xref: /OK3568_Linux_fs/kernel/arch/arm/include/asm/atomic.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  *  arch/arm/include/asm/atomic.h
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  *  Copyright (C) 1996 Russell King.
6*4882a593Smuzhiyun  *  Copyright (C) 2002 Deep Blue Solutions Ltd.
7*4882a593Smuzhiyun  */
8*4882a593Smuzhiyun #ifndef __ASM_ARM_ATOMIC_H
9*4882a593Smuzhiyun #define __ASM_ARM_ATOMIC_H
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <linux/compiler.h>
12*4882a593Smuzhiyun #include <linux/prefetch.h>
13*4882a593Smuzhiyun #include <linux/types.h>
14*4882a593Smuzhiyun #include <linux/irqflags.h>
15*4882a593Smuzhiyun #include <asm/barrier.h>
16*4882a593Smuzhiyun #include <asm/cmpxchg.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun #ifdef __KERNEL__
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun /*
21*4882a593Smuzhiyun  * On ARM, ordinary assignment (str instruction) doesn't clear the local
22*4882a593Smuzhiyun  * strex/ldrex monitor on some implementations. The reason we can use it for
23*4882a593Smuzhiyun  * atomic_set() is the clrex or dummy strex done on every exception return.
24*4882a593Smuzhiyun  */
25*4882a593Smuzhiyun #define atomic_read(v)	READ_ONCE((v)->counter)
26*4882a593Smuzhiyun #define atomic_set(v,i)	WRITE_ONCE(((v)->counter), (i))
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun #if __LINUX_ARM_ARCH__ >= 6
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun /*
31*4882a593Smuzhiyun  * ARMv6 UP and SMP safe atomic ops.  We use load exclusive and
32*4882a593Smuzhiyun  * store exclusive to ensure that these are atomic.  We may loop
33*4882a593Smuzhiyun  * to ensure that the update happens.
34*4882a593Smuzhiyun  */
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun #define ATOMIC_OP(op, c_op, asm_op)					\
37*4882a593Smuzhiyun static inline void atomic_##op(int i, atomic_t *v)			\
38*4882a593Smuzhiyun {									\
39*4882a593Smuzhiyun 	unsigned long tmp;						\
40*4882a593Smuzhiyun 	int result;							\
41*4882a593Smuzhiyun 									\
42*4882a593Smuzhiyun 	prefetchw(&v->counter);						\
43*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic_" #op "\n"			\
44*4882a593Smuzhiyun "1:	ldrex	%0, [%3]\n"						\
45*4882a593Smuzhiyun "	" #asm_op "	%0, %0, %4\n"					\
46*4882a593Smuzhiyun "	strex	%1, %0, [%3]\n"						\
47*4882a593Smuzhiyun "	teq	%1, #0\n"						\
48*4882a593Smuzhiyun "	bne	1b"							\
49*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (tmp), "+Qo" (v->counter)		\
50*4882a593Smuzhiyun 	: "r" (&v->counter), "Ir" (i)					\
51*4882a593Smuzhiyun 	: "cc");							\
52*4882a593Smuzhiyun }									\
53*4882a593Smuzhiyun 
54*4882a593Smuzhiyun #define ATOMIC_OP_RETURN(op, c_op, asm_op)				\
55*4882a593Smuzhiyun static inline int atomic_##op##_return_relaxed(int i, atomic_t *v)	\
56*4882a593Smuzhiyun {									\
57*4882a593Smuzhiyun 	unsigned long tmp;						\
58*4882a593Smuzhiyun 	int result;							\
59*4882a593Smuzhiyun 									\
60*4882a593Smuzhiyun 	prefetchw(&v->counter);						\
61*4882a593Smuzhiyun 									\
62*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic_" #op "_return\n"		\
63*4882a593Smuzhiyun "1:	ldrex	%0, [%3]\n"						\
64*4882a593Smuzhiyun "	" #asm_op "	%0, %0, %4\n"					\
65*4882a593Smuzhiyun "	strex	%1, %0, [%3]\n"						\
66*4882a593Smuzhiyun "	teq	%1, #0\n"						\
67*4882a593Smuzhiyun "	bne	1b"							\
68*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (tmp), "+Qo" (v->counter)		\
69*4882a593Smuzhiyun 	: "r" (&v->counter), "Ir" (i)					\
70*4882a593Smuzhiyun 	: "cc");							\
71*4882a593Smuzhiyun 									\
72*4882a593Smuzhiyun 	return result;							\
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun #define ATOMIC_FETCH_OP(op, c_op, asm_op)				\
76*4882a593Smuzhiyun static inline int atomic_fetch_##op##_relaxed(int i, atomic_t *v)	\
77*4882a593Smuzhiyun {									\
78*4882a593Smuzhiyun 	unsigned long tmp;						\
79*4882a593Smuzhiyun 	int result, val;						\
80*4882a593Smuzhiyun 									\
81*4882a593Smuzhiyun 	prefetchw(&v->counter);						\
82*4882a593Smuzhiyun 									\
83*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic_fetch_" #op "\n"			\
84*4882a593Smuzhiyun "1:	ldrex	%0, [%4]\n"						\
85*4882a593Smuzhiyun "	" #asm_op "	%1, %0, %5\n"					\
86*4882a593Smuzhiyun "	strex	%2, %1, [%4]\n"						\
87*4882a593Smuzhiyun "	teq	%2, #0\n"						\
88*4882a593Smuzhiyun "	bne	1b"							\
89*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (val), "=&r" (tmp), "+Qo" (v->counter)	\
90*4882a593Smuzhiyun 	: "r" (&v->counter), "Ir" (i)					\
91*4882a593Smuzhiyun 	: "cc");							\
92*4882a593Smuzhiyun 									\
93*4882a593Smuzhiyun 	return result;							\
94*4882a593Smuzhiyun }
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun #define atomic_add_return_relaxed	atomic_add_return_relaxed
97*4882a593Smuzhiyun #define atomic_sub_return_relaxed	atomic_sub_return_relaxed
98*4882a593Smuzhiyun #define atomic_fetch_add_relaxed	atomic_fetch_add_relaxed
99*4882a593Smuzhiyun #define atomic_fetch_sub_relaxed	atomic_fetch_sub_relaxed
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun #define atomic_fetch_and_relaxed	atomic_fetch_and_relaxed
102*4882a593Smuzhiyun #define atomic_fetch_andnot_relaxed	atomic_fetch_andnot_relaxed
103*4882a593Smuzhiyun #define atomic_fetch_or_relaxed		atomic_fetch_or_relaxed
104*4882a593Smuzhiyun #define atomic_fetch_xor_relaxed	atomic_fetch_xor_relaxed
105*4882a593Smuzhiyun 
atomic_cmpxchg_relaxed(atomic_t * ptr,int old,int new)106*4882a593Smuzhiyun static inline int atomic_cmpxchg_relaxed(atomic_t *ptr, int old, int new)
107*4882a593Smuzhiyun {
108*4882a593Smuzhiyun 	int oldval;
109*4882a593Smuzhiyun 	unsigned long res;
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun 	prefetchw(&ptr->counter);
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun 	do {
114*4882a593Smuzhiyun 		__asm__ __volatile__("@ atomic_cmpxchg\n"
115*4882a593Smuzhiyun 		"ldrex	%1, [%3]\n"
116*4882a593Smuzhiyun 		"mov	%0, #0\n"
117*4882a593Smuzhiyun 		"teq	%1, %4\n"
118*4882a593Smuzhiyun 		"strexeq %0, %5, [%3]\n"
119*4882a593Smuzhiyun 		    : "=&r" (res), "=&r" (oldval), "+Qo" (ptr->counter)
120*4882a593Smuzhiyun 		    : "r" (&ptr->counter), "Ir" (old), "r" (new)
121*4882a593Smuzhiyun 		    : "cc");
122*4882a593Smuzhiyun 	} while (res);
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun 	return oldval;
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun #define atomic_cmpxchg_relaxed		atomic_cmpxchg_relaxed
127*4882a593Smuzhiyun 
atomic_fetch_add_unless(atomic_t * v,int a,int u)128*4882a593Smuzhiyun static inline int atomic_fetch_add_unless(atomic_t *v, int a, int u)
129*4882a593Smuzhiyun {
130*4882a593Smuzhiyun 	int oldval, newval;
131*4882a593Smuzhiyun 	unsigned long tmp;
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun 	smp_mb();
134*4882a593Smuzhiyun 	prefetchw(&v->counter);
135*4882a593Smuzhiyun 
136*4882a593Smuzhiyun 	__asm__ __volatile__ ("@ atomic_add_unless\n"
137*4882a593Smuzhiyun "1:	ldrex	%0, [%4]\n"
138*4882a593Smuzhiyun "	teq	%0, %5\n"
139*4882a593Smuzhiyun "	beq	2f\n"
140*4882a593Smuzhiyun "	add	%1, %0, %6\n"
141*4882a593Smuzhiyun "	strex	%2, %1, [%4]\n"
142*4882a593Smuzhiyun "	teq	%2, #0\n"
143*4882a593Smuzhiyun "	bne	1b\n"
144*4882a593Smuzhiyun "2:"
145*4882a593Smuzhiyun 	: "=&r" (oldval), "=&r" (newval), "=&r" (tmp), "+Qo" (v->counter)
146*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (u), "r" (a)
147*4882a593Smuzhiyun 	: "cc");
148*4882a593Smuzhiyun 
149*4882a593Smuzhiyun 	if (oldval != u)
150*4882a593Smuzhiyun 		smp_mb();
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 	return oldval;
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun #define atomic_fetch_add_unless		atomic_fetch_add_unless
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun #else /* ARM_ARCH_6 */
157*4882a593Smuzhiyun 
158*4882a593Smuzhiyun #ifdef CONFIG_SMP
159*4882a593Smuzhiyun #error SMP not supported on pre-ARMv6 CPUs
160*4882a593Smuzhiyun #endif
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun #define ATOMIC_OP(op, c_op, asm_op)					\
163*4882a593Smuzhiyun static inline void atomic_##op(int i, atomic_t *v)			\
164*4882a593Smuzhiyun {									\
165*4882a593Smuzhiyun 	unsigned long flags;						\
166*4882a593Smuzhiyun 									\
167*4882a593Smuzhiyun 	raw_local_irq_save(flags);					\
168*4882a593Smuzhiyun 	v->counter c_op i;						\
169*4882a593Smuzhiyun 	raw_local_irq_restore(flags);					\
170*4882a593Smuzhiyun }									\
171*4882a593Smuzhiyun 
172*4882a593Smuzhiyun #define ATOMIC_OP_RETURN(op, c_op, asm_op)				\
173*4882a593Smuzhiyun static inline int atomic_##op##_return(int i, atomic_t *v)		\
174*4882a593Smuzhiyun {									\
175*4882a593Smuzhiyun 	unsigned long flags;						\
176*4882a593Smuzhiyun 	int val;							\
177*4882a593Smuzhiyun 									\
178*4882a593Smuzhiyun 	raw_local_irq_save(flags);					\
179*4882a593Smuzhiyun 	v->counter c_op i;						\
180*4882a593Smuzhiyun 	val = v->counter;						\
181*4882a593Smuzhiyun 	raw_local_irq_restore(flags);					\
182*4882a593Smuzhiyun 									\
183*4882a593Smuzhiyun 	return val;							\
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun #define ATOMIC_FETCH_OP(op, c_op, asm_op)				\
187*4882a593Smuzhiyun static inline int atomic_fetch_##op(int i, atomic_t *v)			\
188*4882a593Smuzhiyun {									\
189*4882a593Smuzhiyun 	unsigned long flags;						\
190*4882a593Smuzhiyun 	int val;							\
191*4882a593Smuzhiyun 									\
192*4882a593Smuzhiyun 	raw_local_irq_save(flags);					\
193*4882a593Smuzhiyun 	val = v->counter;						\
194*4882a593Smuzhiyun 	v->counter c_op i;						\
195*4882a593Smuzhiyun 	raw_local_irq_restore(flags);					\
196*4882a593Smuzhiyun 									\
197*4882a593Smuzhiyun 	return val;							\
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun 
atomic_cmpxchg(atomic_t * v,int old,int new)200*4882a593Smuzhiyun static inline int atomic_cmpxchg(atomic_t *v, int old, int new)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun 	int ret;
203*4882a593Smuzhiyun 	unsigned long flags;
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	raw_local_irq_save(flags);
206*4882a593Smuzhiyun 	ret = v->counter;
207*4882a593Smuzhiyun 	if (likely(ret == old))
208*4882a593Smuzhiyun 		v->counter = new;
209*4882a593Smuzhiyun 	raw_local_irq_restore(flags);
210*4882a593Smuzhiyun 
211*4882a593Smuzhiyun 	return ret;
212*4882a593Smuzhiyun }
213*4882a593Smuzhiyun 
214*4882a593Smuzhiyun #define atomic_fetch_andnot		atomic_fetch_andnot
215*4882a593Smuzhiyun 
216*4882a593Smuzhiyun #endif /* __LINUX_ARM_ARCH__ */
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun #define ATOMIC_OPS(op, c_op, asm_op)					\
219*4882a593Smuzhiyun 	ATOMIC_OP(op, c_op, asm_op)					\
220*4882a593Smuzhiyun 	ATOMIC_OP_RETURN(op, c_op, asm_op)				\
221*4882a593Smuzhiyun 	ATOMIC_FETCH_OP(op, c_op, asm_op)
222*4882a593Smuzhiyun 
223*4882a593Smuzhiyun ATOMIC_OPS(add, +=, add)
224*4882a593Smuzhiyun ATOMIC_OPS(sub, -=, sub)
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun #define atomic_andnot atomic_andnot
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun #undef ATOMIC_OPS
229*4882a593Smuzhiyun #define ATOMIC_OPS(op, c_op, asm_op)					\
230*4882a593Smuzhiyun 	ATOMIC_OP(op, c_op, asm_op)					\
231*4882a593Smuzhiyun 	ATOMIC_FETCH_OP(op, c_op, asm_op)
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun ATOMIC_OPS(and, &=, and)
234*4882a593Smuzhiyun ATOMIC_OPS(andnot, &= ~, bic)
235*4882a593Smuzhiyun ATOMIC_OPS(or,  |=, orr)
236*4882a593Smuzhiyun ATOMIC_OPS(xor, ^=, eor)
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun #undef ATOMIC_OPS
239*4882a593Smuzhiyun #undef ATOMIC_FETCH_OP
240*4882a593Smuzhiyun #undef ATOMIC_OP_RETURN
241*4882a593Smuzhiyun #undef ATOMIC_OP
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun #define atomic_xchg(v, new) (xchg(&((v)->counter), new))
244*4882a593Smuzhiyun 
245*4882a593Smuzhiyun #ifndef CONFIG_GENERIC_ATOMIC64
246*4882a593Smuzhiyun typedef struct {
247*4882a593Smuzhiyun 	s64 counter;
248*4882a593Smuzhiyun } atomic64_t;
249*4882a593Smuzhiyun 
250*4882a593Smuzhiyun #define ATOMIC64_INIT(i) { (i) }
251*4882a593Smuzhiyun 
252*4882a593Smuzhiyun #ifdef CONFIG_ARM_LPAE
atomic64_read(const atomic64_t * v)253*4882a593Smuzhiyun static inline s64 atomic64_read(const atomic64_t *v)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun 	s64 result;
256*4882a593Smuzhiyun 
257*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_read\n"
258*4882a593Smuzhiyun "	ldrd	%0, %H0, [%1]"
259*4882a593Smuzhiyun 	: "=&r" (result)
260*4882a593Smuzhiyun 	: "r" (&v->counter), "Qo" (v->counter)
261*4882a593Smuzhiyun 	);
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun 	return result;
264*4882a593Smuzhiyun }
265*4882a593Smuzhiyun 
atomic64_set(atomic64_t * v,s64 i)266*4882a593Smuzhiyun static inline void atomic64_set(atomic64_t *v, s64 i)
267*4882a593Smuzhiyun {
268*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_set\n"
269*4882a593Smuzhiyun "	strd	%2, %H2, [%1]"
270*4882a593Smuzhiyun 	: "=Qo" (v->counter)
271*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (i)
272*4882a593Smuzhiyun 	);
273*4882a593Smuzhiyun }
274*4882a593Smuzhiyun #else
atomic64_read(const atomic64_t * v)275*4882a593Smuzhiyun static inline s64 atomic64_read(const atomic64_t *v)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun 	s64 result;
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_read\n"
280*4882a593Smuzhiyun "	ldrexd	%0, %H0, [%1]"
281*4882a593Smuzhiyun 	: "=&r" (result)
282*4882a593Smuzhiyun 	: "r" (&v->counter), "Qo" (v->counter)
283*4882a593Smuzhiyun 	);
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 	return result;
286*4882a593Smuzhiyun }
287*4882a593Smuzhiyun 
atomic64_set(atomic64_t * v,s64 i)288*4882a593Smuzhiyun static inline void atomic64_set(atomic64_t *v, s64 i)
289*4882a593Smuzhiyun {
290*4882a593Smuzhiyun 	s64 tmp;
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 	prefetchw(&v->counter);
293*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_set\n"
294*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%2]\n"
295*4882a593Smuzhiyun "	strexd	%0, %3, %H3, [%2]\n"
296*4882a593Smuzhiyun "	teq	%0, #0\n"
297*4882a593Smuzhiyun "	bne	1b"
298*4882a593Smuzhiyun 	: "=&r" (tmp), "=Qo" (v->counter)
299*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (i)
300*4882a593Smuzhiyun 	: "cc");
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun #endif
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun #define ATOMIC64_OP(op, op1, op2)					\
305*4882a593Smuzhiyun static inline void atomic64_##op(s64 i, atomic64_t *v)			\
306*4882a593Smuzhiyun {									\
307*4882a593Smuzhiyun 	s64 result;							\
308*4882a593Smuzhiyun 	unsigned long tmp;						\
309*4882a593Smuzhiyun 									\
310*4882a593Smuzhiyun 	prefetchw(&v->counter);						\
311*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_" #op "\n"			\
312*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%3]\n"					\
313*4882a593Smuzhiyun "	" #op1 " %Q0, %Q0, %Q4\n"					\
314*4882a593Smuzhiyun "	" #op2 " %R0, %R0, %R4\n"					\
315*4882a593Smuzhiyun "	strexd	%1, %0, %H0, [%3]\n"					\
316*4882a593Smuzhiyun "	teq	%1, #0\n"						\
317*4882a593Smuzhiyun "	bne	1b"							\
318*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (tmp), "+Qo" (v->counter)		\
319*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (i)					\
320*4882a593Smuzhiyun 	: "cc");							\
321*4882a593Smuzhiyun }									\
322*4882a593Smuzhiyun 
323*4882a593Smuzhiyun #define ATOMIC64_OP_RETURN(op, op1, op2)				\
324*4882a593Smuzhiyun static inline s64							\
325*4882a593Smuzhiyun atomic64_##op##_return_relaxed(s64 i, atomic64_t *v)			\
326*4882a593Smuzhiyun {									\
327*4882a593Smuzhiyun 	s64 result;							\
328*4882a593Smuzhiyun 	unsigned long tmp;						\
329*4882a593Smuzhiyun 									\
330*4882a593Smuzhiyun 	prefetchw(&v->counter);						\
331*4882a593Smuzhiyun 									\
332*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_" #op "_return\n"		\
333*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%3]\n"					\
334*4882a593Smuzhiyun "	" #op1 " %Q0, %Q0, %Q4\n"					\
335*4882a593Smuzhiyun "	" #op2 " %R0, %R0, %R4\n"					\
336*4882a593Smuzhiyun "	strexd	%1, %0, %H0, [%3]\n"					\
337*4882a593Smuzhiyun "	teq	%1, #0\n"						\
338*4882a593Smuzhiyun "	bne	1b"							\
339*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (tmp), "+Qo" (v->counter)		\
340*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (i)					\
341*4882a593Smuzhiyun 	: "cc");							\
342*4882a593Smuzhiyun 									\
343*4882a593Smuzhiyun 	return result;							\
344*4882a593Smuzhiyun }
345*4882a593Smuzhiyun 
346*4882a593Smuzhiyun #define ATOMIC64_FETCH_OP(op, op1, op2)					\
347*4882a593Smuzhiyun static inline s64							\
348*4882a593Smuzhiyun atomic64_fetch_##op##_relaxed(s64 i, atomic64_t *v)			\
349*4882a593Smuzhiyun {									\
350*4882a593Smuzhiyun 	s64 result, val;						\
351*4882a593Smuzhiyun 	unsigned long tmp;						\
352*4882a593Smuzhiyun 									\
353*4882a593Smuzhiyun 	prefetchw(&v->counter);						\
354*4882a593Smuzhiyun 									\
355*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_fetch_" #op "\n"		\
356*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%4]\n"					\
357*4882a593Smuzhiyun "	" #op1 " %Q1, %Q0, %Q5\n"					\
358*4882a593Smuzhiyun "	" #op2 " %R1, %R0, %R5\n"					\
359*4882a593Smuzhiyun "	strexd	%2, %1, %H1, [%4]\n"					\
360*4882a593Smuzhiyun "	teq	%2, #0\n"						\
361*4882a593Smuzhiyun "	bne	1b"							\
362*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (val), "=&r" (tmp), "+Qo" (v->counter)	\
363*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (i)					\
364*4882a593Smuzhiyun 	: "cc");							\
365*4882a593Smuzhiyun 									\
366*4882a593Smuzhiyun 	return result;							\
367*4882a593Smuzhiyun }
368*4882a593Smuzhiyun 
369*4882a593Smuzhiyun #define ATOMIC64_OPS(op, op1, op2)					\
370*4882a593Smuzhiyun 	ATOMIC64_OP(op, op1, op2)					\
371*4882a593Smuzhiyun 	ATOMIC64_OP_RETURN(op, op1, op2)				\
372*4882a593Smuzhiyun 	ATOMIC64_FETCH_OP(op, op1, op2)
373*4882a593Smuzhiyun 
ATOMIC64_OPS(add,adds,adc)374*4882a593Smuzhiyun ATOMIC64_OPS(add, adds, adc)
375*4882a593Smuzhiyun ATOMIC64_OPS(sub, subs, sbc)
376*4882a593Smuzhiyun 
377*4882a593Smuzhiyun #define atomic64_add_return_relaxed	atomic64_add_return_relaxed
378*4882a593Smuzhiyun #define atomic64_sub_return_relaxed	atomic64_sub_return_relaxed
379*4882a593Smuzhiyun #define atomic64_fetch_add_relaxed	atomic64_fetch_add_relaxed
380*4882a593Smuzhiyun #define atomic64_fetch_sub_relaxed	atomic64_fetch_sub_relaxed
381*4882a593Smuzhiyun 
382*4882a593Smuzhiyun #undef ATOMIC64_OPS
383*4882a593Smuzhiyun #define ATOMIC64_OPS(op, op1, op2)					\
384*4882a593Smuzhiyun 	ATOMIC64_OP(op, op1, op2)					\
385*4882a593Smuzhiyun 	ATOMIC64_FETCH_OP(op, op1, op2)
386*4882a593Smuzhiyun 
387*4882a593Smuzhiyun #define atomic64_andnot atomic64_andnot
388*4882a593Smuzhiyun 
389*4882a593Smuzhiyun ATOMIC64_OPS(and, and, and)
390*4882a593Smuzhiyun ATOMIC64_OPS(andnot, bic, bic)
391*4882a593Smuzhiyun ATOMIC64_OPS(or,  orr, orr)
392*4882a593Smuzhiyun ATOMIC64_OPS(xor, eor, eor)
393*4882a593Smuzhiyun 
394*4882a593Smuzhiyun #define atomic64_fetch_and_relaxed	atomic64_fetch_and_relaxed
395*4882a593Smuzhiyun #define atomic64_fetch_andnot_relaxed	atomic64_fetch_andnot_relaxed
396*4882a593Smuzhiyun #define atomic64_fetch_or_relaxed	atomic64_fetch_or_relaxed
397*4882a593Smuzhiyun #define atomic64_fetch_xor_relaxed	atomic64_fetch_xor_relaxed
398*4882a593Smuzhiyun 
399*4882a593Smuzhiyun #undef ATOMIC64_OPS
400*4882a593Smuzhiyun #undef ATOMIC64_FETCH_OP
401*4882a593Smuzhiyun #undef ATOMIC64_OP_RETURN
402*4882a593Smuzhiyun #undef ATOMIC64_OP
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun static inline s64 atomic64_cmpxchg_relaxed(atomic64_t *ptr, s64 old, s64 new)
405*4882a593Smuzhiyun {
406*4882a593Smuzhiyun 	s64 oldval;
407*4882a593Smuzhiyun 	unsigned long res;
408*4882a593Smuzhiyun 
409*4882a593Smuzhiyun 	prefetchw(&ptr->counter);
410*4882a593Smuzhiyun 
411*4882a593Smuzhiyun 	do {
412*4882a593Smuzhiyun 		__asm__ __volatile__("@ atomic64_cmpxchg\n"
413*4882a593Smuzhiyun 		"ldrexd		%1, %H1, [%3]\n"
414*4882a593Smuzhiyun 		"mov		%0, #0\n"
415*4882a593Smuzhiyun 		"teq		%1, %4\n"
416*4882a593Smuzhiyun 		"teqeq		%H1, %H4\n"
417*4882a593Smuzhiyun 		"strexdeq	%0, %5, %H5, [%3]"
418*4882a593Smuzhiyun 		: "=&r" (res), "=&r" (oldval), "+Qo" (ptr->counter)
419*4882a593Smuzhiyun 		: "r" (&ptr->counter), "r" (old), "r" (new)
420*4882a593Smuzhiyun 		: "cc");
421*4882a593Smuzhiyun 	} while (res);
422*4882a593Smuzhiyun 
423*4882a593Smuzhiyun 	return oldval;
424*4882a593Smuzhiyun }
425*4882a593Smuzhiyun #define atomic64_cmpxchg_relaxed	atomic64_cmpxchg_relaxed
426*4882a593Smuzhiyun 
atomic64_xchg_relaxed(atomic64_t * ptr,s64 new)427*4882a593Smuzhiyun static inline s64 atomic64_xchg_relaxed(atomic64_t *ptr, s64 new)
428*4882a593Smuzhiyun {
429*4882a593Smuzhiyun 	s64 result;
430*4882a593Smuzhiyun 	unsigned long tmp;
431*4882a593Smuzhiyun 
432*4882a593Smuzhiyun 	prefetchw(&ptr->counter);
433*4882a593Smuzhiyun 
434*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_xchg\n"
435*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%3]\n"
436*4882a593Smuzhiyun "	strexd	%1, %4, %H4, [%3]\n"
437*4882a593Smuzhiyun "	teq	%1, #0\n"
438*4882a593Smuzhiyun "	bne	1b"
439*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (tmp), "+Qo" (ptr->counter)
440*4882a593Smuzhiyun 	: "r" (&ptr->counter), "r" (new)
441*4882a593Smuzhiyun 	: "cc");
442*4882a593Smuzhiyun 
443*4882a593Smuzhiyun 	return result;
444*4882a593Smuzhiyun }
445*4882a593Smuzhiyun #define atomic64_xchg_relaxed		atomic64_xchg_relaxed
446*4882a593Smuzhiyun 
atomic64_dec_if_positive(atomic64_t * v)447*4882a593Smuzhiyun static inline s64 atomic64_dec_if_positive(atomic64_t *v)
448*4882a593Smuzhiyun {
449*4882a593Smuzhiyun 	s64 result;
450*4882a593Smuzhiyun 	unsigned long tmp;
451*4882a593Smuzhiyun 
452*4882a593Smuzhiyun 	smp_mb();
453*4882a593Smuzhiyun 	prefetchw(&v->counter);
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_dec_if_positive\n"
456*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%3]\n"
457*4882a593Smuzhiyun "	subs	%Q0, %Q0, #1\n"
458*4882a593Smuzhiyun "	sbc	%R0, %R0, #0\n"
459*4882a593Smuzhiyun "	teq	%R0, #0\n"
460*4882a593Smuzhiyun "	bmi	2f\n"
461*4882a593Smuzhiyun "	strexd	%1, %0, %H0, [%3]\n"
462*4882a593Smuzhiyun "	teq	%1, #0\n"
463*4882a593Smuzhiyun "	bne	1b\n"
464*4882a593Smuzhiyun "2:"
465*4882a593Smuzhiyun 	: "=&r" (result), "=&r" (tmp), "+Qo" (v->counter)
466*4882a593Smuzhiyun 	: "r" (&v->counter)
467*4882a593Smuzhiyun 	: "cc");
468*4882a593Smuzhiyun 
469*4882a593Smuzhiyun 	smp_mb();
470*4882a593Smuzhiyun 
471*4882a593Smuzhiyun 	return result;
472*4882a593Smuzhiyun }
473*4882a593Smuzhiyun #define atomic64_dec_if_positive atomic64_dec_if_positive
474*4882a593Smuzhiyun 
atomic64_fetch_add_unless(atomic64_t * v,s64 a,s64 u)475*4882a593Smuzhiyun static inline s64 atomic64_fetch_add_unless(atomic64_t *v, s64 a, s64 u)
476*4882a593Smuzhiyun {
477*4882a593Smuzhiyun 	s64 oldval, newval;
478*4882a593Smuzhiyun 	unsigned long tmp;
479*4882a593Smuzhiyun 
480*4882a593Smuzhiyun 	smp_mb();
481*4882a593Smuzhiyun 	prefetchw(&v->counter);
482*4882a593Smuzhiyun 
483*4882a593Smuzhiyun 	__asm__ __volatile__("@ atomic64_add_unless\n"
484*4882a593Smuzhiyun "1:	ldrexd	%0, %H0, [%4]\n"
485*4882a593Smuzhiyun "	teq	%0, %5\n"
486*4882a593Smuzhiyun "	teqeq	%H0, %H5\n"
487*4882a593Smuzhiyun "	beq	2f\n"
488*4882a593Smuzhiyun "	adds	%Q1, %Q0, %Q6\n"
489*4882a593Smuzhiyun "	adc	%R1, %R0, %R6\n"
490*4882a593Smuzhiyun "	strexd	%2, %1, %H1, [%4]\n"
491*4882a593Smuzhiyun "	teq	%2, #0\n"
492*4882a593Smuzhiyun "	bne	1b\n"
493*4882a593Smuzhiyun "2:"
494*4882a593Smuzhiyun 	: "=&r" (oldval), "=&r" (newval), "=&r" (tmp), "+Qo" (v->counter)
495*4882a593Smuzhiyun 	: "r" (&v->counter), "r" (u), "r" (a)
496*4882a593Smuzhiyun 	: "cc");
497*4882a593Smuzhiyun 
498*4882a593Smuzhiyun 	if (oldval != u)
499*4882a593Smuzhiyun 		smp_mb();
500*4882a593Smuzhiyun 
501*4882a593Smuzhiyun 	return oldval;
502*4882a593Smuzhiyun }
503*4882a593Smuzhiyun #define atomic64_fetch_add_unless atomic64_fetch_add_unless
504*4882a593Smuzhiyun 
505*4882a593Smuzhiyun #endif /* !CONFIG_GENERIC_ATOMIC64 */
506*4882a593Smuzhiyun #endif
507*4882a593Smuzhiyun #endif
508