1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com)
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun #ifndef _ASM_ARC_ATOMIC_H
7*4882a593Smuzhiyun #define _ASM_ARC_ATOMIC_H
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #ifndef __ASSEMBLY__
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <linux/types.h>
12*4882a593Smuzhiyun #include <linux/compiler.h>
13*4882a593Smuzhiyun #include <asm/cmpxchg.h>
14*4882a593Smuzhiyun #include <asm/barrier.h>
15*4882a593Smuzhiyun #include <asm/smp.h>
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun #define atomic_read(v) READ_ONCE((v)->counter)
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #ifdef CONFIG_ARC_HAS_LLSC
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun #define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i))
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun #define ATOMIC_OP(op, c_op, asm_op) \
24*4882a593Smuzhiyun static inline void atomic_##op(int i, atomic_t *v) \
25*4882a593Smuzhiyun { \
26*4882a593Smuzhiyun unsigned int val; \
27*4882a593Smuzhiyun \
28*4882a593Smuzhiyun __asm__ __volatile__( \
29*4882a593Smuzhiyun "1: llock %[val], [%[ctr]] \n" \
30*4882a593Smuzhiyun " " #asm_op " %[val], %[val], %[i] \n" \
31*4882a593Smuzhiyun " scond %[val], [%[ctr]] \n" \
32*4882a593Smuzhiyun " bnz 1b \n" \
33*4882a593Smuzhiyun : [val] "=&r" (val) /* Early clobber to prevent reg reuse */ \
34*4882a593Smuzhiyun : [ctr] "r" (&v->counter), /* Not "m": llock only supports reg direct addr mode */ \
35*4882a593Smuzhiyun [i] "ir" (i) \
36*4882a593Smuzhiyun : "cc"); \
37*4882a593Smuzhiyun } \
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun #define ATOMIC_OP_RETURN(op, c_op, asm_op) \
40*4882a593Smuzhiyun static inline int atomic_##op##_return(int i, atomic_t *v) \
41*4882a593Smuzhiyun { \
42*4882a593Smuzhiyun unsigned int val; \
43*4882a593Smuzhiyun \
44*4882a593Smuzhiyun /* \
45*4882a593Smuzhiyun * Explicit full memory barrier needed before/after as \
46*4882a593Smuzhiyun * LLOCK/SCOND themselves don't provide any such semantics \
47*4882a593Smuzhiyun */ \
48*4882a593Smuzhiyun smp_mb(); \
49*4882a593Smuzhiyun \
50*4882a593Smuzhiyun __asm__ __volatile__( \
51*4882a593Smuzhiyun "1: llock %[val], [%[ctr]] \n" \
52*4882a593Smuzhiyun " " #asm_op " %[val], %[val], %[i] \n" \
53*4882a593Smuzhiyun " scond %[val], [%[ctr]] \n" \
54*4882a593Smuzhiyun " bnz 1b \n" \
55*4882a593Smuzhiyun : [val] "=&r" (val) \
56*4882a593Smuzhiyun : [ctr] "r" (&v->counter), \
57*4882a593Smuzhiyun [i] "ir" (i) \
58*4882a593Smuzhiyun : "cc"); \
59*4882a593Smuzhiyun \
60*4882a593Smuzhiyun smp_mb(); \
61*4882a593Smuzhiyun \
62*4882a593Smuzhiyun return val; \
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun #define ATOMIC_FETCH_OP(op, c_op, asm_op) \
66*4882a593Smuzhiyun static inline int atomic_fetch_##op(int i, atomic_t *v) \
67*4882a593Smuzhiyun { \
68*4882a593Smuzhiyun unsigned int val, orig; \
69*4882a593Smuzhiyun \
70*4882a593Smuzhiyun /* \
71*4882a593Smuzhiyun * Explicit full memory barrier needed before/after as \
72*4882a593Smuzhiyun * LLOCK/SCOND themselves don't provide any such semantics \
73*4882a593Smuzhiyun */ \
74*4882a593Smuzhiyun smp_mb(); \
75*4882a593Smuzhiyun \
76*4882a593Smuzhiyun __asm__ __volatile__( \
77*4882a593Smuzhiyun "1: llock %[orig], [%[ctr]] \n" \
78*4882a593Smuzhiyun " " #asm_op " %[val], %[orig], %[i] \n" \
79*4882a593Smuzhiyun " scond %[val], [%[ctr]] \n" \
80*4882a593Smuzhiyun " bnz 1b \n" \
81*4882a593Smuzhiyun : [val] "=&r" (val), \
82*4882a593Smuzhiyun [orig] "=&r" (orig) \
83*4882a593Smuzhiyun : [ctr] "r" (&v->counter), \
84*4882a593Smuzhiyun [i] "ir" (i) \
85*4882a593Smuzhiyun : "cc"); \
86*4882a593Smuzhiyun \
87*4882a593Smuzhiyun smp_mb(); \
88*4882a593Smuzhiyun \
89*4882a593Smuzhiyun return orig; \
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun #else /* !CONFIG_ARC_HAS_LLSC */
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun #ifndef CONFIG_SMP
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun /* violating atomic_xxx API locking protocol in UP for optimization sake */
97*4882a593Smuzhiyun #define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i))
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun #else
100*4882a593Smuzhiyun
atomic_set(atomic_t * v,int i)101*4882a593Smuzhiyun static inline void atomic_set(atomic_t *v, int i)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun /*
104*4882a593Smuzhiyun * Independent of hardware support, all of the atomic_xxx() APIs need
105*4882a593Smuzhiyun * to follow the same locking rules to make sure that a "hardware"
106*4882a593Smuzhiyun * atomic insn (e.g. LD) doesn't clobber an "emulated" atomic insn
107*4882a593Smuzhiyun * sequence
108*4882a593Smuzhiyun *
109*4882a593Smuzhiyun * Thus atomic_set() despite being 1 insn (and seemingly atomic)
110*4882a593Smuzhiyun * requires the locking.
111*4882a593Smuzhiyun */
112*4882a593Smuzhiyun unsigned long flags;
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun atomic_ops_lock(flags);
115*4882a593Smuzhiyun WRITE_ONCE(v->counter, i);
116*4882a593Smuzhiyun atomic_ops_unlock(flags);
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun #define atomic_set_release(v, i) atomic_set((v), (i))
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun #endif
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun /*
124*4882a593Smuzhiyun * Non hardware assisted Atomic-R-M-W
125*4882a593Smuzhiyun * Locking would change to irq-disabling only (UP) and spinlocks (SMP)
126*4882a593Smuzhiyun */
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun #define ATOMIC_OP(op, c_op, asm_op) \
129*4882a593Smuzhiyun static inline void atomic_##op(int i, atomic_t *v) \
130*4882a593Smuzhiyun { \
131*4882a593Smuzhiyun unsigned long flags; \
132*4882a593Smuzhiyun \
133*4882a593Smuzhiyun atomic_ops_lock(flags); \
134*4882a593Smuzhiyun v->counter c_op i; \
135*4882a593Smuzhiyun atomic_ops_unlock(flags); \
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun #define ATOMIC_OP_RETURN(op, c_op, asm_op) \
139*4882a593Smuzhiyun static inline int atomic_##op##_return(int i, atomic_t *v) \
140*4882a593Smuzhiyun { \
141*4882a593Smuzhiyun unsigned long flags; \
142*4882a593Smuzhiyun unsigned long temp; \
143*4882a593Smuzhiyun \
144*4882a593Smuzhiyun /* \
145*4882a593Smuzhiyun * spin lock/unlock provides the needed smp_mb() before/after \
146*4882a593Smuzhiyun */ \
147*4882a593Smuzhiyun atomic_ops_lock(flags); \
148*4882a593Smuzhiyun temp = v->counter; \
149*4882a593Smuzhiyun temp c_op i; \
150*4882a593Smuzhiyun v->counter = temp; \
151*4882a593Smuzhiyun atomic_ops_unlock(flags); \
152*4882a593Smuzhiyun \
153*4882a593Smuzhiyun return temp; \
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun #define ATOMIC_FETCH_OP(op, c_op, asm_op) \
157*4882a593Smuzhiyun static inline int atomic_fetch_##op(int i, atomic_t *v) \
158*4882a593Smuzhiyun { \
159*4882a593Smuzhiyun unsigned long flags; \
160*4882a593Smuzhiyun unsigned long orig; \
161*4882a593Smuzhiyun \
162*4882a593Smuzhiyun /* \
163*4882a593Smuzhiyun * spin lock/unlock provides the needed smp_mb() before/after \
164*4882a593Smuzhiyun */ \
165*4882a593Smuzhiyun atomic_ops_lock(flags); \
166*4882a593Smuzhiyun orig = v->counter; \
167*4882a593Smuzhiyun v->counter c_op i; \
168*4882a593Smuzhiyun atomic_ops_unlock(flags); \
169*4882a593Smuzhiyun \
170*4882a593Smuzhiyun return orig; \
171*4882a593Smuzhiyun }
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun #endif /* !CONFIG_ARC_HAS_LLSC */
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun #define ATOMIC_OPS(op, c_op, asm_op) \
176*4882a593Smuzhiyun ATOMIC_OP(op, c_op, asm_op) \
177*4882a593Smuzhiyun ATOMIC_OP_RETURN(op, c_op, asm_op) \
178*4882a593Smuzhiyun ATOMIC_FETCH_OP(op, c_op, asm_op)
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun ATOMIC_OPS(add, +=, add)
181*4882a593Smuzhiyun ATOMIC_OPS(sub, -=, sub)
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun #define atomic_andnot atomic_andnot
184*4882a593Smuzhiyun #define atomic_fetch_andnot atomic_fetch_andnot
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun #undef ATOMIC_OPS
187*4882a593Smuzhiyun #define ATOMIC_OPS(op, c_op, asm_op) \
188*4882a593Smuzhiyun ATOMIC_OP(op, c_op, asm_op) \
189*4882a593Smuzhiyun ATOMIC_FETCH_OP(op, c_op, asm_op)
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun ATOMIC_OPS(and, &=, and)
192*4882a593Smuzhiyun ATOMIC_OPS(andnot, &= ~, bic)
193*4882a593Smuzhiyun ATOMIC_OPS(or, |=, or)
194*4882a593Smuzhiyun ATOMIC_OPS(xor, ^=, xor)
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun #undef ATOMIC_OPS
197*4882a593Smuzhiyun #undef ATOMIC_FETCH_OP
198*4882a593Smuzhiyun #undef ATOMIC_OP_RETURN
199*4882a593Smuzhiyun #undef ATOMIC_OP
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun #ifdef CONFIG_GENERIC_ATOMIC64
202*4882a593Smuzhiyun
203*4882a593Smuzhiyun #include <asm-generic/atomic64.h>
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun #else /* Kconfig ensures this is only enabled with needed h/w assist */
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun /*
208*4882a593Smuzhiyun * ARCv2 supports 64-bit exclusive load (LLOCKD) / store (SCONDD)
209*4882a593Smuzhiyun * - The address HAS to be 64-bit aligned
210*4882a593Smuzhiyun * - There are 2 semantics involved here:
211*4882a593Smuzhiyun * = exclusive implies no interim update between load/store to same addr
212*4882a593Smuzhiyun * = both words are observed/updated together: this is guaranteed even
213*4882a593Smuzhiyun * for regular 64-bit load (LDD) / store (STD). Thus atomic64_set()
214*4882a593Smuzhiyun * is NOT required to use LLOCKD+SCONDD, STD suffices
215*4882a593Smuzhiyun */
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun typedef struct {
218*4882a593Smuzhiyun s64 __aligned(8) counter;
219*4882a593Smuzhiyun } atomic64_t;
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun #define ATOMIC64_INIT(a) { (a) }
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun static inline s64 atomic64_read(const atomic64_t *v)
224*4882a593Smuzhiyun {
225*4882a593Smuzhiyun s64 val;
226*4882a593Smuzhiyun
227*4882a593Smuzhiyun __asm__ __volatile__(
228*4882a593Smuzhiyun " ldd %0, [%1] \n"
229*4882a593Smuzhiyun : "=r"(val)
230*4882a593Smuzhiyun : "r"(&v->counter));
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun return val;
233*4882a593Smuzhiyun }
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun static inline void atomic64_set(atomic64_t *v, s64 a)
236*4882a593Smuzhiyun {
237*4882a593Smuzhiyun /*
238*4882a593Smuzhiyun * This could have been a simple assignment in "C" but would need
239*4882a593Smuzhiyun * explicit volatile. Otherwise gcc optimizers could elide the store
240*4882a593Smuzhiyun * which borked atomic64 self-test
241*4882a593Smuzhiyun * In the inline asm version, memory clobber needed for exact same
242*4882a593Smuzhiyun * reason, to tell gcc about the store.
243*4882a593Smuzhiyun *
244*4882a593Smuzhiyun * This however is not needed for sibling atomic64_add() etc since both
245*4882a593Smuzhiyun * load/store are explicitly done in inline asm. As long as API is used
246*4882a593Smuzhiyun * for each access, gcc has no way to optimize away any load/store
247*4882a593Smuzhiyun */
248*4882a593Smuzhiyun __asm__ __volatile__(
249*4882a593Smuzhiyun " std %0, [%1] \n"
250*4882a593Smuzhiyun :
251*4882a593Smuzhiyun : "r"(a), "r"(&v->counter)
252*4882a593Smuzhiyun : "memory");
253*4882a593Smuzhiyun }
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun #define ATOMIC64_OP(op, op1, op2) \
256*4882a593Smuzhiyun static inline void atomic64_##op(s64 a, atomic64_t *v) \
257*4882a593Smuzhiyun { \
258*4882a593Smuzhiyun s64 val; \
259*4882a593Smuzhiyun \
260*4882a593Smuzhiyun __asm__ __volatile__( \
261*4882a593Smuzhiyun "1: \n" \
262*4882a593Smuzhiyun " llockd %0, [%1] \n" \
263*4882a593Smuzhiyun " " #op1 " %L0, %L0, %L2 \n" \
264*4882a593Smuzhiyun " " #op2 " %H0, %H0, %H2 \n" \
265*4882a593Smuzhiyun " scondd %0, [%1] \n" \
266*4882a593Smuzhiyun " bnz 1b \n" \
267*4882a593Smuzhiyun : "=&r"(val) \
268*4882a593Smuzhiyun : "r"(&v->counter), "ir"(a) \
269*4882a593Smuzhiyun : "cc"); \
270*4882a593Smuzhiyun } \
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun #define ATOMIC64_OP_RETURN(op, op1, op2) \
273*4882a593Smuzhiyun static inline s64 atomic64_##op##_return(s64 a, atomic64_t *v) \
274*4882a593Smuzhiyun { \
275*4882a593Smuzhiyun s64 val; \
276*4882a593Smuzhiyun \
277*4882a593Smuzhiyun smp_mb(); \
278*4882a593Smuzhiyun \
279*4882a593Smuzhiyun __asm__ __volatile__( \
280*4882a593Smuzhiyun "1: \n" \
281*4882a593Smuzhiyun " llockd %0, [%1] \n" \
282*4882a593Smuzhiyun " " #op1 " %L0, %L0, %L2 \n" \
283*4882a593Smuzhiyun " " #op2 " %H0, %H0, %H2 \n" \
284*4882a593Smuzhiyun " scondd %0, [%1] \n" \
285*4882a593Smuzhiyun " bnz 1b \n" \
286*4882a593Smuzhiyun : [val] "=&r"(val) \
287*4882a593Smuzhiyun : "r"(&v->counter), "ir"(a) \
288*4882a593Smuzhiyun : "cc"); /* memory clobber comes from smp_mb() */ \
289*4882a593Smuzhiyun \
290*4882a593Smuzhiyun smp_mb(); \
291*4882a593Smuzhiyun \
292*4882a593Smuzhiyun return val; \
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun #define ATOMIC64_FETCH_OP(op, op1, op2) \
296*4882a593Smuzhiyun static inline s64 atomic64_fetch_##op(s64 a, atomic64_t *v) \
297*4882a593Smuzhiyun { \
298*4882a593Smuzhiyun s64 val, orig; \
299*4882a593Smuzhiyun \
300*4882a593Smuzhiyun smp_mb(); \
301*4882a593Smuzhiyun \
302*4882a593Smuzhiyun __asm__ __volatile__( \
303*4882a593Smuzhiyun "1: \n" \
304*4882a593Smuzhiyun " llockd %0, [%2] \n" \
305*4882a593Smuzhiyun " " #op1 " %L1, %L0, %L3 \n" \
306*4882a593Smuzhiyun " " #op2 " %H1, %H0, %H3 \n" \
307*4882a593Smuzhiyun " scondd %1, [%2] \n" \
308*4882a593Smuzhiyun " bnz 1b \n" \
309*4882a593Smuzhiyun : "=&r"(orig), "=&r"(val) \
310*4882a593Smuzhiyun : "r"(&v->counter), "ir"(a) \
311*4882a593Smuzhiyun : "cc"); /* memory clobber comes from smp_mb() */ \
312*4882a593Smuzhiyun \
313*4882a593Smuzhiyun smp_mb(); \
314*4882a593Smuzhiyun \
315*4882a593Smuzhiyun return orig; \
316*4882a593Smuzhiyun }
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun #define ATOMIC64_OPS(op, op1, op2) \
319*4882a593Smuzhiyun ATOMIC64_OP(op, op1, op2) \
320*4882a593Smuzhiyun ATOMIC64_OP_RETURN(op, op1, op2) \
321*4882a593Smuzhiyun ATOMIC64_FETCH_OP(op, op1, op2)
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun #define atomic64_andnot atomic64_andnot
324*4882a593Smuzhiyun #define atomic64_fetch_andnot atomic64_fetch_andnot
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun ATOMIC64_OPS(add, add.f, adc)
327*4882a593Smuzhiyun ATOMIC64_OPS(sub, sub.f, sbc)
328*4882a593Smuzhiyun ATOMIC64_OPS(and, and, and)
329*4882a593Smuzhiyun ATOMIC64_OPS(andnot, bic, bic)
330*4882a593Smuzhiyun ATOMIC64_OPS(or, or, or)
331*4882a593Smuzhiyun ATOMIC64_OPS(xor, xor, xor)
332*4882a593Smuzhiyun
333*4882a593Smuzhiyun #undef ATOMIC64_OPS
334*4882a593Smuzhiyun #undef ATOMIC64_FETCH_OP
335*4882a593Smuzhiyun #undef ATOMIC64_OP_RETURN
336*4882a593Smuzhiyun #undef ATOMIC64_OP
337*4882a593Smuzhiyun
338*4882a593Smuzhiyun static inline s64
339*4882a593Smuzhiyun atomic64_cmpxchg(atomic64_t *ptr, s64 expected, s64 new)
340*4882a593Smuzhiyun {
341*4882a593Smuzhiyun s64 prev;
342*4882a593Smuzhiyun
343*4882a593Smuzhiyun smp_mb();
344*4882a593Smuzhiyun
345*4882a593Smuzhiyun __asm__ __volatile__(
346*4882a593Smuzhiyun "1: llockd %0, [%1] \n"
347*4882a593Smuzhiyun " brne %L0, %L2, 2f \n"
348*4882a593Smuzhiyun " brne %H0, %H2, 2f \n"
349*4882a593Smuzhiyun " scondd %3, [%1] \n"
350*4882a593Smuzhiyun " bnz 1b \n"
351*4882a593Smuzhiyun "2: \n"
352*4882a593Smuzhiyun : "=&r"(prev)
353*4882a593Smuzhiyun : "r"(ptr), "ir"(expected), "r"(new)
354*4882a593Smuzhiyun : "cc"); /* memory clobber comes from smp_mb() */
355*4882a593Smuzhiyun
356*4882a593Smuzhiyun smp_mb();
357*4882a593Smuzhiyun
358*4882a593Smuzhiyun return prev;
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun
361*4882a593Smuzhiyun static inline s64 atomic64_xchg(atomic64_t *ptr, s64 new)
362*4882a593Smuzhiyun {
363*4882a593Smuzhiyun s64 prev;
364*4882a593Smuzhiyun
365*4882a593Smuzhiyun smp_mb();
366*4882a593Smuzhiyun
367*4882a593Smuzhiyun __asm__ __volatile__(
368*4882a593Smuzhiyun "1: llockd %0, [%1] \n"
369*4882a593Smuzhiyun " scondd %2, [%1] \n"
370*4882a593Smuzhiyun " bnz 1b \n"
371*4882a593Smuzhiyun "2: \n"
372*4882a593Smuzhiyun : "=&r"(prev)
373*4882a593Smuzhiyun : "r"(ptr), "r"(new)
374*4882a593Smuzhiyun : "cc"); /* memory clobber comes from smp_mb() */
375*4882a593Smuzhiyun
376*4882a593Smuzhiyun smp_mb();
377*4882a593Smuzhiyun
378*4882a593Smuzhiyun return prev;
379*4882a593Smuzhiyun }
380*4882a593Smuzhiyun
381*4882a593Smuzhiyun /**
382*4882a593Smuzhiyun * atomic64_dec_if_positive - decrement by 1 if old value positive
383*4882a593Smuzhiyun * @v: pointer of type atomic64_t
384*4882a593Smuzhiyun *
385*4882a593Smuzhiyun * The function returns the old value of *v minus 1, even if
386*4882a593Smuzhiyun * the atomic variable, v, was not decremented.
387*4882a593Smuzhiyun */
388*4882a593Smuzhiyun
389*4882a593Smuzhiyun static inline s64 atomic64_dec_if_positive(atomic64_t *v)
390*4882a593Smuzhiyun {
391*4882a593Smuzhiyun s64 val;
392*4882a593Smuzhiyun
393*4882a593Smuzhiyun smp_mb();
394*4882a593Smuzhiyun
395*4882a593Smuzhiyun __asm__ __volatile__(
396*4882a593Smuzhiyun "1: llockd %0, [%1] \n"
397*4882a593Smuzhiyun " sub.f %L0, %L0, 1 # w0 - 1, set C on borrow\n"
398*4882a593Smuzhiyun " sub.c %H0, %H0, 1 # if C set, w1 - 1\n"
399*4882a593Smuzhiyun " brlt %H0, 0, 2f \n"
400*4882a593Smuzhiyun " scondd %0, [%1] \n"
401*4882a593Smuzhiyun " bnz 1b \n"
402*4882a593Smuzhiyun "2: \n"
403*4882a593Smuzhiyun : "=&r"(val)
404*4882a593Smuzhiyun : "r"(&v->counter)
405*4882a593Smuzhiyun : "cc"); /* memory clobber comes from smp_mb() */
406*4882a593Smuzhiyun
407*4882a593Smuzhiyun smp_mb();
408*4882a593Smuzhiyun
409*4882a593Smuzhiyun return val;
410*4882a593Smuzhiyun }
411*4882a593Smuzhiyun #define atomic64_dec_if_positive atomic64_dec_if_positive
412*4882a593Smuzhiyun
413*4882a593Smuzhiyun /**
414*4882a593Smuzhiyun * atomic64_fetch_add_unless - add unless the number is a given value
415*4882a593Smuzhiyun * @v: pointer of type atomic64_t
416*4882a593Smuzhiyun * @a: the amount to add to v...
417*4882a593Smuzhiyun * @u: ...unless v is equal to u.
418*4882a593Smuzhiyun *
419*4882a593Smuzhiyun * Atomically adds @a to @v, if it was not @u.
420*4882a593Smuzhiyun * Returns the old value of @v
421*4882a593Smuzhiyun */
422*4882a593Smuzhiyun static inline s64 atomic64_fetch_add_unless(atomic64_t *v, s64 a, s64 u)
423*4882a593Smuzhiyun {
424*4882a593Smuzhiyun s64 old, temp;
425*4882a593Smuzhiyun
426*4882a593Smuzhiyun smp_mb();
427*4882a593Smuzhiyun
428*4882a593Smuzhiyun __asm__ __volatile__(
429*4882a593Smuzhiyun "1: llockd %0, [%2] \n"
430*4882a593Smuzhiyun " brne %L0, %L4, 2f # continue to add since v != u \n"
431*4882a593Smuzhiyun " breq.d %H0, %H4, 3f # return since v == u \n"
432*4882a593Smuzhiyun "2: \n"
433*4882a593Smuzhiyun " add.f %L1, %L0, %L3 \n"
434*4882a593Smuzhiyun " adc %H1, %H0, %H3 \n"
435*4882a593Smuzhiyun " scondd %1, [%2] \n"
436*4882a593Smuzhiyun " bnz 1b \n"
437*4882a593Smuzhiyun "3: \n"
438*4882a593Smuzhiyun : "=&r"(old), "=&r" (temp)
439*4882a593Smuzhiyun : "r"(&v->counter), "r"(a), "r"(u)
440*4882a593Smuzhiyun : "cc"); /* memory clobber comes from smp_mb() */
441*4882a593Smuzhiyun
442*4882a593Smuzhiyun smp_mb();
443*4882a593Smuzhiyun
444*4882a593Smuzhiyun return old;
445*4882a593Smuzhiyun }
446*4882a593Smuzhiyun #define atomic64_fetch_add_unless atomic64_fetch_add_unless
447*4882a593Smuzhiyun
448*4882a593Smuzhiyun #endif /* !CONFIG_GENERIC_ATOMIC64 */
449*4882a593Smuzhiyun
450*4882a593Smuzhiyun #endif /* !__ASSEMBLY__ */
451*4882a593Smuzhiyun
452*4882a593Smuzhiyun #endif
453