1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Bit operations for the Hexagon architecture
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (c) 2010-2011, The Linux Foundation. All rights reserved.
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #ifndef _ASM_BITOPS_H
9*4882a593Smuzhiyun #define _ASM_BITOPS_H
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <linux/compiler.h>
12*4882a593Smuzhiyun #include <asm/byteorder.h>
13*4882a593Smuzhiyun #include <asm/atomic.h>
14*4882a593Smuzhiyun #include <asm/barrier.h>
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun #ifdef __KERNEL__
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun /*
19*4882a593Smuzhiyun * The offset calculations for these are based on BITS_PER_LONG == 32
20*4882a593Smuzhiyun * (i.e. I get to shift by #5-2 (32 bits per long, 4 bytes per access),
21*4882a593Smuzhiyun * mask by 0x0000001F)
22*4882a593Smuzhiyun *
23*4882a593Smuzhiyun * Typically, R10 is clobbered for address, R11 bit nr, and R12 is temp
24*4882a593Smuzhiyun */
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun /**
27*4882a593Smuzhiyun * test_and_clear_bit - clear a bit and return its old value
28*4882a593Smuzhiyun * @nr: bit number to clear
29*4882a593Smuzhiyun * @addr: pointer to memory
30*4882a593Smuzhiyun */
test_and_clear_bit(int nr,volatile void * addr)31*4882a593Smuzhiyun static inline int test_and_clear_bit(int nr, volatile void *addr)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun int oldval;
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun __asm__ __volatile__ (
36*4882a593Smuzhiyun " {R10 = %1; R11 = asr(%2,#5); }\n"
37*4882a593Smuzhiyun " {R10 += asl(R11,#2); R11 = and(%2,#0x1f)}\n"
38*4882a593Smuzhiyun "1: R12 = memw_locked(R10);\n"
39*4882a593Smuzhiyun " { P0 = tstbit(R12,R11); R12 = clrbit(R12,R11); }\n"
40*4882a593Smuzhiyun " memw_locked(R10,P1) = R12;\n"
41*4882a593Smuzhiyun " {if (!P1) jump 1b; %0 = mux(P0,#1,#0);}\n"
42*4882a593Smuzhiyun : "=&r" (oldval)
43*4882a593Smuzhiyun : "r" (addr), "r" (nr)
44*4882a593Smuzhiyun : "r10", "r11", "r12", "p0", "p1", "memory"
45*4882a593Smuzhiyun );
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun return oldval;
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun /**
51*4882a593Smuzhiyun * test_and_set_bit - set a bit and return its old value
52*4882a593Smuzhiyun * @nr: bit number to set
53*4882a593Smuzhiyun * @addr: pointer to memory
54*4882a593Smuzhiyun */
test_and_set_bit(int nr,volatile void * addr)55*4882a593Smuzhiyun static inline int test_and_set_bit(int nr, volatile void *addr)
56*4882a593Smuzhiyun {
57*4882a593Smuzhiyun int oldval;
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun __asm__ __volatile__ (
60*4882a593Smuzhiyun " {R10 = %1; R11 = asr(%2,#5); }\n"
61*4882a593Smuzhiyun " {R10 += asl(R11,#2); R11 = and(%2,#0x1f)}\n"
62*4882a593Smuzhiyun "1: R12 = memw_locked(R10);\n"
63*4882a593Smuzhiyun " { P0 = tstbit(R12,R11); R12 = setbit(R12,R11); }\n"
64*4882a593Smuzhiyun " memw_locked(R10,P1) = R12;\n"
65*4882a593Smuzhiyun " {if (!P1) jump 1b; %0 = mux(P0,#1,#0);}\n"
66*4882a593Smuzhiyun : "=&r" (oldval)
67*4882a593Smuzhiyun : "r" (addr), "r" (nr)
68*4882a593Smuzhiyun : "r10", "r11", "r12", "p0", "p1", "memory"
69*4882a593Smuzhiyun );
70*4882a593Smuzhiyun
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun return oldval;
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun /**
77*4882a593Smuzhiyun * test_and_change_bit - toggle a bit and return its old value
78*4882a593Smuzhiyun * @nr: bit number to set
79*4882a593Smuzhiyun * @addr: pointer to memory
80*4882a593Smuzhiyun */
test_and_change_bit(int nr,volatile void * addr)81*4882a593Smuzhiyun static inline int test_and_change_bit(int nr, volatile void *addr)
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun int oldval;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun __asm__ __volatile__ (
86*4882a593Smuzhiyun " {R10 = %1; R11 = asr(%2,#5); }\n"
87*4882a593Smuzhiyun " {R10 += asl(R11,#2); R11 = and(%2,#0x1f)}\n"
88*4882a593Smuzhiyun "1: R12 = memw_locked(R10);\n"
89*4882a593Smuzhiyun " { P0 = tstbit(R12,R11); R12 = togglebit(R12,R11); }\n"
90*4882a593Smuzhiyun " memw_locked(R10,P1) = R12;\n"
91*4882a593Smuzhiyun " {if (!P1) jump 1b; %0 = mux(P0,#1,#0);}\n"
92*4882a593Smuzhiyun : "=&r" (oldval)
93*4882a593Smuzhiyun : "r" (addr), "r" (nr)
94*4882a593Smuzhiyun : "r10", "r11", "r12", "p0", "p1", "memory"
95*4882a593Smuzhiyun );
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun return oldval;
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun /*
102*4882a593Smuzhiyun * Atomic, but doesn't care about the return value.
103*4882a593Smuzhiyun * Rewrite later to save a cycle or two.
104*4882a593Smuzhiyun */
105*4882a593Smuzhiyun
clear_bit(int nr,volatile void * addr)106*4882a593Smuzhiyun static inline void clear_bit(int nr, volatile void *addr)
107*4882a593Smuzhiyun {
108*4882a593Smuzhiyun test_and_clear_bit(nr, addr);
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun
set_bit(int nr,volatile void * addr)111*4882a593Smuzhiyun static inline void set_bit(int nr, volatile void *addr)
112*4882a593Smuzhiyun {
113*4882a593Smuzhiyun test_and_set_bit(nr, addr);
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun
change_bit(int nr,volatile void * addr)116*4882a593Smuzhiyun static inline void change_bit(int nr, volatile void *addr)
117*4882a593Smuzhiyun {
118*4882a593Smuzhiyun test_and_change_bit(nr, addr);
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun /*
123*4882a593Smuzhiyun * These are allowed to be non-atomic. In fact the generic flavors are
124*4882a593Smuzhiyun * in non-atomic.h. Would it be better to use intrinsics for this?
125*4882a593Smuzhiyun *
126*4882a593Smuzhiyun * OK, writes in our architecture do not invalidate LL/SC, so this has to
127*4882a593Smuzhiyun * be atomic, particularly for things like slab_lock and slab_unlock.
128*4882a593Smuzhiyun *
129*4882a593Smuzhiyun */
__clear_bit(int nr,volatile unsigned long * addr)130*4882a593Smuzhiyun static inline void __clear_bit(int nr, volatile unsigned long *addr)
131*4882a593Smuzhiyun {
132*4882a593Smuzhiyun test_and_clear_bit(nr, addr);
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun
__set_bit(int nr,volatile unsigned long * addr)135*4882a593Smuzhiyun static inline void __set_bit(int nr, volatile unsigned long *addr)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun test_and_set_bit(nr, addr);
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun
__change_bit(int nr,volatile unsigned long * addr)140*4882a593Smuzhiyun static inline void __change_bit(int nr, volatile unsigned long *addr)
141*4882a593Smuzhiyun {
142*4882a593Smuzhiyun test_and_change_bit(nr, addr);
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun /* Apparently, at least some of these are allowed to be non-atomic */
__test_and_clear_bit(int nr,volatile unsigned long * addr)146*4882a593Smuzhiyun static inline int __test_and_clear_bit(int nr, volatile unsigned long *addr)
147*4882a593Smuzhiyun {
148*4882a593Smuzhiyun return test_and_clear_bit(nr, addr);
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
__test_and_set_bit(int nr,volatile unsigned long * addr)151*4882a593Smuzhiyun static inline int __test_and_set_bit(int nr, volatile unsigned long *addr)
152*4882a593Smuzhiyun {
153*4882a593Smuzhiyun return test_and_set_bit(nr, addr);
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun
__test_and_change_bit(int nr,volatile unsigned long * addr)156*4882a593Smuzhiyun static inline int __test_and_change_bit(int nr, volatile unsigned long *addr)
157*4882a593Smuzhiyun {
158*4882a593Smuzhiyun return test_and_change_bit(nr, addr);
159*4882a593Smuzhiyun }
160*4882a593Smuzhiyun
__test_bit(int nr,const volatile unsigned long * addr)161*4882a593Smuzhiyun static inline int __test_bit(int nr, const volatile unsigned long *addr)
162*4882a593Smuzhiyun {
163*4882a593Smuzhiyun int retval;
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun asm volatile(
166*4882a593Smuzhiyun "{P0 = tstbit(%1,%2); if (P0.new) %0 = #1; if (!P0.new) %0 = #0;}\n"
167*4882a593Smuzhiyun : "=&r" (retval)
168*4882a593Smuzhiyun : "r" (addr[BIT_WORD(nr)]), "r" (nr % BITS_PER_LONG)
169*4882a593Smuzhiyun : "p0"
170*4882a593Smuzhiyun );
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun return retval;
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun #define test_bit(nr, addr) __test_bit(nr, addr)
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun /*
178*4882a593Smuzhiyun * ffz - find first zero in word.
179*4882a593Smuzhiyun * @word: The word to search
180*4882a593Smuzhiyun *
181*4882a593Smuzhiyun * Undefined if no zero exists, so code should check against ~0UL first.
182*4882a593Smuzhiyun */
ffz(int x)183*4882a593Smuzhiyun static inline long ffz(int x)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun int r;
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun asm("%0 = ct1(%1);\n"
188*4882a593Smuzhiyun : "=&r" (r)
189*4882a593Smuzhiyun : "r" (x));
190*4882a593Smuzhiyun return r;
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun
193*4882a593Smuzhiyun /*
194*4882a593Smuzhiyun * fls - find last (most-significant) bit set
195*4882a593Smuzhiyun * @x: the word to search
196*4882a593Smuzhiyun *
197*4882a593Smuzhiyun * This is defined the same way as ffs.
198*4882a593Smuzhiyun * Note fls(0) = 0, fls(1) = 1, fls(0x80000000) = 32.
199*4882a593Smuzhiyun */
fls(unsigned int x)200*4882a593Smuzhiyun static inline int fls(unsigned int x)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun int r;
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun asm("{ %0 = cl0(%1);}\n"
205*4882a593Smuzhiyun "%0 = sub(#32,%0);\n"
206*4882a593Smuzhiyun : "=&r" (r)
207*4882a593Smuzhiyun : "r" (x)
208*4882a593Smuzhiyun : "p0");
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun return r;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun /*
214*4882a593Smuzhiyun * ffs - find first bit set
215*4882a593Smuzhiyun * @x: the word to search
216*4882a593Smuzhiyun *
217*4882a593Smuzhiyun * This is defined the same way as
218*4882a593Smuzhiyun * the libc and compiler builtin ffs routines, therefore
219*4882a593Smuzhiyun * differs in spirit from the above ffz (man ffs).
220*4882a593Smuzhiyun */
ffs(int x)221*4882a593Smuzhiyun static inline int ffs(int x)
222*4882a593Smuzhiyun {
223*4882a593Smuzhiyun int r;
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun asm("{ P0 = cmp.eq(%1,#0); %0 = ct0(%1);}\n"
226*4882a593Smuzhiyun "{ if (P0) %0 = #0; if (!P0) %0 = add(%0,#1);}\n"
227*4882a593Smuzhiyun : "=&r" (r)
228*4882a593Smuzhiyun : "r" (x)
229*4882a593Smuzhiyun : "p0");
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun return r;
232*4882a593Smuzhiyun }
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun /*
235*4882a593Smuzhiyun * __ffs - find first bit in word.
236*4882a593Smuzhiyun * @word: The word to search
237*4882a593Smuzhiyun *
238*4882a593Smuzhiyun * Undefined if no bit exists, so code should check against 0 first.
239*4882a593Smuzhiyun *
240*4882a593Smuzhiyun * bits_per_long assumed to be 32
241*4882a593Smuzhiyun * numbering starts at 0 I think (instead of 1 like ffs)
242*4882a593Smuzhiyun */
__ffs(unsigned long word)243*4882a593Smuzhiyun static inline unsigned long __ffs(unsigned long word)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun int num;
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun asm("%0 = ct0(%1);\n"
248*4882a593Smuzhiyun : "=&r" (num)
249*4882a593Smuzhiyun : "r" (word));
250*4882a593Smuzhiyun
251*4882a593Smuzhiyun return num;
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun /*
255*4882a593Smuzhiyun * __fls - find last (most-significant) set bit in a long word
256*4882a593Smuzhiyun * @word: the word to search
257*4882a593Smuzhiyun *
258*4882a593Smuzhiyun * Undefined if no set bit exists, so code should check against 0 first.
259*4882a593Smuzhiyun * bits_per_long assumed to be 32
260*4882a593Smuzhiyun */
__fls(unsigned long word)261*4882a593Smuzhiyun static inline unsigned long __fls(unsigned long word)
262*4882a593Smuzhiyun {
263*4882a593Smuzhiyun int num;
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun asm("%0 = cl0(%1);\n"
266*4882a593Smuzhiyun "%0 = sub(#31,%0);\n"
267*4882a593Smuzhiyun : "=&r" (num)
268*4882a593Smuzhiyun : "r" (word));
269*4882a593Smuzhiyun
270*4882a593Smuzhiyun return num;
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun #include <asm-generic/bitops/lock.h>
274*4882a593Smuzhiyun #include <asm-generic/bitops/find.h>
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun #include <asm-generic/bitops/fls64.h>
277*4882a593Smuzhiyun #include <asm-generic/bitops/sched.h>
278*4882a593Smuzhiyun #include <asm-generic/bitops/hweight.h>
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun #include <asm-generic/bitops/le.h>
281*4882a593Smuzhiyun #include <asm-generic/bitops/ext2-atomic.h>
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun #endif /* __KERNEL__ */
284*4882a593Smuzhiyun #endif
285