xref: /OK3568_Linux_fs/kernel/arch/hexagon/include/asm/bitops.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Bit operations for the Hexagon architecture
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (c) 2010-2011, The Linux Foundation. All rights reserved.
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #ifndef _ASM_BITOPS_H
9*4882a593Smuzhiyun #define _ASM_BITOPS_H
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <linux/compiler.h>
12*4882a593Smuzhiyun #include <asm/byteorder.h>
13*4882a593Smuzhiyun #include <asm/atomic.h>
14*4882a593Smuzhiyun #include <asm/barrier.h>
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun #ifdef __KERNEL__
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun /*
19*4882a593Smuzhiyun  * The offset calculations for these are based on BITS_PER_LONG == 32
20*4882a593Smuzhiyun  * (i.e. I get to shift by #5-2 (32 bits per long, 4 bytes per access),
21*4882a593Smuzhiyun  * mask by 0x0000001F)
22*4882a593Smuzhiyun  *
23*4882a593Smuzhiyun  * Typically, R10 is clobbered for address, R11 bit nr, and R12 is temp
24*4882a593Smuzhiyun  */
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun /**
27*4882a593Smuzhiyun  * test_and_clear_bit - clear a bit and return its old value
28*4882a593Smuzhiyun  * @nr:  bit number to clear
29*4882a593Smuzhiyun  * @addr:  pointer to memory
30*4882a593Smuzhiyun  */
test_and_clear_bit(int nr,volatile void * addr)31*4882a593Smuzhiyun static inline int test_and_clear_bit(int nr, volatile void *addr)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun 	int oldval;
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun 	__asm__ __volatile__ (
36*4882a593Smuzhiyun 	"	{R10 = %1; R11 = asr(%2,#5); }\n"
37*4882a593Smuzhiyun 	"	{R10 += asl(R11,#2); R11 = and(%2,#0x1f)}\n"
38*4882a593Smuzhiyun 	"1:	R12 = memw_locked(R10);\n"
39*4882a593Smuzhiyun 	"	{ P0 = tstbit(R12,R11); R12 = clrbit(R12,R11); }\n"
40*4882a593Smuzhiyun 	"	memw_locked(R10,P1) = R12;\n"
41*4882a593Smuzhiyun 	"	{if (!P1) jump 1b; %0 = mux(P0,#1,#0);}\n"
42*4882a593Smuzhiyun 	: "=&r" (oldval)
43*4882a593Smuzhiyun 	: "r" (addr), "r" (nr)
44*4882a593Smuzhiyun 	: "r10", "r11", "r12", "p0", "p1", "memory"
45*4882a593Smuzhiyun 	);
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun 	return oldval;
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun /**
51*4882a593Smuzhiyun  * test_and_set_bit - set a bit and return its old value
52*4882a593Smuzhiyun  * @nr:  bit number to set
53*4882a593Smuzhiyun  * @addr:  pointer to memory
54*4882a593Smuzhiyun  */
test_and_set_bit(int nr,volatile void * addr)55*4882a593Smuzhiyun static inline int test_and_set_bit(int nr, volatile void *addr)
56*4882a593Smuzhiyun {
57*4882a593Smuzhiyun 	int oldval;
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	__asm__ __volatile__ (
60*4882a593Smuzhiyun 	"	{R10 = %1; R11 = asr(%2,#5); }\n"
61*4882a593Smuzhiyun 	"	{R10 += asl(R11,#2); R11 = and(%2,#0x1f)}\n"
62*4882a593Smuzhiyun 	"1:	R12 = memw_locked(R10);\n"
63*4882a593Smuzhiyun 	"	{ P0 = tstbit(R12,R11); R12 = setbit(R12,R11); }\n"
64*4882a593Smuzhiyun 	"	memw_locked(R10,P1) = R12;\n"
65*4882a593Smuzhiyun 	"	{if (!P1) jump 1b; %0 = mux(P0,#1,#0);}\n"
66*4882a593Smuzhiyun 	: "=&r" (oldval)
67*4882a593Smuzhiyun 	: "r" (addr), "r" (nr)
68*4882a593Smuzhiyun 	: "r10", "r11", "r12", "p0", "p1", "memory"
69*4882a593Smuzhiyun 	);
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun 	return oldval;
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun 
76*4882a593Smuzhiyun /**
77*4882a593Smuzhiyun  * test_and_change_bit - toggle a bit and return its old value
78*4882a593Smuzhiyun  * @nr:  bit number to set
79*4882a593Smuzhiyun  * @addr:  pointer to memory
80*4882a593Smuzhiyun  */
test_and_change_bit(int nr,volatile void * addr)81*4882a593Smuzhiyun static inline int test_and_change_bit(int nr, volatile void *addr)
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun 	int oldval;
84*4882a593Smuzhiyun 
85*4882a593Smuzhiyun 	__asm__ __volatile__ (
86*4882a593Smuzhiyun 	"	{R10 = %1; R11 = asr(%2,#5); }\n"
87*4882a593Smuzhiyun 	"	{R10 += asl(R11,#2); R11 = and(%2,#0x1f)}\n"
88*4882a593Smuzhiyun 	"1:	R12 = memw_locked(R10);\n"
89*4882a593Smuzhiyun 	"	{ P0 = tstbit(R12,R11); R12 = togglebit(R12,R11); }\n"
90*4882a593Smuzhiyun 	"	memw_locked(R10,P1) = R12;\n"
91*4882a593Smuzhiyun 	"	{if (!P1) jump 1b; %0 = mux(P0,#1,#0);}\n"
92*4882a593Smuzhiyun 	: "=&r" (oldval)
93*4882a593Smuzhiyun 	: "r" (addr), "r" (nr)
94*4882a593Smuzhiyun 	: "r10", "r11", "r12", "p0", "p1", "memory"
95*4882a593Smuzhiyun 	);
96*4882a593Smuzhiyun 
97*4882a593Smuzhiyun 	return oldval;
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun /*
102*4882a593Smuzhiyun  * Atomic, but doesn't care about the return value.
103*4882a593Smuzhiyun  * Rewrite later to save a cycle or two.
104*4882a593Smuzhiyun  */
105*4882a593Smuzhiyun 
clear_bit(int nr,volatile void * addr)106*4882a593Smuzhiyun static inline void clear_bit(int nr, volatile void *addr)
107*4882a593Smuzhiyun {
108*4882a593Smuzhiyun 	test_and_clear_bit(nr, addr);
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun 
set_bit(int nr,volatile void * addr)111*4882a593Smuzhiyun static inline void set_bit(int nr, volatile void *addr)
112*4882a593Smuzhiyun {
113*4882a593Smuzhiyun 	test_and_set_bit(nr, addr);
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun 
change_bit(int nr,volatile void * addr)116*4882a593Smuzhiyun static inline void change_bit(int nr, volatile void *addr)
117*4882a593Smuzhiyun {
118*4882a593Smuzhiyun 	test_and_change_bit(nr, addr);
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun 
122*4882a593Smuzhiyun /*
123*4882a593Smuzhiyun  * These are allowed to be non-atomic.  In fact the generic flavors are
124*4882a593Smuzhiyun  * in non-atomic.h.  Would it be better to use intrinsics for this?
125*4882a593Smuzhiyun  *
126*4882a593Smuzhiyun  * OK, writes in our architecture do not invalidate LL/SC, so this has to
127*4882a593Smuzhiyun  * be atomic, particularly for things like slab_lock and slab_unlock.
128*4882a593Smuzhiyun  *
129*4882a593Smuzhiyun  */
__clear_bit(int nr,volatile unsigned long * addr)130*4882a593Smuzhiyun static inline void __clear_bit(int nr, volatile unsigned long *addr)
131*4882a593Smuzhiyun {
132*4882a593Smuzhiyun 	test_and_clear_bit(nr, addr);
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun 
__set_bit(int nr,volatile unsigned long * addr)135*4882a593Smuzhiyun static inline void __set_bit(int nr, volatile unsigned long *addr)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun 	test_and_set_bit(nr, addr);
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun 
__change_bit(int nr,volatile unsigned long * addr)140*4882a593Smuzhiyun static inline void __change_bit(int nr, volatile unsigned long *addr)
141*4882a593Smuzhiyun {
142*4882a593Smuzhiyun 	test_and_change_bit(nr, addr);
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun /*  Apparently, at least some of these are allowed to be non-atomic  */
__test_and_clear_bit(int nr,volatile unsigned long * addr)146*4882a593Smuzhiyun static inline int __test_and_clear_bit(int nr, volatile unsigned long *addr)
147*4882a593Smuzhiyun {
148*4882a593Smuzhiyun 	return test_and_clear_bit(nr, addr);
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun 
__test_and_set_bit(int nr,volatile unsigned long * addr)151*4882a593Smuzhiyun static inline int __test_and_set_bit(int nr, volatile unsigned long *addr)
152*4882a593Smuzhiyun {
153*4882a593Smuzhiyun 	return test_and_set_bit(nr, addr);
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun 
__test_and_change_bit(int nr,volatile unsigned long * addr)156*4882a593Smuzhiyun static inline int __test_and_change_bit(int nr, volatile unsigned long *addr)
157*4882a593Smuzhiyun {
158*4882a593Smuzhiyun 	return test_and_change_bit(nr, addr);
159*4882a593Smuzhiyun }
160*4882a593Smuzhiyun 
__test_bit(int nr,const volatile unsigned long * addr)161*4882a593Smuzhiyun static inline int __test_bit(int nr, const volatile unsigned long *addr)
162*4882a593Smuzhiyun {
163*4882a593Smuzhiyun 	int retval;
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	asm volatile(
166*4882a593Smuzhiyun 	"{P0 = tstbit(%1,%2); if (P0.new) %0 = #1; if (!P0.new) %0 = #0;}\n"
167*4882a593Smuzhiyun 	: "=&r" (retval)
168*4882a593Smuzhiyun 	: "r" (addr[BIT_WORD(nr)]), "r" (nr % BITS_PER_LONG)
169*4882a593Smuzhiyun 	: "p0"
170*4882a593Smuzhiyun 	);
171*4882a593Smuzhiyun 
172*4882a593Smuzhiyun 	return retval;
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun #define test_bit(nr, addr) __test_bit(nr, addr)
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun /*
178*4882a593Smuzhiyun  * ffz - find first zero in word.
179*4882a593Smuzhiyun  * @word: The word to search
180*4882a593Smuzhiyun  *
181*4882a593Smuzhiyun  * Undefined if no zero exists, so code should check against ~0UL first.
182*4882a593Smuzhiyun  */
ffz(int x)183*4882a593Smuzhiyun static inline long ffz(int x)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun 	int r;
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	asm("%0 = ct1(%1);\n"
188*4882a593Smuzhiyun 		: "=&r" (r)
189*4882a593Smuzhiyun 		: "r" (x));
190*4882a593Smuzhiyun 	return r;
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun /*
194*4882a593Smuzhiyun  * fls - find last (most-significant) bit set
195*4882a593Smuzhiyun  * @x: the word to search
196*4882a593Smuzhiyun  *
197*4882a593Smuzhiyun  * This is defined the same way as ffs.
198*4882a593Smuzhiyun  * Note fls(0) = 0, fls(1) = 1, fls(0x80000000) = 32.
199*4882a593Smuzhiyun  */
fls(unsigned int x)200*4882a593Smuzhiyun static inline int fls(unsigned int x)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun 	int r;
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun 	asm("{ %0 = cl0(%1);}\n"
205*4882a593Smuzhiyun 		"%0 = sub(#32,%0);\n"
206*4882a593Smuzhiyun 		: "=&r" (r)
207*4882a593Smuzhiyun 		: "r" (x)
208*4882a593Smuzhiyun 		: "p0");
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	return r;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun /*
214*4882a593Smuzhiyun  * ffs - find first bit set
215*4882a593Smuzhiyun  * @x: the word to search
216*4882a593Smuzhiyun  *
217*4882a593Smuzhiyun  * This is defined the same way as
218*4882a593Smuzhiyun  * the libc and compiler builtin ffs routines, therefore
219*4882a593Smuzhiyun  * differs in spirit from the above ffz (man ffs).
220*4882a593Smuzhiyun  */
ffs(int x)221*4882a593Smuzhiyun static inline int ffs(int x)
222*4882a593Smuzhiyun {
223*4882a593Smuzhiyun 	int r;
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 	asm("{ P0 = cmp.eq(%1,#0); %0 = ct0(%1);}\n"
226*4882a593Smuzhiyun 		"{ if (P0) %0 = #0; if (!P0) %0 = add(%0,#1);}\n"
227*4882a593Smuzhiyun 		: "=&r" (r)
228*4882a593Smuzhiyun 		: "r" (x)
229*4882a593Smuzhiyun 		: "p0");
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	return r;
232*4882a593Smuzhiyun }
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun /*
235*4882a593Smuzhiyun  * __ffs - find first bit in word.
236*4882a593Smuzhiyun  * @word: The word to search
237*4882a593Smuzhiyun  *
238*4882a593Smuzhiyun  * Undefined if no bit exists, so code should check against 0 first.
239*4882a593Smuzhiyun  *
240*4882a593Smuzhiyun  * bits_per_long assumed to be 32
241*4882a593Smuzhiyun  * numbering starts at 0 I think (instead of 1 like ffs)
242*4882a593Smuzhiyun  */
__ffs(unsigned long word)243*4882a593Smuzhiyun static inline unsigned long __ffs(unsigned long word)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun 	int num;
246*4882a593Smuzhiyun 
247*4882a593Smuzhiyun 	asm("%0 = ct0(%1);\n"
248*4882a593Smuzhiyun 		: "=&r" (num)
249*4882a593Smuzhiyun 		: "r" (word));
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun 	return num;
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun 
254*4882a593Smuzhiyun /*
255*4882a593Smuzhiyun  * __fls - find last (most-significant) set bit in a long word
256*4882a593Smuzhiyun  * @word: the word to search
257*4882a593Smuzhiyun  *
258*4882a593Smuzhiyun  * Undefined if no set bit exists, so code should check against 0 first.
259*4882a593Smuzhiyun  * bits_per_long assumed to be 32
260*4882a593Smuzhiyun  */
__fls(unsigned long word)261*4882a593Smuzhiyun static inline unsigned long __fls(unsigned long word)
262*4882a593Smuzhiyun {
263*4882a593Smuzhiyun 	int num;
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun 	asm("%0 = cl0(%1);\n"
266*4882a593Smuzhiyun 		"%0 = sub(#31,%0);\n"
267*4882a593Smuzhiyun 		: "=&r" (num)
268*4882a593Smuzhiyun 		: "r" (word));
269*4882a593Smuzhiyun 
270*4882a593Smuzhiyun 	return num;
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun #include <asm-generic/bitops/lock.h>
274*4882a593Smuzhiyun #include <asm-generic/bitops/find.h>
275*4882a593Smuzhiyun 
276*4882a593Smuzhiyun #include <asm-generic/bitops/fls64.h>
277*4882a593Smuzhiyun #include <asm-generic/bitops/sched.h>
278*4882a593Smuzhiyun #include <asm-generic/bitops/hweight.h>
279*4882a593Smuzhiyun 
280*4882a593Smuzhiyun #include <asm-generic/bitops/le.h>
281*4882a593Smuzhiyun #include <asm-generic/bitops/ext2-atomic.h>
282*4882a593Smuzhiyun 
283*4882a593Smuzhiyun #endif /* __KERNEL__ */
284*4882a593Smuzhiyun #endif
285