xref: /OK3568_Linux_fs/kernel/arch/arm64/net/bpf_jit.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * BPF JIT compiler for ARM64
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (C) 2014-2016 Zi Shen Lim <zlim.lnx@gmail.com>
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun #ifndef _BPF_JIT_H
8*4882a593Smuzhiyun #define _BPF_JIT_H
9*4882a593Smuzhiyun 
10*4882a593Smuzhiyun #include <asm/insn.h>
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun /* 5-bit Register Operand */
13*4882a593Smuzhiyun #define A64_R(x)	AARCH64_INSN_REG_##x
14*4882a593Smuzhiyun #define A64_FP		AARCH64_INSN_REG_FP
15*4882a593Smuzhiyun #define A64_LR		AARCH64_INSN_REG_LR
16*4882a593Smuzhiyun #define A64_ZR		AARCH64_INSN_REG_ZR
17*4882a593Smuzhiyun #define A64_SP		AARCH64_INSN_REG_SP
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #define A64_VARIANT(sf) \
20*4882a593Smuzhiyun 	((sf) ? AARCH64_INSN_VARIANT_64BIT : AARCH64_INSN_VARIANT_32BIT)
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun /* Compare & branch (immediate) */
23*4882a593Smuzhiyun #define A64_COMP_BRANCH(sf, Rt, offset, type) \
24*4882a593Smuzhiyun 	aarch64_insn_gen_comp_branch_imm(0, offset, Rt, A64_VARIANT(sf), \
25*4882a593Smuzhiyun 		AARCH64_INSN_BRANCH_COMP_##type)
26*4882a593Smuzhiyun #define A64_CBZ(sf, Rt, imm19) A64_COMP_BRANCH(sf, Rt, (imm19) << 2, ZERO)
27*4882a593Smuzhiyun #define A64_CBNZ(sf, Rt, imm19) A64_COMP_BRANCH(sf, Rt, (imm19) << 2, NONZERO)
28*4882a593Smuzhiyun 
29*4882a593Smuzhiyun /* Conditional branch (immediate) */
30*4882a593Smuzhiyun #define A64_COND_BRANCH(cond, offset) \
31*4882a593Smuzhiyun 	aarch64_insn_gen_cond_branch_imm(0, offset, cond)
32*4882a593Smuzhiyun #define A64_COND_EQ	AARCH64_INSN_COND_EQ /* == */
33*4882a593Smuzhiyun #define A64_COND_NE	AARCH64_INSN_COND_NE /* != */
34*4882a593Smuzhiyun #define A64_COND_CS	AARCH64_INSN_COND_CS /* unsigned >= */
35*4882a593Smuzhiyun #define A64_COND_HI	AARCH64_INSN_COND_HI /* unsigned > */
36*4882a593Smuzhiyun #define A64_COND_LS	AARCH64_INSN_COND_LS /* unsigned <= */
37*4882a593Smuzhiyun #define A64_COND_CC	AARCH64_INSN_COND_CC /* unsigned < */
38*4882a593Smuzhiyun #define A64_COND_GE	AARCH64_INSN_COND_GE /* signed >= */
39*4882a593Smuzhiyun #define A64_COND_GT	AARCH64_INSN_COND_GT /* signed > */
40*4882a593Smuzhiyun #define A64_COND_LE	AARCH64_INSN_COND_LE /* signed <= */
41*4882a593Smuzhiyun #define A64_COND_LT	AARCH64_INSN_COND_LT /* signed < */
42*4882a593Smuzhiyun #define A64_B_(cond, imm19) A64_COND_BRANCH(cond, (imm19) << 2)
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun /* Unconditional branch (immediate) */
45*4882a593Smuzhiyun #define A64_BRANCH(offset, type) aarch64_insn_gen_branch_imm(0, offset, \
46*4882a593Smuzhiyun 	AARCH64_INSN_BRANCH_##type)
47*4882a593Smuzhiyun #define A64_B(imm26)  A64_BRANCH((imm26) << 2, NOLINK)
48*4882a593Smuzhiyun #define A64_BL(imm26) A64_BRANCH((imm26) << 2, LINK)
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun /* Unconditional branch (register) */
51*4882a593Smuzhiyun #define A64_BR(Rn)  aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_NOLINK)
52*4882a593Smuzhiyun #define A64_BLR(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_LINK)
53*4882a593Smuzhiyun #define A64_RET(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_RETURN)
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun /* Load/store register (register offset) */
56*4882a593Smuzhiyun #define A64_LS_REG(Rt, Rn, Rm, size, type) \
57*4882a593Smuzhiyun 	aarch64_insn_gen_load_store_reg(Rt, Rn, Rm, \
58*4882a593Smuzhiyun 		AARCH64_INSN_SIZE_##size, \
59*4882a593Smuzhiyun 		AARCH64_INSN_LDST_##type##_REG_OFFSET)
60*4882a593Smuzhiyun #define A64_STRB(Wt, Xn, Xm)  A64_LS_REG(Wt, Xn, Xm, 8, STORE)
61*4882a593Smuzhiyun #define A64_LDRB(Wt, Xn, Xm)  A64_LS_REG(Wt, Xn, Xm, 8, LOAD)
62*4882a593Smuzhiyun #define A64_STRH(Wt, Xn, Xm)  A64_LS_REG(Wt, Xn, Xm, 16, STORE)
63*4882a593Smuzhiyun #define A64_LDRH(Wt, Xn, Xm)  A64_LS_REG(Wt, Xn, Xm, 16, LOAD)
64*4882a593Smuzhiyun #define A64_STR32(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 32, STORE)
65*4882a593Smuzhiyun #define A64_LDR32(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 32, LOAD)
66*4882a593Smuzhiyun #define A64_STR64(Xt, Xn, Xm) A64_LS_REG(Xt, Xn, Xm, 64, STORE)
67*4882a593Smuzhiyun #define A64_LDR64(Xt, Xn, Xm) A64_LS_REG(Xt, Xn, Xm, 64, LOAD)
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun /* Load/store register pair */
70*4882a593Smuzhiyun #define A64_LS_PAIR(Rt, Rt2, Rn, offset, ls, type) \
71*4882a593Smuzhiyun 	aarch64_insn_gen_load_store_pair(Rt, Rt2, Rn, offset, \
72*4882a593Smuzhiyun 		AARCH64_INSN_VARIANT_64BIT, \
73*4882a593Smuzhiyun 		AARCH64_INSN_LDST_##ls##_PAIR_##type)
74*4882a593Smuzhiyun /* Rn -= 16; Rn[0] = Rt; Rn[8] = Rt2; */
75*4882a593Smuzhiyun #define A64_PUSH(Rt, Rt2, Rn) A64_LS_PAIR(Rt, Rt2, Rn, -16, STORE, PRE_INDEX)
76*4882a593Smuzhiyun /* Rt = Rn[0]; Rt2 = Rn[8]; Rn += 16; */
77*4882a593Smuzhiyun #define A64_POP(Rt, Rt2, Rn)  A64_LS_PAIR(Rt, Rt2, Rn, 16, LOAD, POST_INDEX)
78*4882a593Smuzhiyun 
79*4882a593Smuzhiyun /* Load/store exclusive */
80*4882a593Smuzhiyun #define A64_SIZE(sf) \
81*4882a593Smuzhiyun 	((sf) ? AARCH64_INSN_SIZE_64 : AARCH64_INSN_SIZE_32)
82*4882a593Smuzhiyun #define A64_LSX(sf, Rt, Rn, Rs, type) \
83*4882a593Smuzhiyun 	aarch64_insn_gen_load_store_ex(Rt, Rn, Rs, A64_SIZE(sf), \
84*4882a593Smuzhiyun 				       AARCH64_INSN_LDST_##type)
85*4882a593Smuzhiyun /* Rt = [Rn]; (atomic) */
86*4882a593Smuzhiyun #define A64_LDXR(sf, Rt, Rn) \
87*4882a593Smuzhiyun 	A64_LSX(sf, Rt, Rn, A64_ZR, LOAD_EX)
88*4882a593Smuzhiyun /* [Rn] = Rt; (atomic) Rs = [state] */
89*4882a593Smuzhiyun #define A64_STXR(sf, Rt, Rn, Rs) \
90*4882a593Smuzhiyun 	A64_LSX(sf, Rt, Rn, Rs, STORE_EX)
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun /* LSE atomics */
93*4882a593Smuzhiyun #define A64_STADD(sf, Rn, Rs) \
94*4882a593Smuzhiyun 	aarch64_insn_gen_stadd(Rn, Rs, A64_SIZE(sf))
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun /* Add/subtract (immediate) */
97*4882a593Smuzhiyun #define A64_ADDSUB_IMM(sf, Rd, Rn, imm12, type) \
98*4882a593Smuzhiyun 	aarch64_insn_gen_add_sub_imm(Rd, Rn, imm12, \
99*4882a593Smuzhiyun 		A64_VARIANT(sf), AARCH64_INSN_ADSB_##type)
100*4882a593Smuzhiyun /* Rd = Rn OP imm12 */
101*4882a593Smuzhiyun #define A64_ADD_I(sf, Rd, Rn, imm12) A64_ADDSUB_IMM(sf, Rd, Rn, imm12, ADD)
102*4882a593Smuzhiyun #define A64_SUB_I(sf, Rd, Rn, imm12) A64_ADDSUB_IMM(sf, Rd, Rn, imm12, SUB)
103*4882a593Smuzhiyun #define A64_ADDS_I(sf, Rd, Rn, imm12) \
104*4882a593Smuzhiyun 	A64_ADDSUB_IMM(sf, Rd, Rn, imm12, ADD_SETFLAGS)
105*4882a593Smuzhiyun #define A64_SUBS_I(sf, Rd, Rn, imm12) \
106*4882a593Smuzhiyun 	A64_ADDSUB_IMM(sf, Rd, Rn, imm12, SUB_SETFLAGS)
107*4882a593Smuzhiyun /* Rn + imm12; set condition flags */
108*4882a593Smuzhiyun #define A64_CMN_I(sf, Rn, imm12) A64_ADDS_I(sf, A64_ZR, Rn, imm12)
109*4882a593Smuzhiyun /* Rn - imm12; set condition flags */
110*4882a593Smuzhiyun #define A64_CMP_I(sf, Rn, imm12) A64_SUBS_I(sf, A64_ZR, Rn, imm12)
111*4882a593Smuzhiyun /* Rd = Rn */
112*4882a593Smuzhiyun #define A64_MOV(sf, Rd, Rn) A64_ADD_I(sf, Rd, Rn, 0)
113*4882a593Smuzhiyun 
114*4882a593Smuzhiyun /* Bitfield move */
115*4882a593Smuzhiyun #define A64_BITFIELD(sf, Rd, Rn, immr, imms, type) \
116*4882a593Smuzhiyun 	aarch64_insn_gen_bitfield(Rd, Rn, immr, imms, \
117*4882a593Smuzhiyun 		A64_VARIANT(sf), AARCH64_INSN_BITFIELD_MOVE_##type)
118*4882a593Smuzhiyun /* Signed, with sign replication to left and zeros to right */
119*4882a593Smuzhiyun #define A64_SBFM(sf, Rd, Rn, ir, is) A64_BITFIELD(sf, Rd, Rn, ir, is, SIGNED)
120*4882a593Smuzhiyun /* Unsigned, with zeros to left and right */
121*4882a593Smuzhiyun #define A64_UBFM(sf, Rd, Rn, ir, is) A64_BITFIELD(sf, Rd, Rn, ir, is, UNSIGNED)
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun /* Rd = Rn << shift */
124*4882a593Smuzhiyun #define A64_LSL(sf, Rd, Rn, shift) ({	\
125*4882a593Smuzhiyun 	int sz = (sf) ? 64 : 32;	\
126*4882a593Smuzhiyun 	A64_UBFM(sf, Rd, Rn, (unsigned)-(shift) % sz, sz - 1 - (shift)); \
127*4882a593Smuzhiyun })
128*4882a593Smuzhiyun /* Rd = Rn >> shift */
129*4882a593Smuzhiyun #define A64_LSR(sf, Rd, Rn, shift) A64_UBFM(sf, Rd, Rn, shift, (sf) ? 63 : 31)
130*4882a593Smuzhiyun /* Rd = Rn >> shift; signed */
131*4882a593Smuzhiyun #define A64_ASR(sf, Rd, Rn, shift) A64_SBFM(sf, Rd, Rn, shift, (sf) ? 63 : 31)
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun /* Zero extend */
134*4882a593Smuzhiyun #define A64_UXTH(sf, Rd, Rn) A64_UBFM(sf, Rd, Rn, 0, 15)
135*4882a593Smuzhiyun #define A64_UXTW(sf, Rd, Rn) A64_UBFM(sf, Rd, Rn, 0, 31)
136*4882a593Smuzhiyun 
137*4882a593Smuzhiyun /* Move wide (immediate) */
138*4882a593Smuzhiyun #define A64_MOVEW(sf, Rd, imm16, shift, type) \
139*4882a593Smuzhiyun 	aarch64_insn_gen_movewide(Rd, imm16, shift, \
140*4882a593Smuzhiyun 		A64_VARIANT(sf), AARCH64_INSN_MOVEWIDE_##type)
141*4882a593Smuzhiyun /* Rd = Zeros (for MOVZ);
142*4882a593Smuzhiyun  * Rd |= imm16 << shift (where shift is {0, 16, 32, 48});
143*4882a593Smuzhiyun  * Rd = ~Rd; (for MOVN); */
144*4882a593Smuzhiyun #define A64_MOVN(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, INVERSE)
145*4882a593Smuzhiyun #define A64_MOVZ(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, ZERO)
146*4882a593Smuzhiyun #define A64_MOVK(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, KEEP)
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun /* Add/subtract (shifted register) */
149*4882a593Smuzhiyun #define A64_ADDSUB_SREG(sf, Rd, Rn, Rm, type) \
150*4882a593Smuzhiyun 	aarch64_insn_gen_add_sub_shifted_reg(Rd, Rn, Rm, 0, \
151*4882a593Smuzhiyun 		A64_VARIANT(sf), AARCH64_INSN_ADSB_##type)
152*4882a593Smuzhiyun /* Rd = Rn OP Rm */
153*4882a593Smuzhiyun #define A64_ADD(sf, Rd, Rn, Rm)  A64_ADDSUB_SREG(sf, Rd, Rn, Rm, ADD)
154*4882a593Smuzhiyun #define A64_SUB(sf, Rd, Rn, Rm)  A64_ADDSUB_SREG(sf, Rd, Rn, Rm, SUB)
155*4882a593Smuzhiyun #define A64_SUBS(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, SUB_SETFLAGS)
156*4882a593Smuzhiyun /* Rd = -Rm */
157*4882a593Smuzhiyun #define A64_NEG(sf, Rd, Rm) A64_SUB(sf, Rd, A64_ZR, Rm)
158*4882a593Smuzhiyun /* Rn - Rm; set condition flags */
159*4882a593Smuzhiyun #define A64_CMP(sf, Rn, Rm) A64_SUBS(sf, A64_ZR, Rn, Rm)
160*4882a593Smuzhiyun 
161*4882a593Smuzhiyun /* Data-processing (1 source) */
162*4882a593Smuzhiyun #define A64_DATA1(sf, Rd, Rn, type) aarch64_insn_gen_data1(Rd, Rn, \
163*4882a593Smuzhiyun 	A64_VARIANT(sf), AARCH64_INSN_DATA1_##type)
164*4882a593Smuzhiyun /* Rd = BSWAPx(Rn) */
165*4882a593Smuzhiyun #define A64_REV16(sf, Rd, Rn) A64_DATA1(sf, Rd, Rn, REVERSE_16)
166*4882a593Smuzhiyun #define A64_REV32(sf, Rd, Rn) A64_DATA1(sf, Rd, Rn, REVERSE_32)
167*4882a593Smuzhiyun #define A64_REV64(Rd, Rn)     A64_DATA1(1, Rd, Rn, REVERSE_64)
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun /* Data-processing (2 source) */
170*4882a593Smuzhiyun /* Rd = Rn OP Rm */
171*4882a593Smuzhiyun #define A64_DATA2(sf, Rd, Rn, Rm, type) aarch64_insn_gen_data2(Rd, Rn, Rm, \
172*4882a593Smuzhiyun 	A64_VARIANT(sf), AARCH64_INSN_DATA2_##type)
173*4882a593Smuzhiyun #define A64_UDIV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, UDIV)
174*4882a593Smuzhiyun #define A64_LSLV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, LSLV)
175*4882a593Smuzhiyun #define A64_LSRV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, LSRV)
176*4882a593Smuzhiyun #define A64_ASRV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, ASRV)
177*4882a593Smuzhiyun 
178*4882a593Smuzhiyun /* Data-processing (3 source) */
179*4882a593Smuzhiyun /* Rd = Ra + Rn * Rm */
180*4882a593Smuzhiyun #define A64_MADD(sf, Rd, Ra, Rn, Rm) aarch64_insn_gen_data3(Rd, Ra, Rn, Rm, \
181*4882a593Smuzhiyun 	A64_VARIANT(sf), AARCH64_INSN_DATA3_MADD)
182*4882a593Smuzhiyun /* Rd = Ra - Rn * Rm */
183*4882a593Smuzhiyun #define A64_MSUB(sf, Rd, Ra, Rn, Rm) aarch64_insn_gen_data3(Rd, Ra, Rn, Rm, \
184*4882a593Smuzhiyun 	A64_VARIANT(sf), AARCH64_INSN_DATA3_MSUB)
185*4882a593Smuzhiyun /* Rd = Rn * Rm */
186*4882a593Smuzhiyun #define A64_MUL(sf, Rd, Rn, Rm) A64_MADD(sf, Rd, A64_ZR, Rn, Rm)
187*4882a593Smuzhiyun 
188*4882a593Smuzhiyun /* Logical (shifted register) */
189*4882a593Smuzhiyun #define A64_LOGIC_SREG(sf, Rd, Rn, Rm, type) \
190*4882a593Smuzhiyun 	aarch64_insn_gen_logical_shifted_reg(Rd, Rn, Rm, 0, \
191*4882a593Smuzhiyun 		A64_VARIANT(sf), AARCH64_INSN_LOGIC_##type)
192*4882a593Smuzhiyun /* Rd = Rn OP Rm */
193*4882a593Smuzhiyun #define A64_AND(sf, Rd, Rn, Rm)  A64_LOGIC_SREG(sf, Rd, Rn, Rm, AND)
194*4882a593Smuzhiyun #define A64_ORR(sf, Rd, Rn, Rm)  A64_LOGIC_SREG(sf, Rd, Rn, Rm, ORR)
195*4882a593Smuzhiyun #define A64_EOR(sf, Rd, Rn, Rm)  A64_LOGIC_SREG(sf, Rd, Rn, Rm, EOR)
196*4882a593Smuzhiyun #define A64_ANDS(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, AND_SETFLAGS)
197*4882a593Smuzhiyun /* Rn & Rm; set condition flags */
198*4882a593Smuzhiyun #define A64_TST(sf, Rn, Rm) A64_ANDS(sf, A64_ZR, Rn, Rm)
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun /* Logical (immediate) */
201*4882a593Smuzhiyun #define A64_LOGIC_IMM(sf, Rd, Rn, imm, type) ({ \
202*4882a593Smuzhiyun 	u64 imm64 = (sf) ? (u64)imm : (u64)(u32)imm; \
203*4882a593Smuzhiyun 	aarch64_insn_gen_logical_immediate(AARCH64_INSN_LOGIC_##type, \
204*4882a593Smuzhiyun 		A64_VARIANT(sf), Rn, Rd, imm64); \
205*4882a593Smuzhiyun })
206*4882a593Smuzhiyun /* Rd = Rn OP imm */
207*4882a593Smuzhiyun #define A64_AND_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, AND)
208*4882a593Smuzhiyun #define A64_ORR_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, ORR)
209*4882a593Smuzhiyun #define A64_EOR_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, EOR)
210*4882a593Smuzhiyun #define A64_ANDS_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, AND_SETFLAGS)
211*4882a593Smuzhiyun /* Rn & imm; set condition flags */
212*4882a593Smuzhiyun #define A64_TST_I(sf, Rn, imm) A64_ANDS_I(sf, A64_ZR, Rn, imm)
213*4882a593Smuzhiyun 
214*4882a593Smuzhiyun /* HINTs */
215*4882a593Smuzhiyun #define A64_HINT(x) aarch64_insn_gen_hint(x)
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun /* BTI */
218*4882a593Smuzhiyun #define A64_BTI_C  A64_HINT(AARCH64_INSN_HINT_BTIC)
219*4882a593Smuzhiyun #define A64_BTI_J  A64_HINT(AARCH64_INSN_HINT_BTIJ)
220*4882a593Smuzhiyun #define A64_BTI_JC A64_HINT(AARCH64_INSN_HINT_BTIJC)
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun #endif /* _BPF_JIT_H */
223