1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */ 2*4882a593Smuzhiyun /* 3*4882a593Smuzhiyun * BPF JIT compiler for ARM64 4*4882a593Smuzhiyun * 5*4882a593Smuzhiyun * Copyright (C) 2014-2016 Zi Shen Lim <zlim.lnx@gmail.com> 6*4882a593Smuzhiyun */ 7*4882a593Smuzhiyun #ifndef _BPF_JIT_H 8*4882a593Smuzhiyun #define _BPF_JIT_H 9*4882a593Smuzhiyun 10*4882a593Smuzhiyun #include <asm/insn.h> 11*4882a593Smuzhiyun 12*4882a593Smuzhiyun /* 5-bit Register Operand */ 13*4882a593Smuzhiyun #define A64_R(x) AARCH64_INSN_REG_##x 14*4882a593Smuzhiyun #define A64_FP AARCH64_INSN_REG_FP 15*4882a593Smuzhiyun #define A64_LR AARCH64_INSN_REG_LR 16*4882a593Smuzhiyun #define A64_ZR AARCH64_INSN_REG_ZR 17*4882a593Smuzhiyun #define A64_SP AARCH64_INSN_REG_SP 18*4882a593Smuzhiyun 19*4882a593Smuzhiyun #define A64_VARIANT(sf) \ 20*4882a593Smuzhiyun ((sf) ? AARCH64_INSN_VARIANT_64BIT : AARCH64_INSN_VARIANT_32BIT) 21*4882a593Smuzhiyun 22*4882a593Smuzhiyun /* Compare & branch (immediate) */ 23*4882a593Smuzhiyun #define A64_COMP_BRANCH(sf, Rt, offset, type) \ 24*4882a593Smuzhiyun aarch64_insn_gen_comp_branch_imm(0, offset, Rt, A64_VARIANT(sf), \ 25*4882a593Smuzhiyun AARCH64_INSN_BRANCH_COMP_##type) 26*4882a593Smuzhiyun #define A64_CBZ(sf, Rt, imm19) A64_COMP_BRANCH(sf, Rt, (imm19) << 2, ZERO) 27*4882a593Smuzhiyun #define A64_CBNZ(sf, Rt, imm19) A64_COMP_BRANCH(sf, Rt, (imm19) << 2, NONZERO) 28*4882a593Smuzhiyun 29*4882a593Smuzhiyun /* Conditional branch (immediate) */ 30*4882a593Smuzhiyun #define A64_COND_BRANCH(cond, offset) \ 31*4882a593Smuzhiyun aarch64_insn_gen_cond_branch_imm(0, offset, cond) 32*4882a593Smuzhiyun #define A64_COND_EQ AARCH64_INSN_COND_EQ /* == */ 33*4882a593Smuzhiyun #define A64_COND_NE AARCH64_INSN_COND_NE /* != */ 34*4882a593Smuzhiyun #define A64_COND_CS AARCH64_INSN_COND_CS /* unsigned >= */ 35*4882a593Smuzhiyun #define A64_COND_HI AARCH64_INSN_COND_HI /* unsigned > */ 36*4882a593Smuzhiyun #define A64_COND_LS AARCH64_INSN_COND_LS /* unsigned <= */ 37*4882a593Smuzhiyun #define A64_COND_CC AARCH64_INSN_COND_CC /* unsigned < */ 38*4882a593Smuzhiyun #define A64_COND_GE AARCH64_INSN_COND_GE /* signed >= */ 39*4882a593Smuzhiyun #define A64_COND_GT AARCH64_INSN_COND_GT /* signed > */ 40*4882a593Smuzhiyun #define A64_COND_LE AARCH64_INSN_COND_LE /* signed <= */ 41*4882a593Smuzhiyun #define A64_COND_LT AARCH64_INSN_COND_LT /* signed < */ 42*4882a593Smuzhiyun #define A64_B_(cond, imm19) A64_COND_BRANCH(cond, (imm19) << 2) 43*4882a593Smuzhiyun 44*4882a593Smuzhiyun /* Unconditional branch (immediate) */ 45*4882a593Smuzhiyun #define A64_BRANCH(offset, type) aarch64_insn_gen_branch_imm(0, offset, \ 46*4882a593Smuzhiyun AARCH64_INSN_BRANCH_##type) 47*4882a593Smuzhiyun #define A64_B(imm26) A64_BRANCH((imm26) << 2, NOLINK) 48*4882a593Smuzhiyun #define A64_BL(imm26) A64_BRANCH((imm26) << 2, LINK) 49*4882a593Smuzhiyun 50*4882a593Smuzhiyun /* Unconditional branch (register) */ 51*4882a593Smuzhiyun #define A64_BR(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_NOLINK) 52*4882a593Smuzhiyun #define A64_BLR(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_LINK) 53*4882a593Smuzhiyun #define A64_RET(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_RETURN) 54*4882a593Smuzhiyun 55*4882a593Smuzhiyun /* Load/store register (register offset) */ 56*4882a593Smuzhiyun #define A64_LS_REG(Rt, Rn, Rm, size, type) \ 57*4882a593Smuzhiyun aarch64_insn_gen_load_store_reg(Rt, Rn, Rm, \ 58*4882a593Smuzhiyun AARCH64_INSN_SIZE_##size, \ 59*4882a593Smuzhiyun AARCH64_INSN_LDST_##type##_REG_OFFSET) 60*4882a593Smuzhiyun #define A64_STRB(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 8, STORE) 61*4882a593Smuzhiyun #define A64_LDRB(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 8, LOAD) 62*4882a593Smuzhiyun #define A64_STRH(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 16, STORE) 63*4882a593Smuzhiyun #define A64_LDRH(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 16, LOAD) 64*4882a593Smuzhiyun #define A64_STR32(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 32, STORE) 65*4882a593Smuzhiyun #define A64_LDR32(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 32, LOAD) 66*4882a593Smuzhiyun #define A64_STR64(Xt, Xn, Xm) A64_LS_REG(Xt, Xn, Xm, 64, STORE) 67*4882a593Smuzhiyun #define A64_LDR64(Xt, Xn, Xm) A64_LS_REG(Xt, Xn, Xm, 64, LOAD) 68*4882a593Smuzhiyun 69*4882a593Smuzhiyun /* Load/store register pair */ 70*4882a593Smuzhiyun #define A64_LS_PAIR(Rt, Rt2, Rn, offset, ls, type) \ 71*4882a593Smuzhiyun aarch64_insn_gen_load_store_pair(Rt, Rt2, Rn, offset, \ 72*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT, \ 73*4882a593Smuzhiyun AARCH64_INSN_LDST_##ls##_PAIR_##type) 74*4882a593Smuzhiyun /* Rn -= 16; Rn[0] = Rt; Rn[8] = Rt2; */ 75*4882a593Smuzhiyun #define A64_PUSH(Rt, Rt2, Rn) A64_LS_PAIR(Rt, Rt2, Rn, -16, STORE, PRE_INDEX) 76*4882a593Smuzhiyun /* Rt = Rn[0]; Rt2 = Rn[8]; Rn += 16; */ 77*4882a593Smuzhiyun #define A64_POP(Rt, Rt2, Rn) A64_LS_PAIR(Rt, Rt2, Rn, 16, LOAD, POST_INDEX) 78*4882a593Smuzhiyun 79*4882a593Smuzhiyun /* Load/store exclusive */ 80*4882a593Smuzhiyun #define A64_SIZE(sf) \ 81*4882a593Smuzhiyun ((sf) ? AARCH64_INSN_SIZE_64 : AARCH64_INSN_SIZE_32) 82*4882a593Smuzhiyun #define A64_LSX(sf, Rt, Rn, Rs, type) \ 83*4882a593Smuzhiyun aarch64_insn_gen_load_store_ex(Rt, Rn, Rs, A64_SIZE(sf), \ 84*4882a593Smuzhiyun AARCH64_INSN_LDST_##type) 85*4882a593Smuzhiyun /* Rt = [Rn]; (atomic) */ 86*4882a593Smuzhiyun #define A64_LDXR(sf, Rt, Rn) \ 87*4882a593Smuzhiyun A64_LSX(sf, Rt, Rn, A64_ZR, LOAD_EX) 88*4882a593Smuzhiyun /* [Rn] = Rt; (atomic) Rs = [state] */ 89*4882a593Smuzhiyun #define A64_STXR(sf, Rt, Rn, Rs) \ 90*4882a593Smuzhiyun A64_LSX(sf, Rt, Rn, Rs, STORE_EX) 91*4882a593Smuzhiyun 92*4882a593Smuzhiyun /* LSE atomics */ 93*4882a593Smuzhiyun #define A64_STADD(sf, Rn, Rs) \ 94*4882a593Smuzhiyun aarch64_insn_gen_stadd(Rn, Rs, A64_SIZE(sf)) 95*4882a593Smuzhiyun 96*4882a593Smuzhiyun /* Add/subtract (immediate) */ 97*4882a593Smuzhiyun #define A64_ADDSUB_IMM(sf, Rd, Rn, imm12, type) \ 98*4882a593Smuzhiyun aarch64_insn_gen_add_sub_imm(Rd, Rn, imm12, \ 99*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_ADSB_##type) 100*4882a593Smuzhiyun /* Rd = Rn OP imm12 */ 101*4882a593Smuzhiyun #define A64_ADD_I(sf, Rd, Rn, imm12) A64_ADDSUB_IMM(sf, Rd, Rn, imm12, ADD) 102*4882a593Smuzhiyun #define A64_SUB_I(sf, Rd, Rn, imm12) A64_ADDSUB_IMM(sf, Rd, Rn, imm12, SUB) 103*4882a593Smuzhiyun #define A64_ADDS_I(sf, Rd, Rn, imm12) \ 104*4882a593Smuzhiyun A64_ADDSUB_IMM(sf, Rd, Rn, imm12, ADD_SETFLAGS) 105*4882a593Smuzhiyun #define A64_SUBS_I(sf, Rd, Rn, imm12) \ 106*4882a593Smuzhiyun A64_ADDSUB_IMM(sf, Rd, Rn, imm12, SUB_SETFLAGS) 107*4882a593Smuzhiyun /* Rn + imm12; set condition flags */ 108*4882a593Smuzhiyun #define A64_CMN_I(sf, Rn, imm12) A64_ADDS_I(sf, A64_ZR, Rn, imm12) 109*4882a593Smuzhiyun /* Rn - imm12; set condition flags */ 110*4882a593Smuzhiyun #define A64_CMP_I(sf, Rn, imm12) A64_SUBS_I(sf, A64_ZR, Rn, imm12) 111*4882a593Smuzhiyun /* Rd = Rn */ 112*4882a593Smuzhiyun #define A64_MOV(sf, Rd, Rn) A64_ADD_I(sf, Rd, Rn, 0) 113*4882a593Smuzhiyun 114*4882a593Smuzhiyun /* Bitfield move */ 115*4882a593Smuzhiyun #define A64_BITFIELD(sf, Rd, Rn, immr, imms, type) \ 116*4882a593Smuzhiyun aarch64_insn_gen_bitfield(Rd, Rn, immr, imms, \ 117*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_BITFIELD_MOVE_##type) 118*4882a593Smuzhiyun /* Signed, with sign replication to left and zeros to right */ 119*4882a593Smuzhiyun #define A64_SBFM(sf, Rd, Rn, ir, is) A64_BITFIELD(sf, Rd, Rn, ir, is, SIGNED) 120*4882a593Smuzhiyun /* Unsigned, with zeros to left and right */ 121*4882a593Smuzhiyun #define A64_UBFM(sf, Rd, Rn, ir, is) A64_BITFIELD(sf, Rd, Rn, ir, is, UNSIGNED) 122*4882a593Smuzhiyun 123*4882a593Smuzhiyun /* Rd = Rn << shift */ 124*4882a593Smuzhiyun #define A64_LSL(sf, Rd, Rn, shift) ({ \ 125*4882a593Smuzhiyun int sz = (sf) ? 64 : 32; \ 126*4882a593Smuzhiyun A64_UBFM(sf, Rd, Rn, (unsigned)-(shift) % sz, sz - 1 - (shift)); \ 127*4882a593Smuzhiyun }) 128*4882a593Smuzhiyun /* Rd = Rn >> shift */ 129*4882a593Smuzhiyun #define A64_LSR(sf, Rd, Rn, shift) A64_UBFM(sf, Rd, Rn, shift, (sf) ? 63 : 31) 130*4882a593Smuzhiyun /* Rd = Rn >> shift; signed */ 131*4882a593Smuzhiyun #define A64_ASR(sf, Rd, Rn, shift) A64_SBFM(sf, Rd, Rn, shift, (sf) ? 63 : 31) 132*4882a593Smuzhiyun 133*4882a593Smuzhiyun /* Zero extend */ 134*4882a593Smuzhiyun #define A64_UXTH(sf, Rd, Rn) A64_UBFM(sf, Rd, Rn, 0, 15) 135*4882a593Smuzhiyun #define A64_UXTW(sf, Rd, Rn) A64_UBFM(sf, Rd, Rn, 0, 31) 136*4882a593Smuzhiyun 137*4882a593Smuzhiyun /* Move wide (immediate) */ 138*4882a593Smuzhiyun #define A64_MOVEW(sf, Rd, imm16, shift, type) \ 139*4882a593Smuzhiyun aarch64_insn_gen_movewide(Rd, imm16, shift, \ 140*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_MOVEWIDE_##type) 141*4882a593Smuzhiyun /* Rd = Zeros (for MOVZ); 142*4882a593Smuzhiyun * Rd |= imm16 << shift (where shift is {0, 16, 32, 48}); 143*4882a593Smuzhiyun * Rd = ~Rd; (for MOVN); */ 144*4882a593Smuzhiyun #define A64_MOVN(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, INVERSE) 145*4882a593Smuzhiyun #define A64_MOVZ(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, ZERO) 146*4882a593Smuzhiyun #define A64_MOVK(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, KEEP) 147*4882a593Smuzhiyun 148*4882a593Smuzhiyun /* Add/subtract (shifted register) */ 149*4882a593Smuzhiyun #define A64_ADDSUB_SREG(sf, Rd, Rn, Rm, type) \ 150*4882a593Smuzhiyun aarch64_insn_gen_add_sub_shifted_reg(Rd, Rn, Rm, 0, \ 151*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_ADSB_##type) 152*4882a593Smuzhiyun /* Rd = Rn OP Rm */ 153*4882a593Smuzhiyun #define A64_ADD(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, ADD) 154*4882a593Smuzhiyun #define A64_SUB(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, SUB) 155*4882a593Smuzhiyun #define A64_SUBS(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, SUB_SETFLAGS) 156*4882a593Smuzhiyun /* Rd = -Rm */ 157*4882a593Smuzhiyun #define A64_NEG(sf, Rd, Rm) A64_SUB(sf, Rd, A64_ZR, Rm) 158*4882a593Smuzhiyun /* Rn - Rm; set condition flags */ 159*4882a593Smuzhiyun #define A64_CMP(sf, Rn, Rm) A64_SUBS(sf, A64_ZR, Rn, Rm) 160*4882a593Smuzhiyun 161*4882a593Smuzhiyun /* Data-processing (1 source) */ 162*4882a593Smuzhiyun #define A64_DATA1(sf, Rd, Rn, type) aarch64_insn_gen_data1(Rd, Rn, \ 163*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_DATA1_##type) 164*4882a593Smuzhiyun /* Rd = BSWAPx(Rn) */ 165*4882a593Smuzhiyun #define A64_REV16(sf, Rd, Rn) A64_DATA1(sf, Rd, Rn, REVERSE_16) 166*4882a593Smuzhiyun #define A64_REV32(sf, Rd, Rn) A64_DATA1(sf, Rd, Rn, REVERSE_32) 167*4882a593Smuzhiyun #define A64_REV64(Rd, Rn) A64_DATA1(1, Rd, Rn, REVERSE_64) 168*4882a593Smuzhiyun 169*4882a593Smuzhiyun /* Data-processing (2 source) */ 170*4882a593Smuzhiyun /* Rd = Rn OP Rm */ 171*4882a593Smuzhiyun #define A64_DATA2(sf, Rd, Rn, Rm, type) aarch64_insn_gen_data2(Rd, Rn, Rm, \ 172*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_DATA2_##type) 173*4882a593Smuzhiyun #define A64_UDIV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, UDIV) 174*4882a593Smuzhiyun #define A64_LSLV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, LSLV) 175*4882a593Smuzhiyun #define A64_LSRV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, LSRV) 176*4882a593Smuzhiyun #define A64_ASRV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, ASRV) 177*4882a593Smuzhiyun 178*4882a593Smuzhiyun /* Data-processing (3 source) */ 179*4882a593Smuzhiyun /* Rd = Ra + Rn * Rm */ 180*4882a593Smuzhiyun #define A64_MADD(sf, Rd, Ra, Rn, Rm) aarch64_insn_gen_data3(Rd, Ra, Rn, Rm, \ 181*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_DATA3_MADD) 182*4882a593Smuzhiyun /* Rd = Ra - Rn * Rm */ 183*4882a593Smuzhiyun #define A64_MSUB(sf, Rd, Ra, Rn, Rm) aarch64_insn_gen_data3(Rd, Ra, Rn, Rm, \ 184*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_DATA3_MSUB) 185*4882a593Smuzhiyun /* Rd = Rn * Rm */ 186*4882a593Smuzhiyun #define A64_MUL(sf, Rd, Rn, Rm) A64_MADD(sf, Rd, A64_ZR, Rn, Rm) 187*4882a593Smuzhiyun 188*4882a593Smuzhiyun /* Logical (shifted register) */ 189*4882a593Smuzhiyun #define A64_LOGIC_SREG(sf, Rd, Rn, Rm, type) \ 190*4882a593Smuzhiyun aarch64_insn_gen_logical_shifted_reg(Rd, Rn, Rm, 0, \ 191*4882a593Smuzhiyun A64_VARIANT(sf), AARCH64_INSN_LOGIC_##type) 192*4882a593Smuzhiyun /* Rd = Rn OP Rm */ 193*4882a593Smuzhiyun #define A64_AND(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, AND) 194*4882a593Smuzhiyun #define A64_ORR(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, ORR) 195*4882a593Smuzhiyun #define A64_EOR(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, EOR) 196*4882a593Smuzhiyun #define A64_ANDS(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, AND_SETFLAGS) 197*4882a593Smuzhiyun /* Rn & Rm; set condition flags */ 198*4882a593Smuzhiyun #define A64_TST(sf, Rn, Rm) A64_ANDS(sf, A64_ZR, Rn, Rm) 199*4882a593Smuzhiyun 200*4882a593Smuzhiyun /* Logical (immediate) */ 201*4882a593Smuzhiyun #define A64_LOGIC_IMM(sf, Rd, Rn, imm, type) ({ \ 202*4882a593Smuzhiyun u64 imm64 = (sf) ? (u64)imm : (u64)(u32)imm; \ 203*4882a593Smuzhiyun aarch64_insn_gen_logical_immediate(AARCH64_INSN_LOGIC_##type, \ 204*4882a593Smuzhiyun A64_VARIANT(sf), Rn, Rd, imm64); \ 205*4882a593Smuzhiyun }) 206*4882a593Smuzhiyun /* Rd = Rn OP imm */ 207*4882a593Smuzhiyun #define A64_AND_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, AND) 208*4882a593Smuzhiyun #define A64_ORR_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, ORR) 209*4882a593Smuzhiyun #define A64_EOR_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, EOR) 210*4882a593Smuzhiyun #define A64_ANDS_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, AND_SETFLAGS) 211*4882a593Smuzhiyun /* Rn & imm; set condition flags */ 212*4882a593Smuzhiyun #define A64_TST_I(sf, Rn, imm) A64_ANDS_I(sf, A64_ZR, Rn, imm) 213*4882a593Smuzhiyun 214*4882a593Smuzhiyun /* HINTs */ 215*4882a593Smuzhiyun #define A64_HINT(x) aarch64_insn_gen_hint(x) 216*4882a593Smuzhiyun 217*4882a593Smuzhiyun /* BTI */ 218*4882a593Smuzhiyun #define A64_BTI_C A64_HINT(AARCH64_INSN_HINT_BTIC) 219*4882a593Smuzhiyun #define A64_BTI_J A64_HINT(AARCH64_INSN_HINT_BTIJ) 220*4882a593Smuzhiyun #define A64_BTI_JC A64_HINT(AARCH64_INSN_HINT_BTIJC) 221*4882a593Smuzhiyun 222*4882a593Smuzhiyun #endif /* _BPF_JIT_H */ 223