bpf_jit.h 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288
  1. /* SPDX-License-Identifier: GPL-2.0-only */
  2. /*
  3. * BPF JIT compiler for ARM64
  4. *
  5. * Copyright (C) 2014-2016 Zi Shen Lim <[email protected]>
  6. */
  7. #ifndef _BPF_JIT_H
  8. #define _BPF_JIT_H
  9. #include <asm/insn.h>
  10. /* 5-bit Register Operand */
  11. #define A64_R(x) AARCH64_INSN_REG_##x
  12. #define A64_FP AARCH64_INSN_REG_FP
  13. #define A64_LR AARCH64_INSN_REG_LR
  14. #define A64_ZR AARCH64_INSN_REG_ZR
  15. #define A64_SP AARCH64_INSN_REG_SP
  16. #define A64_VARIANT(sf) \
  17. ((sf) ? AARCH64_INSN_VARIANT_64BIT : AARCH64_INSN_VARIANT_32BIT)
  18. /* Compare & branch (immediate) */
  19. #define A64_COMP_BRANCH(sf, Rt, offset, type) \
  20. aarch64_insn_gen_comp_branch_imm(0, offset, Rt, A64_VARIANT(sf), \
  21. AARCH64_INSN_BRANCH_COMP_##type)
  22. #define A64_CBZ(sf, Rt, imm19) A64_COMP_BRANCH(sf, Rt, (imm19) << 2, ZERO)
  23. #define A64_CBNZ(sf, Rt, imm19) A64_COMP_BRANCH(sf, Rt, (imm19) << 2, NONZERO)
  24. /* Conditional branch (immediate) */
  25. #define A64_COND_BRANCH(cond, offset) \
  26. aarch64_insn_gen_cond_branch_imm(0, offset, cond)
  27. #define A64_COND_EQ AARCH64_INSN_COND_EQ /* == */
  28. #define A64_COND_NE AARCH64_INSN_COND_NE /* != */
  29. #define A64_COND_CS AARCH64_INSN_COND_CS /* unsigned >= */
  30. #define A64_COND_HI AARCH64_INSN_COND_HI /* unsigned > */
  31. #define A64_COND_LS AARCH64_INSN_COND_LS /* unsigned <= */
  32. #define A64_COND_CC AARCH64_INSN_COND_CC /* unsigned < */
  33. #define A64_COND_GE AARCH64_INSN_COND_GE /* signed >= */
  34. #define A64_COND_GT AARCH64_INSN_COND_GT /* signed > */
  35. #define A64_COND_LE AARCH64_INSN_COND_LE /* signed <= */
  36. #define A64_COND_LT AARCH64_INSN_COND_LT /* signed < */
  37. #define A64_B_(cond, imm19) A64_COND_BRANCH(cond, (imm19) << 2)
  38. /* Unconditional branch (immediate) */
  39. #define A64_BRANCH(offset, type) aarch64_insn_gen_branch_imm(0, offset, \
  40. AARCH64_INSN_BRANCH_##type)
  41. #define A64_B(imm26) A64_BRANCH((imm26) << 2, NOLINK)
  42. #define A64_BL(imm26) A64_BRANCH((imm26) << 2, LINK)
  43. /* Unconditional branch (register) */
  44. #define A64_BR(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_NOLINK)
  45. #define A64_BLR(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_LINK)
  46. #define A64_RET(Rn) aarch64_insn_gen_branch_reg(Rn, AARCH64_INSN_BRANCH_RETURN)
  47. /* Load/store register (register offset) */
  48. #define A64_LS_REG(Rt, Rn, Rm, size, type) \
  49. aarch64_insn_gen_load_store_reg(Rt, Rn, Rm, \
  50. AARCH64_INSN_SIZE_##size, \
  51. AARCH64_INSN_LDST_##type##_REG_OFFSET)
  52. #define A64_STRB(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 8, STORE)
  53. #define A64_LDRB(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 8, LOAD)
  54. #define A64_STRH(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 16, STORE)
  55. #define A64_LDRH(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 16, LOAD)
  56. #define A64_STR32(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 32, STORE)
  57. #define A64_LDR32(Wt, Xn, Xm) A64_LS_REG(Wt, Xn, Xm, 32, LOAD)
  58. #define A64_STR64(Xt, Xn, Xm) A64_LS_REG(Xt, Xn, Xm, 64, STORE)
  59. #define A64_LDR64(Xt, Xn, Xm) A64_LS_REG(Xt, Xn, Xm, 64, LOAD)
  60. /* Load/store register (immediate offset) */
  61. #define A64_LS_IMM(Rt, Rn, imm, size, type) \
  62. aarch64_insn_gen_load_store_imm(Rt, Rn, imm, \
  63. AARCH64_INSN_SIZE_##size, \
  64. AARCH64_INSN_LDST_##type##_IMM_OFFSET)
  65. #define A64_STRBI(Wt, Xn, imm) A64_LS_IMM(Wt, Xn, imm, 8, STORE)
  66. #define A64_LDRBI(Wt, Xn, imm) A64_LS_IMM(Wt, Xn, imm, 8, LOAD)
  67. #define A64_STRHI(Wt, Xn, imm) A64_LS_IMM(Wt, Xn, imm, 16, STORE)
  68. #define A64_LDRHI(Wt, Xn, imm) A64_LS_IMM(Wt, Xn, imm, 16, LOAD)
  69. #define A64_STR32I(Wt, Xn, imm) A64_LS_IMM(Wt, Xn, imm, 32, STORE)
  70. #define A64_LDR32I(Wt, Xn, imm) A64_LS_IMM(Wt, Xn, imm, 32, LOAD)
  71. #define A64_STR64I(Xt, Xn, imm) A64_LS_IMM(Xt, Xn, imm, 64, STORE)
  72. #define A64_LDR64I(Xt, Xn, imm) A64_LS_IMM(Xt, Xn, imm, 64, LOAD)
  73. /* LDR (literal) */
  74. #define A64_LDR32LIT(Wt, offset) \
  75. aarch64_insn_gen_load_literal(0, offset, Wt, false)
  76. #define A64_LDR64LIT(Xt, offset) \
  77. aarch64_insn_gen_load_literal(0, offset, Xt, true)
  78. /* Load/store register pair */
  79. #define A64_LS_PAIR(Rt, Rt2, Rn, offset, ls, type) \
  80. aarch64_insn_gen_load_store_pair(Rt, Rt2, Rn, offset, \
  81. AARCH64_INSN_VARIANT_64BIT, \
  82. AARCH64_INSN_LDST_##ls##_PAIR_##type)
  83. /* Rn -= 16; Rn[0] = Rt; Rn[8] = Rt2; */
  84. #define A64_PUSH(Rt, Rt2, Rn) A64_LS_PAIR(Rt, Rt2, Rn, -16, STORE, PRE_INDEX)
  85. /* Rt = Rn[0]; Rt2 = Rn[8]; Rn += 16; */
  86. #define A64_POP(Rt, Rt2, Rn) A64_LS_PAIR(Rt, Rt2, Rn, 16, LOAD, POST_INDEX)
  87. /* Load/store exclusive */
  88. #define A64_SIZE(sf) \
  89. ((sf) ? AARCH64_INSN_SIZE_64 : AARCH64_INSN_SIZE_32)
  90. #define A64_LSX(sf, Rt, Rn, Rs, type) \
  91. aarch64_insn_gen_load_store_ex(Rt, Rn, Rs, A64_SIZE(sf), \
  92. AARCH64_INSN_LDST_##type)
  93. /* Rt = [Rn]; (atomic) */
  94. #define A64_LDXR(sf, Rt, Rn) \
  95. A64_LSX(sf, Rt, Rn, A64_ZR, LOAD_EX)
  96. /* [Rn] = Rt; (atomic) Rs = [state] */
  97. #define A64_STXR(sf, Rt, Rn, Rs) \
  98. A64_LSX(sf, Rt, Rn, Rs, STORE_EX)
  99. /* [Rn] = Rt (store release); (atomic) Rs = [state] */
  100. #define A64_STLXR(sf, Rt, Rn, Rs) \
  101. aarch64_insn_gen_load_store_ex(Rt, Rn, Rs, A64_SIZE(sf), \
  102. AARCH64_INSN_LDST_STORE_REL_EX)
  103. /*
  104. * LSE atomics
  105. *
  106. * ST{ADD,CLR,SET,EOR} is simply encoded as an alias for
  107. * LDD{ADD,CLR,SET,EOR} with XZR as the destination register.
  108. */
  109. #define A64_ST_OP(sf, Rn, Rs, op) \
  110. aarch64_insn_gen_atomic_ld_op(A64_ZR, Rn, Rs, \
  111. A64_SIZE(sf), AARCH64_INSN_MEM_ATOMIC_##op, \
  112. AARCH64_INSN_MEM_ORDER_NONE)
  113. /* [Rn] <op>= Rs */
  114. #define A64_STADD(sf, Rn, Rs) A64_ST_OP(sf, Rn, Rs, ADD)
  115. #define A64_STCLR(sf, Rn, Rs) A64_ST_OP(sf, Rn, Rs, CLR)
  116. #define A64_STEOR(sf, Rn, Rs) A64_ST_OP(sf, Rn, Rs, EOR)
  117. #define A64_STSET(sf, Rn, Rs) A64_ST_OP(sf, Rn, Rs, SET)
  118. #define A64_LD_OP_AL(sf, Rt, Rn, Rs, op) \
  119. aarch64_insn_gen_atomic_ld_op(Rt, Rn, Rs, \
  120. A64_SIZE(sf), AARCH64_INSN_MEM_ATOMIC_##op, \
  121. AARCH64_INSN_MEM_ORDER_ACQREL)
  122. /* Rt = [Rn] (load acquire); [Rn] <op>= Rs (store release) */
  123. #define A64_LDADDAL(sf, Rt, Rn, Rs) A64_LD_OP_AL(sf, Rt, Rn, Rs, ADD)
  124. #define A64_LDCLRAL(sf, Rt, Rn, Rs) A64_LD_OP_AL(sf, Rt, Rn, Rs, CLR)
  125. #define A64_LDEORAL(sf, Rt, Rn, Rs) A64_LD_OP_AL(sf, Rt, Rn, Rs, EOR)
  126. #define A64_LDSETAL(sf, Rt, Rn, Rs) A64_LD_OP_AL(sf, Rt, Rn, Rs, SET)
  127. /* Rt = [Rn] (load acquire); [Rn] = Rs (store release) */
  128. #define A64_SWPAL(sf, Rt, Rn, Rs) A64_LD_OP_AL(sf, Rt, Rn, Rs, SWP)
  129. /* Rs = CAS(Rn, Rs, Rt) (load acquire & store release) */
  130. #define A64_CASAL(sf, Rt, Rn, Rs) \
  131. aarch64_insn_gen_cas(Rt, Rn, Rs, A64_SIZE(sf), \
  132. AARCH64_INSN_MEM_ORDER_ACQREL)
  133. /* Add/subtract (immediate) */
  134. #define A64_ADDSUB_IMM(sf, Rd, Rn, imm12, type) \
  135. aarch64_insn_gen_add_sub_imm(Rd, Rn, imm12, \
  136. A64_VARIANT(sf), AARCH64_INSN_ADSB_##type)
  137. /* Rd = Rn OP imm12 */
  138. #define A64_ADD_I(sf, Rd, Rn, imm12) A64_ADDSUB_IMM(sf, Rd, Rn, imm12, ADD)
  139. #define A64_SUB_I(sf, Rd, Rn, imm12) A64_ADDSUB_IMM(sf, Rd, Rn, imm12, SUB)
  140. #define A64_ADDS_I(sf, Rd, Rn, imm12) \
  141. A64_ADDSUB_IMM(sf, Rd, Rn, imm12, ADD_SETFLAGS)
  142. #define A64_SUBS_I(sf, Rd, Rn, imm12) \
  143. A64_ADDSUB_IMM(sf, Rd, Rn, imm12, SUB_SETFLAGS)
  144. /* Rn + imm12; set condition flags */
  145. #define A64_CMN_I(sf, Rn, imm12) A64_ADDS_I(sf, A64_ZR, Rn, imm12)
  146. /* Rn - imm12; set condition flags */
  147. #define A64_CMP_I(sf, Rn, imm12) A64_SUBS_I(sf, A64_ZR, Rn, imm12)
  148. /* Rd = Rn */
  149. #define A64_MOV(sf, Rd, Rn) A64_ADD_I(sf, Rd, Rn, 0)
  150. /* Bitfield move */
  151. #define A64_BITFIELD(sf, Rd, Rn, immr, imms, type) \
  152. aarch64_insn_gen_bitfield(Rd, Rn, immr, imms, \
  153. A64_VARIANT(sf), AARCH64_INSN_BITFIELD_MOVE_##type)
  154. /* Signed, with sign replication to left and zeros to right */
  155. #define A64_SBFM(sf, Rd, Rn, ir, is) A64_BITFIELD(sf, Rd, Rn, ir, is, SIGNED)
  156. /* Unsigned, with zeros to left and right */
  157. #define A64_UBFM(sf, Rd, Rn, ir, is) A64_BITFIELD(sf, Rd, Rn, ir, is, UNSIGNED)
  158. /* Rd = Rn << shift */
  159. #define A64_LSL(sf, Rd, Rn, shift) ({ \
  160. int sz = (sf) ? 64 : 32; \
  161. A64_UBFM(sf, Rd, Rn, (unsigned)-(shift) % sz, sz - 1 - (shift)); \
  162. })
  163. /* Rd = Rn >> shift */
  164. #define A64_LSR(sf, Rd, Rn, shift) A64_UBFM(sf, Rd, Rn, shift, (sf) ? 63 : 31)
  165. /* Rd = Rn >> shift; signed */
  166. #define A64_ASR(sf, Rd, Rn, shift) A64_SBFM(sf, Rd, Rn, shift, (sf) ? 63 : 31)
  167. /* Zero extend */
  168. #define A64_UXTH(sf, Rd, Rn) A64_UBFM(sf, Rd, Rn, 0, 15)
  169. #define A64_UXTW(sf, Rd, Rn) A64_UBFM(sf, Rd, Rn, 0, 31)
  170. /* Move wide (immediate) */
  171. #define A64_MOVEW(sf, Rd, imm16, shift, type) \
  172. aarch64_insn_gen_movewide(Rd, imm16, shift, \
  173. A64_VARIANT(sf), AARCH64_INSN_MOVEWIDE_##type)
  174. /* Rd = Zeros (for MOVZ);
  175. * Rd |= imm16 << shift (where shift is {0, 16, 32, 48});
  176. * Rd = ~Rd; (for MOVN); */
  177. #define A64_MOVN(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, INVERSE)
  178. #define A64_MOVZ(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, ZERO)
  179. #define A64_MOVK(sf, Rd, imm16, shift) A64_MOVEW(sf, Rd, imm16, shift, KEEP)
  180. /* Add/subtract (shifted register) */
  181. #define A64_ADDSUB_SREG(sf, Rd, Rn, Rm, type) \
  182. aarch64_insn_gen_add_sub_shifted_reg(Rd, Rn, Rm, 0, \
  183. A64_VARIANT(sf), AARCH64_INSN_ADSB_##type)
  184. /* Rd = Rn OP Rm */
  185. #define A64_ADD(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, ADD)
  186. #define A64_SUB(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, SUB)
  187. #define A64_SUBS(sf, Rd, Rn, Rm) A64_ADDSUB_SREG(sf, Rd, Rn, Rm, SUB_SETFLAGS)
  188. /* Rd = -Rm */
  189. #define A64_NEG(sf, Rd, Rm) A64_SUB(sf, Rd, A64_ZR, Rm)
  190. /* Rn - Rm; set condition flags */
  191. #define A64_CMP(sf, Rn, Rm) A64_SUBS(sf, A64_ZR, Rn, Rm)
  192. /* Data-processing (1 source) */
  193. #define A64_DATA1(sf, Rd, Rn, type) aarch64_insn_gen_data1(Rd, Rn, \
  194. A64_VARIANT(sf), AARCH64_INSN_DATA1_##type)
  195. /* Rd = BSWAPx(Rn) */
  196. #define A64_REV16(sf, Rd, Rn) A64_DATA1(sf, Rd, Rn, REVERSE_16)
  197. #define A64_REV32(sf, Rd, Rn) A64_DATA1(sf, Rd, Rn, REVERSE_32)
  198. #define A64_REV64(Rd, Rn) A64_DATA1(1, Rd, Rn, REVERSE_64)
  199. /* Data-processing (2 source) */
  200. /* Rd = Rn OP Rm */
  201. #define A64_DATA2(sf, Rd, Rn, Rm, type) aarch64_insn_gen_data2(Rd, Rn, Rm, \
  202. A64_VARIANT(sf), AARCH64_INSN_DATA2_##type)
  203. #define A64_UDIV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, UDIV)
  204. #define A64_LSLV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, LSLV)
  205. #define A64_LSRV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, LSRV)
  206. #define A64_ASRV(sf, Rd, Rn, Rm) A64_DATA2(sf, Rd, Rn, Rm, ASRV)
  207. /* Data-processing (3 source) */
  208. /* Rd = Ra + Rn * Rm */
  209. #define A64_MADD(sf, Rd, Ra, Rn, Rm) aarch64_insn_gen_data3(Rd, Ra, Rn, Rm, \
  210. A64_VARIANT(sf), AARCH64_INSN_DATA3_MADD)
  211. /* Rd = Ra - Rn * Rm */
  212. #define A64_MSUB(sf, Rd, Ra, Rn, Rm) aarch64_insn_gen_data3(Rd, Ra, Rn, Rm, \
  213. A64_VARIANT(sf), AARCH64_INSN_DATA3_MSUB)
  214. /* Rd = Rn * Rm */
  215. #define A64_MUL(sf, Rd, Rn, Rm) A64_MADD(sf, Rd, A64_ZR, Rn, Rm)
  216. /* Logical (shifted register) */
  217. #define A64_LOGIC_SREG(sf, Rd, Rn, Rm, type) \
  218. aarch64_insn_gen_logical_shifted_reg(Rd, Rn, Rm, 0, \
  219. A64_VARIANT(sf), AARCH64_INSN_LOGIC_##type)
  220. /* Rd = Rn OP Rm */
  221. #define A64_AND(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, AND)
  222. #define A64_ORR(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, ORR)
  223. #define A64_EOR(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, EOR)
  224. #define A64_ANDS(sf, Rd, Rn, Rm) A64_LOGIC_SREG(sf, Rd, Rn, Rm, AND_SETFLAGS)
  225. /* Rn & Rm; set condition flags */
  226. #define A64_TST(sf, Rn, Rm) A64_ANDS(sf, A64_ZR, Rn, Rm)
  227. /* Rd = ~Rm (alias of ORN with A64_ZR as Rn) */
  228. #define A64_MVN(sf, Rd, Rm) \
  229. A64_LOGIC_SREG(sf, Rd, A64_ZR, Rm, ORN)
  230. /* Logical (immediate) */
  231. #define A64_LOGIC_IMM(sf, Rd, Rn, imm, type) ({ \
  232. u64 imm64 = (sf) ? (u64)imm : (u64)(u32)imm; \
  233. aarch64_insn_gen_logical_immediate(AARCH64_INSN_LOGIC_##type, \
  234. A64_VARIANT(sf), Rn, Rd, imm64); \
  235. })
  236. /* Rd = Rn OP imm */
  237. #define A64_AND_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, AND)
  238. #define A64_ORR_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, ORR)
  239. #define A64_EOR_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, EOR)
  240. #define A64_ANDS_I(sf, Rd, Rn, imm) A64_LOGIC_IMM(sf, Rd, Rn, imm, AND_SETFLAGS)
  241. /* Rn & imm; set condition flags */
  242. #define A64_TST_I(sf, Rn, imm) A64_ANDS_I(sf, A64_ZR, Rn, imm)
  243. /* HINTs */
  244. #define A64_HINT(x) aarch64_insn_gen_hint(x)
  245. #define A64_PACIASP A64_HINT(AARCH64_INSN_HINT_PACIASP)
  246. #define A64_AUTIASP A64_HINT(AARCH64_INSN_HINT_AUTIASP)
  247. /* BTI */
  248. #define A64_BTI_C A64_HINT(AARCH64_INSN_HINT_BTIC)
  249. #define A64_BTI_J A64_HINT(AARCH64_INSN_HINT_BTIJ)
  250. #define A64_BTI_JC A64_HINT(AARCH64_INSN_HINT_BTIJC)
  251. #define A64_NOP A64_HINT(AARCH64_INSN_HINT_NOP)
  252. /* DMB */
  253. #define A64_DMB_ISH aarch64_insn_gen_dmb(AARCH64_INSN_MB_ISH)
  254. /* ADR */
  255. #define A64_ADR(Rd, offset) \
  256. aarch64_insn_gen_adr(0, offset, Rd, AARCH64_INSN_ADR_TYPE_ADR)
  257. #endif /* _BPF_JIT_H */