18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci * Just-In-Time compiler for eBPF filters on IA32 (32bit x86)
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * Author: Wang YanQing (udknight@gmail.com)
68c2ecf20Sopenharmony_ci * The code based on code and ideas from:
78c2ecf20Sopenharmony_ci * Eric Dumazet (eric.dumazet@gmail.com)
88c2ecf20Sopenharmony_ci * and from:
98c2ecf20Sopenharmony_ci * Shubham Bansal <illusionist.neo@gmail.com>
108c2ecf20Sopenharmony_ci */
118c2ecf20Sopenharmony_ci
128c2ecf20Sopenharmony_ci#include <linux/netdevice.h>
138c2ecf20Sopenharmony_ci#include <linux/filter.h>
148c2ecf20Sopenharmony_ci#include <linux/if_vlan.h>
158c2ecf20Sopenharmony_ci#include <asm/cacheflush.h>
168c2ecf20Sopenharmony_ci#include <asm/set_memory.h>
178c2ecf20Sopenharmony_ci#include <asm/nospec-branch.h>
188c2ecf20Sopenharmony_ci#include <asm/asm-prototypes.h>
198c2ecf20Sopenharmony_ci#include <linux/bpf.h>
208c2ecf20Sopenharmony_ci
218c2ecf20Sopenharmony_ci/*
228c2ecf20Sopenharmony_ci * eBPF prog stack layout:
238c2ecf20Sopenharmony_ci *
248c2ecf20Sopenharmony_ci *                         high
258c2ecf20Sopenharmony_ci * original ESP =>        +-----+
268c2ecf20Sopenharmony_ci *                        |     | callee saved registers
278c2ecf20Sopenharmony_ci *                        +-----+
288c2ecf20Sopenharmony_ci *                        | ... | eBPF JIT scratch space
298c2ecf20Sopenharmony_ci * BPF_FP,IA32_EBP  =>    +-----+
308c2ecf20Sopenharmony_ci *                        | ... | eBPF prog stack
318c2ecf20Sopenharmony_ci *                        +-----+
328c2ecf20Sopenharmony_ci *                        |RSVD | JIT scratchpad
338c2ecf20Sopenharmony_ci * current ESP =>         +-----+
348c2ecf20Sopenharmony_ci *                        |     |
358c2ecf20Sopenharmony_ci *                        | ... | Function call stack
368c2ecf20Sopenharmony_ci *                        |     |
378c2ecf20Sopenharmony_ci *                        +-----+
388c2ecf20Sopenharmony_ci *                          low
398c2ecf20Sopenharmony_ci *
408c2ecf20Sopenharmony_ci * The callee saved registers:
418c2ecf20Sopenharmony_ci *
428c2ecf20Sopenharmony_ci *                                high
438c2ecf20Sopenharmony_ci * original ESP =>        +------------------+ \
448c2ecf20Sopenharmony_ci *                        |        ebp       | |
458c2ecf20Sopenharmony_ci * current EBP =>         +------------------+ } callee saved registers
468c2ecf20Sopenharmony_ci *                        |    ebx,esi,edi   | |
478c2ecf20Sopenharmony_ci *                        +------------------+ /
488c2ecf20Sopenharmony_ci *                                low
498c2ecf20Sopenharmony_ci */
508c2ecf20Sopenharmony_ci
518c2ecf20Sopenharmony_cistatic u8 *emit_code(u8 *ptr, u32 bytes, unsigned int len)
528c2ecf20Sopenharmony_ci{
538c2ecf20Sopenharmony_ci	if (len == 1)
548c2ecf20Sopenharmony_ci		*ptr = bytes;
558c2ecf20Sopenharmony_ci	else if (len == 2)
568c2ecf20Sopenharmony_ci		*(u16 *)ptr = bytes;
578c2ecf20Sopenharmony_ci	else {
588c2ecf20Sopenharmony_ci		*(u32 *)ptr = bytes;
598c2ecf20Sopenharmony_ci		barrier();
608c2ecf20Sopenharmony_ci	}
618c2ecf20Sopenharmony_ci	return ptr + len;
628c2ecf20Sopenharmony_ci}
638c2ecf20Sopenharmony_ci
648c2ecf20Sopenharmony_ci#define EMIT(bytes, len) \
658c2ecf20Sopenharmony_ci	do { prog = emit_code(prog, bytes, len); cnt += len; } while (0)
668c2ecf20Sopenharmony_ci
678c2ecf20Sopenharmony_ci#define EMIT1(b1)		EMIT(b1, 1)
688c2ecf20Sopenharmony_ci#define EMIT2(b1, b2)		EMIT((b1) + ((b2) << 8), 2)
698c2ecf20Sopenharmony_ci#define EMIT3(b1, b2, b3)	EMIT((b1) + ((b2) << 8) + ((b3) << 16), 3)
708c2ecf20Sopenharmony_ci#define EMIT4(b1, b2, b3, b4)   \
718c2ecf20Sopenharmony_ci	EMIT((b1) + ((b2) << 8) + ((b3) << 16) + ((b4) << 24), 4)
728c2ecf20Sopenharmony_ci
738c2ecf20Sopenharmony_ci#define EMIT1_off32(b1, off) \
748c2ecf20Sopenharmony_ci	do { EMIT1(b1); EMIT(off, 4); } while (0)
758c2ecf20Sopenharmony_ci#define EMIT2_off32(b1, b2, off) \
768c2ecf20Sopenharmony_ci	do { EMIT2(b1, b2); EMIT(off, 4); } while (0)
778c2ecf20Sopenharmony_ci#define EMIT3_off32(b1, b2, b3, off) \
788c2ecf20Sopenharmony_ci	do { EMIT3(b1, b2, b3); EMIT(off, 4); } while (0)
798c2ecf20Sopenharmony_ci#define EMIT4_off32(b1, b2, b3, b4, off) \
808c2ecf20Sopenharmony_ci	do { EMIT4(b1, b2, b3, b4); EMIT(off, 4); } while (0)
818c2ecf20Sopenharmony_ci
828c2ecf20Sopenharmony_ci#define jmp_label(label, jmp_insn_len) (label - cnt - jmp_insn_len)
838c2ecf20Sopenharmony_ci
848c2ecf20Sopenharmony_cistatic bool is_imm8(int value)
858c2ecf20Sopenharmony_ci{
868c2ecf20Sopenharmony_ci	return value <= 127 && value >= -128;
878c2ecf20Sopenharmony_ci}
888c2ecf20Sopenharmony_ci
898c2ecf20Sopenharmony_cistatic bool is_simm32(s64 value)
908c2ecf20Sopenharmony_ci{
918c2ecf20Sopenharmony_ci	return value == (s64) (s32) value;
928c2ecf20Sopenharmony_ci}
938c2ecf20Sopenharmony_ci
948c2ecf20Sopenharmony_ci#define STACK_OFFSET(k)	(k)
958c2ecf20Sopenharmony_ci#define TCALL_CNT	(MAX_BPF_JIT_REG + 0)	/* Tail Call Count */
968c2ecf20Sopenharmony_ci
978c2ecf20Sopenharmony_ci#define IA32_EAX	(0x0)
988c2ecf20Sopenharmony_ci#define IA32_EBX	(0x3)
998c2ecf20Sopenharmony_ci#define IA32_ECX	(0x1)
1008c2ecf20Sopenharmony_ci#define IA32_EDX	(0x2)
1018c2ecf20Sopenharmony_ci#define IA32_ESI	(0x6)
1028c2ecf20Sopenharmony_ci#define IA32_EDI	(0x7)
1038c2ecf20Sopenharmony_ci#define IA32_EBP	(0x5)
1048c2ecf20Sopenharmony_ci#define IA32_ESP	(0x4)
1058c2ecf20Sopenharmony_ci
1068c2ecf20Sopenharmony_ci/*
1078c2ecf20Sopenharmony_ci * List of x86 cond jumps opcodes (. + s8)
1088c2ecf20Sopenharmony_ci * Add 0x10 (and an extra 0x0f) to generate far jumps (. + s32)
1098c2ecf20Sopenharmony_ci */
1108c2ecf20Sopenharmony_ci#define IA32_JB  0x72
1118c2ecf20Sopenharmony_ci#define IA32_JAE 0x73
1128c2ecf20Sopenharmony_ci#define IA32_JE  0x74
1138c2ecf20Sopenharmony_ci#define IA32_JNE 0x75
1148c2ecf20Sopenharmony_ci#define IA32_JBE 0x76
1158c2ecf20Sopenharmony_ci#define IA32_JA  0x77
1168c2ecf20Sopenharmony_ci#define IA32_JL  0x7C
1178c2ecf20Sopenharmony_ci#define IA32_JGE 0x7D
1188c2ecf20Sopenharmony_ci#define IA32_JLE 0x7E
1198c2ecf20Sopenharmony_ci#define IA32_JG  0x7F
1208c2ecf20Sopenharmony_ci
1218c2ecf20Sopenharmony_ci#define COND_JMP_OPCODE_INVALID	(0xFF)
1228c2ecf20Sopenharmony_ci
1238c2ecf20Sopenharmony_ci/*
1248c2ecf20Sopenharmony_ci * Map eBPF registers to IA32 32bit registers or stack scratch space.
1258c2ecf20Sopenharmony_ci *
1268c2ecf20Sopenharmony_ci * 1. All the registers, R0-R10, are mapped to scratch space on stack.
1278c2ecf20Sopenharmony_ci * 2. We need two 64 bit temp registers to do complex operations on eBPF
1288c2ecf20Sopenharmony_ci *    registers.
1298c2ecf20Sopenharmony_ci * 3. For performance reason, the BPF_REG_AX for blinding constant, is
1308c2ecf20Sopenharmony_ci *    mapped to real hardware register pair, IA32_ESI and IA32_EDI.
1318c2ecf20Sopenharmony_ci *
1328c2ecf20Sopenharmony_ci * As the eBPF registers are all 64 bit registers and IA32 has only 32 bit
1338c2ecf20Sopenharmony_ci * registers, we have to map each eBPF registers with two IA32 32 bit regs
1348c2ecf20Sopenharmony_ci * or scratch memory space and we have to build eBPF 64 bit register from those.
1358c2ecf20Sopenharmony_ci *
1368c2ecf20Sopenharmony_ci * We use IA32_EAX, IA32_EDX, IA32_ECX, IA32_EBX as temporary registers.
1378c2ecf20Sopenharmony_ci */
1388c2ecf20Sopenharmony_cistatic const u8 bpf2ia32[][2] = {
1398c2ecf20Sopenharmony_ci	/* Return value from in-kernel function, and exit value from eBPF */
1408c2ecf20Sopenharmony_ci	[BPF_REG_0] = {STACK_OFFSET(0), STACK_OFFSET(4)},
1418c2ecf20Sopenharmony_ci
1428c2ecf20Sopenharmony_ci	/* The arguments from eBPF program to in-kernel function */
1438c2ecf20Sopenharmony_ci	/* Stored on stack scratch space */
1448c2ecf20Sopenharmony_ci	[BPF_REG_1] = {STACK_OFFSET(8), STACK_OFFSET(12)},
1458c2ecf20Sopenharmony_ci	[BPF_REG_2] = {STACK_OFFSET(16), STACK_OFFSET(20)},
1468c2ecf20Sopenharmony_ci	[BPF_REG_3] = {STACK_OFFSET(24), STACK_OFFSET(28)},
1478c2ecf20Sopenharmony_ci	[BPF_REG_4] = {STACK_OFFSET(32), STACK_OFFSET(36)},
1488c2ecf20Sopenharmony_ci	[BPF_REG_5] = {STACK_OFFSET(40), STACK_OFFSET(44)},
1498c2ecf20Sopenharmony_ci
1508c2ecf20Sopenharmony_ci	/* Callee saved registers that in-kernel function will preserve */
1518c2ecf20Sopenharmony_ci	/* Stored on stack scratch space */
1528c2ecf20Sopenharmony_ci	[BPF_REG_6] = {STACK_OFFSET(48), STACK_OFFSET(52)},
1538c2ecf20Sopenharmony_ci	[BPF_REG_7] = {STACK_OFFSET(56), STACK_OFFSET(60)},
1548c2ecf20Sopenharmony_ci	[BPF_REG_8] = {STACK_OFFSET(64), STACK_OFFSET(68)},
1558c2ecf20Sopenharmony_ci	[BPF_REG_9] = {STACK_OFFSET(72), STACK_OFFSET(76)},
1568c2ecf20Sopenharmony_ci
1578c2ecf20Sopenharmony_ci	/* Read only Frame Pointer to access Stack */
1588c2ecf20Sopenharmony_ci	[BPF_REG_FP] = {STACK_OFFSET(80), STACK_OFFSET(84)},
1598c2ecf20Sopenharmony_ci
1608c2ecf20Sopenharmony_ci	/* Temporary register for blinding constants. */
1618c2ecf20Sopenharmony_ci	[BPF_REG_AX] = {IA32_ESI, IA32_EDI},
1628c2ecf20Sopenharmony_ci
1638c2ecf20Sopenharmony_ci	/* Tail call count. Stored on stack scratch space. */
1648c2ecf20Sopenharmony_ci	[TCALL_CNT] = {STACK_OFFSET(88), STACK_OFFSET(92)},
1658c2ecf20Sopenharmony_ci};
1668c2ecf20Sopenharmony_ci
1678c2ecf20Sopenharmony_ci#define dst_lo	dst[0]
1688c2ecf20Sopenharmony_ci#define dst_hi	dst[1]
1698c2ecf20Sopenharmony_ci#define src_lo	src[0]
1708c2ecf20Sopenharmony_ci#define src_hi	src[1]
1718c2ecf20Sopenharmony_ci
1728c2ecf20Sopenharmony_ci#define STACK_ALIGNMENT	8
1738c2ecf20Sopenharmony_ci/*
1748c2ecf20Sopenharmony_ci * Stack space for BPF_REG_1, BPF_REG_2, BPF_REG_3, BPF_REG_4,
1758c2ecf20Sopenharmony_ci * BPF_REG_5, BPF_REG_6, BPF_REG_7, BPF_REG_8, BPF_REG_9,
1768c2ecf20Sopenharmony_ci * BPF_REG_FP, BPF_REG_AX and Tail call counts.
1778c2ecf20Sopenharmony_ci */
1788c2ecf20Sopenharmony_ci#define SCRATCH_SIZE 96
1798c2ecf20Sopenharmony_ci
1808c2ecf20Sopenharmony_ci/* Total stack size used in JITed code */
1818c2ecf20Sopenharmony_ci#define _STACK_SIZE	(stack_depth + SCRATCH_SIZE)
1828c2ecf20Sopenharmony_ci
1838c2ecf20Sopenharmony_ci#define STACK_SIZE ALIGN(_STACK_SIZE, STACK_ALIGNMENT)
1848c2ecf20Sopenharmony_ci
1858c2ecf20Sopenharmony_ci/* Get the offset of eBPF REGISTERs stored on scratch space. */
1868c2ecf20Sopenharmony_ci#define STACK_VAR(off) (off)
1878c2ecf20Sopenharmony_ci
1888c2ecf20Sopenharmony_ci/* Encode 'dst_reg' register into IA32 opcode 'byte' */
1898c2ecf20Sopenharmony_cistatic u8 add_1reg(u8 byte, u32 dst_reg)
1908c2ecf20Sopenharmony_ci{
1918c2ecf20Sopenharmony_ci	return byte + dst_reg;
1928c2ecf20Sopenharmony_ci}
1938c2ecf20Sopenharmony_ci
1948c2ecf20Sopenharmony_ci/* Encode 'dst_reg' and 'src_reg' registers into IA32 opcode 'byte' */
1958c2ecf20Sopenharmony_cistatic u8 add_2reg(u8 byte, u32 dst_reg, u32 src_reg)
1968c2ecf20Sopenharmony_ci{
1978c2ecf20Sopenharmony_ci	return byte + dst_reg + (src_reg << 3);
1988c2ecf20Sopenharmony_ci}
1998c2ecf20Sopenharmony_ci
2008c2ecf20Sopenharmony_cistatic void jit_fill_hole(void *area, unsigned int size)
2018c2ecf20Sopenharmony_ci{
2028c2ecf20Sopenharmony_ci	/* Fill whole space with int3 instructions */
2038c2ecf20Sopenharmony_ci	memset(area, 0xcc, size);
2048c2ecf20Sopenharmony_ci}
2058c2ecf20Sopenharmony_ci
2068c2ecf20Sopenharmony_cistatic inline void emit_ia32_mov_i(const u8 dst, const u32 val, bool dstk,
2078c2ecf20Sopenharmony_ci				   u8 **pprog)
2088c2ecf20Sopenharmony_ci{
2098c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
2108c2ecf20Sopenharmony_ci	int cnt = 0;
2118c2ecf20Sopenharmony_ci
2128c2ecf20Sopenharmony_ci	if (dstk) {
2138c2ecf20Sopenharmony_ci		if (val == 0) {
2148c2ecf20Sopenharmony_ci			/* xor eax,eax */
2158c2ecf20Sopenharmony_ci			EMIT2(0x33, add_2reg(0xC0, IA32_EAX, IA32_EAX));
2168c2ecf20Sopenharmony_ci			/* mov dword ptr [ebp+off],eax */
2178c2ecf20Sopenharmony_ci			EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX),
2188c2ecf20Sopenharmony_ci			      STACK_VAR(dst));
2198c2ecf20Sopenharmony_ci		} else {
2208c2ecf20Sopenharmony_ci			EMIT3_off32(0xC7, add_1reg(0x40, IA32_EBP),
2218c2ecf20Sopenharmony_ci				    STACK_VAR(dst), val);
2228c2ecf20Sopenharmony_ci		}
2238c2ecf20Sopenharmony_ci	} else {
2248c2ecf20Sopenharmony_ci		if (val == 0)
2258c2ecf20Sopenharmony_ci			EMIT2(0x33, add_2reg(0xC0, dst, dst));
2268c2ecf20Sopenharmony_ci		else
2278c2ecf20Sopenharmony_ci			EMIT2_off32(0xC7, add_1reg(0xC0, dst),
2288c2ecf20Sopenharmony_ci				    val);
2298c2ecf20Sopenharmony_ci	}
2308c2ecf20Sopenharmony_ci	*pprog = prog;
2318c2ecf20Sopenharmony_ci}
2328c2ecf20Sopenharmony_ci
2338c2ecf20Sopenharmony_ci/* dst = imm (4 bytes)*/
2348c2ecf20Sopenharmony_cistatic inline void emit_ia32_mov_r(const u8 dst, const u8 src, bool dstk,
2358c2ecf20Sopenharmony_ci				   bool sstk, u8 **pprog)
2368c2ecf20Sopenharmony_ci{
2378c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
2388c2ecf20Sopenharmony_ci	int cnt = 0;
2398c2ecf20Sopenharmony_ci	u8 sreg = sstk ? IA32_EAX : src;
2408c2ecf20Sopenharmony_ci
2418c2ecf20Sopenharmony_ci	if (sstk)
2428c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
2438c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(src));
2448c2ecf20Sopenharmony_ci	if (dstk)
2458c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],eax */
2468c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, sreg), STACK_VAR(dst));
2478c2ecf20Sopenharmony_ci	else
2488c2ecf20Sopenharmony_ci		/* mov dst,sreg */
2498c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dst, sreg));
2508c2ecf20Sopenharmony_ci
2518c2ecf20Sopenharmony_ci	*pprog = prog;
2528c2ecf20Sopenharmony_ci}
2538c2ecf20Sopenharmony_ci
2548c2ecf20Sopenharmony_ci/* dst = src */
2558c2ecf20Sopenharmony_cistatic inline void emit_ia32_mov_r64(const bool is64, const u8 dst[],
2568c2ecf20Sopenharmony_ci				     const u8 src[], bool dstk,
2578c2ecf20Sopenharmony_ci				     bool sstk, u8 **pprog,
2588c2ecf20Sopenharmony_ci				     const struct bpf_prog_aux *aux)
2598c2ecf20Sopenharmony_ci{
2608c2ecf20Sopenharmony_ci	emit_ia32_mov_r(dst_lo, src_lo, dstk, sstk, pprog);
2618c2ecf20Sopenharmony_ci	if (is64)
2628c2ecf20Sopenharmony_ci		/* complete 8 byte move */
2638c2ecf20Sopenharmony_ci		emit_ia32_mov_r(dst_hi, src_hi, dstk, sstk, pprog);
2648c2ecf20Sopenharmony_ci	else if (!aux->verifier_zext)
2658c2ecf20Sopenharmony_ci		/* zero out high 4 bytes */
2668c2ecf20Sopenharmony_ci		emit_ia32_mov_i(dst_hi, 0, dstk, pprog);
2678c2ecf20Sopenharmony_ci}
2688c2ecf20Sopenharmony_ci
2698c2ecf20Sopenharmony_ci/* Sign extended move */
2708c2ecf20Sopenharmony_cistatic inline void emit_ia32_mov_i64(const bool is64, const u8 dst[],
2718c2ecf20Sopenharmony_ci				     const u32 val, bool dstk, u8 **pprog)
2728c2ecf20Sopenharmony_ci{
2738c2ecf20Sopenharmony_ci	u32 hi = 0;
2748c2ecf20Sopenharmony_ci
2758c2ecf20Sopenharmony_ci	if (is64 && (val & (1<<31)))
2768c2ecf20Sopenharmony_ci		hi = (u32)~0;
2778c2ecf20Sopenharmony_ci	emit_ia32_mov_i(dst_lo, val, dstk, pprog);
2788c2ecf20Sopenharmony_ci	emit_ia32_mov_i(dst_hi, hi, dstk, pprog);
2798c2ecf20Sopenharmony_ci}
2808c2ecf20Sopenharmony_ci
2818c2ecf20Sopenharmony_ci/*
2828c2ecf20Sopenharmony_ci * ALU operation (32 bit)
2838c2ecf20Sopenharmony_ci * dst = dst * src
2848c2ecf20Sopenharmony_ci */
2858c2ecf20Sopenharmony_cistatic inline void emit_ia32_mul_r(const u8 dst, const u8 src, bool dstk,
2868c2ecf20Sopenharmony_ci				   bool sstk, u8 **pprog)
2878c2ecf20Sopenharmony_ci{
2888c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
2898c2ecf20Sopenharmony_ci	int cnt = 0;
2908c2ecf20Sopenharmony_ci	u8 sreg = sstk ? IA32_ECX : src;
2918c2ecf20Sopenharmony_ci
2928c2ecf20Sopenharmony_ci	if (sstk)
2938c2ecf20Sopenharmony_ci		/* mov ecx,dword ptr [ebp+off] */
2948c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX), STACK_VAR(src));
2958c2ecf20Sopenharmony_ci
2968c2ecf20Sopenharmony_ci	if (dstk)
2978c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
2988c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(dst));
2998c2ecf20Sopenharmony_ci	else
3008c2ecf20Sopenharmony_ci		/* mov eax,dst */
3018c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, dst, IA32_EAX));
3028c2ecf20Sopenharmony_ci
3038c2ecf20Sopenharmony_ci
3048c2ecf20Sopenharmony_ci	EMIT2(0xF7, add_1reg(0xE0, sreg));
3058c2ecf20Sopenharmony_ci
3068c2ecf20Sopenharmony_ci	if (dstk)
3078c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],eax */
3088c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX),
3098c2ecf20Sopenharmony_ci		      STACK_VAR(dst));
3108c2ecf20Sopenharmony_ci	else
3118c2ecf20Sopenharmony_ci		/* mov dst,eax */
3128c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dst, IA32_EAX));
3138c2ecf20Sopenharmony_ci
3148c2ecf20Sopenharmony_ci	*pprog = prog;
3158c2ecf20Sopenharmony_ci}
3168c2ecf20Sopenharmony_ci
3178c2ecf20Sopenharmony_cistatic inline void emit_ia32_to_le_r64(const u8 dst[], s32 val,
3188c2ecf20Sopenharmony_ci					 bool dstk, u8 **pprog,
3198c2ecf20Sopenharmony_ci					 const struct bpf_prog_aux *aux)
3208c2ecf20Sopenharmony_ci{
3218c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
3228c2ecf20Sopenharmony_ci	int cnt = 0;
3238c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
3248c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
3258c2ecf20Sopenharmony_ci
3268c2ecf20Sopenharmony_ci	if (dstk && val != 64) {
3278c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
3288c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
3298c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
3308c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
3318c2ecf20Sopenharmony_ci	}
3328c2ecf20Sopenharmony_ci	switch (val) {
3338c2ecf20Sopenharmony_ci	case 16:
3348c2ecf20Sopenharmony_ci		/*
3358c2ecf20Sopenharmony_ci		 * Emit 'movzwl eax,ax' to zero extend 16-bit
3368c2ecf20Sopenharmony_ci		 * into 64 bit
3378c2ecf20Sopenharmony_ci		 */
3388c2ecf20Sopenharmony_ci		EMIT2(0x0F, 0xB7);
3398c2ecf20Sopenharmony_ci		EMIT1(add_2reg(0xC0, dreg_lo, dreg_lo));
3408c2ecf20Sopenharmony_ci		if (!aux->verifier_zext)
3418c2ecf20Sopenharmony_ci			/* xor dreg_hi,dreg_hi */
3428c2ecf20Sopenharmony_ci			EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
3438c2ecf20Sopenharmony_ci		break;
3448c2ecf20Sopenharmony_ci	case 32:
3458c2ecf20Sopenharmony_ci		if (!aux->verifier_zext)
3468c2ecf20Sopenharmony_ci			/* xor dreg_hi,dreg_hi */
3478c2ecf20Sopenharmony_ci			EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
3488c2ecf20Sopenharmony_ci		break;
3498c2ecf20Sopenharmony_ci	case 64:
3508c2ecf20Sopenharmony_ci		/* nop */
3518c2ecf20Sopenharmony_ci		break;
3528c2ecf20Sopenharmony_ci	}
3538c2ecf20Sopenharmony_ci
3548c2ecf20Sopenharmony_ci	if (dstk && val != 64) {
3558c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
3568c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
3578c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
3588c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
3598c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
3608c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
3618c2ecf20Sopenharmony_ci	}
3628c2ecf20Sopenharmony_ci	*pprog = prog;
3638c2ecf20Sopenharmony_ci}
3648c2ecf20Sopenharmony_ci
3658c2ecf20Sopenharmony_cistatic inline void emit_ia32_to_be_r64(const u8 dst[], s32 val,
3668c2ecf20Sopenharmony_ci				       bool dstk, u8 **pprog,
3678c2ecf20Sopenharmony_ci				       const struct bpf_prog_aux *aux)
3688c2ecf20Sopenharmony_ci{
3698c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
3708c2ecf20Sopenharmony_ci	int cnt = 0;
3718c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
3728c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
3738c2ecf20Sopenharmony_ci
3748c2ecf20Sopenharmony_ci	if (dstk) {
3758c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
3768c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
3778c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
3788c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
3798c2ecf20Sopenharmony_ci	}
3808c2ecf20Sopenharmony_ci	switch (val) {
3818c2ecf20Sopenharmony_ci	case 16:
3828c2ecf20Sopenharmony_ci		/* Emit 'ror %ax, 8' to swap lower 2 bytes */
3838c2ecf20Sopenharmony_ci		EMIT1(0x66);
3848c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xC8, dreg_lo), 8);
3858c2ecf20Sopenharmony_ci
3868c2ecf20Sopenharmony_ci		EMIT2(0x0F, 0xB7);
3878c2ecf20Sopenharmony_ci		EMIT1(add_2reg(0xC0, dreg_lo, dreg_lo));
3888c2ecf20Sopenharmony_ci
3898c2ecf20Sopenharmony_ci		if (!aux->verifier_zext)
3908c2ecf20Sopenharmony_ci			/* xor dreg_hi,dreg_hi */
3918c2ecf20Sopenharmony_ci			EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
3928c2ecf20Sopenharmony_ci		break;
3938c2ecf20Sopenharmony_ci	case 32:
3948c2ecf20Sopenharmony_ci		/* Emit 'bswap eax' to swap lower 4 bytes */
3958c2ecf20Sopenharmony_ci		EMIT1(0x0F);
3968c2ecf20Sopenharmony_ci		EMIT1(add_1reg(0xC8, dreg_lo));
3978c2ecf20Sopenharmony_ci
3988c2ecf20Sopenharmony_ci		if (!aux->verifier_zext)
3998c2ecf20Sopenharmony_ci			/* xor dreg_hi,dreg_hi */
4008c2ecf20Sopenharmony_ci			EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
4018c2ecf20Sopenharmony_ci		break;
4028c2ecf20Sopenharmony_ci	case 64:
4038c2ecf20Sopenharmony_ci		/* Emit 'bswap eax' to swap lower 4 bytes */
4048c2ecf20Sopenharmony_ci		EMIT1(0x0F);
4058c2ecf20Sopenharmony_ci		EMIT1(add_1reg(0xC8, dreg_lo));
4068c2ecf20Sopenharmony_ci
4078c2ecf20Sopenharmony_ci		/* Emit 'bswap edx' to swap lower 4 bytes */
4088c2ecf20Sopenharmony_ci		EMIT1(0x0F);
4098c2ecf20Sopenharmony_ci		EMIT1(add_1reg(0xC8, dreg_hi));
4108c2ecf20Sopenharmony_ci
4118c2ecf20Sopenharmony_ci		/* mov ecx,dreg_hi */
4128c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, IA32_ECX, dreg_hi));
4138c2ecf20Sopenharmony_ci		/* mov dreg_hi,dreg_lo */
4148c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dreg_hi, dreg_lo));
4158c2ecf20Sopenharmony_ci		/* mov dreg_lo,ecx */
4168c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dreg_lo, IA32_ECX));
4178c2ecf20Sopenharmony_ci
4188c2ecf20Sopenharmony_ci		break;
4198c2ecf20Sopenharmony_ci	}
4208c2ecf20Sopenharmony_ci	if (dstk) {
4218c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
4228c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
4238c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
4248c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
4258c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
4268c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
4278c2ecf20Sopenharmony_ci	}
4288c2ecf20Sopenharmony_ci	*pprog = prog;
4298c2ecf20Sopenharmony_ci}
4308c2ecf20Sopenharmony_ci
4318c2ecf20Sopenharmony_ci/*
4328c2ecf20Sopenharmony_ci * ALU operation (32 bit)
4338c2ecf20Sopenharmony_ci * dst = dst (div|mod) src
4348c2ecf20Sopenharmony_ci */
4358c2ecf20Sopenharmony_cistatic inline void emit_ia32_div_mod_r(const u8 op, const u8 dst, const u8 src,
4368c2ecf20Sopenharmony_ci				       bool dstk, bool sstk, u8 **pprog)
4378c2ecf20Sopenharmony_ci{
4388c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
4398c2ecf20Sopenharmony_ci	int cnt = 0;
4408c2ecf20Sopenharmony_ci
4418c2ecf20Sopenharmony_ci	if (sstk)
4428c2ecf20Sopenharmony_ci		/* mov ecx,dword ptr [ebp+off] */
4438c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
4448c2ecf20Sopenharmony_ci		      STACK_VAR(src));
4458c2ecf20Sopenharmony_ci	else if (src != IA32_ECX)
4468c2ecf20Sopenharmony_ci		/* mov ecx,src */
4478c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, src, IA32_ECX));
4488c2ecf20Sopenharmony_ci
4498c2ecf20Sopenharmony_ci	if (dstk)
4508c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
4518c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
4528c2ecf20Sopenharmony_ci		      STACK_VAR(dst));
4538c2ecf20Sopenharmony_ci	else
4548c2ecf20Sopenharmony_ci		/* mov eax,dst */
4558c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, dst, IA32_EAX));
4568c2ecf20Sopenharmony_ci
4578c2ecf20Sopenharmony_ci	/* xor edx,edx */
4588c2ecf20Sopenharmony_ci	EMIT2(0x31, add_2reg(0xC0, IA32_EDX, IA32_EDX));
4598c2ecf20Sopenharmony_ci	/* div ecx */
4608c2ecf20Sopenharmony_ci	EMIT2(0xF7, add_1reg(0xF0, IA32_ECX));
4618c2ecf20Sopenharmony_ci
4628c2ecf20Sopenharmony_ci	if (op == BPF_MOD) {
4638c2ecf20Sopenharmony_ci		if (dstk)
4648c2ecf20Sopenharmony_ci			EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EDX),
4658c2ecf20Sopenharmony_ci			      STACK_VAR(dst));
4668c2ecf20Sopenharmony_ci		else
4678c2ecf20Sopenharmony_ci			EMIT2(0x89, add_2reg(0xC0, dst, IA32_EDX));
4688c2ecf20Sopenharmony_ci	} else {
4698c2ecf20Sopenharmony_ci		if (dstk)
4708c2ecf20Sopenharmony_ci			EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX),
4718c2ecf20Sopenharmony_ci			      STACK_VAR(dst));
4728c2ecf20Sopenharmony_ci		else
4738c2ecf20Sopenharmony_ci			EMIT2(0x89, add_2reg(0xC0, dst, IA32_EAX));
4748c2ecf20Sopenharmony_ci	}
4758c2ecf20Sopenharmony_ci	*pprog = prog;
4768c2ecf20Sopenharmony_ci}
4778c2ecf20Sopenharmony_ci
4788c2ecf20Sopenharmony_ci/*
4798c2ecf20Sopenharmony_ci * ALU operation (32 bit)
4808c2ecf20Sopenharmony_ci * dst = dst (shift) src
4818c2ecf20Sopenharmony_ci */
4828c2ecf20Sopenharmony_cistatic inline void emit_ia32_shift_r(const u8 op, const u8 dst, const u8 src,
4838c2ecf20Sopenharmony_ci				     bool dstk, bool sstk, u8 **pprog)
4848c2ecf20Sopenharmony_ci{
4858c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
4868c2ecf20Sopenharmony_ci	int cnt = 0;
4878c2ecf20Sopenharmony_ci	u8 dreg = dstk ? IA32_EAX : dst;
4888c2ecf20Sopenharmony_ci	u8 b2;
4898c2ecf20Sopenharmony_ci
4908c2ecf20Sopenharmony_ci	if (dstk)
4918c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
4928c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(dst));
4938c2ecf20Sopenharmony_ci
4948c2ecf20Sopenharmony_ci	if (sstk)
4958c2ecf20Sopenharmony_ci		/* mov ecx,dword ptr [ebp+off] */
4968c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX), STACK_VAR(src));
4978c2ecf20Sopenharmony_ci	else if (src != IA32_ECX)
4988c2ecf20Sopenharmony_ci		/* mov ecx,src */
4998c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, src, IA32_ECX));
5008c2ecf20Sopenharmony_ci
5018c2ecf20Sopenharmony_ci	switch (op) {
5028c2ecf20Sopenharmony_ci	case BPF_LSH:
5038c2ecf20Sopenharmony_ci		b2 = 0xE0; break;
5048c2ecf20Sopenharmony_ci	case BPF_RSH:
5058c2ecf20Sopenharmony_ci		b2 = 0xE8; break;
5068c2ecf20Sopenharmony_ci	case BPF_ARSH:
5078c2ecf20Sopenharmony_ci		b2 = 0xF8; break;
5088c2ecf20Sopenharmony_ci	default:
5098c2ecf20Sopenharmony_ci		return;
5108c2ecf20Sopenharmony_ci	}
5118c2ecf20Sopenharmony_ci	EMIT2(0xD3, add_1reg(b2, dreg));
5128c2ecf20Sopenharmony_ci
5138c2ecf20Sopenharmony_ci	if (dstk)
5148c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg */
5158c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg), STACK_VAR(dst));
5168c2ecf20Sopenharmony_ci	*pprog = prog;
5178c2ecf20Sopenharmony_ci}
5188c2ecf20Sopenharmony_ci
5198c2ecf20Sopenharmony_ci/*
5208c2ecf20Sopenharmony_ci * ALU operation (32 bit)
5218c2ecf20Sopenharmony_ci * dst = dst (op) src
5228c2ecf20Sopenharmony_ci */
5238c2ecf20Sopenharmony_cistatic inline void emit_ia32_alu_r(const bool is64, const bool hi, const u8 op,
5248c2ecf20Sopenharmony_ci				   const u8 dst, const u8 src, bool dstk,
5258c2ecf20Sopenharmony_ci				   bool sstk, u8 **pprog)
5268c2ecf20Sopenharmony_ci{
5278c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
5288c2ecf20Sopenharmony_ci	int cnt = 0;
5298c2ecf20Sopenharmony_ci	u8 sreg = sstk ? IA32_EAX : src;
5308c2ecf20Sopenharmony_ci	u8 dreg = dstk ? IA32_EDX : dst;
5318c2ecf20Sopenharmony_ci
5328c2ecf20Sopenharmony_ci	if (sstk)
5338c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
5348c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(src));
5358c2ecf20Sopenharmony_ci
5368c2ecf20Sopenharmony_ci	if (dstk)
5378c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
5388c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX), STACK_VAR(dst));
5398c2ecf20Sopenharmony_ci
5408c2ecf20Sopenharmony_ci	switch (BPF_OP(op)) {
5418c2ecf20Sopenharmony_ci	/* dst = dst + src */
5428c2ecf20Sopenharmony_ci	case BPF_ADD:
5438c2ecf20Sopenharmony_ci		if (hi && is64)
5448c2ecf20Sopenharmony_ci			EMIT2(0x11, add_2reg(0xC0, dreg, sreg));
5458c2ecf20Sopenharmony_ci		else
5468c2ecf20Sopenharmony_ci			EMIT2(0x01, add_2reg(0xC0, dreg, sreg));
5478c2ecf20Sopenharmony_ci		break;
5488c2ecf20Sopenharmony_ci	/* dst = dst - src */
5498c2ecf20Sopenharmony_ci	case BPF_SUB:
5508c2ecf20Sopenharmony_ci		if (hi && is64)
5518c2ecf20Sopenharmony_ci			EMIT2(0x19, add_2reg(0xC0, dreg, sreg));
5528c2ecf20Sopenharmony_ci		else
5538c2ecf20Sopenharmony_ci			EMIT2(0x29, add_2reg(0xC0, dreg, sreg));
5548c2ecf20Sopenharmony_ci		break;
5558c2ecf20Sopenharmony_ci	/* dst = dst | src */
5568c2ecf20Sopenharmony_ci	case BPF_OR:
5578c2ecf20Sopenharmony_ci		EMIT2(0x09, add_2reg(0xC0, dreg, sreg));
5588c2ecf20Sopenharmony_ci		break;
5598c2ecf20Sopenharmony_ci	/* dst = dst & src */
5608c2ecf20Sopenharmony_ci	case BPF_AND:
5618c2ecf20Sopenharmony_ci		EMIT2(0x21, add_2reg(0xC0, dreg, sreg));
5628c2ecf20Sopenharmony_ci		break;
5638c2ecf20Sopenharmony_ci	/* dst = dst ^ src */
5648c2ecf20Sopenharmony_ci	case BPF_XOR:
5658c2ecf20Sopenharmony_ci		EMIT2(0x31, add_2reg(0xC0, dreg, sreg));
5668c2ecf20Sopenharmony_ci		break;
5678c2ecf20Sopenharmony_ci	}
5688c2ecf20Sopenharmony_ci
5698c2ecf20Sopenharmony_ci	if (dstk)
5708c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg */
5718c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg),
5728c2ecf20Sopenharmony_ci		      STACK_VAR(dst));
5738c2ecf20Sopenharmony_ci	*pprog = prog;
5748c2ecf20Sopenharmony_ci}
5758c2ecf20Sopenharmony_ci
5768c2ecf20Sopenharmony_ci/* ALU operation (64 bit) */
5778c2ecf20Sopenharmony_cistatic inline void emit_ia32_alu_r64(const bool is64, const u8 op,
5788c2ecf20Sopenharmony_ci				     const u8 dst[], const u8 src[],
5798c2ecf20Sopenharmony_ci				     bool dstk,  bool sstk,
5808c2ecf20Sopenharmony_ci				     u8 **pprog, const struct bpf_prog_aux *aux)
5818c2ecf20Sopenharmony_ci{
5828c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
5838c2ecf20Sopenharmony_ci
5848c2ecf20Sopenharmony_ci	emit_ia32_alu_r(is64, false, op, dst_lo, src_lo, dstk, sstk, &prog);
5858c2ecf20Sopenharmony_ci	if (is64)
5868c2ecf20Sopenharmony_ci		emit_ia32_alu_r(is64, true, op, dst_hi, src_hi, dstk, sstk,
5878c2ecf20Sopenharmony_ci				&prog);
5888c2ecf20Sopenharmony_ci	else if (!aux->verifier_zext)
5898c2ecf20Sopenharmony_ci		emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
5908c2ecf20Sopenharmony_ci	*pprog = prog;
5918c2ecf20Sopenharmony_ci}
5928c2ecf20Sopenharmony_ci
5938c2ecf20Sopenharmony_ci/*
5948c2ecf20Sopenharmony_ci * ALU operation (32 bit)
5958c2ecf20Sopenharmony_ci * dst = dst (op) val
5968c2ecf20Sopenharmony_ci */
5978c2ecf20Sopenharmony_cistatic inline void emit_ia32_alu_i(const bool is64, const bool hi, const u8 op,
5988c2ecf20Sopenharmony_ci				   const u8 dst, const s32 val, bool dstk,
5998c2ecf20Sopenharmony_ci				   u8 **pprog)
6008c2ecf20Sopenharmony_ci{
6018c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
6028c2ecf20Sopenharmony_ci	int cnt = 0;
6038c2ecf20Sopenharmony_ci	u8 dreg = dstk ? IA32_EAX : dst;
6048c2ecf20Sopenharmony_ci	u8 sreg = IA32_EDX;
6058c2ecf20Sopenharmony_ci
6068c2ecf20Sopenharmony_ci	if (dstk)
6078c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
6088c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(dst));
6098c2ecf20Sopenharmony_ci
6108c2ecf20Sopenharmony_ci	if (!is_imm8(val))
6118c2ecf20Sopenharmony_ci		/* mov edx,imm32*/
6128c2ecf20Sopenharmony_ci		EMIT2_off32(0xC7, add_1reg(0xC0, IA32_EDX), val);
6138c2ecf20Sopenharmony_ci
6148c2ecf20Sopenharmony_ci	switch (op) {
6158c2ecf20Sopenharmony_ci	/* dst = dst + val */
6168c2ecf20Sopenharmony_ci	case BPF_ADD:
6178c2ecf20Sopenharmony_ci		if (hi && is64) {
6188c2ecf20Sopenharmony_ci			if (is_imm8(val))
6198c2ecf20Sopenharmony_ci				EMIT3(0x83, add_1reg(0xD0, dreg), val);
6208c2ecf20Sopenharmony_ci			else
6218c2ecf20Sopenharmony_ci				EMIT2(0x11, add_2reg(0xC0, dreg, sreg));
6228c2ecf20Sopenharmony_ci		} else {
6238c2ecf20Sopenharmony_ci			if (is_imm8(val))
6248c2ecf20Sopenharmony_ci				EMIT3(0x83, add_1reg(0xC0, dreg), val);
6258c2ecf20Sopenharmony_ci			else
6268c2ecf20Sopenharmony_ci				EMIT2(0x01, add_2reg(0xC0, dreg, sreg));
6278c2ecf20Sopenharmony_ci		}
6288c2ecf20Sopenharmony_ci		break;
6298c2ecf20Sopenharmony_ci	/* dst = dst - val */
6308c2ecf20Sopenharmony_ci	case BPF_SUB:
6318c2ecf20Sopenharmony_ci		if (hi && is64) {
6328c2ecf20Sopenharmony_ci			if (is_imm8(val))
6338c2ecf20Sopenharmony_ci				EMIT3(0x83, add_1reg(0xD8, dreg), val);
6348c2ecf20Sopenharmony_ci			else
6358c2ecf20Sopenharmony_ci				EMIT2(0x19, add_2reg(0xC0, dreg, sreg));
6368c2ecf20Sopenharmony_ci		} else {
6378c2ecf20Sopenharmony_ci			if (is_imm8(val))
6388c2ecf20Sopenharmony_ci				EMIT3(0x83, add_1reg(0xE8, dreg), val);
6398c2ecf20Sopenharmony_ci			else
6408c2ecf20Sopenharmony_ci				EMIT2(0x29, add_2reg(0xC0, dreg, sreg));
6418c2ecf20Sopenharmony_ci		}
6428c2ecf20Sopenharmony_ci		break;
6438c2ecf20Sopenharmony_ci	/* dst = dst | val */
6448c2ecf20Sopenharmony_ci	case BPF_OR:
6458c2ecf20Sopenharmony_ci		if (is_imm8(val))
6468c2ecf20Sopenharmony_ci			EMIT3(0x83, add_1reg(0xC8, dreg), val);
6478c2ecf20Sopenharmony_ci		else
6488c2ecf20Sopenharmony_ci			EMIT2(0x09, add_2reg(0xC0, dreg, sreg));
6498c2ecf20Sopenharmony_ci		break;
6508c2ecf20Sopenharmony_ci	/* dst = dst & val */
6518c2ecf20Sopenharmony_ci	case BPF_AND:
6528c2ecf20Sopenharmony_ci		if (is_imm8(val))
6538c2ecf20Sopenharmony_ci			EMIT3(0x83, add_1reg(0xE0, dreg), val);
6548c2ecf20Sopenharmony_ci		else
6558c2ecf20Sopenharmony_ci			EMIT2(0x21, add_2reg(0xC0, dreg, sreg));
6568c2ecf20Sopenharmony_ci		break;
6578c2ecf20Sopenharmony_ci	/* dst = dst ^ val */
6588c2ecf20Sopenharmony_ci	case BPF_XOR:
6598c2ecf20Sopenharmony_ci		if (is_imm8(val))
6608c2ecf20Sopenharmony_ci			EMIT3(0x83, add_1reg(0xF0, dreg), val);
6618c2ecf20Sopenharmony_ci		else
6628c2ecf20Sopenharmony_ci			EMIT2(0x31, add_2reg(0xC0, dreg, sreg));
6638c2ecf20Sopenharmony_ci		break;
6648c2ecf20Sopenharmony_ci	case BPF_NEG:
6658c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xD8, dreg));
6668c2ecf20Sopenharmony_ci		break;
6678c2ecf20Sopenharmony_ci	}
6688c2ecf20Sopenharmony_ci
6698c2ecf20Sopenharmony_ci	if (dstk)
6708c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg */
6718c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg),
6728c2ecf20Sopenharmony_ci		      STACK_VAR(dst));
6738c2ecf20Sopenharmony_ci	*pprog = prog;
6748c2ecf20Sopenharmony_ci}
6758c2ecf20Sopenharmony_ci
6768c2ecf20Sopenharmony_ci/* ALU operation (64 bit) */
6778c2ecf20Sopenharmony_cistatic inline void emit_ia32_alu_i64(const bool is64, const u8 op,
6788c2ecf20Sopenharmony_ci				     const u8 dst[], const u32 val,
6798c2ecf20Sopenharmony_ci				     bool dstk, u8 **pprog,
6808c2ecf20Sopenharmony_ci				     const struct bpf_prog_aux *aux)
6818c2ecf20Sopenharmony_ci{
6828c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
6838c2ecf20Sopenharmony_ci	u32 hi = 0;
6848c2ecf20Sopenharmony_ci
6858c2ecf20Sopenharmony_ci	if (is64 && (val & (1<<31)))
6868c2ecf20Sopenharmony_ci		hi = (u32)~0;
6878c2ecf20Sopenharmony_ci
6888c2ecf20Sopenharmony_ci	emit_ia32_alu_i(is64, false, op, dst_lo, val, dstk, &prog);
6898c2ecf20Sopenharmony_ci	if (is64)
6908c2ecf20Sopenharmony_ci		emit_ia32_alu_i(is64, true, op, dst_hi, hi, dstk, &prog);
6918c2ecf20Sopenharmony_ci	else if (!aux->verifier_zext)
6928c2ecf20Sopenharmony_ci		emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
6938c2ecf20Sopenharmony_ci
6948c2ecf20Sopenharmony_ci	*pprog = prog;
6958c2ecf20Sopenharmony_ci}
6968c2ecf20Sopenharmony_ci
6978c2ecf20Sopenharmony_ci/* dst = ~dst (64 bit) */
6988c2ecf20Sopenharmony_cistatic inline void emit_ia32_neg64(const u8 dst[], bool dstk, u8 **pprog)
6998c2ecf20Sopenharmony_ci{
7008c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
7018c2ecf20Sopenharmony_ci	int cnt = 0;
7028c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
7038c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
7048c2ecf20Sopenharmony_ci
7058c2ecf20Sopenharmony_ci	if (dstk) {
7068c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
7078c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
7088c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
7098c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
7108c2ecf20Sopenharmony_ci	}
7118c2ecf20Sopenharmony_ci
7128c2ecf20Sopenharmony_ci	/* neg dreg_lo */
7138c2ecf20Sopenharmony_ci	EMIT2(0xF7, add_1reg(0xD8, dreg_lo));
7148c2ecf20Sopenharmony_ci	/* adc dreg_hi,0x0 */
7158c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xD0, dreg_hi), 0x00);
7168c2ecf20Sopenharmony_ci	/* neg dreg_hi */
7178c2ecf20Sopenharmony_ci	EMIT2(0xF7, add_1reg(0xD8, dreg_hi));
7188c2ecf20Sopenharmony_ci
7198c2ecf20Sopenharmony_ci	if (dstk) {
7208c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
7218c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
7228c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
7238c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
7248c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
7258c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
7268c2ecf20Sopenharmony_ci	}
7278c2ecf20Sopenharmony_ci	*pprog = prog;
7288c2ecf20Sopenharmony_ci}
7298c2ecf20Sopenharmony_ci
7308c2ecf20Sopenharmony_ci/* dst = dst << src */
7318c2ecf20Sopenharmony_cistatic inline void emit_ia32_lsh_r64(const u8 dst[], const u8 src[],
7328c2ecf20Sopenharmony_ci				     bool dstk, bool sstk, u8 **pprog)
7338c2ecf20Sopenharmony_ci{
7348c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
7358c2ecf20Sopenharmony_ci	int cnt = 0;
7368c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
7378c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
7388c2ecf20Sopenharmony_ci
7398c2ecf20Sopenharmony_ci	if (dstk) {
7408c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
7418c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
7428c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
7438c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
7448c2ecf20Sopenharmony_ci	}
7458c2ecf20Sopenharmony_ci
7468c2ecf20Sopenharmony_ci	if (sstk)
7478c2ecf20Sopenharmony_ci		/* mov ecx,dword ptr [ebp+off] */
7488c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
7498c2ecf20Sopenharmony_ci		      STACK_VAR(src_lo));
7508c2ecf20Sopenharmony_ci	else
7518c2ecf20Sopenharmony_ci		/* mov ecx,src_lo */
7528c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, src_lo, IA32_ECX));
7538c2ecf20Sopenharmony_ci
7548c2ecf20Sopenharmony_ci	/* shld dreg_hi,dreg_lo,cl */
7558c2ecf20Sopenharmony_ci	EMIT3(0x0F, 0xA5, add_2reg(0xC0, dreg_hi, dreg_lo));
7568c2ecf20Sopenharmony_ci	/* shl dreg_lo,cl */
7578c2ecf20Sopenharmony_ci	EMIT2(0xD3, add_1reg(0xE0, dreg_lo));
7588c2ecf20Sopenharmony_ci
7598c2ecf20Sopenharmony_ci	/* if ecx >= 32, mov dreg_lo into dreg_hi and clear dreg_lo */
7608c2ecf20Sopenharmony_ci
7618c2ecf20Sopenharmony_ci	/* cmp ecx,32 */
7628c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xF8, IA32_ECX), 32);
7638c2ecf20Sopenharmony_ci	/* skip the next two instructions (4 bytes) when < 32 */
7648c2ecf20Sopenharmony_ci	EMIT2(IA32_JB, 4);
7658c2ecf20Sopenharmony_ci
7668c2ecf20Sopenharmony_ci	/* mov dreg_hi,dreg_lo */
7678c2ecf20Sopenharmony_ci	EMIT2(0x89, add_2reg(0xC0, dreg_hi, dreg_lo));
7688c2ecf20Sopenharmony_ci	/* xor dreg_lo,dreg_lo */
7698c2ecf20Sopenharmony_ci	EMIT2(0x33, add_2reg(0xC0, dreg_lo, dreg_lo));
7708c2ecf20Sopenharmony_ci
7718c2ecf20Sopenharmony_ci	if (dstk) {
7728c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
7738c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
7748c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
7758c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
7768c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
7778c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
7788c2ecf20Sopenharmony_ci	}
7798c2ecf20Sopenharmony_ci	/* out: */
7808c2ecf20Sopenharmony_ci	*pprog = prog;
7818c2ecf20Sopenharmony_ci}
7828c2ecf20Sopenharmony_ci
7838c2ecf20Sopenharmony_ci/* dst = dst >> src (signed)*/
7848c2ecf20Sopenharmony_cistatic inline void emit_ia32_arsh_r64(const u8 dst[], const u8 src[],
7858c2ecf20Sopenharmony_ci				      bool dstk, bool sstk, u8 **pprog)
7868c2ecf20Sopenharmony_ci{
7878c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
7888c2ecf20Sopenharmony_ci	int cnt = 0;
7898c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
7908c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
7918c2ecf20Sopenharmony_ci
7928c2ecf20Sopenharmony_ci	if (dstk) {
7938c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
7948c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
7958c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
7968c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
7978c2ecf20Sopenharmony_ci	}
7988c2ecf20Sopenharmony_ci
7998c2ecf20Sopenharmony_ci	if (sstk)
8008c2ecf20Sopenharmony_ci		/* mov ecx,dword ptr [ebp+off] */
8018c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
8028c2ecf20Sopenharmony_ci		      STACK_VAR(src_lo));
8038c2ecf20Sopenharmony_ci	else
8048c2ecf20Sopenharmony_ci		/* mov ecx,src_lo */
8058c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, src_lo, IA32_ECX));
8068c2ecf20Sopenharmony_ci
8078c2ecf20Sopenharmony_ci	/* shrd dreg_lo,dreg_hi,cl */
8088c2ecf20Sopenharmony_ci	EMIT3(0x0F, 0xAD, add_2reg(0xC0, dreg_lo, dreg_hi));
8098c2ecf20Sopenharmony_ci	/* sar dreg_hi,cl */
8108c2ecf20Sopenharmony_ci	EMIT2(0xD3, add_1reg(0xF8, dreg_hi));
8118c2ecf20Sopenharmony_ci
8128c2ecf20Sopenharmony_ci	/* if ecx >= 32, mov dreg_hi to dreg_lo and set/clear dreg_hi depending on sign */
8138c2ecf20Sopenharmony_ci
8148c2ecf20Sopenharmony_ci	/* cmp ecx,32 */
8158c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xF8, IA32_ECX), 32);
8168c2ecf20Sopenharmony_ci	/* skip the next two instructions (5 bytes) when < 32 */
8178c2ecf20Sopenharmony_ci	EMIT2(IA32_JB, 5);
8188c2ecf20Sopenharmony_ci
8198c2ecf20Sopenharmony_ci	/* mov dreg_lo,dreg_hi */
8208c2ecf20Sopenharmony_ci	EMIT2(0x89, add_2reg(0xC0, dreg_lo, dreg_hi));
8218c2ecf20Sopenharmony_ci	/* sar dreg_hi,31 */
8228c2ecf20Sopenharmony_ci	EMIT3(0xC1, add_1reg(0xF8, dreg_hi), 31);
8238c2ecf20Sopenharmony_ci
8248c2ecf20Sopenharmony_ci	if (dstk) {
8258c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
8268c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
8278c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
8288c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
8298c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
8308c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
8318c2ecf20Sopenharmony_ci	}
8328c2ecf20Sopenharmony_ci	/* out: */
8338c2ecf20Sopenharmony_ci	*pprog = prog;
8348c2ecf20Sopenharmony_ci}
8358c2ecf20Sopenharmony_ci
8368c2ecf20Sopenharmony_ci/* dst = dst >> src */
8378c2ecf20Sopenharmony_cistatic inline void emit_ia32_rsh_r64(const u8 dst[], const u8 src[], bool dstk,
8388c2ecf20Sopenharmony_ci				     bool sstk, u8 **pprog)
8398c2ecf20Sopenharmony_ci{
8408c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
8418c2ecf20Sopenharmony_ci	int cnt = 0;
8428c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
8438c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
8448c2ecf20Sopenharmony_ci
8458c2ecf20Sopenharmony_ci	if (dstk) {
8468c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
8478c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
8488c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
8498c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
8508c2ecf20Sopenharmony_ci	}
8518c2ecf20Sopenharmony_ci
8528c2ecf20Sopenharmony_ci	if (sstk)
8538c2ecf20Sopenharmony_ci		/* mov ecx,dword ptr [ebp+off] */
8548c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
8558c2ecf20Sopenharmony_ci		      STACK_VAR(src_lo));
8568c2ecf20Sopenharmony_ci	else
8578c2ecf20Sopenharmony_ci		/* mov ecx,src_lo */
8588c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, src_lo, IA32_ECX));
8598c2ecf20Sopenharmony_ci
8608c2ecf20Sopenharmony_ci	/* shrd dreg_lo,dreg_hi,cl */
8618c2ecf20Sopenharmony_ci	EMIT3(0x0F, 0xAD, add_2reg(0xC0, dreg_lo, dreg_hi));
8628c2ecf20Sopenharmony_ci	/* shr dreg_hi,cl */
8638c2ecf20Sopenharmony_ci	EMIT2(0xD3, add_1reg(0xE8, dreg_hi));
8648c2ecf20Sopenharmony_ci
8658c2ecf20Sopenharmony_ci	/* if ecx >= 32, mov dreg_hi to dreg_lo and clear dreg_hi */
8668c2ecf20Sopenharmony_ci
8678c2ecf20Sopenharmony_ci	/* cmp ecx,32 */
8688c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xF8, IA32_ECX), 32);
8698c2ecf20Sopenharmony_ci	/* skip the next two instructions (4 bytes) when < 32 */
8708c2ecf20Sopenharmony_ci	EMIT2(IA32_JB, 4);
8718c2ecf20Sopenharmony_ci
8728c2ecf20Sopenharmony_ci	/* mov dreg_lo,dreg_hi */
8738c2ecf20Sopenharmony_ci	EMIT2(0x89, add_2reg(0xC0, dreg_lo, dreg_hi));
8748c2ecf20Sopenharmony_ci	/* xor dreg_hi,dreg_hi */
8758c2ecf20Sopenharmony_ci	EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
8768c2ecf20Sopenharmony_ci
8778c2ecf20Sopenharmony_ci	if (dstk) {
8788c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
8798c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
8808c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
8818c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
8828c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
8838c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
8848c2ecf20Sopenharmony_ci	}
8858c2ecf20Sopenharmony_ci	/* out: */
8868c2ecf20Sopenharmony_ci	*pprog = prog;
8878c2ecf20Sopenharmony_ci}
8888c2ecf20Sopenharmony_ci
8898c2ecf20Sopenharmony_ci/* dst = dst << val */
8908c2ecf20Sopenharmony_cistatic inline void emit_ia32_lsh_i64(const u8 dst[], const u32 val,
8918c2ecf20Sopenharmony_ci				     bool dstk, u8 **pprog)
8928c2ecf20Sopenharmony_ci{
8938c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
8948c2ecf20Sopenharmony_ci	int cnt = 0;
8958c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
8968c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
8978c2ecf20Sopenharmony_ci
8988c2ecf20Sopenharmony_ci	if (dstk) {
8998c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
9008c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
9018c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
9028c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
9038c2ecf20Sopenharmony_ci	}
9048c2ecf20Sopenharmony_ci	/* Do LSH operation */
9058c2ecf20Sopenharmony_ci	if (val < 32) {
9068c2ecf20Sopenharmony_ci		/* shld dreg_hi,dreg_lo,imm8 */
9078c2ecf20Sopenharmony_ci		EMIT4(0x0F, 0xA4, add_2reg(0xC0, dreg_hi, dreg_lo), val);
9088c2ecf20Sopenharmony_ci		/* shl dreg_lo,imm8 */
9098c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xE0, dreg_lo), val);
9108c2ecf20Sopenharmony_ci	} else if (val >= 32 && val < 64) {
9118c2ecf20Sopenharmony_ci		u32 value = val - 32;
9128c2ecf20Sopenharmony_ci
9138c2ecf20Sopenharmony_ci		/* shl dreg_lo,imm8 */
9148c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xE0, dreg_lo), value);
9158c2ecf20Sopenharmony_ci		/* mov dreg_hi,dreg_lo */
9168c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dreg_hi, dreg_lo));
9178c2ecf20Sopenharmony_ci		/* xor dreg_lo,dreg_lo */
9188c2ecf20Sopenharmony_ci		EMIT2(0x33, add_2reg(0xC0, dreg_lo, dreg_lo));
9198c2ecf20Sopenharmony_ci	} else {
9208c2ecf20Sopenharmony_ci		/* xor dreg_lo,dreg_lo */
9218c2ecf20Sopenharmony_ci		EMIT2(0x33, add_2reg(0xC0, dreg_lo, dreg_lo));
9228c2ecf20Sopenharmony_ci		/* xor dreg_hi,dreg_hi */
9238c2ecf20Sopenharmony_ci		EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
9248c2ecf20Sopenharmony_ci	}
9258c2ecf20Sopenharmony_ci
9268c2ecf20Sopenharmony_ci	if (dstk) {
9278c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
9288c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
9298c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
9308c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
9318c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
9328c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
9338c2ecf20Sopenharmony_ci	}
9348c2ecf20Sopenharmony_ci	*pprog = prog;
9358c2ecf20Sopenharmony_ci}
9368c2ecf20Sopenharmony_ci
9378c2ecf20Sopenharmony_ci/* dst = dst >> val */
9388c2ecf20Sopenharmony_cistatic inline void emit_ia32_rsh_i64(const u8 dst[], const u32 val,
9398c2ecf20Sopenharmony_ci				     bool dstk, u8 **pprog)
9408c2ecf20Sopenharmony_ci{
9418c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
9428c2ecf20Sopenharmony_ci	int cnt = 0;
9438c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
9448c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
9458c2ecf20Sopenharmony_ci
9468c2ecf20Sopenharmony_ci	if (dstk) {
9478c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
9488c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
9498c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
9508c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
9518c2ecf20Sopenharmony_ci	}
9528c2ecf20Sopenharmony_ci
9538c2ecf20Sopenharmony_ci	/* Do RSH operation */
9548c2ecf20Sopenharmony_ci	if (val < 32) {
9558c2ecf20Sopenharmony_ci		/* shrd dreg_lo,dreg_hi,imm8 */
9568c2ecf20Sopenharmony_ci		EMIT4(0x0F, 0xAC, add_2reg(0xC0, dreg_lo, dreg_hi), val);
9578c2ecf20Sopenharmony_ci		/* shr dreg_hi,imm8 */
9588c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xE8, dreg_hi), val);
9598c2ecf20Sopenharmony_ci	} else if (val >= 32 && val < 64) {
9608c2ecf20Sopenharmony_ci		u32 value = val - 32;
9618c2ecf20Sopenharmony_ci
9628c2ecf20Sopenharmony_ci		/* shr dreg_hi,imm8 */
9638c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xE8, dreg_hi), value);
9648c2ecf20Sopenharmony_ci		/* mov dreg_lo,dreg_hi */
9658c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dreg_lo, dreg_hi));
9668c2ecf20Sopenharmony_ci		/* xor dreg_hi,dreg_hi */
9678c2ecf20Sopenharmony_ci		EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
9688c2ecf20Sopenharmony_ci	} else {
9698c2ecf20Sopenharmony_ci		/* xor dreg_lo,dreg_lo */
9708c2ecf20Sopenharmony_ci		EMIT2(0x33, add_2reg(0xC0, dreg_lo, dreg_lo));
9718c2ecf20Sopenharmony_ci		/* xor dreg_hi,dreg_hi */
9728c2ecf20Sopenharmony_ci		EMIT2(0x33, add_2reg(0xC0, dreg_hi, dreg_hi));
9738c2ecf20Sopenharmony_ci	}
9748c2ecf20Sopenharmony_ci
9758c2ecf20Sopenharmony_ci	if (dstk) {
9768c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
9778c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
9788c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
9798c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
9808c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
9818c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
9828c2ecf20Sopenharmony_ci	}
9838c2ecf20Sopenharmony_ci	*pprog = prog;
9848c2ecf20Sopenharmony_ci}
9858c2ecf20Sopenharmony_ci
9868c2ecf20Sopenharmony_ci/* dst = dst >> val (signed) */
9878c2ecf20Sopenharmony_cistatic inline void emit_ia32_arsh_i64(const u8 dst[], const u32 val,
9888c2ecf20Sopenharmony_ci				      bool dstk, u8 **pprog)
9898c2ecf20Sopenharmony_ci{
9908c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
9918c2ecf20Sopenharmony_ci	int cnt = 0;
9928c2ecf20Sopenharmony_ci	u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
9938c2ecf20Sopenharmony_ci	u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
9948c2ecf20Sopenharmony_ci
9958c2ecf20Sopenharmony_ci	if (dstk) {
9968c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
9978c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
9988c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
9998c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
10008c2ecf20Sopenharmony_ci	}
10018c2ecf20Sopenharmony_ci	/* Do RSH operation */
10028c2ecf20Sopenharmony_ci	if (val < 32) {
10038c2ecf20Sopenharmony_ci		/* shrd dreg_lo,dreg_hi,imm8 */
10048c2ecf20Sopenharmony_ci		EMIT4(0x0F, 0xAC, add_2reg(0xC0, dreg_lo, dreg_hi), val);
10058c2ecf20Sopenharmony_ci		/* ashr dreg_hi,imm8 */
10068c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xF8, dreg_hi), val);
10078c2ecf20Sopenharmony_ci	} else if (val >= 32 && val < 64) {
10088c2ecf20Sopenharmony_ci		u32 value = val - 32;
10098c2ecf20Sopenharmony_ci
10108c2ecf20Sopenharmony_ci		/* ashr dreg_hi,imm8 */
10118c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xF8, dreg_hi), value);
10128c2ecf20Sopenharmony_ci		/* mov dreg_lo,dreg_hi */
10138c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dreg_lo, dreg_hi));
10148c2ecf20Sopenharmony_ci
10158c2ecf20Sopenharmony_ci		/* ashr dreg_hi,imm8 */
10168c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xF8, dreg_hi), 31);
10178c2ecf20Sopenharmony_ci	} else {
10188c2ecf20Sopenharmony_ci		/* ashr dreg_hi,imm8 */
10198c2ecf20Sopenharmony_ci		EMIT3(0xC1, add_1reg(0xF8, dreg_hi), 31);
10208c2ecf20Sopenharmony_ci		/* mov dreg_lo,dreg_hi */
10218c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dreg_lo, dreg_hi));
10228c2ecf20Sopenharmony_ci	}
10238c2ecf20Sopenharmony_ci
10248c2ecf20Sopenharmony_ci	if (dstk) {
10258c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_lo */
10268c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_lo),
10278c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
10288c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],dreg_hi */
10298c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, dreg_hi),
10308c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
10318c2ecf20Sopenharmony_ci	}
10328c2ecf20Sopenharmony_ci	*pprog = prog;
10338c2ecf20Sopenharmony_ci}
10348c2ecf20Sopenharmony_ci
10358c2ecf20Sopenharmony_cistatic inline void emit_ia32_mul_r64(const u8 dst[], const u8 src[], bool dstk,
10368c2ecf20Sopenharmony_ci				     bool sstk, u8 **pprog)
10378c2ecf20Sopenharmony_ci{
10388c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
10398c2ecf20Sopenharmony_ci	int cnt = 0;
10408c2ecf20Sopenharmony_ci
10418c2ecf20Sopenharmony_ci	if (dstk)
10428c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
10438c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
10448c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
10458c2ecf20Sopenharmony_ci	else
10468c2ecf20Sopenharmony_ci		/* mov eax,dst_hi */
10478c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, dst_hi, IA32_EAX));
10488c2ecf20Sopenharmony_ci
10498c2ecf20Sopenharmony_ci	if (sstk)
10508c2ecf20Sopenharmony_ci		/* mul dword ptr [ebp+off] */
10518c2ecf20Sopenharmony_ci		EMIT3(0xF7, add_1reg(0x60, IA32_EBP), STACK_VAR(src_lo));
10528c2ecf20Sopenharmony_ci	else
10538c2ecf20Sopenharmony_ci		/* mul src_lo */
10548c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xE0, src_lo));
10558c2ecf20Sopenharmony_ci
10568c2ecf20Sopenharmony_ci	/* mov ecx,eax */
10578c2ecf20Sopenharmony_ci	EMIT2(0x89, add_2reg(0xC0, IA32_ECX, IA32_EAX));
10588c2ecf20Sopenharmony_ci
10598c2ecf20Sopenharmony_ci	if (dstk)
10608c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
10618c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
10628c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
10638c2ecf20Sopenharmony_ci	else
10648c2ecf20Sopenharmony_ci		/* mov eax,dst_lo */
10658c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, dst_lo, IA32_EAX));
10668c2ecf20Sopenharmony_ci
10678c2ecf20Sopenharmony_ci	if (sstk)
10688c2ecf20Sopenharmony_ci		/* mul dword ptr [ebp+off] */
10698c2ecf20Sopenharmony_ci		EMIT3(0xF7, add_1reg(0x60, IA32_EBP), STACK_VAR(src_hi));
10708c2ecf20Sopenharmony_ci	else
10718c2ecf20Sopenharmony_ci		/* mul src_hi */
10728c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xE0, src_hi));
10738c2ecf20Sopenharmony_ci
10748c2ecf20Sopenharmony_ci	/* add eax,eax */
10758c2ecf20Sopenharmony_ci	EMIT2(0x01, add_2reg(0xC0, IA32_ECX, IA32_EAX));
10768c2ecf20Sopenharmony_ci
10778c2ecf20Sopenharmony_ci	if (dstk)
10788c2ecf20Sopenharmony_ci		/* mov eax,dword ptr [ebp+off] */
10798c2ecf20Sopenharmony_ci		EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
10808c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
10818c2ecf20Sopenharmony_ci	else
10828c2ecf20Sopenharmony_ci		/* mov eax,dst_lo */
10838c2ecf20Sopenharmony_ci		EMIT2(0x8B, add_2reg(0xC0, dst_lo, IA32_EAX));
10848c2ecf20Sopenharmony_ci
10858c2ecf20Sopenharmony_ci	if (sstk)
10868c2ecf20Sopenharmony_ci		/* mul dword ptr [ebp+off] */
10878c2ecf20Sopenharmony_ci		EMIT3(0xF7, add_1reg(0x60, IA32_EBP), STACK_VAR(src_lo));
10888c2ecf20Sopenharmony_ci	else
10898c2ecf20Sopenharmony_ci		/* mul src_lo */
10908c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xE0, src_lo));
10918c2ecf20Sopenharmony_ci
10928c2ecf20Sopenharmony_ci	/* add ecx,edx */
10938c2ecf20Sopenharmony_ci	EMIT2(0x01, add_2reg(0xC0, IA32_ECX, IA32_EDX));
10948c2ecf20Sopenharmony_ci
10958c2ecf20Sopenharmony_ci	if (dstk) {
10968c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],eax */
10978c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX),
10988c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
10998c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],ecx */
11008c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_ECX),
11018c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
11028c2ecf20Sopenharmony_ci	} else {
11038c2ecf20Sopenharmony_ci		/* mov dst_lo,eax */
11048c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dst_lo, IA32_EAX));
11058c2ecf20Sopenharmony_ci		/* mov dst_hi,ecx */
11068c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dst_hi, IA32_ECX));
11078c2ecf20Sopenharmony_ci	}
11088c2ecf20Sopenharmony_ci
11098c2ecf20Sopenharmony_ci	*pprog = prog;
11108c2ecf20Sopenharmony_ci}
11118c2ecf20Sopenharmony_ci
11128c2ecf20Sopenharmony_cistatic inline void emit_ia32_mul_i64(const u8 dst[], const u32 val,
11138c2ecf20Sopenharmony_ci				     bool dstk, u8 **pprog)
11148c2ecf20Sopenharmony_ci{
11158c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
11168c2ecf20Sopenharmony_ci	int cnt = 0;
11178c2ecf20Sopenharmony_ci	u32 hi;
11188c2ecf20Sopenharmony_ci
11198c2ecf20Sopenharmony_ci	hi = val & (1<<31) ? (u32)~0 : 0;
11208c2ecf20Sopenharmony_ci	/* movl eax,imm32 */
11218c2ecf20Sopenharmony_ci	EMIT2_off32(0xC7, add_1reg(0xC0, IA32_EAX), val);
11228c2ecf20Sopenharmony_ci	if (dstk)
11238c2ecf20Sopenharmony_ci		/* mul dword ptr [ebp+off] */
11248c2ecf20Sopenharmony_ci		EMIT3(0xF7, add_1reg(0x60, IA32_EBP), STACK_VAR(dst_hi));
11258c2ecf20Sopenharmony_ci	else
11268c2ecf20Sopenharmony_ci		/* mul dst_hi */
11278c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xE0, dst_hi));
11288c2ecf20Sopenharmony_ci
11298c2ecf20Sopenharmony_ci	/* mov ecx,eax */
11308c2ecf20Sopenharmony_ci	EMIT2(0x89, add_2reg(0xC0, IA32_ECX, IA32_EAX));
11318c2ecf20Sopenharmony_ci
11328c2ecf20Sopenharmony_ci	/* movl eax,imm32 */
11338c2ecf20Sopenharmony_ci	EMIT2_off32(0xC7, add_1reg(0xC0, IA32_EAX), hi);
11348c2ecf20Sopenharmony_ci	if (dstk)
11358c2ecf20Sopenharmony_ci		/* mul dword ptr [ebp+off] */
11368c2ecf20Sopenharmony_ci		EMIT3(0xF7, add_1reg(0x60, IA32_EBP), STACK_VAR(dst_lo));
11378c2ecf20Sopenharmony_ci	else
11388c2ecf20Sopenharmony_ci		/* mul dst_lo */
11398c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xE0, dst_lo));
11408c2ecf20Sopenharmony_ci	/* add ecx,eax */
11418c2ecf20Sopenharmony_ci	EMIT2(0x01, add_2reg(0xC0, IA32_ECX, IA32_EAX));
11428c2ecf20Sopenharmony_ci
11438c2ecf20Sopenharmony_ci	/* movl eax,imm32 */
11448c2ecf20Sopenharmony_ci	EMIT2_off32(0xC7, add_1reg(0xC0, IA32_EAX), val);
11458c2ecf20Sopenharmony_ci	if (dstk)
11468c2ecf20Sopenharmony_ci		/* mul dword ptr [ebp+off] */
11478c2ecf20Sopenharmony_ci		EMIT3(0xF7, add_1reg(0x60, IA32_EBP), STACK_VAR(dst_lo));
11488c2ecf20Sopenharmony_ci	else
11498c2ecf20Sopenharmony_ci		/* mul dst_lo */
11508c2ecf20Sopenharmony_ci		EMIT2(0xF7, add_1reg(0xE0, dst_lo));
11518c2ecf20Sopenharmony_ci
11528c2ecf20Sopenharmony_ci	/* add ecx,edx */
11538c2ecf20Sopenharmony_ci	EMIT2(0x01, add_2reg(0xC0, IA32_ECX, IA32_EDX));
11548c2ecf20Sopenharmony_ci
11558c2ecf20Sopenharmony_ci	if (dstk) {
11568c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],eax */
11578c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX),
11588c2ecf20Sopenharmony_ci		      STACK_VAR(dst_lo));
11598c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],ecx */
11608c2ecf20Sopenharmony_ci		EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_ECX),
11618c2ecf20Sopenharmony_ci		      STACK_VAR(dst_hi));
11628c2ecf20Sopenharmony_ci	} else {
11638c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],eax */
11648c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dst_lo, IA32_EAX));
11658c2ecf20Sopenharmony_ci		/* mov dword ptr [ebp+off],ecx */
11668c2ecf20Sopenharmony_ci		EMIT2(0x89, add_2reg(0xC0, dst_hi, IA32_ECX));
11678c2ecf20Sopenharmony_ci	}
11688c2ecf20Sopenharmony_ci
11698c2ecf20Sopenharmony_ci	*pprog = prog;
11708c2ecf20Sopenharmony_ci}
11718c2ecf20Sopenharmony_ci
11728c2ecf20Sopenharmony_cistatic int bpf_size_to_x86_bytes(int bpf_size)
11738c2ecf20Sopenharmony_ci{
11748c2ecf20Sopenharmony_ci	if (bpf_size == BPF_W)
11758c2ecf20Sopenharmony_ci		return 4;
11768c2ecf20Sopenharmony_ci	else if (bpf_size == BPF_H)
11778c2ecf20Sopenharmony_ci		return 2;
11788c2ecf20Sopenharmony_ci	else if (bpf_size == BPF_B)
11798c2ecf20Sopenharmony_ci		return 1;
11808c2ecf20Sopenharmony_ci	else if (bpf_size == BPF_DW)
11818c2ecf20Sopenharmony_ci		return 4; /* imm32 */
11828c2ecf20Sopenharmony_ci	else
11838c2ecf20Sopenharmony_ci		return 0;
11848c2ecf20Sopenharmony_ci}
11858c2ecf20Sopenharmony_ci
11868c2ecf20Sopenharmony_cistruct jit_context {
11878c2ecf20Sopenharmony_ci	int cleanup_addr; /* Epilogue code offset */
11888c2ecf20Sopenharmony_ci};
11898c2ecf20Sopenharmony_ci
11908c2ecf20Sopenharmony_ci/* Maximum number of bytes emitted while JITing one eBPF insn */
11918c2ecf20Sopenharmony_ci#define BPF_MAX_INSN_SIZE	128
11928c2ecf20Sopenharmony_ci#define BPF_INSN_SAFETY		64
11938c2ecf20Sopenharmony_ci
11948c2ecf20Sopenharmony_ci#define PROLOGUE_SIZE 35
11958c2ecf20Sopenharmony_ci
11968c2ecf20Sopenharmony_ci/*
11978c2ecf20Sopenharmony_ci * Emit prologue code for BPF program and check it's size.
11988c2ecf20Sopenharmony_ci * bpf_tail_call helper will skip it while jumping into another program.
11998c2ecf20Sopenharmony_ci */
12008c2ecf20Sopenharmony_cistatic void emit_prologue(u8 **pprog, u32 stack_depth)
12018c2ecf20Sopenharmony_ci{
12028c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
12038c2ecf20Sopenharmony_ci	int cnt = 0;
12048c2ecf20Sopenharmony_ci	const u8 *r1 = bpf2ia32[BPF_REG_1];
12058c2ecf20Sopenharmony_ci	const u8 fplo = bpf2ia32[BPF_REG_FP][0];
12068c2ecf20Sopenharmony_ci	const u8 fphi = bpf2ia32[BPF_REG_FP][1];
12078c2ecf20Sopenharmony_ci	const u8 *tcc = bpf2ia32[TCALL_CNT];
12088c2ecf20Sopenharmony_ci
12098c2ecf20Sopenharmony_ci	/* push ebp */
12108c2ecf20Sopenharmony_ci	EMIT1(0x55);
12118c2ecf20Sopenharmony_ci	/* mov ebp,esp */
12128c2ecf20Sopenharmony_ci	EMIT2(0x89, 0xE5);
12138c2ecf20Sopenharmony_ci	/* push edi */
12148c2ecf20Sopenharmony_ci	EMIT1(0x57);
12158c2ecf20Sopenharmony_ci	/* push esi */
12168c2ecf20Sopenharmony_ci	EMIT1(0x56);
12178c2ecf20Sopenharmony_ci	/* push ebx */
12188c2ecf20Sopenharmony_ci	EMIT1(0x53);
12198c2ecf20Sopenharmony_ci
12208c2ecf20Sopenharmony_ci	/* sub esp,STACK_SIZE */
12218c2ecf20Sopenharmony_ci	EMIT2_off32(0x81, 0xEC, STACK_SIZE);
12228c2ecf20Sopenharmony_ci	/* sub ebp,SCRATCH_SIZE+12*/
12238c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xE8, IA32_EBP), SCRATCH_SIZE + 12);
12248c2ecf20Sopenharmony_ci	/* xor ebx,ebx */
12258c2ecf20Sopenharmony_ci	EMIT2(0x31, add_2reg(0xC0, IA32_EBX, IA32_EBX));
12268c2ecf20Sopenharmony_ci
12278c2ecf20Sopenharmony_ci	/* Set up BPF prog stack base register */
12288c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EBP), STACK_VAR(fplo));
12298c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EBX), STACK_VAR(fphi));
12308c2ecf20Sopenharmony_ci
12318c2ecf20Sopenharmony_ci	/* Move BPF_CTX (EAX) to BPF_REG_R1 */
12328c2ecf20Sopenharmony_ci	/* mov dword ptr [ebp+off],eax */
12338c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(r1[0]));
12348c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EBX), STACK_VAR(r1[1]));
12358c2ecf20Sopenharmony_ci
12368c2ecf20Sopenharmony_ci	/* Initialize Tail Count */
12378c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EBX), STACK_VAR(tcc[0]));
12388c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EBX), STACK_VAR(tcc[1]));
12398c2ecf20Sopenharmony_ci
12408c2ecf20Sopenharmony_ci	BUILD_BUG_ON(cnt != PROLOGUE_SIZE);
12418c2ecf20Sopenharmony_ci	*pprog = prog;
12428c2ecf20Sopenharmony_ci}
12438c2ecf20Sopenharmony_ci
12448c2ecf20Sopenharmony_ci/* Emit epilogue code for BPF program */
12458c2ecf20Sopenharmony_cistatic void emit_epilogue(u8 **pprog, u32 stack_depth)
12468c2ecf20Sopenharmony_ci{
12478c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
12488c2ecf20Sopenharmony_ci	const u8 *r0 = bpf2ia32[BPF_REG_0];
12498c2ecf20Sopenharmony_ci	int cnt = 0;
12508c2ecf20Sopenharmony_ci
12518c2ecf20Sopenharmony_ci	/* mov eax,dword ptr [ebp+off]*/
12528c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(r0[0]));
12538c2ecf20Sopenharmony_ci	/* mov edx,dword ptr [ebp+off]*/
12548c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX), STACK_VAR(r0[1]));
12558c2ecf20Sopenharmony_ci
12568c2ecf20Sopenharmony_ci	/* add ebp,SCRATCH_SIZE+12*/
12578c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xC0, IA32_EBP), SCRATCH_SIZE + 12);
12588c2ecf20Sopenharmony_ci
12598c2ecf20Sopenharmony_ci	/* mov ebx,dword ptr [ebp-12]*/
12608c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EBX), -12);
12618c2ecf20Sopenharmony_ci	/* mov esi,dword ptr [ebp-8]*/
12628c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ESI), -8);
12638c2ecf20Sopenharmony_ci	/* mov edi,dword ptr [ebp-4]*/
12648c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDI), -4);
12658c2ecf20Sopenharmony_ci
12668c2ecf20Sopenharmony_ci	EMIT1(0xC9); /* leave */
12678c2ecf20Sopenharmony_ci	EMIT1(0xC3); /* ret */
12688c2ecf20Sopenharmony_ci	*pprog = prog;
12698c2ecf20Sopenharmony_ci}
12708c2ecf20Sopenharmony_ci
12718c2ecf20Sopenharmony_cistatic int emit_jmp_edx(u8 **pprog, u8 *ip)
12728c2ecf20Sopenharmony_ci{
12738c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
12748c2ecf20Sopenharmony_ci	int cnt = 0;
12758c2ecf20Sopenharmony_ci
12768c2ecf20Sopenharmony_ci#ifdef CONFIG_RETPOLINE
12778c2ecf20Sopenharmony_ci	EMIT1_off32(0xE9, (u8 *)__x86_indirect_thunk_edx - (ip + 5));
12788c2ecf20Sopenharmony_ci#else
12798c2ecf20Sopenharmony_ci	EMIT2(0xFF, 0xE2);
12808c2ecf20Sopenharmony_ci#endif
12818c2ecf20Sopenharmony_ci	*pprog = prog;
12828c2ecf20Sopenharmony_ci
12838c2ecf20Sopenharmony_ci	return cnt;
12848c2ecf20Sopenharmony_ci}
12858c2ecf20Sopenharmony_ci
12868c2ecf20Sopenharmony_ci/*
12878c2ecf20Sopenharmony_ci * Generate the following code:
12888c2ecf20Sopenharmony_ci * ... bpf_tail_call(void *ctx, struct bpf_array *array, u64 index) ...
12898c2ecf20Sopenharmony_ci *   if (index >= array->map.max_entries)
12908c2ecf20Sopenharmony_ci *     goto out;
12918c2ecf20Sopenharmony_ci *   if (++tail_call_cnt > MAX_TAIL_CALL_CNT)
12928c2ecf20Sopenharmony_ci *     goto out;
12938c2ecf20Sopenharmony_ci *   prog = array->ptrs[index];
12948c2ecf20Sopenharmony_ci *   if (prog == NULL)
12958c2ecf20Sopenharmony_ci *     goto out;
12968c2ecf20Sopenharmony_ci *   goto *(prog->bpf_func + prologue_size);
12978c2ecf20Sopenharmony_ci * out:
12988c2ecf20Sopenharmony_ci */
12998c2ecf20Sopenharmony_cistatic void emit_bpf_tail_call(u8 **pprog, u8 *ip)
13008c2ecf20Sopenharmony_ci{
13018c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
13028c2ecf20Sopenharmony_ci	int cnt = 0;
13038c2ecf20Sopenharmony_ci	const u8 *r1 = bpf2ia32[BPF_REG_1];
13048c2ecf20Sopenharmony_ci	const u8 *r2 = bpf2ia32[BPF_REG_2];
13058c2ecf20Sopenharmony_ci	const u8 *r3 = bpf2ia32[BPF_REG_3];
13068c2ecf20Sopenharmony_ci	const u8 *tcc = bpf2ia32[TCALL_CNT];
13078c2ecf20Sopenharmony_ci	u32 lo, hi;
13088c2ecf20Sopenharmony_ci	static int jmp_label1 = -1;
13098c2ecf20Sopenharmony_ci
13108c2ecf20Sopenharmony_ci	/*
13118c2ecf20Sopenharmony_ci	 * if (index >= array->map.max_entries)
13128c2ecf20Sopenharmony_ci	 *     goto out;
13138c2ecf20Sopenharmony_ci	 */
13148c2ecf20Sopenharmony_ci	/* mov eax,dword ptr [ebp+off] */
13158c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(r2[0]));
13168c2ecf20Sopenharmony_ci	/* mov edx,dword ptr [ebp+off] */
13178c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX), STACK_VAR(r3[0]));
13188c2ecf20Sopenharmony_ci
13198c2ecf20Sopenharmony_ci	/* cmp dword ptr [eax+off],edx */
13208c2ecf20Sopenharmony_ci	EMIT3(0x39, add_2reg(0x40, IA32_EAX, IA32_EDX),
13218c2ecf20Sopenharmony_ci	      offsetof(struct bpf_array, map.max_entries));
13228c2ecf20Sopenharmony_ci	/* jbe out */
13238c2ecf20Sopenharmony_ci	EMIT2(IA32_JBE, jmp_label(jmp_label1, 2));
13248c2ecf20Sopenharmony_ci
13258c2ecf20Sopenharmony_ci	/*
13268c2ecf20Sopenharmony_ci	 * if (tail_call_cnt > MAX_TAIL_CALL_CNT)
13278c2ecf20Sopenharmony_ci	 *     goto out;
13288c2ecf20Sopenharmony_ci	 */
13298c2ecf20Sopenharmony_ci	lo = (u32)MAX_TAIL_CALL_CNT;
13308c2ecf20Sopenharmony_ci	hi = (u32)((u64)MAX_TAIL_CALL_CNT >> 32);
13318c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX), STACK_VAR(tcc[0]));
13328c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EBX), STACK_VAR(tcc[1]));
13338c2ecf20Sopenharmony_ci
13348c2ecf20Sopenharmony_ci	/* cmp edx,hi */
13358c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xF8, IA32_EBX), hi);
13368c2ecf20Sopenharmony_ci	EMIT2(IA32_JNE, 3);
13378c2ecf20Sopenharmony_ci	/* cmp ecx,lo */
13388c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xF8, IA32_ECX), lo);
13398c2ecf20Sopenharmony_ci
13408c2ecf20Sopenharmony_ci	/* ja out */
13418c2ecf20Sopenharmony_ci	EMIT2(IA32_JAE, jmp_label(jmp_label1, 2));
13428c2ecf20Sopenharmony_ci
13438c2ecf20Sopenharmony_ci	/* add eax,0x1 */
13448c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xC0, IA32_ECX), 0x01);
13458c2ecf20Sopenharmony_ci	/* adc ebx,0x0 */
13468c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xD0, IA32_EBX), 0x00);
13478c2ecf20Sopenharmony_ci
13488c2ecf20Sopenharmony_ci	/* mov dword ptr [ebp+off],eax */
13498c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_ECX), STACK_VAR(tcc[0]));
13508c2ecf20Sopenharmony_ci	/* mov dword ptr [ebp+off],edx */
13518c2ecf20Sopenharmony_ci	EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EBX), STACK_VAR(tcc[1]));
13528c2ecf20Sopenharmony_ci
13538c2ecf20Sopenharmony_ci	/* prog = array->ptrs[index]; */
13548c2ecf20Sopenharmony_ci	/* mov edx, [eax + edx * 4 + offsetof(...)] */
13558c2ecf20Sopenharmony_ci	EMIT3_off32(0x8B, 0x94, 0x90, offsetof(struct bpf_array, ptrs));
13568c2ecf20Sopenharmony_ci
13578c2ecf20Sopenharmony_ci	/*
13588c2ecf20Sopenharmony_ci	 * if (prog == NULL)
13598c2ecf20Sopenharmony_ci	 *     goto out;
13608c2ecf20Sopenharmony_ci	 */
13618c2ecf20Sopenharmony_ci	/* test edx,edx */
13628c2ecf20Sopenharmony_ci	EMIT2(0x85, add_2reg(0xC0, IA32_EDX, IA32_EDX));
13638c2ecf20Sopenharmony_ci	/* je out */
13648c2ecf20Sopenharmony_ci	EMIT2(IA32_JE, jmp_label(jmp_label1, 2));
13658c2ecf20Sopenharmony_ci
13668c2ecf20Sopenharmony_ci	/* goto *(prog->bpf_func + prologue_size); */
13678c2ecf20Sopenharmony_ci	/* mov edx, dword ptr [edx + 32] */
13688c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EDX, IA32_EDX),
13698c2ecf20Sopenharmony_ci	      offsetof(struct bpf_prog, bpf_func));
13708c2ecf20Sopenharmony_ci	/* add edx,prologue_size */
13718c2ecf20Sopenharmony_ci	EMIT3(0x83, add_1reg(0xC0, IA32_EDX), PROLOGUE_SIZE);
13728c2ecf20Sopenharmony_ci
13738c2ecf20Sopenharmony_ci	/* mov eax,dword ptr [ebp+off] */
13748c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX), STACK_VAR(r1[0]));
13758c2ecf20Sopenharmony_ci
13768c2ecf20Sopenharmony_ci	/*
13778c2ecf20Sopenharmony_ci	 * Now we're ready to jump into next BPF program:
13788c2ecf20Sopenharmony_ci	 * eax == ctx (1st arg)
13798c2ecf20Sopenharmony_ci	 * edx == prog->bpf_func + prologue_size
13808c2ecf20Sopenharmony_ci	 */
13818c2ecf20Sopenharmony_ci	cnt += emit_jmp_edx(&prog, ip + cnt);
13828c2ecf20Sopenharmony_ci
13838c2ecf20Sopenharmony_ci	if (jmp_label1 == -1)
13848c2ecf20Sopenharmony_ci		jmp_label1 = cnt;
13858c2ecf20Sopenharmony_ci
13868c2ecf20Sopenharmony_ci	/* out: */
13878c2ecf20Sopenharmony_ci	*pprog = prog;
13888c2ecf20Sopenharmony_ci}
13898c2ecf20Sopenharmony_ci
13908c2ecf20Sopenharmony_ci/* Push the scratch stack register on top of the stack. */
13918c2ecf20Sopenharmony_cistatic inline void emit_push_r64(const u8 src[], u8 **pprog)
13928c2ecf20Sopenharmony_ci{
13938c2ecf20Sopenharmony_ci	u8 *prog = *pprog;
13948c2ecf20Sopenharmony_ci	int cnt = 0;
13958c2ecf20Sopenharmony_ci
13968c2ecf20Sopenharmony_ci	/* mov ecx,dword ptr [ebp+off] */
13978c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX), STACK_VAR(src_hi));
13988c2ecf20Sopenharmony_ci	/* push ecx */
13998c2ecf20Sopenharmony_ci	EMIT1(0x51);
14008c2ecf20Sopenharmony_ci
14018c2ecf20Sopenharmony_ci	/* mov ecx,dword ptr [ebp+off] */
14028c2ecf20Sopenharmony_ci	EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX), STACK_VAR(src_lo));
14038c2ecf20Sopenharmony_ci	/* push ecx */
14048c2ecf20Sopenharmony_ci	EMIT1(0x51);
14058c2ecf20Sopenharmony_ci
14068c2ecf20Sopenharmony_ci	*pprog = prog;
14078c2ecf20Sopenharmony_ci}
14088c2ecf20Sopenharmony_ci
14098c2ecf20Sopenharmony_cistatic u8 get_cond_jmp_opcode(const u8 op, bool is_cmp_lo)
14108c2ecf20Sopenharmony_ci{
14118c2ecf20Sopenharmony_ci	u8 jmp_cond;
14128c2ecf20Sopenharmony_ci
14138c2ecf20Sopenharmony_ci	/* Convert BPF opcode to x86 */
14148c2ecf20Sopenharmony_ci	switch (op) {
14158c2ecf20Sopenharmony_ci	case BPF_JEQ:
14168c2ecf20Sopenharmony_ci		jmp_cond = IA32_JE;
14178c2ecf20Sopenharmony_ci		break;
14188c2ecf20Sopenharmony_ci	case BPF_JSET:
14198c2ecf20Sopenharmony_ci	case BPF_JNE:
14208c2ecf20Sopenharmony_ci		jmp_cond = IA32_JNE;
14218c2ecf20Sopenharmony_ci		break;
14228c2ecf20Sopenharmony_ci	case BPF_JGT:
14238c2ecf20Sopenharmony_ci		/* GT is unsigned '>', JA in x86 */
14248c2ecf20Sopenharmony_ci		jmp_cond = IA32_JA;
14258c2ecf20Sopenharmony_ci		break;
14268c2ecf20Sopenharmony_ci	case BPF_JLT:
14278c2ecf20Sopenharmony_ci		/* LT is unsigned '<', JB in x86 */
14288c2ecf20Sopenharmony_ci		jmp_cond = IA32_JB;
14298c2ecf20Sopenharmony_ci		break;
14308c2ecf20Sopenharmony_ci	case BPF_JGE:
14318c2ecf20Sopenharmony_ci		/* GE is unsigned '>=', JAE in x86 */
14328c2ecf20Sopenharmony_ci		jmp_cond = IA32_JAE;
14338c2ecf20Sopenharmony_ci		break;
14348c2ecf20Sopenharmony_ci	case BPF_JLE:
14358c2ecf20Sopenharmony_ci		/* LE is unsigned '<=', JBE in x86 */
14368c2ecf20Sopenharmony_ci		jmp_cond = IA32_JBE;
14378c2ecf20Sopenharmony_ci		break;
14388c2ecf20Sopenharmony_ci	case BPF_JSGT:
14398c2ecf20Sopenharmony_ci		if (!is_cmp_lo)
14408c2ecf20Sopenharmony_ci			/* Signed '>', GT in x86 */
14418c2ecf20Sopenharmony_ci			jmp_cond = IA32_JG;
14428c2ecf20Sopenharmony_ci		else
14438c2ecf20Sopenharmony_ci			/* GT is unsigned '>', JA in x86 */
14448c2ecf20Sopenharmony_ci			jmp_cond = IA32_JA;
14458c2ecf20Sopenharmony_ci		break;
14468c2ecf20Sopenharmony_ci	case BPF_JSLT:
14478c2ecf20Sopenharmony_ci		if (!is_cmp_lo)
14488c2ecf20Sopenharmony_ci			/* Signed '<', LT in x86 */
14498c2ecf20Sopenharmony_ci			jmp_cond = IA32_JL;
14508c2ecf20Sopenharmony_ci		else
14518c2ecf20Sopenharmony_ci			/* LT is unsigned '<', JB in x86 */
14528c2ecf20Sopenharmony_ci			jmp_cond = IA32_JB;
14538c2ecf20Sopenharmony_ci		break;
14548c2ecf20Sopenharmony_ci	case BPF_JSGE:
14558c2ecf20Sopenharmony_ci		if (!is_cmp_lo)
14568c2ecf20Sopenharmony_ci			/* Signed '>=', GE in x86 */
14578c2ecf20Sopenharmony_ci			jmp_cond = IA32_JGE;
14588c2ecf20Sopenharmony_ci		else
14598c2ecf20Sopenharmony_ci			/* GE is unsigned '>=', JAE in x86 */
14608c2ecf20Sopenharmony_ci			jmp_cond = IA32_JAE;
14618c2ecf20Sopenharmony_ci		break;
14628c2ecf20Sopenharmony_ci	case BPF_JSLE:
14638c2ecf20Sopenharmony_ci		if (!is_cmp_lo)
14648c2ecf20Sopenharmony_ci			/* Signed '<=', LE in x86 */
14658c2ecf20Sopenharmony_ci			jmp_cond = IA32_JLE;
14668c2ecf20Sopenharmony_ci		else
14678c2ecf20Sopenharmony_ci			/* LE is unsigned '<=', JBE in x86 */
14688c2ecf20Sopenharmony_ci			jmp_cond = IA32_JBE;
14698c2ecf20Sopenharmony_ci		break;
14708c2ecf20Sopenharmony_ci	default: /* to silence GCC warning */
14718c2ecf20Sopenharmony_ci		jmp_cond = COND_JMP_OPCODE_INVALID;
14728c2ecf20Sopenharmony_ci		break;
14738c2ecf20Sopenharmony_ci	}
14748c2ecf20Sopenharmony_ci
14758c2ecf20Sopenharmony_ci	return jmp_cond;
14768c2ecf20Sopenharmony_ci}
14778c2ecf20Sopenharmony_ci
14788c2ecf20Sopenharmony_cistatic int do_jit(struct bpf_prog *bpf_prog, int *addrs, u8 *image,
14798c2ecf20Sopenharmony_ci		  int oldproglen, struct jit_context *ctx)
14808c2ecf20Sopenharmony_ci{
14818c2ecf20Sopenharmony_ci	struct bpf_insn *insn = bpf_prog->insnsi;
14828c2ecf20Sopenharmony_ci	int insn_cnt = bpf_prog->len;
14838c2ecf20Sopenharmony_ci	bool seen_exit = false;
14848c2ecf20Sopenharmony_ci	u8 temp[BPF_MAX_INSN_SIZE + BPF_INSN_SAFETY];
14858c2ecf20Sopenharmony_ci	int i, cnt = 0;
14868c2ecf20Sopenharmony_ci	int proglen = 0;
14878c2ecf20Sopenharmony_ci	u8 *prog = temp;
14888c2ecf20Sopenharmony_ci
14898c2ecf20Sopenharmony_ci	emit_prologue(&prog, bpf_prog->aux->stack_depth);
14908c2ecf20Sopenharmony_ci
14918c2ecf20Sopenharmony_ci	for (i = 0; i < insn_cnt; i++, insn++) {
14928c2ecf20Sopenharmony_ci		const s32 imm32 = insn->imm;
14938c2ecf20Sopenharmony_ci		const bool is64 = BPF_CLASS(insn->code) == BPF_ALU64;
14948c2ecf20Sopenharmony_ci		const bool dstk = insn->dst_reg != BPF_REG_AX;
14958c2ecf20Sopenharmony_ci		const bool sstk = insn->src_reg != BPF_REG_AX;
14968c2ecf20Sopenharmony_ci		const u8 code = insn->code;
14978c2ecf20Sopenharmony_ci		const u8 *dst = bpf2ia32[insn->dst_reg];
14988c2ecf20Sopenharmony_ci		const u8 *src = bpf2ia32[insn->src_reg];
14998c2ecf20Sopenharmony_ci		const u8 *r0 = bpf2ia32[BPF_REG_0];
15008c2ecf20Sopenharmony_ci		s64 jmp_offset;
15018c2ecf20Sopenharmony_ci		u8 jmp_cond;
15028c2ecf20Sopenharmony_ci		int ilen;
15038c2ecf20Sopenharmony_ci		u8 *func;
15048c2ecf20Sopenharmony_ci
15058c2ecf20Sopenharmony_ci		switch (code) {
15068c2ecf20Sopenharmony_ci		/* ALU operations */
15078c2ecf20Sopenharmony_ci		/* dst = src */
15088c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_MOV | BPF_K:
15098c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_MOV | BPF_X:
15108c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_MOV | BPF_K:
15118c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_MOV | BPF_X:
15128c2ecf20Sopenharmony_ci			switch (BPF_SRC(code)) {
15138c2ecf20Sopenharmony_ci			case BPF_X:
15148c2ecf20Sopenharmony_ci				if (imm32 == 1) {
15158c2ecf20Sopenharmony_ci					/* Special mov32 for zext. */
15168c2ecf20Sopenharmony_ci					emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
15178c2ecf20Sopenharmony_ci					break;
15188c2ecf20Sopenharmony_ci				}
15198c2ecf20Sopenharmony_ci				emit_ia32_mov_r64(is64, dst, src, dstk, sstk,
15208c2ecf20Sopenharmony_ci						  &prog, bpf_prog->aux);
15218c2ecf20Sopenharmony_ci				break;
15228c2ecf20Sopenharmony_ci			case BPF_K:
15238c2ecf20Sopenharmony_ci				/* Sign-extend immediate value to dst reg */
15248c2ecf20Sopenharmony_ci				emit_ia32_mov_i64(is64, dst, imm32,
15258c2ecf20Sopenharmony_ci						  dstk, &prog);
15268c2ecf20Sopenharmony_ci				break;
15278c2ecf20Sopenharmony_ci			}
15288c2ecf20Sopenharmony_ci			break;
15298c2ecf20Sopenharmony_ci		/* dst = dst + src/imm */
15308c2ecf20Sopenharmony_ci		/* dst = dst - src/imm */
15318c2ecf20Sopenharmony_ci		/* dst = dst | src/imm */
15328c2ecf20Sopenharmony_ci		/* dst = dst & src/imm */
15338c2ecf20Sopenharmony_ci		/* dst = dst ^ src/imm */
15348c2ecf20Sopenharmony_ci		/* dst = dst * src/imm */
15358c2ecf20Sopenharmony_ci		/* dst = dst << src */
15368c2ecf20Sopenharmony_ci		/* dst = dst >> src */
15378c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_ADD | BPF_K:
15388c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_ADD | BPF_X:
15398c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_SUB | BPF_K:
15408c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_SUB | BPF_X:
15418c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_OR | BPF_K:
15428c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_OR | BPF_X:
15438c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_AND | BPF_K:
15448c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_AND | BPF_X:
15458c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_XOR | BPF_K:
15468c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_XOR | BPF_X:
15478c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_ADD | BPF_K:
15488c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_ADD | BPF_X:
15498c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_SUB | BPF_K:
15508c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_SUB | BPF_X:
15518c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_OR | BPF_K:
15528c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_OR | BPF_X:
15538c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_AND | BPF_K:
15548c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_AND | BPF_X:
15558c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_XOR | BPF_K:
15568c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_XOR | BPF_X:
15578c2ecf20Sopenharmony_ci			switch (BPF_SRC(code)) {
15588c2ecf20Sopenharmony_ci			case BPF_X:
15598c2ecf20Sopenharmony_ci				emit_ia32_alu_r64(is64, BPF_OP(code), dst,
15608c2ecf20Sopenharmony_ci						  src, dstk, sstk, &prog,
15618c2ecf20Sopenharmony_ci						  bpf_prog->aux);
15628c2ecf20Sopenharmony_ci				break;
15638c2ecf20Sopenharmony_ci			case BPF_K:
15648c2ecf20Sopenharmony_ci				emit_ia32_alu_i64(is64, BPF_OP(code), dst,
15658c2ecf20Sopenharmony_ci						  imm32, dstk, &prog,
15668c2ecf20Sopenharmony_ci						  bpf_prog->aux);
15678c2ecf20Sopenharmony_ci				break;
15688c2ecf20Sopenharmony_ci			}
15698c2ecf20Sopenharmony_ci			break;
15708c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_MUL | BPF_K:
15718c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_MUL | BPF_X:
15728c2ecf20Sopenharmony_ci			switch (BPF_SRC(code)) {
15738c2ecf20Sopenharmony_ci			case BPF_X:
15748c2ecf20Sopenharmony_ci				emit_ia32_mul_r(dst_lo, src_lo, dstk,
15758c2ecf20Sopenharmony_ci						sstk, &prog);
15768c2ecf20Sopenharmony_ci				break;
15778c2ecf20Sopenharmony_ci			case BPF_K:
15788c2ecf20Sopenharmony_ci				/* mov ecx,imm32*/
15798c2ecf20Sopenharmony_ci				EMIT2_off32(0xC7, add_1reg(0xC0, IA32_ECX),
15808c2ecf20Sopenharmony_ci					    imm32);
15818c2ecf20Sopenharmony_ci				emit_ia32_mul_r(dst_lo, IA32_ECX, dstk,
15828c2ecf20Sopenharmony_ci						false, &prog);
15838c2ecf20Sopenharmony_ci				break;
15848c2ecf20Sopenharmony_ci			}
15858c2ecf20Sopenharmony_ci			if (!bpf_prog->aux->verifier_zext)
15868c2ecf20Sopenharmony_ci				emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
15878c2ecf20Sopenharmony_ci			break;
15888c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_LSH | BPF_X:
15898c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_RSH | BPF_X:
15908c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_ARSH | BPF_K:
15918c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_ARSH | BPF_X:
15928c2ecf20Sopenharmony_ci			switch (BPF_SRC(code)) {
15938c2ecf20Sopenharmony_ci			case BPF_X:
15948c2ecf20Sopenharmony_ci				emit_ia32_shift_r(BPF_OP(code), dst_lo, src_lo,
15958c2ecf20Sopenharmony_ci						  dstk, sstk, &prog);
15968c2ecf20Sopenharmony_ci				break;
15978c2ecf20Sopenharmony_ci			case BPF_K:
15988c2ecf20Sopenharmony_ci				/* mov ecx,imm32*/
15998c2ecf20Sopenharmony_ci				EMIT2_off32(0xC7, add_1reg(0xC0, IA32_ECX),
16008c2ecf20Sopenharmony_ci					    imm32);
16018c2ecf20Sopenharmony_ci				emit_ia32_shift_r(BPF_OP(code), dst_lo,
16028c2ecf20Sopenharmony_ci						  IA32_ECX, dstk, false,
16038c2ecf20Sopenharmony_ci						  &prog);
16048c2ecf20Sopenharmony_ci				break;
16058c2ecf20Sopenharmony_ci			}
16068c2ecf20Sopenharmony_ci			if (!bpf_prog->aux->verifier_zext)
16078c2ecf20Sopenharmony_ci				emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
16088c2ecf20Sopenharmony_ci			break;
16098c2ecf20Sopenharmony_ci		/* dst = dst / src(imm) */
16108c2ecf20Sopenharmony_ci		/* dst = dst % src(imm) */
16118c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_DIV | BPF_K:
16128c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_DIV | BPF_X:
16138c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_MOD | BPF_K:
16148c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_MOD | BPF_X:
16158c2ecf20Sopenharmony_ci			switch (BPF_SRC(code)) {
16168c2ecf20Sopenharmony_ci			case BPF_X:
16178c2ecf20Sopenharmony_ci				emit_ia32_div_mod_r(BPF_OP(code), dst_lo,
16188c2ecf20Sopenharmony_ci						    src_lo, dstk, sstk, &prog);
16198c2ecf20Sopenharmony_ci				break;
16208c2ecf20Sopenharmony_ci			case BPF_K:
16218c2ecf20Sopenharmony_ci				/* mov ecx,imm32*/
16228c2ecf20Sopenharmony_ci				EMIT2_off32(0xC7, add_1reg(0xC0, IA32_ECX),
16238c2ecf20Sopenharmony_ci					    imm32);
16248c2ecf20Sopenharmony_ci				emit_ia32_div_mod_r(BPF_OP(code), dst_lo,
16258c2ecf20Sopenharmony_ci						    IA32_ECX, dstk, false,
16268c2ecf20Sopenharmony_ci						    &prog);
16278c2ecf20Sopenharmony_ci				break;
16288c2ecf20Sopenharmony_ci			}
16298c2ecf20Sopenharmony_ci			if (!bpf_prog->aux->verifier_zext)
16308c2ecf20Sopenharmony_ci				emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
16318c2ecf20Sopenharmony_ci			break;
16328c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_DIV | BPF_K:
16338c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_DIV | BPF_X:
16348c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_MOD | BPF_K:
16358c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_MOD | BPF_X:
16368c2ecf20Sopenharmony_ci			goto notyet;
16378c2ecf20Sopenharmony_ci		/* dst = dst >> imm */
16388c2ecf20Sopenharmony_ci		/* dst = dst << imm */
16398c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_RSH | BPF_K:
16408c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_LSH | BPF_K:
16418c2ecf20Sopenharmony_ci			if (unlikely(imm32 > 31))
16428c2ecf20Sopenharmony_ci				return -EINVAL;
16438c2ecf20Sopenharmony_ci			/* mov ecx,imm32*/
16448c2ecf20Sopenharmony_ci			EMIT2_off32(0xC7, add_1reg(0xC0, IA32_ECX), imm32);
16458c2ecf20Sopenharmony_ci			emit_ia32_shift_r(BPF_OP(code), dst_lo, IA32_ECX, dstk,
16468c2ecf20Sopenharmony_ci					  false, &prog);
16478c2ecf20Sopenharmony_ci			if (!bpf_prog->aux->verifier_zext)
16488c2ecf20Sopenharmony_ci				emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
16498c2ecf20Sopenharmony_ci			break;
16508c2ecf20Sopenharmony_ci		/* dst = dst << imm */
16518c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_LSH | BPF_K:
16528c2ecf20Sopenharmony_ci			if (unlikely(imm32 > 63))
16538c2ecf20Sopenharmony_ci				return -EINVAL;
16548c2ecf20Sopenharmony_ci			emit_ia32_lsh_i64(dst, imm32, dstk, &prog);
16558c2ecf20Sopenharmony_ci			break;
16568c2ecf20Sopenharmony_ci		/* dst = dst >> imm */
16578c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_RSH | BPF_K:
16588c2ecf20Sopenharmony_ci			if (unlikely(imm32 > 63))
16598c2ecf20Sopenharmony_ci				return -EINVAL;
16608c2ecf20Sopenharmony_ci			emit_ia32_rsh_i64(dst, imm32, dstk, &prog);
16618c2ecf20Sopenharmony_ci			break;
16628c2ecf20Sopenharmony_ci		/* dst = dst << src */
16638c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_LSH | BPF_X:
16648c2ecf20Sopenharmony_ci			emit_ia32_lsh_r64(dst, src, dstk, sstk, &prog);
16658c2ecf20Sopenharmony_ci			break;
16668c2ecf20Sopenharmony_ci		/* dst = dst >> src */
16678c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_RSH | BPF_X:
16688c2ecf20Sopenharmony_ci			emit_ia32_rsh_r64(dst, src, dstk, sstk, &prog);
16698c2ecf20Sopenharmony_ci			break;
16708c2ecf20Sopenharmony_ci		/* dst = dst >> src (signed) */
16718c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_ARSH | BPF_X:
16728c2ecf20Sopenharmony_ci			emit_ia32_arsh_r64(dst, src, dstk, sstk, &prog);
16738c2ecf20Sopenharmony_ci			break;
16748c2ecf20Sopenharmony_ci		/* dst = dst >> imm (signed) */
16758c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_ARSH | BPF_K:
16768c2ecf20Sopenharmony_ci			if (unlikely(imm32 > 63))
16778c2ecf20Sopenharmony_ci				return -EINVAL;
16788c2ecf20Sopenharmony_ci			emit_ia32_arsh_i64(dst, imm32, dstk, &prog);
16798c2ecf20Sopenharmony_ci			break;
16808c2ecf20Sopenharmony_ci		/* dst = ~dst */
16818c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_NEG:
16828c2ecf20Sopenharmony_ci			emit_ia32_alu_i(is64, false, BPF_OP(code),
16838c2ecf20Sopenharmony_ci					dst_lo, 0, dstk, &prog);
16848c2ecf20Sopenharmony_ci			if (!bpf_prog->aux->verifier_zext)
16858c2ecf20Sopenharmony_ci				emit_ia32_mov_i(dst_hi, 0, dstk, &prog);
16868c2ecf20Sopenharmony_ci			break;
16878c2ecf20Sopenharmony_ci		/* dst = ~dst (64 bit) */
16888c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_NEG:
16898c2ecf20Sopenharmony_ci			emit_ia32_neg64(dst, dstk, &prog);
16908c2ecf20Sopenharmony_ci			break;
16918c2ecf20Sopenharmony_ci		/* dst = dst * src/imm */
16928c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_MUL | BPF_X:
16938c2ecf20Sopenharmony_ci		case BPF_ALU64 | BPF_MUL | BPF_K:
16948c2ecf20Sopenharmony_ci			switch (BPF_SRC(code)) {
16958c2ecf20Sopenharmony_ci			case BPF_X:
16968c2ecf20Sopenharmony_ci				emit_ia32_mul_r64(dst, src, dstk, sstk, &prog);
16978c2ecf20Sopenharmony_ci				break;
16988c2ecf20Sopenharmony_ci			case BPF_K:
16998c2ecf20Sopenharmony_ci				emit_ia32_mul_i64(dst, imm32, dstk, &prog);
17008c2ecf20Sopenharmony_ci				break;
17018c2ecf20Sopenharmony_ci			}
17028c2ecf20Sopenharmony_ci			break;
17038c2ecf20Sopenharmony_ci		/* dst = htole(dst) */
17048c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_END | BPF_FROM_LE:
17058c2ecf20Sopenharmony_ci			emit_ia32_to_le_r64(dst, imm32, dstk, &prog,
17068c2ecf20Sopenharmony_ci					    bpf_prog->aux);
17078c2ecf20Sopenharmony_ci			break;
17088c2ecf20Sopenharmony_ci		/* dst = htobe(dst) */
17098c2ecf20Sopenharmony_ci		case BPF_ALU | BPF_END | BPF_FROM_BE:
17108c2ecf20Sopenharmony_ci			emit_ia32_to_be_r64(dst, imm32, dstk, &prog,
17118c2ecf20Sopenharmony_ci					    bpf_prog->aux);
17128c2ecf20Sopenharmony_ci			break;
17138c2ecf20Sopenharmony_ci		/* dst = imm64 */
17148c2ecf20Sopenharmony_ci		case BPF_LD | BPF_IMM | BPF_DW: {
17158c2ecf20Sopenharmony_ci			s32 hi, lo = imm32;
17168c2ecf20Sopenharmony_ci
17178c2ecf20Sopenharmony_ci			hi = insn[1].imm;
17188c2ecf20Sopenharmony_ci			emit_ia32_mov_i(dst_lo, lo, dstk, &prog);
17198c2ecf20Sopenharmony_ci			emit_ia32_mov_i(dst_hi, hi, dstk, &prog);
17208c2ecf20Sopenharmony_ci			insn++;
17218c2ecf20Sopenharmony_ci			i++;
17228c2ecf20Sopenharmony_ci			break;
17238c2ecf20Sopenharmony_ci		}
17248c2ecf20Sopenharmony_ci		/* speculation barrier */
17258c2ecf20Sopenharmony_ci		case BPF_ST | BPF_NOSPEC:
17268c2ecf20Sopenharmony_ci			if (boot_cpu_has(X86_FEATURE_XMM2))
17278c2ecf20Sopenharmony_ci				/* Emit 'lfence' */
17288c2ecf20Sopenharmony_ci				EMIT3(0x0F, 0xAE, 0xE8);
17298c2ecf20Sopenharmony_ci			break;
17308c2ecf20Sopenharmony_ci		/* ST: *(u8*)(dst_reg + off) = imm */
17318c2ecf20Sopenharmony_ci		case BPF_ST | BPF_MEM | BPF_H:
17328c2ecf20Sopenharmony_ci		case BPF_ST | BPF_MEM | BPF_B:
17338c2ecf20Sopenharmony_ci		case BPF_ST | BPF_MEM | BPF_W:
17348c2ecf20Sopenharmony_ci		case BPF_ST | BPF_MEM | BPF_DW:
17358c2ecf20Sopenharmony_ci			if (dstk)
17368c2ecf20Sopenharmony_ci				/* mov eax,dword ptr [ebp+off] */
17378c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
17388c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
17398c2ecf20Sopenharmony_ci			else
17408c2ecf20Sopenharmony_ci				/* mov eax,dst_lo */
17418c2ecf20Sopenharmony_ci				EMIT2(0x8B, add_2reg(0xC0, dst_lo, IA32_EAX));
17428c2ecf20Sopenharmony_ci
17438c2ecf20Sopenharmony_ci			switch (BPF_SIZE(code)) {
17448c2ecf20Sopenharmony_ci			case BPF_B:
17458c2ecf20Sopenharmony_ci				EMIT(0xC6, 1); break;
17468c2ecf20Sopenharmony_ci			case BPF_H:
17478c2ecf20Sopenharmony_ci				EMIT2(0x66, 0xC7); break;
17488c2ecf20Sopenharmony_ci			case BPF_W:
17498c2ecf20Sopenharmony_ci			case BPF_DW:
17508c2ecf20Sopenharmony_ci				EMIT(0xC7, 1); break;
17518c2ecf20Sopenharmony_ci			}
17528c2ecf20Sopenharmony_ci
17538c2ecf20Sopenharmony_ci			if (is_imm8(insn->off))
17548c2ecf20Sopenharmony_ci				EMIT2(add_1reg(0x40, IA32_EAX), insn->off);
17558c2ecf20Sopenharmony_ci			else
17568c2ecf20Sopenharmony_ci				EMIT1_off32(add_1reg(0x80, IA32_EAX),
17578c2ecf20Sopenharmony_ci					    insn->off);
17588c2ecf20Sopenharmony_ci			EMIT(imm32, bpf_size_to_x86_bytes(BPF_SIZE(code)));
17598c2ecf20Sopenharmony_ci
17608c2ecf20Sopenharmony_ci			if (BPF_SIZE(code) == BPF_DW) {
17618c2ecf20Sopenharmony_ci				u32 hi;
17628c2ecf20Sopenharmony_ci
17638c2ecf20Sopenharmony_ci				hi = imm32 & (1<<31) ? (u32)~0 : 0;
17648c2ecf20Sopenharmony_ci				EMIT2_off32(0xC7, add_1reg(0x80, IA32_EAX),
17658c2ecf20Sopenharmony_ci					    insn->off + 4);
17668c2ecf20Sopenharmony_ci				EMIT(hi, 4);
17678c2ecf20Sopenharmony_ci			}
17688c2ecf20Sopenharmony_ci			break;
17698c2ecf20Sopenharmony_ci
17708c2ecf20Sopenharmony_ci		/* STX: *(u8*)(dst_reg + off) = src_reg */
17718c2ecf20Sopenharmony_ci		case BPF_STX | BPF_MEM | BPF_B:
17728c2ecf20Sopenharmony_ci		case BPF_STX | BPF_MEM | BPF_H:
17738c2ecf20Sopenharmony_ci		case BPF_STX | BPF_MEM | BPF_W:
17748c2ecf20Sopenharmony_ci		case BPF_STX | BPF_MEM | BPF_DW:
17758c2ecf20Sopenharmony_ci			if (dstk)
17768c2ecf20Sopenharmony_ci				/* mov eax,dword ptr [ebp+off] */
17778c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
17788c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
17798c2ecf20Sopenharmony_ci			else
17808c2ecf20Sopenharmony_ci				/* mov eax,dst_lo */
17818c2ecf20Sopenharmony_ci				EMIT2(0x8B, add_2reg(0xC0, dst_lo, IA32_EAX));
17828c2ecf20Sopenharmony_ci
17838c2ecf20Sopenharmony_ci			if (sstk)
17848c2ecf20Sopenharmony_ci				/* mov edx,dword ptr [ebp+off] */
17858c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
17868c2ecf20Sopenharmony_ci				      STACK_VAR(src_lo));
17878c2ecf20Sopenharmony_ci			else
17888c2ecf20Sopenharmony_ci				/* mov edx,src_lo */
17898c2ecf20Sopenharmony_ci				EMIT2(0x8B, add_2reg(0xC0, src_lo, IA32_EDX));
17908c2ecf20Sopenharmony_ci
17918c2ecf20Sopenharmony_ci			switch (BPF_SIZE(code)) {
17928c2ecf20Sopenharmony_ci			case BPF_B:
17938c2ecf20Sopenharmony_ci				EMIT(0x88, 1); break;
17948c2ecf20Sopenharmony_ci			case BPF_H:
17958c2ecf20Sopenharmony_ci				EMIT2(0x66, 0x89); break;
17968c2ecf20Sopenharmony_ci			case BPF_W:
17978c2ecf20Sopenharmony_ci			case BPF_DW:
17988c2ecf20Sopenharmony_ci				EMIT(0x89, 1); break;
17998c2ecf20Sopenharmony_ci			}
18008c2ecf20Sopenharmony_ci
18018c2ecf20Sopenharmony_ci			if (is_imm8(insn->off))
18028c2ecf20Sopenharmony_ci				EMIT2(add_2reg(0x40, IA32_EAX, IA32_EDX),
18038c2ecf20Sopenharmony_ci				      insn->off);
18048c2ecf20Sopenharmony_ci			else
18058c2ecf20Sopenharmony_ci				EMIT1_off32(add_2reg(0x80, IA32_EAX, IA32_EDX),
18068c2ecf20Sopenharmony_ci					    insn->off);
18078c2ecf20Sopenharmony_ci
18088c2ecf20Sopenharmony_ci			if (BPF_SIZE(code) == BPF_DW) {
18098c2ecf20Sopenharmony_ci				if (sstk)
18108c2ecf20Sopenharmony_ci					/* mov edi,dword ptr [ebp+off] */
18118c2ecf20Sopenharmony_ci					EMIT3(0x8B, add_2reg(0x40, IA32_EBP,
18128c2ecf20Sopenharmony_ci							     IA32_EDX),
18138c2ecf20Sopenharmony_ci					      STACK_VAR(src_hi));
18148c2ecf20Sopenharmony_ci				else
18158c2ecf20Sopenharmony_ci					/* mov edi,src_hi */
18168c2ecf20Sopenharmony_ci					EMIT2(0x8B, add_2reg(0xC0, src_hi,
18178c2ecf20Sopenharmony_ci							     IA32_EDX));
18188c2ecf20Sopenharmony_ci				EMIT1(0x89);
18198c2ecf20Sopenharmony_ci				if (is_imm8(insn->off + 4)) {
18208c2ecf20Sopenharmony_ci					EMIT2(add_2reg(0x40, IA32_EAX,
18218c2ecf20Sopenharmony_ci						       IA32_EDX),
18228c2ecf20Sopenharmony_ci					      insn->off + 4);
18238c2ecf20Sopenharmony_ci				} else {
18248c2ecf20Sopenharmony_ci					EMIT1(add_2reg(0x80, IA32_EAX,
18258c2ecf20Sopenharmony_ci						       IA32_EDX));
18268c2ecf20Sopenharmony_ci					EMIT(insn->off + 4, 4);
18278c2ecf20Sopenharmony_ci				}
18288c2ecf20Sopenharmony_ci			}
18298c2ecf20Sopenharmony_ci			break;
18308c2ecf20Sopenharmony_ci
18318c2ecf20Sopenharmony_ci		/* LDX: dst_reg = *(u8*)(src_reg + off) */
18328c2ecf20Sopenharmony_ci		case BPF_LDX | BPF_MEM | BPF_B:
18338c2ecf20Sopenharmony_ci		case BPF_LDX | BPF_MEM | BPF_H:
18348c2ecf20Sopenharmony_ci		case BPF_LDX | BPF_MEM | BPF_W:
18358c2ecf20Sopenharmony_ci		case BPF_LDX | BPF_MEM | BPF_DW:
18368c2ecf20Sopenharmony_ci			if (sstk)
18378c2ecf20Sopenharmony_ci				/* mov eax,dword ptr [ebp+off] */
18388c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
18398c2ecf20Sopenharmony_ci				      STACK_VAR(src_lo));
18408c2ecf20Sopenharmony_ci			else
18418c2ecf20Sopenharmony_ci				/* mov eax,dword ptr [ebp+off] */
18428c2ecf20Sopenharmony_ci				EMIT2(0x8B, add_2reg(0xC0, src_lo, IA32_EAX));
18438c2ecf20Sopenharmony_ci
18448c2ecf20Sopenharmony_ci			switch (BPF_SIZE(code)) {
18458c2ecf20Sopenharmony_ci			case BPF_B:
18468c2ecf20Sopenharmony_ci				EMIT2(0x0F, 0xB6); break;
18478c2ecf20Sopenharmony_ci			case BPF_H:
18488c2ecf20Sopenharmony_ci				EMIT2(0x0F, 0xB7); break;
18498c2ecf20Sopenharmony_ci			case BPF_W:
18508c2ecf20Sopenharmony_ci			case BPF_DW:
18518c2ecf20Sopenharmony_ci				EMIT(0x8B, 1); break;
18528c2ecf20Sopenharmony_ci			}
18538c2ecf20Sopenharmony_ci
18548c2ecf20Sopenharmony_ci			if (is_imm8(insn->off))
18558c2ecf20Sopenharmony_ci				EMIT2(add_2reg(0x40, IA32_EAX, IA32_EDX),
18568c2ecf20Sopenharmony_ci				      insn->off);
18578c2ecf20Sopenharmony_ci			else
18588c2ecf20Sopenharmony_ci				EMIT1_off32(add_2reg(0x80, IA32_EAX, IA32_EDX),
18598c2ecf20Sopenharmony_ci					    insn->off);
18608c2ecf20Sopenharmony_ci
18618c2ecf20Sopenharmony_ci			if (dstk)
18628c2ecf20Sopenharmony_ci				/* mov dword ptr [ebp+off],edx */
18638c2ecf20Sopenharmony_ci				EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EDX),
18648c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
18658c2ecf20Sopenharmony_ci			else
18668c2ecf20Sopenharmony_ci				/* mov dst_lo,edx */
18678c2ecf20Sopenharmony_ci				EMIT2(0x89, add_2reg(0xC0, dst_lo, IA32_EDX));
18688c2ecf20Sopenharmony_ci			switch (BPF_SIZE(code)) {
18698c2ecf20Sopenharmony_ci			case BPF_B:
18708c2ecf20Sopenharmony_ci			case BPF_H:
18718c2ecf20Sopenharmony_ci			case BPF_W:
18728c2ecf20Sopenharmony_ci				if (bpf_prog->aux->verifier_zext)
18738c2ecf20Sopenharmony_ci					break;
18748c2ecf20Sopenharmony_ci				if (dstk) {
18758c2ecf20Sopenharmony_ci					EMIT3(0xC7, add_1reg(0x40, IA32_EBP),
18768c2ecf20Sopenharmony_ci					      STACK_VAR(dst_hi));
18778c2ecf20Sopenharmony_ci					EMIT(0x0, 4);
18788c2ecf20Sopenharmony_ci				} else {
18798c2ecf20Sopenharmony_ci					/* xor dst_hi,dst_hi */
18808c2ecf20Sopenharmony_ci					EMIT2(0x33,
18818c2ecf20Sopenharmony_ci					      add_2reg(0xC0, dst_hi, dst_hi));
18828c2ecf20Sopenharmony_ci				}
18838c2ecf20Sopenharmony_ci				break;
18848c2ecf20Sopenharmony_ci			case BPF_DW:
18858c2ecf20Sopenharmony_ci				EMIT2_off32(0x8B,
18868c2ecf20Sopenharmony_ci					    add_2reg(0x80, IA32_EAX, IA32_EDX),
18878c2ecf20Sopenharmony_ci					    insn->off + 4);
18888c2ecf20Sopenharmony_ci				if (dstk)
18898c2ecf20Sopenharmony_ci					EMIT3(0x89,
18908c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
18918c2ecf20Sopenharmony_ci						       IA32_EDX),
18928c2ecf20Sopenharmony_ci					      STACK_VAR(dst_hi));
18938c2ecf20Sopenharmony_ci				else
18948c2ecf20Sopenharmony_ci					EMIT2(0x89,
18958c2ecf20Sopenharmony_ci					      add_2reg(0xC0, dst_hi, IA32_EDX));
18968c2ecf20Sopenharmony_ci				break;
18978c2ecf20Sopenharmony_ci			default:
18988c2ecf20Sopenharmony_ci				break;
18998c2ecf20Sopenharmony_ci			}
19008c2ecf20Sopenharmony_ci			break;
19018c2ecf20Sopenharmony_ci		/* call */
19028c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_CALL:
19038c2ecf20Sopenharmony_ci		{
19048c2ecf20Sopenharmony_ci			const u8 *r1 = bpf2ia32[BPF_REG_1];
19058c2ecf20Sopenharmony_ci			const u8 *r2 = bpf2ia32[BPF_REG_2];
19068c2ecf20Sopenharmony_ci			const u8 *r3 = bpf2ia32[BPF_REG_3];
19078c2ecf20Sopenharmony_ci			const u8 *r4 = bpf2ia32[BPF_REG_4];
19088c2ecf20Sopenharmony_ci			const u8 *r5 = bpf2ia32[BPF_REG_5];
19098c2ecf20Sopenharmony_ci
19108c2ecf20Sopenharmony_ci			if (insn->src_reg == BPF_PSEUDO_CALL)
19118c2ecf20Sopenharmony_ci				goto notyet;
19128c2ecf20Sopenharmony_ci
19138c2ecf20Sopenharmony_ci			func = (u8 *) __bpf_call_base + imm32;
19148c2ecf20Sopenharmony_ci			jmp_offset = func - (image + addrs[i]);
19158c2ecf20Sopenharmony_ci
19168c2ecf20Sopenharmony_ci			if (!imm32 || !is_simm32(jmp_offset)) {
19178c2ecf20Sopenharmony_ci				pr_err("unsupported BPF func %d addr %p image %p\n",
19188c2ecf20Sopenharmony_ci				       imm32, func, image);
19198c2ecf20Sopenharmony_ci				return -EINVAL;
19208c2ecf20Sopenharmony_ci			}
19218c2ecf20Sopenharmony_ci
19228c2ecf20Sopenharmony_ci			/* mov eax,dword ptr [ebp+off] */
19238c2ecf20Sopenharmony_ci			EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
19248c2ecf20Sopenharmony_ci			      STACK_VAR(r1[0]));
19258c2ecf20Sopenharmony_ci			/* mov edx,dword ptr [ebp+off] */
19268c2ecf20Sopenharmony_ci			EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EDX),
19278c2ecf20Sopenharmony_ci			      STACK_VAR(r1[1]));
19288c2ecf20Sopenharmony_ci
19298c2ecf20Sopenharmony_ci			emit_push_r64(r5, &prog);
19308c2ecf20Sopenharmony_ci			emit_push_r64(r4, &prog);
19318c2ecf20Sopenharmony_ci			emit_push_r64(r3, &prog);
19328c2ecf20Sopenharmony_ci			emit_push_r64(r2, &prog);
19338c2ecf20Sopenharmony_ci
19348c2ecf20Sopenharmony_ci			EMIT1_off32(0xE8, jmp_offset + 9);
19358c2ecf20Sopenharmony_ci
19368c2ecf20Sopenharmony_ci			/* mov dword ptr [ebp+off],eax */
19378c2ecf20Sopenharmony_ci			EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EAX),
19388c2ecf20Sopenharmony_ci			      STACK_VAR(r0[0]));
19398c2ecf20Sopenharmony_ci			/* mov dword ptr [ebp+off],edx */
19408c2ecf20Sopenharmony_ci			EMIT3(0x89, add_2reg(0x40, IA32_EBP, IA32_EDX),
19418c2ecf20Sopenharmony_ci			      STACK_VAR(r0[1]));
19428c2ecf20Sopenharmony_ci
19438c2ecf20Sopenharmony_ci			/* add esp,32 */
19448c2ecf20Sopenharmony_ci			EMIT3(0x83, add_1reg(0xC0, IA32_ESP), 32);
19458c2ecf20Sopenharmony_ci			break;
19468c2ecf20Sopenharmony_ci		}
19478c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_TAIL_CALL:
19488c2ecf20Sopenharmony_ci			emit_bpf_tail_call(&prog, image + addrs[i - 1]);
19498c2ecf20Sopenharmony_ci			break;
19508c2ecf20Sopenharmony_ci
19518c2ecf20Sopenharmony_ci		/* cond jump */
19528c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JEQ | BPF_X:
19538c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JNE | BPF_X:
19548c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JGT | BPF_X:
19558c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JLT | BPF_X:
19568c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JGE | BPF_X:
19578c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JLE | BPF_X:
19588c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JEQ | BPF_X:
19598c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JNE | BPF_X:
19608c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JGT | BPF_X:
19618c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JLT | BPF_X:
19628c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JGE | BPF_X:
19638c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JLE | BPF_X:
19648c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSGT | BPF_X:
19658c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSLE | BPF_X:
19668c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSLT | BPF_X:
19678c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSGE | BPF_X: {
19688c2ecf20Sopenharmony_ci			bool is_jmp64 = BPF_CLASS(insn->code) == BPF_JMP;
19698c2ecf20Sopenharmony_ci			u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
19708c2ecf20Sopenharmony_ci			u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
19718c2ecf20Sopenharmony_ci			u8 sreg_lo = sstk ? IA32_ECX : src_lo;
19728c2ecf20Sopenharmony_ci			u8 sreg_hi = sstk ? IA32_EBX : src_hi;
19738c2ecf20Sopenharmony_ci
19748c2ecf20Sopenharmony_ci			if (dstk) {
19758c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
19768c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
19778c2ecf20Sopenharmony_ci				if (is_jmp64)
19788c2ecf20Sopenharmony_ci					EMIT3(0x8B,
19798c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
19808c2ecf20Sopenharmony_ci						       IA32_EDX),
19818c2ecf20Sopenharmony_ci					      STACK_VAR(dst_hi));
19828c2ecf20Sopenharmony_ci			}
19838c2ecf20Sopenharmony_ci
19848c2ecf20Sopenharmony_ci			if (sstk) {
19858c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
19868c2ecf20Sopenharmony_ci				      STACK_VAR(src_lo));
19878c2ecf20Sopenharmony_ci				if (is_jmp64)
19888c2ecf20Sopenharmony_ci					EMIT3(0x8B,
19898c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
19908c2ecf20Sopenharmony_ci						       IA32_EBX),
19918c2ecf20Sopenharmony_ci					      STACK_VAR(src_hi));
19928c2ecf20Sopenharmony_ci			}
19938c2ecf20Sopenharmony_ci
19948c2ecf20Sopenharmony_ci			if (is_jmp64) {
19958c2ecf20Sopenharmony_ci				/* cmp dreg_hi,sreg_hi */
19968c2ecf20Sopenharmony_ci				EMIT2(0x39, add_2reg(0xC0, dreg_hi, sreg_hi));
19978c2ecf20Sopenharmony_ci				EMIT2(IA32_JNE, 2);
19988c2ecf20Sopenharmony_ci			}
19998c2ecf20Sopenharmony_ci			/* cmp dreg_lo,sreg_lo */
20008c2ecf20Sopenharmony_ci			EMIT2(0x39, add_2reg(0xC0, dreg_lo, sreg_lo));
20018c2ecf20Sopenharmony_ci			goto emit_cond_jmp;
20028c2ecf20Sopenharmony_ci		}
20038c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSGT | BPF_X:
20048c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSLE | BPF_X:
20058c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSLT | BPF_X:
20068c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSGE | BPF_X: {
20078c2ecf20Sopenharmony_ci			u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
20088c2ecf20Sopenharmony_ci			u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
20098c2ecf20Sopenharmony_ci			u8 sreg_lo = sstk ? IA32_ECX : src_lo;
20108c2ecf20Sopenharmony_ci			u8 sreg_hi = sstk ? IA32_EBX : src_hi;
20118c2ecf20Sopenharmony_ci
20128c2ecf20Sopenharmony_ci			if (dstk) {
20138c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
20148c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
20158c2ecf20Sopenharmony_ci				EMIT3(0x8B,
20168c2ecf20Sopenharmony_ci				      add_2reg(0x40, IA32_EBP,
20178c2ecf20Sopenharmony_ci					       IA32_EDX),
20188c2ecf20Sopenharmony_ci				      STACK_VAR(dst_hi));
20198c2ecf20Sopenharmony_ci			}
20208c2ecf20Sopenharmony_ci
20218c2ecf20Sopenharmony_ci			if (sstk) {
20228c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
20238c2ecf20Sopenharmony_ci				      STACK_VAR(src_lo));
20248c2ecf20Sopenharmony_ci				EMIT3(0x8B,
20258c2ecf20Sopenharmony_ci				      add_2reg(0x40, IA32_EBP,
20268c2ecf20Sopenharmony_ci					       IA32_EBX),
20278c2ecf20Sopenharmony_ci				      STACK_VAR(src_hi));
20288c2ecf20Sopenharmony_ci			}
20298c2ecf20Sopenharmony_ci
20308c2ecf20Sopenharmony_ci			/* cmp dreg_hi,sreg_hi */
20318c2ecf20Sopenharmony_ci			EMIT2(0x39, add_2reg(0xC0, dreg_hi, sreg_hi));
20328c2ecf20Sopenharmony_ci			EMIT2(IA32_JNE, 10);
20338c2ecf20Sopenharmony_ci			/* cmp dreg_lo,sreg_lo */
20348c2ecf20Sopenharmony_ci			EMIT2(0x39, add_2reg(0xC0, dreg_lo, sreg_lo));
20358c2ecf20Sopenharmony_ci			goto emit_cond_jmp_signed;
20368c2ecf20Sopenharmony_ci		}
20378c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSET | BPF_X:
20388c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSET | BPF_X: {
20398c2ecf20Sopenharmony_ci			bool is_jmp64 = BPF_CLASS(insn->code) == BPF_JMP;
20408c2ecf20Sopenharmony_ci			u8 dreg_lo = IA32_EAX;
20418c2ecf20Sopenharmony_ci			u8 dreg_hi = IA32_EDX;
20428c2ecf20Sopenharmony_ci			u8 sreg_lo = sstk ? IA32_ECX : src_lo;
20438c2ecf20Sopenharmony_ci			u8 sreg_hi = sstk ? IA32_EBX : src_hi;
20448c2ecf20Sopenharmony_ci
20458c2ecf20Sopenharmony_ci			if (dstk) {
20468c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
20478c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
20488c2ecf20Sopenharmony_ci				if (is_jmp64)
20498c2ecf20Sopenharmony_ci					EMIT3(0x8B,
20508c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
20518c2ecf20Sopenharmony_ci						       IA32_EDX),
20528c2ecf20Sopenharmony_ci					      STACK_VAR(dst_hi));
20538c2ecf20Sopenharmony_ci			} else {
20548c2ecf20Sopenharmony_ci				/* mov dreg_lo,dst_lo */
20558c2ecf20Sopenharmony_ci				EMIT2(0x89, add_2reg(0xC0, dreg_lo, dst_lo));
20568c2ecf20Sopenharmony_ci				if (is_jmp64)
20578c2ecf20Sopenharmony_ci					/* mov dreg_hi,dst_hi */
20588c2ecf20Sopenharmony_ci					EMIT2(0x89,
20598c2ecf20Sopenharmony_ci					      add_2reg(0xC0, dreg_hi, dst_hi));
20608c2ecf20Sopenharmony_ci			}
20618c2ecf20Sopenharmony_ci
20628c2ecf20Sopenharmony_ci			if (sstk) {
20638c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_ECX),
20648c2ecf20Sopenharmony_ci				      STACK_VAR(src_lo));
20658c2ecf20Sopenharmony_ci				if (is_jmp64)
20668c2ecf20Sopenharmony_ci					EMIT3(0x8B,
20678c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
20688c2ecf20Sopenharmony_ci						       IA32_EBX),
20698c2ecf20Sopenharmony_ci					      STACK_VAR(src_hi));
20708c2ecf20Sopenharmony_ci			}
20718c2ecf20Sopenharmony_ci			/* and dreg_lo,sreg_lo */
20728c2ecf20Sopenharmony_ci			EMIT2(0x23, add_2reg(0xC0, sreg_lo, dreg_lo));
20738c2ecf20Sopenharmony_ci			if (is_jmp64) {
20748c2ecf20Sopenharmony_ci				/* and dreg_hi,sreg_hi */
20758c2ecf20Sopenharmony_ci				EMIT2(0x23, add_2reg(0xC0, sreg_hi, dreg_hi));
20768c2ecf20Sopenharmony_ci				/* or dreg_lo,dreg_hi */
20778c2ecf20Sopenharmony_ci				EMIT2(0x09, add_2reg(0xC0, dreg_lo, dreg_hi));
20788c2ecf20Sopenharmony_ci			}
20798c2ecf20Sopenharmony_ci			goto emit_cond_jmp;
20808c2ecf20Sopenharmony_ci		}
20818c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSET | BPF_K:
20828c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSET | BPF_K: {
20838c2ecf20Sopenharmony_ci			bool is_jmp64 = BPF_CLASS(insn->code) == BPF_JMP;
20848c2ecf20Sopenharmony_ci			u8 dreg_lo = IA32_EAX;
20858c2ecf20Sopenharmony_ci			u8 dreg_hi = IA32_EDX;
20868c2ecf20Sopenharmony_ci			u8 sreg_lo = IA32_ECX;
20878c2ecf20Sopenharmony_ci			u8 sreg_hi = IA32_EBX;
20888c2ecf20Sopenharmony_ci			u32 hi;
20898c2ecf20Sopenharmony_ci
20908c2ecf20Sopenharmony_ci			if (dstk) {
20918c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
20928c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
20938c2ecf20Sopenharmony_ci				if (is_jmp64)
20948c2ecf20Sopenharmony_ci					EMIT3(0x8B,
20958c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
20968c2ecf20Sopenharmony_ci						       IA32_EDX),
20978c2ecf20Sopenharmony_ci					      STACK_VAR(dst_hi));
20988c2ecf20Sopenharmony_ci			} else {
20998c2ecf20Sopenharmony_ci				/* mov dreg_lo,dst_lo */
21008c2ecf20Sopenharmony_ci				EMIT2(0x89, add_2reg(0xC0, dreg_lo, dst_lo));
21018c2ecf20Sopenharmony_ci				if (is_jmp64)
21028c2ecf20Sopenharmony_ci					/* mov dreg_hi,dst_hi */
21038c2ecf20Sopenharmony_ci					EMIT2(0x89,
21048c2ecf20Sopenharmony_ci					      add_2reg(0xC0, dreg_hi, dst_hi));
21058c2ecf20Sopenharmony_ci			}
21068c2ecf20Sopenharmony_ci
21078c2ecf20Sopenharmony_ci			/* mov ecx,imm32 */
21088c2ecf20Sopenharmony_ci			EMIT2_off32(0xC7, add_1reg(0xC0, sreg_lo), imm32);
21098c2ecf20Sopenharmony_ci
21108c2ecf20Sopenharmony_ci			/* and dreg_lo,sreg_lo */
21118c2ecf20Sopenharmony_ci			EMIT2(0x23, add_2reg(0xC0, sreg_lo, dreg_lo));
21128c2ecf20Sopenharmony_ci			if (is_jmp64) {
21138c2ecf20Sopenharmony_ci				hi = imm32 & (1 << 31) ? (u32)~0 : 0;
21148c2ecf20Sopenharmony_ci				/* mov ebx,imm32 */
21158c2ecf20Sopenharmony_ci				EMIT2_off32(0xC7, add_1reg(0xC0, sreg_hi), hi);
21168c2ecf20Sopenharmony_ci				/* and dreg_hi,sreg_hi */
21178c2ecf20Sopenharmony_ci				EMIT2(0x23, add_2reg(0xC0, sreg_hi, dreg_hi));
21188c2ecf20Sopenharmony_ci				/* or dreg_lo,dreg_hi */
21198c2ecf20Sopenharmony_ci				EMIT2(0x09, add_2reg(0xC0, dreg_lo, dreg_hi));
21208c2ecf20Sopenharmony_ci			}
21218c2ecf20Sopenharmony_ci			goto emit_cond_jmp;
21228c2ecf20Sopenharmony_ci		}
21238c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JEQ | BPF_K:
21248c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JNE | BPF_K:
21258c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JGT | BPF_K:
21268c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JLT | BPF_K:
21278c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JGE | BPF_K:
21288c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JLE | BPF_K:
21298c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JEQ | BPF_K:
21308c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JNE | BPF_K:
21318c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JGT | BPF_K:
21328c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JLT | BPF_K:
21338c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JGE | BPF_K:
21348c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JLE | BPF_K:
21358c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSGT | BPF_K:
21368c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSLE | BPF_K:
21378c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSLT | BPF_K:
21388c2ecf20Sopenharmony_ci		case BPF_JMP32 | BPF_JSGE | BPF_K: {
21398c2ecf20Sopenharmony_ci			bool is_jmp64 = BPF_CLASS(insn->code) == BPF_JMP;
21408c2ecf20Sopenharmony_ci			u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
21418c2ecf20Sopenharmony_ci			u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
21428c2ecf20Sopenharmony_ci			u8 sreg_lo = IA32_ECX;
21438c2ecf20Sopenharmony_ci			u8 sreg_hi = IA32_EBX;
21448c2ecf20Sopenharmony_ci			u32 hi;
21458c2ecf20Sopenharmony_ci
21468c2ecf20Sopenharmony_ci			if (dstk) {
21478c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
21488c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
21498c2ecf20Sopenharmony_ci				if (is_jmp64)
21508c2ecf20Sopenharmony_ci					EMIT3(0x8B,
21518c2ecf20Sopenharmony_ci					      add_2reg(0x40, IA32_EBP,
21528c2ecf20Sopenharmony_ci						       IA32_EDX),
21538c2ecf20Sopenharmony_ci					      STACK_VAR(dst_hi));
21548c2ecf20Sopenharmony_ci			}
21558c2ecf20Sopenharmony_ci
21568c2ecf20Sopenharmony_ci			/* mov ecx,imm32 */
21578c2ecf20Sopenharmony_ci			EMIT2_off32(0xC7, add_1reg(0xC0, IA32_ECX), imm32);
21588c2ecf20Sopenharmony_ci			if (is_jmp64) {
21598c2ecf20Sopenharmony_ci				hi = imm32 & (1 << 31) ? (u32)~0 : 0;
21608c2ecf20Sopenharmony_ci				/* mov ebx,imm32 */
21618c2ecf20Sopenharmony_ci				EMIT2_off32(0xC7, add_1reg(0xC0, IA32_EBX), hi);
21628c2ecf20Sopenharmony_ci				/* cmp dreg_hi,sreg_hi */
21638c2ecf20Sopenharmony_ci				EMIT2(0x39, add_2reg(0xC0, dreg_hi, sreg_hi));
21648c2ecf20Sopenharmony_ci				EMIT2(IA32_JNE, 2);
21658c2ecf20Sopenharmony_ci			}
21668c2ecf20Sopenharmony_ci			/* cmp dreg_lo,sreg_lo */
21678c2ecf20Sopenharmony_ci			EMIT2(0x39, add_2reg(0xC0, dreg_lo, sreg_lo));
21688c2ecf20Sopenharmony_ci
21698c2ecf20Sopenharmony_ciemit_cond_jmp:		jmp_cond = get_cond_jmp_opcode(BPF_OP(code), false);
21708c2ecf20Sopenharmony_ci			if (jmp_cond == COND_JMP_OPCODE_INVALID)
21718c2ecf20Sopenharmony_ci				return -EFAULT;
21728c2ecf20Sopenharmony_ci			jmp_offset = addrs[i + insn->off] - addrs[i];
21738c2ecf20Sopenharmony_ci			if (is_imm8(jmp_offset)) {
21748c2ecf20Sopenharmony_ci				EMIT2(jmp_cond, jmp_offset);
21758c2ecf20Sopenharmony_ci			} else if (is_simm32(jmp_offset)) {
21768c2ecf20Sopenharmony_ci				EMIT2_off32(0x0F, jmp_cond + 0x10, jmp_offset);
21778c2ecf20Sopenharmony_ci			} else {
21788c2ecf20Sopenharmony_ci				pr_err("cond_jmp gen bug %llx\n", jmp_offset);
21798c2ecf20Sopenharmony_ci				return -EFAULT;
21808c2ecf20Sopenharmony_ci			}
21818c2ecf20Sopenharmony_ci			break;
21828c2ecf20Sopenharmony_ci		}
21838c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSGT | BPF_K:
21848c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSLE | BPF_K:
21858c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSLT | BPF_K:
21868c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JSGE | BPF_K: {
21878c2ecf20Sopenharmony_ci			u8 dreg_lo = dstk ? IA32_EAX : dst_lo;
21888c2ecf20Sopenharmony_ci			u8 dreg_hi = dstk ? IA32_EDX : dst_hi;
21898c2ecf20Sopenharmony_ci			u8 sreg_lo = IA32_ECX;
21908c2ecf20Sopenharmony_ci			u8 sreg_hi = IA32_EBX;
21918c2ecf20Sopenharmony_ci			u32 hi;
21928c2ecf20Sopenharmony_ci
21938c2ecf20Sopenharmony_ci			if (dstk) {
21948c2ecf20Sopenharmony_ci				EMIT3(0x8B, add_2reg(0x40, IA32_EBP, IA32_EAX),
21958c2ecf20Sopenharmony_ci				      STACK_VAR(dst_lo));
21968c2ecf20Sopenharmony_ci				EMIT3(0x8B,
21978c2ecf20Sopenharmony_ci				      add_2reg(0x40, IA32_EBP,
21988c2ecf20Sopenharmony_ci					       IA32_EDX),
21998c2ecf20Sopenharmony_ci				      STACK_VAR(dst_hi));
22008c2ecf20Sopenharmony_ci			}
22018c2ecf20Sopenharmony_ci
22028c2ecf20Sopenharmony_ci			/* mov ecx,imm32 */
22038c2ecf20Sopenharmony_ci			EMIT2_off32(0xC7, add_1reg(0xC0, IA32_ECX), imm32);
22048c2ecf20Sopenharmony_ci			hi = imm32 & (1 << 31) ? (u32)~0 : 0;
22058c2ecf20Sopenharmony_ci			/* mov ebx,imm32 */
22068c2ecf20Sopenharmony_ci			EMIT2_off32(0xC7, add_1reg(0xC0, IA32_EBX), hi);
22078c2ecf20Sopenharmony_ci			/* cmp dreg_hi,sreg_hi */
22088c2ecf20Sopenharmony_ci			EMIT2(0x39, add_2reg(0xC0, dreg_hi, sreg_hi));
22098c2ecf20Sopenharmony_ci			EMIT2(IA32_JNE, 10);
22108c2ecf20Sopenharmony_ci			/* cmp dreg_lo,sreg_lo */
22118c2ecf20Sopenharmony_ci			EMIT2(0x39, add_2reg(0xC0, dreg_lo, sreg_lo));
22128c2ecf20Sopenharmony_ci
22138c2ecf20Sopenharmony_ci			/*
22148c2ecf20Sopenharmony_ci			 * For simplicity of branch offset computation,
22158c2ecf20Sopenharmony_ci			 * let's use fixed jump coding here.
22168c2ecf20Sopenharmony_ci			 */
22178c2ecf20Sopenharmony_ciemit_cond_jmp_signed:	/* Check the condition for low 32-bit comparison */
22188c2ecf20Sopenharmony_ci			jmp_cond = get_cond_jmp_opcode(BPF_OP(code), true);
22198c2ecf20Sopenharmony_ci			if (jmp_cond == COND_JMP_OPCODE_INVALID)
22208c2ecf20Sopenharmony_ci				return -EFAULT;
22218c2ecf20Sopenharmony_ci			jmp_offset = addrs[i + insn->off] - addrs[i] + 8;
22228c2ecf20Sopenharmony_ci			if (is_simm32(jmp_offset)) {
22238c2ecf20Sopenharmony_ci				EMIT2_off32(0x0F, jmp_cond + 0x10, jmp_offset);
22248c2ecf20Sopenharmony_ci			} else {
22258c2ecf20Sopenharmony_ci				pr_err("cond_jmp gen bug %llx\n", jmp_offset);
22268c2ecf20Sopenharmony_ci				return -EFAULT;
22278c2ecf20Sopenharmony_ci			}
22288c2ecf20Sopenharmony_ci			EMIT2(0xEB, 6);
22298c2ecf20Sopenharmony_ci
22308c2ecf20Sopenharmony_ci			/* Check the condition for high 32-bit comparison */
22318c2ecf20Sopenharmony_ci			jmp_cond = get_cond_jmp_opcode(BPF_OP(code), false);
22328c2ecf20Sopenharmony_ci			if (jmp_cond == COND_JMP_OPCODE_INVALID)
22338c2ecf20Sopenharmony_ci				return -EFAULT;
22348c2ecf20Sopenharmony_ci			jmp_offset = addrs[i + insn->off] - addrs[i];
22358c2ecf20Sopenharmony_ci			if (is_simm32(jmp_offset)) {
22368c2ecf20Sopenharmony_ci				EMIT2_off32(0x0F, jmp_cond + 0x10, jmp_offset);
22378c2ecf20Sopenharmony_ci			} else {
22388c2ecf20Sopenharmony_ci				pr_err("cond_jmp gen bug %llx\n", jmp_offset);
22398c2ecf20Sopenharmony_ci				return -EFAULT;
22408c2ecf20Sopenharmony_ci			}
22418c2ecf20Sopenharmony_ci			break;
22428c2ecf20Sopenharmony_ci		}
22438c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_JA:
22448c2ecf20Sopenharmony_ci			if (insn->off == -1)
22458c2ecf20Sopenharmony_ci				/* -1 jmp instructions will always jump
22468c2ecf20Sopenharmony_ci				 * backwards two bytes. Explicitly handling
22478c2ecf20Sopenharmony_ci				 * this case avoids wasting too many passes
22488c2ecf20Sopenharmony_ci				 * when there are long sequences of replaced
22498c2ecf20Sopenharmony_ci				 * dead code.
22508c2ecf20Sopenharmony_ci				 */
22518c2ecf20Sopenharmony_ci				jmp_offset = -2;
22528c2ecf20Sopenharmony_ci			else
22538c2ecf20Sopenharmony_ci				jmp_offset = addrs[i + insn->off] - addrs[i];
22548c2ecf20Sopenharmony_ci
22558c2ecf20Sopenharmony_ci			if (!jmp_offset)
22568c2ecf20Sopenharmony_ci				/* Optimize out nop jumps */
22578c2ecf20Sopenharmony_ci				break;
22588c2ecf20Sopenharmony_ciemit_jmp:
22598c2ecf20Sopenharmony_ci			if (is_imm8(jmp_offset)) {
22608c2ecf20Sopenharmony_ci				EMIT2(0xEB, jmp_offset);
22618c2ecf20Sopenharmony_ci			} else if (is_simm32(jmp_offset)) {
22628c2ecf20Sopenharmony_ci				EMIT1_off32(0xE9, jmp_offset);
22638c2ecf20Sopenharmony_ci			} else {
22648c2ecf20Sopenharmony_ci				pr_err("jmp gen bug %llx\n", jmp_offset);
22658c2ecf20Sopenharmony_ci				return -EFAULT;
22668c2ecf20Sopenharmony_ci			}
22678c2ecf20Sopenharmony_ci			break;
22688c2ecf20Sopenharmony_ci		/* STX XADD: lock *(u32 *)(dst + off) += src */
22698c2ecf20Sopenharmony_ci		case BPF_STX | BPF_XADD | BPF_W:
22708c2ecf20Sopenharmony_ci		/* STX XADD: lock *(u64 *)(dst + off) += src */
22718c2ecf20Sopenharmony_ci		case BPF_STX | BPF_XADD | BPF_DW:
22728c2ecf20Sopenharmony_ci			goto notyet;
22738c2ecf20Sopenharmony_ci		case BPF_JMP | BPF_EXIT:
22748c2ecf20Sopenharmony_ci			if (seen_exit) {
22758c2ecf20Sopenharmony_ci				jmp_offset = ctx->cleanup_addr - addrs[i];
22768c2ecf20Sopenharmony_ci				goto emit_jmp;
22778c2ecf20Sopenharmony_ci			}
22788c2ecf20Sopenharmony_ci			seen_exit = true;
22798c2ecf20Sopenharmony_ci			/* Update cleanup_addr */
22808c2ecf20Sopenharmony_ci			ctx->cleanup_addr = proglen;
22818c2ecf20Sopenharmony_ci			emit_epilogue(&prog, bpf_prog->aux->stack_depth);
22828c2ecf20Sopenharmony_ci			break;
22838c2ecf20Sopenharmony_cinotyet:
22848c2ecf20Sopenharmony_ci			pr_info_once("*** NOT YET: opcode %02x ***\n", code);
22858c2ecf20Sopenharmony_ci			return -EFAULT;
22868c2ecf20Sopenharmony_ci		default:
22878c2ecf20Sopenharmony_ci			/*
22888c2ecf20Sopenharmony_ci			 * This error will be seen if new instruction was added
22898c2ecf20Sopenharmony_ci			 * to interpreter, but not to JIT or if there is junk in
22908c2ecf20Sopenharmony_ci			 * bpf_prog
22918c2ecf20Sopenharmony_ci			 */
22928c2ecf20Sopenharmony_ci			pr_err("bpf_jit: unknown opcode %02x\n", code);
22938c2ecf20Sopenharmony_ci			return -EINVAL;
22948c2ecf20Sopenharmony_ci		}
22958c2ecf20Sopenharmony_ci
22968c2ecf20Sopenharmony_ci		ilen = prog - temp;
22978c2ecf20Sopenharmony_ci		if (ilen > BPF_MAX_INSN_SIZE) {
22988c2ecf20Sopenharmony_ci			pr_err("bpf_jit: fatal insn size error\n");
22998c2ecf20Sopenharmony_ci			return -EFAULT;
23008c2ecf20Sopenharmony_ci		}
23018c2ecf20Sopenharmony_ci
23028c2ecf20Sopenharmony_ci		if (image) {
23038c2ecf20Sopenharmony_ci			/*
23048c2ecf20Sopenharmony_ci			 * When populating the image, assert that:
23058c2ecf20Sopenharmony_ci			 *
23068c2ecf20Sopenharmony_ci			 *  i) We do not write beyond the allocated space, and
23078c2ecf20Sopenharmony_ci			 * ii) addrs[i] did not change from the prior run, in order
23088c2ecf20Sopenharmony_ci			 *     to validate assumptions made for computing branch
23098c2ecf20Sopenharmony_ci			 *     displacements.
23108c2ecf20Sopenharmony_ci			 */
23118c2ecf20Sopenharmony_ci			if (unlikely(proglen + ilen > oldproglen ||
23128c2ecf20Sopenharmony_ci				     proglen + ilen != addrs[i])) {
23138c2ecf20Sopenharmony_ci				pr_err("bpf_jit: fatal error\n");
23148c2ecf20Sopenharmony_ci				return -EFAULT;
23158c2ecf20Sopenharmony_ci			}
23168c2ecf20Sopenharmony_ci			memcpy(image + proglen, temp, ilen);
23178c2ecf20Sopenharmony_ci		}
23188c2ecf20Sopenharmony_ci		proglen += ilen;
23198c2ecf20Sopenharmony_ci		addrs[i] = proglen;
23208c2ecf20Sopenharmony_ci		prog = temp;
23218c2ecf20Sopenharmony_ci	}
23228c2ecf20Sopenharmony_ci	return proglen;
23238c2ecf20Sopenharmony_ci}
23248c2ecf20Sopenharmony_ci
23258c2ecf20Sopenharmony_cibool bpf_jit_needs_zext(void)
23268c2ecf20Sopenharmony_ci{
23278c2ecf20Sopenharmony_ci	return true;
23288c2ecf20Sopenharmony_ci}
23298c2ecf20Sopenharmony_ci
23308c2ecf20Sopenharmony_cistruct bpf_prog *bpf_int_jit_compile(struct bpf_prog *prog)
23318c2ecf20Sopenharmony_ci{
23328c2ecf20Sopenharmony_ci	struct bpf_binary_header *header = NULL;
23338c2ecf20Sopenharmony_ci	struct bpf_prog *tmp, *orig_prog = prog;
23348c2ecf20Sopenharmony_ci	int proglen, oldproglen = 0;
23358c2ecf20Sopenharmony_ci	struct jit_context ctx = {};
23368c2ecf20Sopenharmony_ci	bool tmp_blinded = false;
23378c2ecf20Sopenharmony_ci	u8 *image = NULL;
23388c2ecf20Sopenharmony_ci	int *addrs;
23398c2ecf20Sopenharmony_ci	int pass;
23408c2ecf20Sopenharmony_ci	int i;
23418c2ecf20Sopenharmony_ci
23428c2ecf20Sopenharmony_ci	if (!prog->jit_requested)
23438c2ecf20Sopenharmony_ci		return orig_prog;
23448c2ecf20Sopenharmony_ci
23458c2ecf20Sopenharmony_ci	tmp = bpf_jit_blind_constants(prog);
23468c2ecf20Sopenharmony_ci	/*
23478c2ecf20Sopenharmony_ci	 * If blinding was requested and we failed during blinding,
23488c2ecf20Sopenharmony_ci	 * we must fall back to the interpreter.
23498c2ecf20Sopenharmony_ci	 */
23508c2ecf20Sopenharmony_ci	if (IS_ERR(tmp))
23518c2ecf20Sopenharmony_ci		return orig_prog;
23528c2ecf20Sopenharmony_ci	if (tmp != prog) {
23538c2ecf20Sopenharmony_ci		tmp_blinded = true;
23548c2ecf20Sopenharmony_ci		prog = tmp;
23558c2ecf20Sopenharmony_ci	}
23568c2ecf20Sopenharmony_ci
23578c2ecf20Sopenharmony_ci	addrs = kmalloc_array(prog->len, sizeof(*addrs), GFP_KERNEL);
23588c2ecf20Sopenharmony_ci	if (!addrs) {
23598c2ecf20Sopenharmony_ci		prog = orig_prog;
23608c2ecf20Sopenharmony_ci		goto out;
23618c2ecf20Sopenharmony_ci	}
23628c2ecf20Sopenharmony_ci
23638c2ecf20Sopenharmony_ci	/*
23648c2ecf20Sopenharmony_ci	 * Before first pass, make a rough estimation of addrs[]
23658c2ecf20Sopenharmony_ci	 * each BPF instruction is translated to less than 64 bytes
23668c2ecf20Sopenharmony_ci	 */
23678c2ecf20Sopenharmony_ci	for (proglen = 0, i = 0; i < prog->len; i++) {
23688c2ecf20Sopenharmony_ci		proglen += 64;
23698c2ecf20Sopenharmony_ci		addrs[i] = proglen;
23708c2ecf20Sopenharmony_ci	}
23718c2ecf20Sopenharmony_ci	ctx.cleanup_addr = proglen;
23728c2ecf20Sopenharmony_ci
23738c2ecf20Sopenharmony_ci	/*
23748c2ecf20Sopenharmony_ci	 * JITed image shrinks with every pass and the loop iterates
23758c2ecf20Sopenharmony_ci	 * until the image stops shrinking. Very large BPF programs
23768c2ecf20Sopenharmony_ci	 * may converge on the last pass. In such case do one more
23778c2ecf20Sopenharmony_ci	 * pass to emit the final image.
23788c2ecf20Sopenharmony_ci	 */
23798c2ecf20Sopenharmony_ci	for (pass = 0; pass < 20 || image; pass++) {
23808c2ecf20Sopenharmony_ci		proglen = do_jit(prog, addrs, image, oldproglen, &ctx);
23818c2ecf20Sopenharmony_ci		if (proglen <= 0) {
23828c2ecf20Sopenharmony_ciout_image:
23838c2ecf20Sopenharmony_ci			image = NULL;
23848c2ecf20Sopenharmony_ci			if (header)
23858c2ecf20Sopenharmony_ci				bpf_jit_binary_free(header);
23868c2ecf20Sopenharmony_ci			prog = orig_prog;
23878c2ecf20Sopenharmony_ci			goto out_addrs;
23888c2ecf20Sopenharmony_ci		}
23898c2ecf20Sopenharmony_ci		if (image) {
23908c2ecf20Sopenharmony_ci			if (proglen != oldproglen) {
23918c2ecf20Sopenharmony_ci				pr_err("bpf_jit: proglen=%d != oldproglen=%d\n",
23928c2ecf20Sopenharmony_ci				       proglen, oldproglen);
23938c2ecf20Sopenharmony_ci				goto out_image;
23948c2ecf20Sopenharmony_ci			}
23958c2ecf20Sopenharmony_ci			break;
23968c2ecf20Sopenharmony_ci		}
23978c2ecf20Sopenharmony_ci		if (proglen == oldproglen) {
23988c2ecf20Sopenharmony_ci			header = bpf_jit_binary_alloc(proglen, &image,
23998c2ecf20Sopenharmony_ci						      1, jit_fill_hole);
24008c2ecf20Sopenharmony_ci			if (!header) {
24018c2ecf20Sopenharmony_ci				prog = orig_prog;
24028c2ecf20Sopenharmony_ci				goto out_addrs;
24038c2ecf20Sopenharmony_ci			}
24048c2ecf20Sopenharmony_ci		}
24058c2ecf20Sopenharmony_ci		oldproglen = proglen;
24068c2ecf20Sopenharmony_ci		cond_resched();
24078c2ecf20Sopenharmony_ci	}
24088c2ecf20Sopenharmony_ci
24098c2ecf20Sopenharmony_ci	if (bpf_jit_enable > 1)
24108c2ecf20Sopenharmony_ci		bpf_jit_dump(prog->len, proglen, pass + 1, image);
24118c2ecf20Sopenharmony_ci
24128c2ecf20Sopenharmony_ci	if (image) {
24138c2ecf20Sopenharmony_ci		bpf_jit_binary_lock_ro(header);
24148c2ecf20Sopenharmony_ci		prog->bpf_func = (void *)image;
24158c2ecf20Sopenharmony_ci		prog->jited = 1;
24168c2ecf20Sopenharmony_ci		prog->jited_len = proglen;
24178c2ecf20Sopenharmony_ci	} else {
24188c2ecf20Sopenharmony_ci		prog = orig_prog;
24198c2ecf20Sopenharmony_ci	}
24208c2ecf20Sopenharmony_ci
24218c2ecf20Sopenharmony_ciout_addrs:
24228c2ecf20Sopenharmony_ci	kfree(addrs);
24238c2ecf20Sopenharmony_ciout:
24248c2ecf20Sopenharmony_ci	if (tmp_blinded)
24258c2ecf20Sopenharmony_ci		bpf_jit_prog_release_other(prog, prog == orig_prog ?
24268c2ecf20Sopenharmony_ci					   tmp : orig_prog);
24278c2ecf20Sopenharmony_ci	return prog;
24288c2ecf20Sopenharmony_ci}
2429