162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * BPF JIT compiler for LoongArch
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (C) 2022 Loongson Technology Corporation Limited
662306a36Sopenharmony_ci */
762306a36Sopenharmony_ci#include "bpf_jit.h"
862306a36Sopenharmony_ci
962306a36Sopenharmony_ci#define REG_TCC		LOONGARCH_GPR_A6
1062306a36Sopenharmony_ci#define TCC_SAVED	LOONGARCH_GPR_S5
1162306a36Sopenharmony_ci
1262306a36Sopenharmony_ci#define SAVE_RA		BIT(0)
1362306a36Sopenharmony_ci#define SAVE_TCC	BIT(1)
1462306a36Sopenharmony_ci
1562306a36Sopenharmony_cistatic const int regmap[] = {
1662306a36Sopenharmony_ci	/* return value from in-kernel function, and exit value for eBPF program */
1762306a36Sopenharmony_ci	[BPF_REG_0] = LOONGARCH_GPR_A5,
1862306a36Sopenharmony_ci	/* arguments from eBPF program to in-kernel function */
1962306a36Sopenharmony_ci	[BPF_REG_1] = LOONGARCH_GPR_A0,
2062306a36Sopenharmony_ci	[BPF_REG_2] = LOONGARCH_GPR_A1,
2162306a36Sopenharmony_ci	[BPF_REG_3] = LOONGARCH_GPR_A2,
2262306a36Sopenharmony_ci	[BPF_REG_4] = LOONGARCH_GPR_A3,
2362306a36Sopenharmony_ci	[BPF_REG_5] = LOONGARCH_GPR_A4,
2462306a36Sopenharmony_ci	/* callee saved registers that in-kernel function will preserve */
2562306a36Sopenharmony_ci	[BPF_REG_6] = LOONGARCH_GPR_S0,
2662306a36Sopenharmony_ci	[BPF_REG_7] = LOONGARCH_GPR_S1,
2762306a36Sopenharmony_ci	[BPF_REG_8] = LOONGARCH_GPR_S2,
2862306a36Sopenharmony_ci	[BPF_REG_9] = LOONGARCH_GPR_S3,
2962306a36Sopenharmony_ci	/* read-only frame pointer to access stack */
3062306a36Sopenharmony_ci	[BPF_REG_FP] = LOONGARCH_GPR_S4,
3162306a36Sopenharmony_ci	/* temporary register for blinding constants */
3262306a36Sopenharmony_ci	[BPF_REG_AX] = LOONGARCH_GPR_T0,
3362306a36Sopenharmony_ci};
3462306a36Sopenharmony_ci
3562306a36Sopenharmony_cistatic void mark_call(struct jit_ctx *ctx)
3662306a36Sopenharmony_ci{
3762306a36Sopenharmony_ci	ctx->flags |= SAVE_RA;
3862306a36Sopenharmony_ci}
3962306a36Sopenharmony_ci
4062306a36Sopenharmony_cistatic void mark_tail_call(struct jit_ctx *ctx)
4162306a36Sopenharmony_ci{
4262306a36Sopenharmony_ci	ctx->flags |= SAVE_TCC;
4362306a36Sopenharmony_ci}
4462306a36Sopenharmony_ci
4562306a36Sopenharmony_cistatic bool seen_call(struct jit_ctx *ctx)
4662306a36Sopenharmony_ci{
4762306a36Sopenharmony_ci	return (ctx->flags & SAVE_RA);
4862306a36Sopenharmony_ci}
4962306a36Sopenharmony_ci
5062306a36Sopenharmony_cistatic bool seen_tail_call(struct jit_ctx *ctx)
5162306a36Sopenharmony_ci{
5262306a36Sopenharmony_ci	return (ctx->flags & SAVE_TCC);
5362306a36Sopenharmony_ci}
5462306a36Sopenharmony_ci
5562306a36Sopenharmony_cistatic u8 tail_call_reg(struct jit_ctx *ctx)
5662306a36Sopenharmony_ci{
5762306a36Sopenharmony_ci	if (seen_call(ctx))
5862306a36Sopenharmony_ci		return TCC_SAVED;
5962306a36Sopenharmony_ci
6062306a36Sopenharmony_ci	return REG_TCC;
6162306a36Sopenharmony_ci}
6262306a36Sopenharmony_ci
6362306a36Sopenharmony_ci/*
6462306a36Sopenharmony_ci * eBPF prog stack layout:
6562306a36Sopenharmony_ci *
6662306a36Sopenharmony_ci *                                        high
6762306a36Sopenharmony_ci * original $sp ------------> +-------------------------+ <--LOONGARCH_GPR_FP
6862306a36Sopenharmony_ci *                            |           $ra           |
6962306a36Sopenharmony_ci *                            +-------------------------+
7062306a36Sopenharmony_ci *                            |           $fp           |
7162306a36Sopenharmony_ci *                            +-------------------------+
7262306a36Sopenharmony_ci *                            |           $s0           |
7362306a36Sopenharmony_ci *                            +-------------------------+
7462306a36Sopenharmony_ci *                            |           $s1           |
7562306a36Sopenharmony_ci *                            +-------------------------+
7662306a36Sopenharmony_ci *                            |           $s2           |
7762306a36Sopenharmony_ci *                            +-------------------------+
7862306a36Sopenharmony_ci *                            |           $s3           |
7962306a36Sopenharmony_ci *                            +-------------------------+
8062306a36Sopenharmony_ci *                            |           $s4           |
8162306a36Sopenharmony_ci *                            +-------------------------+
8262306a36Sopenharmony_ci *                            |           $s5           |
8362306a36Sopenharmony_ci *                            +-------------------------+ <--BPF_REG_FP
8462306a36Sopenharmony_ci *                            |  prog->aux->stack_depth |
8562306a36Sopenharmony_ci *                            |        (optional)       |
8662306a36Sopenharmony_ci * current $sp -------------> +-------------------------+
8762306a36Sopenharmony_ci *                                        low
8862306a36Sopenharmony_ci */
8962306a36Sopenharmony_cistatic void build_prologue(struct jit_ctx *ctx)
9062306a36Sopenharmony_ci{
9162306a36Sopenharmony_ci	int stack_adjust = 0, store_offset, bpf_stack_adjust;
9262306a36Sopenharmony_ci
9362306a36Sopenharmony_ci	bpf_stack_adjust = round_up(ctx->prog->aux->stack_depth, 16);
9462306a36Sopenharmony_ci
9562306a36Sopenharmony_ci	/* To store ra, fp, s0, s1, s2, s3, s4 and s5. */
9662306a36Sopenharmony_ci	stack_adjust += sizeof(long) * 8;
9762306a36Sopenharmony_ci
9862306a36Sopenharmony_ci	stack_adjust = round_up(stack_adjust, 16);
9962306a36Sopenharmony_ci	stack_adjust += bpf_stack_adjust;
10062306a36Sopenharmony_ci
10162306a36Sopenharmony_ci	/*
10262306a36Sopenharmony_ci	 * First instruction initializes the tail call count (TCC).
10362306a36Sopenharmony_ci	 * On tail call we skip this instruction, and the TCC is
10462306a36Sopenharmony_ci	 * passed in REG_TCC from the caller.
10562306a36Sopenharmony_ci	 */
10662306a36Sopenharmony_ci	emit_insn(ctx, addid, REG_TCC, LOONGARCH_GPR_ZERO, MAX_TAIL_CALL_CNT);
10762306a36Sopenharmony_ci
10862306a36Sopenharmony_ci	emit_insn(ctx, addid, LOONGARCH_GPR_SP, LOONGARCH_GPR_SP, -stack_adjust);
10962306a36Sopenharmony_ci
11062306a36Sopenharmony_ci	store_offset = stack_adjust - sizeof(long);
11162306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_RA, LOONGARCH_GPR_SP, store_offset);
11262306a36Sopenharmony_ci
11362306a36Sopenharmony_ci	store_offset -= sizeof(long);
11462306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_FP, LOONGARCH_GPR_SP, store_offset);
11562306a36Sopenharmony_ci
11662306a36Sopenharmony_ci	store_offset -= sizeof(long);
11762306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_S0, LOONGARCH_GPR_SP, store_offset);
11862306a36Sopenharmony_ci
11962306a36Sopenharmony_ci	store_offset -= sizeof(long);
12062306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_S1, LOONGARCH_GPR_SP, store_offset);
12162306a36Sopenharmony_ci
12262306a36Sopenharmony_ci	store_offset -= sizeof(long);
12362306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_S2, LOONGARCH_GPR_SP, store_offset);
12462306a36Sopenharmony_ci
12562306a36Sopenharmony_ci	store_offset -= sizeof(long);
12662306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_S3, LOONGARCH_GPR_SP, store_offset);
12762306a36Sopenharmony_ci
12862306a36Sopenharmony_ci	store_offset -= sizeof(long);
12962306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_S4, LOONGARCH_GPR_SP, store_offset);
13062306a36Sopenharmony_ci
13162306a36Sopenharmony_ci	store_offset -= sizeof(long);
13262306a36Sopenharmony_ci	emit_insn(ctx, std, LOONGARCH_GPR_S5, LOONGARCH_GPR_SP, store_offset);
13362306a36Sopenharmony_ci
13462306a36Sopenharmony_ci	emit_insn(ctx, addid, LOONGARCH_GPR_FP, LOONGARCH_GPR_SP, stack_adjust);
13562306a36Sopenharmony_ci
13662306a36Sopenharmony_ci	if (bpf_stack_adjust)
13762306a36Sopenharmony_ci		emit_insn(ctx, addid, regmap[BPF_REG_FP], LOONGARCH_GPR_SP, bpf_stack_adjust);
13862306a36Sopenharmony_ci
13962306a36Sopenharmony_ci	/*
14062306a36Sopenharmony_ci	 * Program contains calls and tail calls, so REG_TCC need
14162306a36Sopenharmony_ci	 * to be saved across calls.
14262306a36Sopenharmony_ci	 */
14362306a36Sopenharmony_ci	if (seen_tail_call(ctx) && seen_call(ctx))
14462306a36Sopenharmony_ci		move_reg(ctx, TCC_SAVED, REG_TCC);
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_ci	ctx->stack_size = stack_adjust;
14762306a36Sopenharmony_ci}
14862306a36Sopenharmony_ci
14962306a36Sopenharmony_cistatic void __build_epilogue(struct jit_ctx *ctx, bool is_tail_call)
15062306a36Sopenharmony_ci{
15162306a36Sopenharmony_ci	int stack_adjust = ctx->stack_size;
15262306a36Sopenharmony_ci	int load_offset;
15362306a36Sopenharmony_ci
15462306a36Sopenharmony_ci	load_offset = stack_adjust - sizeof(long);
15562306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_RA, LOONGARCH_GPR_SP, load_offset);
15662306a36Sopenharmony_ci
15762306a36Sopenharmony_ci	load_offset -= sizeof(long);
15862306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_FP, LOONGARCH_GPR_SP, load_offset);
15962306a36Sopenharmony_ci
16062306a36Sopenharmony_ci	load_offset -= sizeof(long);
16162306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_S0, LOONGARCH_GPR_SP, load_offset);
16262306a36Sopenharmony_ci
16362306a36Sopenharmony_ci	load_offset -= sizeof(long);
16462306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_S1, LOONGARCH_GPR_SP, load_offset);
16562306a36Sopenharmony_ci
16662306a36Sopenharmony_ci	load_offset -= sizeof(long);
16762306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_S2, LOONGARCH_GPR_SP, load_offset);
16862306a36Sopenharmony_ci
16962306a36Sopenharmony_ci	load_offset -= sizeof(long);
17062306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_S3, LOONGARCH_GPR_SP, load_offset);
17162306a36Sopenharmony_ci
17262306a36Sopenharmony_ci	load_offset -= sizeof(long);
17362306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_S4, LOONGARCH_GPR_SP, load_offset);
17462306a36Sopenharmony_ci
17562306a36Sopenharmony_ci	load_offset -= sizeof(long);
17662306a36Sopenharmony_ci	emit_insn(ctx, ldd, LOONGARCH_GPR_S5, LOONGARCH_GPR_SP, load_offset);
17762306a36Sopenharmony_ci
17862306a36Sopenharmony_ci	emit_insn(ctx, addid, LOONGARCH_GPR_SP, LOONGARCH_GPR_SP, stack_adjust);
17962306a36Sopenharmony_ci
18062306a36Sopenharmony_ci	if (!is_tail_call) {
18162306a36Sopenharmony_ci		/* Set return value */
18262306a36Sopenharmony_ci		move_reg(ctx, LOONGARCH_GPR_A0, regmap[BPF_REG_0]);
18362306a36Sopenharmony_ci		/* Return to the caller */
18462306a36Sopenharmony_ci		emit_insn(ctx, jirl, LOONGARCH_GPR_RA, LOONGARCH_GPR_ZERO, 0);
18562306a36Sopenharmony_ci	} else {
18662306a36Sopenharmony_ci		/*
18762306a36Sopenharmony_ci		 * Call the next bpf prog and skip the first instruction
18862306a36Sopenharmony_ci		 * of TCC initialization.
18962306a36Sopenharmony_ci		 */
19062306a36Sopenharmony_ci		emit_insn(ctx, jirl, LOONGARCH_GPR_T3, LOONGARCH_GPR_ZERO, 1);
19162306a36Sopenharmony_ci	}
19262306a36Sopenharmony_ci}
19362306a36Sopenharmony_ci
19462306a36Sopenharmony_cistatic void build_epilogue(struct jit_ctx *ctx)
19562306a36Sopenharmony_ci{
19662306a36Sopenharmony_ci	__build_epilogue(ctx, false);
19762306a36Sopenharmony_ci}
19862306a36Sopenharmony_ci
19962306a36Sopenharmony_cibool bpf_jit_supports_kfunc_call(void)
20062306a36Sopenharmony_ci{
20162306a36Sopenharmony_ci	return true;
20262306a36Sopenharmony_ci}
20362306a36Sopenharmony_ci
20462306a36Sopenharmony_ci/* initialized on the first pass of build_body() */
20562306a36Sopenharmony_cistatic int out_offset = -1;
20662306a36Sopenharmony_cistatic int emit_bpf_tail_call(struct jit_ctx *ctx)
20762306a36Sopenharmony_ci{
20862306a36Sopenharmony_ci	int off;
20962306a36Sopenharmony_ci	u8 tcc = tail_call_reg(ctx);
21062306a36Sopenharmony_ci	u8 a1 = LOONGARCH_GPR_A1;
21162306a36Sopenharmony_ci	u8 a2 = LOONGARCH_GPR_A2;
21262306a36Sopenharmony_ci	u8 t1 = LOONGARCH_GPR_T1;
21362306a36Sopenharmony_ci	u8 t2 = LOONGARCH_GPR_T2;
21462306a36Sopenharmony_ci	u8 t3 = LOONGARCH_GPR_T3;
21562306a36Sopenharmony_ci	const int idx0 = ctx->idx;
21662306a36Sopenharmony_ci
21762306a36Sopenharmony_ci#define cur_offset (ctx->idx - idx0)
21862306a36Sopenharmony_ci#define jmp_offset (out_offset - (cur_offset))
21962306a36Sopenharmony_ci
22062306a36Sopenharmony_ci	/*
22162306a36Sopenharmony_ci	 * a0: &ctx
22262306a36Sopenharmony_ci	 * a1: &array
22362306a36Sopenharmony_ci	 * a2: index
22462306a36Sopenharmony_ci	 *
22562306a36Sopenharmony_ci	 * if (index >= array->map.max_entries)
22662306a36Sopenharmony_ci	 *	 goto out;
22762306a36Sopenharmony_ci	 */
22862306a36Sopenharmony_ci	off = offsetof(struct bpf_array, map.max_entries);
22962306a36Sopenharmony_ci	emit_insn(ctx, ldwu, t1, a1, off);
23062306a36Sopenharmony_ci	/* bgeu $a2, $t1, jmp_offset */
23162306a36Sopenharmony_ci	if (emit_tailcall_jmp(ctx, BPF_JGE, a2, t1, jmp_offset) < 0)
23262306a36Sopenharmony_ci		goto toofar;
23362306a36Sopenharmony_ci
23462306a36Sopenharmony_ci	/*
23562306a36Sopenharmony_ci	 * if (--TCC < 0)
23662306a36Sopenharmony_ci	 *	 goto out;
23762306a36Sopenharmony_ci	 */
23862306a36Sopenharmony_ci	emit_insn(ctx, addid, REG_TCC, tcc, -1);
23962306a36Sopenharmony_ci	if (emit_tailcall_jmp(ctx, BPF_JSLT, REG_TCC, LOONGARCH_GPR_ZERO, jmp_offset) < 0)
24062306a36Sopenharmony_ci		goto toofar;
24162306a36Sopenharmony_ci
24262306a36Sopenharmony_ci	/*
24362306a36Sopenharmony_ci	 * prog = array->ptrs[index];
24462306a36Sopenharmony_ci	 * if (!prog)
24562306a36Sopenharmony_ci	 *	 goto out;
24662306a36Sopenharmony_ci	 */
24762306a36Sopenharmony_ci	emit_insn(ctx, alsld, t2, a2, a1, 2);
24862306a36Sopenharmony_ci	off = offsetof(struct bpf_array, ptrs);
24962306a36Sopenharmony_ci	emit_insn(ctx, ldd, t2, t2, off);
25062306a36Sopenharmony_ci	/* beq $t2, $zero, jmp_offset */
25162306a36Sopenharmony_ci	if (emit_tailcall_jmp(ctx, BPF_JEQ, t2, LOONGARCH_GPR_ZERO, jmp_offset) < 0)
25262306a36Sopenharmony_ci		goto toofar;
25362306a36Sopenharmony_ci
25462306a36Sopenharmony_ci	/* goto *(prog->bpf_func + 4); */
25562306a36Sopenharmony_ci	off = offsetof(struct bpf_prog, bpf_func);
25662306a36Sopenharmony_ci	emit_insn(ctx, ldd, t3, t2, off);
25762306a36Sopenharmony_ci	__build_epilogue(ctx, true);
25862306a36Sopenharmony_ci
25962306a36Sopenharmony_ci	/* out: */
26062306a36Sopenharmony_ci	if (out_offset == -1)
26162306a36Sopenharmony_ci		out_offset = cur_offset;
26262306a36Sopenharmony_ci	if (cur_offset != out_offset) {
26362306a36Sopenharmony_ci		pr_err_once("tail_call out_offset = %d, expected %d!\n",
26462306a36Sopenharmony_ci			    cur_offset, out_offset);
26562306a36Sopenharmony_ci		return -1;
26662306a36Sopenharmony_ci	}
26762306a36Sopenharmony_ci
26862306a36Sopenharmony_ci	return 0;
26962306a36Sopenharmony_ci
27062306a36Sopenharmony_citoofar:
27162306a36Sopenharmony_ci	pr_info_once("tail_call: jump too far\n");
27262306a36Sopenharmony_ci	return -1;
27362306a36Sopenharmony_ci#undef cur_offset
27462306a36Sopenharmony_ci#undef jmp_offset
27562306a36Sopenharmony_ci}
27662306a36Sopenharmony_ci
27762306a36Sopenharmony_cistatic void emit_atomic(const struct bpf_insn *insn, struct jit_ctx *ctx)
27862306a36Sopenharmony_ci{
27962306a36Sopenharmony_ci	const u8 t1 = LOONGARCH_GPR_T1;
28062306a36Sopenharmony_ci	const u8 t2 = LOONGARCH_GPR_T2;
28162306a36Sopenharmony_ci	const u8 t3 = LOONGARCH_GPR_T3;
28262306a36Sopenharmony_ci	const u8 r0 = regmap[BPF_REG_0];
28362306a36Sopenharmony_ci	const u8 src = regmap[insn->src_reg];
28462306a36Sopenharmony_ci	const u8 dst = regmap[insn->dst_reg];
28562306a36Sopenharmony_ci	const s16 off = insn->off;
28662306a36Sopenharmony_ci	const s32 imm = insn->imm;
28762306a36Sopenharmony_ci	const bool isdw = BPF_SIZE(insn->code) == BPF_DW;
28862306a36Sopenharmony_ci
28962306a36Sopenharmony_ci	move_imm(ctx, t1, off, false);
29062306a36Sopenharmony_ci	emit_insn(ctx, addd, t1, dst, t1);
29162306a36Sopenharmony_ci	move_reg(ctx, t3, src);
29262306a36Sopenharmony_ci
29362306a36Sopenharmony_ci	switch (imm) {
29462306a36Sopenharmony_ci	/* lock *(size *)(dst + off) <op>= src */
29562306a36Sopenharmony_ci	case BPF_ADD:
29662306a36Sopenharmony_ci		if (isdw)
29762306a36Sopenharmony_ci			emit_insn(ctx, amaddd, t2, t1, src);
29862306a36Sopenharmony_ci		else
29962306a36Sopenharmony_ci			emit_insn(ctx, amaddw, t2, t1, src);
30062306a36Sopenharmony_ci		break;
30162306a36Sopenharmony_ci	case BPF_AND:
30262306a36Sopenharmony_ci		if (isdw)
30362306a36Sopenharmony_ci			emit_insn(ctx, amandd, t2, t1, src);
30462306a36Sopenharmony_ci		else
30562306a36Sopenharmony_ci			emit_insn(ctx, amandw, t2, t1, src);
30662306a36Sopenharmony_ci		break;
30762306a36Sopenharmony_ci	case BPF_OR:
30862306a36Sopenharmony_ci		if (isdw)
30962306a36Sopenharmony_ci			emit_insn(ctx, amord, t2, t1, src);
31062306a36Sopenharmony_ci		else
31162306a36Sopenharmony_ci			emit_insn(ctx, amorw, t2, t1, src);
31262306a36Sopenharmony_ci		break;
31362306a36Sopenharmony_ci	case BPF_XOR:
31462306a36Sopenharmony_ci		if (isdw)
31562306a36Sopenharmony_ci			emit_insn(ctx, amxord, t2, t1, src);
31662306a36Sopenharmony_ci		else
31762306a36Sopenharmony_ci			emit_insn(ctx, amxorw, t2, t1, src);
31862306a36Sopenharmony_ci		break;
31962306a36Sopenharmony_ci	/* src = atomic_fetch_<op>(dst + off, src) */
32062306a36Sopenharmony_ci	case BPF_ADD | BPF_FETCH:
32162306a36Sopenharmony_ci		if (isdw) {
32262306a36Sopenharmony_ci			emit_insn(ctx, amaddd, src, t1, t3);
32362306a36Sopenharmony_ci		} else {
32462306a36Sopenharmony_ci			emit_insn(ctx, amaddw, src, t1, t3);
32562306a36Sopenharmony_ci			emit_zext_32(ctx, src, true);
32662306a36Sopenharmony_ci		}
32762306a36Sopenharmony_ci		break;
32862306a36Sopenharmony_ci	case BPF_AND | BPF_FETCH:
32962306a36Sopenharmony_ci		if (isdw) {
33062306a36Sopenharmony_ci			emit_insn(ctx, amandd, src, t1, t3);
33162306a36Sopenharmony_ci		} else {
33262306a36Sopenharmony_ci			emit_insn(ctx, amandw, src, t1, t3);
33362306a36Sopenharmony_ci			emit_zext_32(ctx, src, true);
33462306a36Sopenharmony_ci		}
33562306a36Sopenharmony_ci		break;
33662306a36Sopenharmony_ci	case BPF_OR | BPF_FETCH:
33762306a36Sopenharmony_ci		if (isdw) {
33862306a36Sopenharmony_ci			emit_insn(ctx, amord, src, t1, t3);
33962306a36Sopenharmony_ci		} else {
34062306a36Sopenharmony_ci			emit_insn(ctx, amorw, src, t1, t3);
34162306a36Sopenharmony_ci			emit_zext_32(ctx, src, true);
34262306a36Sopenharmony_ci		}
34362306a36Sopenharmony_ci		break;
34462306a36Sopenharmony_ci	case BPF_XOR | BPF_FETCH:
34562306a36Sopenharmony_ci		if (isdw) {
34662306a36Sopenharmony_ci			emit_insn(ctx, amxord, src, t1, t3);
34762306a36Sopenharmony_ci		} else {
34862306a36Sopenharmony_ci			emit_insn(ctx, amxorw, src, t1, t3);
34962306a36Sopenharmony_ci			emit_zext_32(ctx, src, true);
35062306a36Sopenharmony_ci		}
35162306a36Sopenharmony_ci		break;
35262306a36Sopenharmony_ci	/* src = atomic_xchg(dst + off, src); */
35362306a36Sopenharmony_ci	case BPF_XCHG:
35462306a36Sopenharmony_ci		if (isdw) {
35562306a36Sopenharmony_ci			emit_insn(ctx, amswapd, src, t1, t3);
35662306a36Sopenharmony_ci		} else {
35762306a36Sopenharmony_ci			emit_insn(ctx, amswapw, src, t1, t3);
35862306a36Sopenharmony_ci			emit_zext_32(ctx, src, true);
35962306a36Sopenharmony_ci		}
36062306a36Sopenharmony_ci		break;
36162306a36Sopenharmony_ci	/* r0 = atomic_cmpxchg(dst + off, r0, src); */
36262306a36Sopenharmony_ci	case BPF_CMPXCHG:
36362306a36Sopenharmony_ci		move_reg(ctx, t2, r0);
36462306a36Sopenharmony_ci		if (isdw) {
36562306a36Sopenharmony_ci			emit_insn(ctx, lld, r0, t1, 0);
36662306a36Sopenharmony_ci			emit_insn(ctx, bne, t2, r0, 4);
36762306a36Sopenharmony_ci			move_reg(ctx, t3, src);
36862306a36Sopenharmony_ci			emit_insn(ctx, scd, t3, t1, 0);
36962306a36Sopenharmony_ci			emit_insn(ctx, beq, t3, LOONGARCH_GPR_ZERO, -4);
37062306a36Sopenharmony_ci		} else {
37162306a36Sopenharmony_ci			emit_insn(ctx, llw, r0, t1, 0);
37262306a36Sopenharmony_ci			emit_zext_32(ctx, t2, true);
37362306a36Sopenharmony_ci			emit_zext_32(ctx, r0, true);
37462306a36Sopenharmony_ci			emit_insn(ctx, bne, t2, r0, 4);
37562306a36Sopenharmony_ci			move_reg(ctx, t3, src);
37662306a36Sopenharmony_ci			emit_insn(ctx, scw, t3, t1, 0);
37762306a36Sopenharmony_ci			emit_insn(ctx, beq, t3, LOONGARCH_GPR_ZERO, -6);
37862306a36Sopenharmony_ci			emit_zext_32(ctx, r0, true);
37962306a36Sopenharmony_ci		}
38062306a36Sopenharmony_ci		break;
38162306a36Sopenharmony_ci	}
38262306a36Sopenharmony_ci}
38362306a36Sopenharmony_ci
38462306a36Sopenharmony_cistatic bool is_signed_bpf_cond(u8 cond)
38562306a36Sopenharmony_ci{
38662306a36Sopenharmony_ci	return cond == BPF_JSGT || cond == BPF_JSLT ||
38762306a36Sopenharmony_ci	       cond == BPF_JSGE || cond == BPF_JSLE;
38862306a36Sopenharmony_ci}
38962306a36Sopenharmony_ci
39062306a36Sopenharmony_ci#define BPF_FIXUP_REG_MASK	GENMASK(31, 27)
39162306a36Sopenharmony_ci#define BPF_FIXUP_OFFSET_MASK	GENMASK(26, 0)
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_cibool ex_handler_bpf(const struct exception_table_entry *ex,
39462306a36Sopenharmony_ci		    struct pt_regs *regs)
39562306a36Sopenharmony_ci{
39662306a36Sopenharmony_ci	int dst_reg = FIELD_GET(BPF_FIXUP_REG_MASK, ex->fixup);
39762306a36Sopenharmony_ci	off_t offset = FIELD_GET(BPF_FIXUP_OFFSET_MASK, ex->fixup);
39862306a36Sopenharmony_ci
39962306a36Sopenharmony_ci	regs->regs[dst_reg] = 0;
40062306a36Sopenharmony_ci	regs->csr_era = (unsigned long)&ex->fixup - offset;
40162306a36Sopenharmony_ci
40262306a36Sopenharmony_ci	return true;
40362306a36Sopenharmony_ci}
40462306a36Sopenharmony_ci
40562306a36Sopenharmony_ci/* For accesses to BTF pointers, add an entry to the exception table */
40662306a36Sopenharmony_cistatic int add_exception_handler(const struct bpf_insn *insn,
40762306a36Sopenharmony_ci				 struct jit_ctx *ctx,
40862306a36Sopenharmony_ci				 int dst_reg)
40962306a36Sopenharmony_ci{
41062306a36Sopenharmony_ci	unsigned long pc;
41162306a36Sopenharmony_ci	off_t offset;
41262306a36Sopenharmony_ci	struct exception_table_entry *ex;
41362306a36Sopenharmony_ci
41462306a36Sopenharmony_ci	if (!ctx->image || !ctx->prog->aux->extable || BPF_MODE(insn->code) != BPF_PROBE_MEM)
41562306a36Sopenharmony_ci		return 0;
41662306a36Sopenharmony_ci
41762306a36Sopenharmony_ci	if (WARN_ON_ONCE(ctx->num_exentries >= ctx->prog->aux->num_exentries))
41862306a36Sopenharmony_ci		return -EINVAL;
41962306a36Sopenharmony_ci
42062306a36Sopenharmony_ci	ex = &ctx->prog->aux->extable[ctx->num_exentries];
42162306a36Sopenharmony_ci	pc = (unsigned long)&ctx->image[ctx->idx - 1];
42262306a36Sopenharmony_ci
42362306a36Sopenharmony_ci	offset = pc - (long)&ex->insn;
42462306a36Sopenharmony_ci	if (WARN_ON_ONCE(offset >= 0 || offset < INT_MIN))
42562306a36Sopenharmony_ci		return -ERANGE;
42662306a36Sopenharmony_ci
42762306a36Sopenharmony_ci	ex->insn = offset;
42862306a36Sopenharmony_ci
42962306a36Sopenharmony_ci	/*
43062306a36Sopenharmony_ci	 * Since the extable follows the program, the fixup offset is always
43162306a36Sopenharmony_ci	 * negative and limited to BPF_JIT_REGION_SIZE. Store a positive value
43262306a36Sopenharmony_ci	 * to keep things simple, and put the destination register in the upper
43362306a36Sopenharmony_ci	 * bits. We don't need to worry about buildtime or runtime sort
43462306a36Sopenharmony_ci	 * modifying the upper bits because the table is already sorted, and
43562306a36Sopenharmony_ci	 * isn't part of the main exception table.
43662306a36Sopenharmony_ci	 */
43762306a36Sopenharmony_ci	offset = (long)&ex->fixup - (pc + LOONGARCH_INSN_SIZE);
43862306a36Sopenharmony_ci	if (!FIELD_FIT(BPF_FIXUP_OFFSET_MASK, offset))
43962306a36Sopenharmony_ci		return -ERANGE;
44062306a36Sopenharmony_ci
44162306a36Sopenharmony_ci	ex->type = EX_TYPE_BPF;
44262306a36Sopenharmony_ci	ex->fixup = FIELD_PREP(BPF_FIXUP_OFFSET_MASK, offset) | FIELD_PREP(BPF_FIXUP_REG_MASK, dst_reg);
44362306a36Sopenharmony_ci
44462306a36Sopenharmony_ci	ctx->num_exentries++;
44562306a36Sopenharmony_ci
44662306a36Sopenharmony_ci	return 0;
44762306a36Sopenharmony_ci}
44862306a36Sopenharmony_ci
44962306a36Sopenharmony_cistatic int build_insn(const struct bpf_insn *insn, struct jit_ctx *ctx, bool extra_pass)
45062306a36Sopenharmony_ci{
45162306a36Sopenharmony_ci	u8 tm = -1;
45262306a36Sopenharmony_ci	u64 func_addr;
45362306a36Sopenharmony_ci	bool func_addr_fixed;
45462306a36Sopenharmony_ci	int i = insn - ctx->prog->insnsi;
45562306a36Sopenharmony_ci	int ret, jmp_offset;
45662306a36Sopenharmony_ci	const u8 code = insn->code;
45762306a36Sopenharmony_ci	const u8 cond = BPF_OP(code);
45862306a36Sopenharmony_ci	const u8 t1 = LOONGARCH_GPR_T1;
45962306a36Sopenharmony_ci	const u8 t2 = LOONGARCH_GPR_T2;
46062306a36Sopenharmony_ci	const u8 src = regmap[insn->src_reg];
46162306a36Sopenharmony_ci	const u8 dst = regmap[insn->dst_reg];
46262306a36Sopenharmony_ci	const s16 off = insn->off;
46362306a36Sopenharmony_ci	const s32 imm = insn->imm;
46462306a36Sopenharmony_ci	const bool is32 = BPF_CLASS(insn->code) == BPF_ALU || BPF_CLASS(insn->code) == BPF_JMP32;
46562306a36Sopenharmony_ci
46662306a36Sopenharmony_ci	switch (code) {
46762306a36Sopenharmony_ci	/* dst = src */
46862306a36Sopenharmony_ci	case BPF_ALU | BPF_MOV | BPF_X:
46962306a36Sopenharmony_ci	case BPF_ALU64 | BPF_MOV | BPF_X:
47062306a36Sopenharmony_ci		move_reg(ctx, dst, src);
47162306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
47262306a36Sopenharmony_ci		break;
47362306a36Sopenharmony_ci
47462306a36Sopenharmony_ci	/* dst = imm */
47562306a36Sopenharmony_ci	case BPF_ALU | BPF_MOV | BPF_K:
47662306a36Sopenharmony_ci	case BPF_ALU64 | BPF_MOV | BPF_K:
47762306a36Sopenharmony_ci		move_imm(ctx, dst, imm, is32);
47862306a36Sopenharmony_ci		break;
47962306a36Sopenharmony_ci
48062306a36Sopenharmony_ci	/* dst = dst + src */
48162306a36Sopenharmony_ci	case BPF_ALU | BPF_ADD | BPF_X:
48262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_ADD | BPF_X:
48362306a36Sopenharmony_ci		emit_insn(ctx, addd, dst, dst, src);
48462306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
48562306a36Sopenharmony_ci		break;
48662306a36Sopenharmony_ci
48762306a36Sopenharmony_ci	/* dst = dst + imm */
48862306a36Sopenharmony_ci	case BPF_ALU | BPF_ADD | BPF_K:
48962306a36Sopenharmony_ci	case BPF_ALU64 | BPF_ADD | BPF_K:
49062306a36Sopenharmony_ci		if (is_signed_imm12(imm)) {
49162306a36Sopenharmony_ci			emit_insn(ctx, addid, dst, dst, imm);
49262306a36Sopenharmony_ci		} else {
49362306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
49462306a36Sopenharmony_ci			emit_insn(ctx, addd, dst, dst, t1);
49562306a36Sopenharmony_ci		}
49662306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
49762306a36Sopenharmony_ci		break;
49862306a36Sopenharmony_ci
49962306a36Sopenharmony_ci	/* dst = dst - src */
50062306a36Sopenharmony_ci	case BPF_ALU | BPF_SUB | BPF_X:
50162306a36Sopenharmony_ci	case BPF_ALU64 | BPF_SUB | BPF_X:
50262306a36Sopenharmony_ci		emit_insn(ctx, subd, dst, dst, src);
50362306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
50462306a36Sopenharmony_ci		break;
50562306a36Sopenharmony_ci
50662306a36Sopenharmony_ci	/* dst = dst - imm */
50762306a36Sopenharmony_ci	case BPF_ALU | BPF_SUB | BPF_K:
50862306a36Sopenharmony_ci	case BPF_ALU64 | BPF_SUB | BPF_K:
50962306a36Sopenharmony_ci		if (is_signed_imm12(-imm)) {
51062306a36Sopenharmony_ci			emit_insn(ctx, addid, dst, dst, -imm);
51162306a36Sopenharmony_ci		} else {
51262306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
51362306a36Sopenharmony_ci			emit_insn(ctx, subd, dst, dst, t1);
51462306a36Sopenharmony_ci		}
51562306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
51662306a36Sopenharmony_ci		break;
51762306a36Sopenharmony_ci
51862306a36Sopenharmony_ci	/* dst = dst * src */
51962306a36Sopenharmony_ci	case BPF_ALU | BPF_MUL | BPF_X:
52062306a36Sopenharmony_ci	case BPF_ALU64 | BPF_MUL | BPF_X:
52162306a36Sopenharmony_ci		emit_insn(ctx, muld, dst, dst, src);
52262306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
52362306a36Sopenharmony_ci		break;
52462306a36Sopenharmony_ci
52562306a36Sopenharmony_ci	/* dst = dst * imm */
52662306a36Sopenharmony_ci	case BPF_ALU | BPF_MUL | BPF_K:
52762306a36Sopenharmony_ci	case BPF_ALU64 | BPF_MUL | BPF_K:
52862306a36Sopenharmony_ci		move_imm(ctx, t1, imm, is32);
52962306a36Sopenharmony_ci		emit_insn(ctx, muld, dst, dst, t1);
53062306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
53162306a36Sopenharmony_ci		break;
53262306a36Sopenharmony_ci
53362306a36Sopenharmony_ci	/* dst = dst / src */
53462306a36Sopenharmony_ci	case BPF_ALU | BPF_DIV | BPF_X:
53562306a36Sopenharmony_ci	case BPF_ALU64 | BPF_DIV | BPF_X:
53662306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
53762306a36Sopenharmony_ci		move_reg(ctx, t1, src);
53862306a36Sopenharmony_ci		emit_zext_32(ctx, t1, is32);
53962306a36Sopenharmony_ci		emit_insn(ctx, divdu, dst, dst, t1);
54062306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
54162306a36Sopenharmony_ci		break;
54262306a36Sopenharmony_ci
54362306a36Sopenharmony_ci	/* dst = dst / imm */
54462306a36Sopenharmony_ci	case BPF_ALU | BPF_DIV | BPF_K:
54562306a36Sopenharmony_ci	case BPF_ALU64 | BPF_DIV | BPF_K:
54662306a36Sopenharmony_ci		move_imm(ctx, t1, imm, is32);
54762306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
54862306a36Sopenharmony_ci		emit_insn(ctx, divdu, dst, dst, t1);
54962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
55062306a36Sopenharmony_ci		break;
55162306a36Sopenharmony_ci
55262306a36Sopenharmony_ci	/* dst = dst % src */
55362306a36Sopenharmony_ci	case BPF_ALU | BPF_MOD | BPF_X:
55462306a36Sopenharmony_ci	case BPF_ALU64 | BPF_MOD | BPF_X:
55562306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
55662306a36Sopenharmony_ci		move_reg(ctx, t1, src);
55762306a36Sopenharmony_ci		emit_zext_32(ctx, t1, is32);
55862306a36Sopenharmony_ci		emit_insn(ctx, moddu, dst, dst, t1);
55962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
56062306a36Sopenharmony_ci		break;
56162306a36Sopenharmony_ci
56262306a36Sopenharmony_ci	/* dst = dst % imm */
56362306a36Sopenharmony_ci	case BPF_ALU | BPF_MOD | BPF_K:
56462306a36Sopenharmony_ci	case BPF_ALU64 | BPF_MOD | BPF_K:
56562306a36Sopenharmony_ci		move_imm(ctx, t1, imm, is32);
56662306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
56762306a36Sopenharmony_ci		emit_insn(ctx, moddu, dst, dst, t1);
56862306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
56962306a36Sopenharmony_ci		break;
57062306a36Sopenharmony_ci
57162306a36Sopenharmony_ci	/* dst = -dst */
57262306a36Sopenharmony_ci	case BPF_ALU | BPF_NEG:
57362306a36Sopenharmony_ci	case BPF_ALU64 | BPF_NEG:
57462306a36Sopenharmony_ci		move_imm(ctx, t1, imm, is32);
57562306a36Sopenharmony_ci		emit_insn(ctx, subd, dst, LOONGARCH_GPR_ZERO, dst);
57662306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
57762306a36Sopenharmony_ci		break;
57862306a36Sopenharmony_ci
57962306a36Sopenharmony_ci	/* dst = dst & src */
58062306a36Sopenharmony_ci	case BPF_ALU | BPF_AND | BPF_X:
58162306a36Sopenharmony_ci	case BPF_ALU64 | BPF_AND | BPF_X:
58262306a36Sopenharmony_ci		emit_insn(ctx, and, dst, dst, src);
58362306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
58462306a36Sopenharmony_ci		break;
58562306a36Sopenharmony_ci
58662306a36Sopenharmony_ci	/* dst = dst & imm */
58762306a36Sopenharmony_ci	case BPF_ALU | BPF_AND | BPF_K:
58862306a36Sopenharmony_ci	case BPF_ALU64 | BPF_AND | BPF_K:
58962306a36Sopenharmony_ci		if (is_unsigned_imm12(imm)) {
59062306a36Sopenharmony_ci			emit_insn(ctx, andi, dst, dst, imm);
59162306a36Sopenharmony_ci		} else {
59262306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
59362306a36Sopenharmony_ci			emit_insn(ctx, and, dst, dst, t1);
59462306a36Sopenharmony_ci		}
59562306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
59662306a36Sopenharmony_ci		break;
59762306a36Sopenharmony_ci
59862306a36Sopenharmony_ci	/* dst = dst | src */
59962306a36Sopenharmony_ci	case BPF_ALU | BPF_OR | BPF_X:
60062306a36Sopenharmony_ci	case BPF_ALU64 | BPF_OR | BPF_X:
60162306a36Sopenharmony_ci		emit_insn(ctx, or, dst, dst, src);
60262306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
60362306a36Sopenharmony_ci		break;
60462306a36Sopenharmony_ci
60562306a36Sopenharmony_ci	/* dst = dst | imm */
60662306a36Sopenharmony_ci	case BPF_ALU | BPF_OR | BPF_K:
60762306a36Sopenharmony_ci	case BPF_ALU64 | BPF_OR | BPF_K:
60862306a36Sopenharmony_ci		if (is_unsigned_imm12(imm)) {
60962306a36Sopenharmony_ci			emit_insn(ctx, ori, dst, dst, imm);
61062306a36Sopenharmony_ci		} else {
61162306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
61262306a36Sopenharmony_ci			emit_insn(ctx, or, dst, dst, t1);
61362306a36Sopenharmony_ci		}
61462306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
61562306a36Sopenharmony_ci		break;
61662306a36Sopenharmony_ci
61762306a36Sopenharmony_ci	/* dst = dst ^ src */
61862306a36Sopenharmony_ci	case BPF_ALU | BPF_XOR | BPF_X:
61962306a36Sopenharmony_ci	case BPF_ALU64 | BPF_XOR | BPF_X:
62062306a36Sopenharmony_ci		emit_insn(ctx, xor, dst, dst, src);
62162306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
62262306a36Sopenharmony_ci		break;
62362306a36Sopenharmony_ci
62462306a36Sopenharmony_ci	/* dst = dst ^ imm */
62562306a36Sopenharmony_ci	case BPF_ALU | BPF_XOR | BPF_K:
62662306a36Sopenharmony_ci	case BPF_ALU64 | BPF_XOR | BPF_K:
62762306a36Sopenharmony_ci		if (is_unsigned_imm12(imm)) {
62862306a36Sopenharmony_ci			emit_insn(ctx, xori, dst, dst, imm);
62962306a36Sopenharmony_ci		} else {
63062306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
63162306a36Sopenharmony_ci			emit_insn(ctx, xor, dst, dst, t1);
63262306a36Sopenharmony_ci		}
63362306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
63462306a36Sopenharmony_ci		break;
63562306a36Sopenharmony_ci
63662306a36Sopenharmony_ci	/* dst = dst << src (logical) */
63762306a36Sopenharmony_ci	case BPF_ALU | BPF_LSH | BPF_X:
63862306a36Sopenharmony_ci		emit_insn(ctx, sllw, dst, dst, src);
63962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
64062306a36Sopenharmony_ci		break;
64162306a36Sopenharmony_ci
64262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_LSH | BPF_X:
64362306a36Sopenharmony_ci		emit_insn(ctx, slld, dst, dst, src);
64462306a36Sopenharmony_ci		break;
64562306a36Sopenharmony_ci
64662306a36Sopenharmony_ci	/* dst = dst << imm (logical) */
64762306a36Sopenharmony_ci	case BPF_ALU | BPF_LSH | BPF_K:
64862306a36Sopenharmony_ci		emit_insn(ctx, slliw, dst, dst, imm);
64962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
65062306a36Sopenharmony_ci		break;
65162306a36Sopenharmony_ci
65262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_LSH | BPF_K:
65362306a36Sopenharmony_ci		emit_insn(ctx, sllid, dst, dst, imm);
65462306a36Sopenharmony_ci		break;
65562306a36Sopenharmony_ci
65662306a36Sopenharmony_ci	/* dst = dst >> src (logical) */
65762306a36Sopenharmony_ci	case BPF_ALU | BPF_RSH | BPF_X:
65862306a36Sopenharmony_ci		emit_insn(ctx, srlw, dst, dst, src);
65962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
66062306a36Sopenharmony_ci		break;
66162306a36Sopenharmony_ci
66262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_RSH | BPF_X:
66362306a36Sopenharmony_ci		emit_insn(ctx, srld, dst, dst, src);
66462306a36Sopenharmony_ci		break;
66562306a36Sopenharmony_ci
66662306a36Sopenharmony_ci	/* dst = dst >> imm (logical) */
66762306a36Sopenharmony_ci	case BPF_ALU | BPF_RSH | BPF_K:
66862306a36Sopenharmony_ci		emit_insn(ctx, srliw, dst, dst, imm);
66962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
67062306a36Sopenharmony_ci		break;
67162306a36Sopenharmony_ci
67262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_RSH | BPF_K:
67362306a36Sopenharmony_ci		emit_insn(ctx, srlid, dst, dst, imm);
67462306a36Sopenharmony_ci		break;
67562306a36Sopenharmony_ci
67662306a36Sopenharmony_ci	/* dst = dst >> src (arithmetic) */
67762306a36Sopenharmony_ci	case BPF_ALU | BPF_ARSH | BPF_X:
67862306a36Sopenharmony_ci		emit_insn(ctx, sraw, dst, dst, src);
67962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
68062306a36Sopenharmony_ci		break;
68162306a36Sopenharmony_ci
68262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_ARSH | BPF_X:
68362306a36Sopenharmony_ci		emit_insn(ctx, srad, dst, dst, src);
68462306a36Sopenharmony_ci		break;
68562306a36Sopenharmony_ci
68662306a36Sopenharmony_ci	/* dst = dst >> imm (arithmetic) */
68762306a36Sopenharmony_ci	case BPF_ALU | BPF_ARSH | BPF_K:
68862306a36Sopenharmony_ci		emit_insn(ctx, sraiw, dst, dst, imm);
68962306a36Sopenharmony_ci		emit_zext_32(ctx, dst, is32);
69062306a36Sopenharmony_ci		break;
69162306a36Sopenharmony_ci
69262306a36Sopenharmony_ci	case BPF_ALU64 | BPF_ARSH | BPF_K:
69362306a36Sopenharmony_ci		emit_insn(ctx, sraid, dst, dst, imm);
69462306a36Sopenharmony_ci		break;
69562306a36Sopenharmony_ci
69662306a36Sopenharmony_ci	/* dst = BSWAP##imm(dst) */
69762306a36Sopenharmony_ci	case BPF_ALU | BPF_END | BPF_FROM_LE:
69862306a36Sopenharmony_ci		switch (imm) {
69962306a36Sopenharmony_ci		case 16:
70062306a36Sopenharmony_ci			/* zero-extend 16 bits into 64 bits */
70162306a36Sopenharmony_ci			emit_insn(ctx, bstrpickd, dst, dst, 15, 0);
70262306a36Sopenharmony_ci			break;
70362306a36Sopenharmony_ci		case 32:
70462306a36Sopenharmony_ci			/* zero-extend 32 bits into 64 bits */
70562306a36Sopenharmony_ci			emit_zext_32(ctx, dst, is32);
70662306a36Sopenharmony_ci			break;
70762306a36Sopenharmony_ci		case 64:
70862306a36Sopenharmony_ci			/* do nothing */
70962306a36Sopenharmony_ci			break;
71062306a36Sopenharmony_ci		}
71162306a36Sopenharmony_ci		break;
71262306a36Sopenharmony_ci
71362306a36Sopenharmony_ci	case BPF_ALU | BPF_END | BPF_FROM_BE:
71462306a36Sopenharmony_ci		switch (imm) {
71562306a36Sopenharmony_ci		case 16:
71662306a36Sopenharmony_ci			emit_insn(ctx, revb2h, dst, dst);
71762306a36Sopenharmony_ci			/* zero-extend 16 bits into 64 bits */
71862306a36Sopenharmony_ci			emit_insn(ctx, bstrpickd, dst, dst, 15, 0);
71962306a36Sopenharmony_ci			break;
72062306a36Sopenharmony_ci		case 32:
72162306a36Sopenharmony_ci			emit_insn(ctx, revb2w, dst, dst);
72262306a36Sopenharmony_ci			/* zero-extend 32 bits into 64 bits */
72362306a36Sopenharmony_ci			emit_zext_32(ctx, dst, is32);
72462306a36Sopenharmony_ci			break;
72562306a36Sopenharmony_ci		case 64:
72662306a36Sopenharmony_ci			emit_insn(ctx, revbd, dst, dst);
72762306a36Sopenharmony_ci			break;
72862306a36Sopenharmony_ci		}
72962306a36Sopenharmony_ci		break;
73062306a36Sopenharmony_ci
73162306a36Sopenharmony_ci	/* PC += off if dst cond src */
73262306a36Sopenharmony_ci	case BPF_JMP | BPF_JEQ | BPF_X:
73362306a36Sopenharmony_ci	case BPF_JMP | BPF_JNE | BPF_X:
73462306a36Sopenharmony_ci	case BPF_JMP | BPF_JGT | BPF_X:
73562306a36Sopenharmony_ci	case BPF_JMP | BPF_JGE | BPF_X:
73662306a36Sopenharmony_ci	case BPF_JMP | BPF_JLT | BPF_X:
73762306a36Sopenharmony_ci	case BPF_JMP | BPF_JLE | BPF_X:
73862306a36Sopenharmony_ci	case BPF_JMP | BPF_JSGT | BPF_X:
73962306a36Sopenharmony_ci	case BPF_JMP | BPF_JSGE | BPF_X:
74062306a36Sopenharmony_ci	case BPF_JMP | BPF_JSLT | BPF_X:
74162306a36Sopenharmony_ci	case BPF_JMP | BPF_JSLE | BPF_X:
74262306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JEQ | BPF_X:
74362306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JNE | BPF_X:
74462306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JGT | BPF_X:
74562306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JGE | BPF_X:
74662306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JLT | BPF_X:
74762306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JLE | BPF_X:
74862306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSGT | BPF_X:
74962306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSGE | BPF_X:
75062306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSLT | BPF_X:
75162306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSLE | BPF_X:
75262306a36Sopenharmony_ci		jmp_offset = bpf2la_offset(i, off, ctx);
75362306a36Sopenharmony_ci		move_reg(ctx, t1, dst);
75462306a36Sopenharmony_ci		move_reg(ctx, t2, src);
75562306a36Sopenharmony_ci		if (is_signed_bpf_cond(BPF_OP(code))) {
75662306a36Sopenharmony_ci			emit_sext_32(ctx, t1, is32);
75762306a36Sopenharmony_ci			emit_sext_32(ctx, t2, is32);
75862306a36Sopenharmony_ci		} else {
75962306a36Sopenharmony_ci			emit_zext_32(ctx, t1, is32);
76062306a36Sopenharmony_ci			emit_zext_32(ctx, t2, is32);
76162306a36Sopenharmony_ci		}
76262306a36Sopenharmony_ci		if (emit_cond_jmp(ctx, cond, t1, t2, jmp_offset) < 0)
76362306a36Sopenharmony_ci			goto toofar;
76462306a36Sopenharmony_ci		break;
76562306a36Sopenharmony_ci
76662306a36Sopenharmony_ci	/* PC += off if dst cond imm */
76762306a36Sopenharmony_ci	case BPF_JMP | BPF_JEQ | BPF_K:
76862306a36Sopenharmony_ci	case BPF_JMP | BPF_JNE | BPF_K:
76962306a36Sopenharmony_ci	case BPF_JMP | BPF_JGT | BPF_K:
77062306a36Sopenharmony_ci	case BPF_JMP | BPF_JGE | BPF_K:
77162306a36Sopenharmony_ci	case BPF_JMP | BPF_JLT | BPF_K:
77262306a36Sopenharmony_ci	case BPF_JMP | BPF_JLE | BPF_K:
77362306a36Sopenharmony_ci	case BPF_JMP | BPF_JSGT | BPF_K:
77462306a36Sopenharmony_ci	case BPF_JMP | BPF_JSGE | BPF_K:
77562306a36Sopenharmony_ci	case BPF_JMP | BPF_JSLT | BPF_K:
77662306a36Sopenharmony_ci	case BPF_JMP | BPF_JSLE | BPF_K:
77762306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JEQ | BPF_K:
77862306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JNE | BPF_K:
77962306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JGT | BPF_K:
78062306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JGE | BPF_K:
78162306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JLT | BPF_K:
78262306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JLE | BPF_K:
78362306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSGT | BPF_K:
78462306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSGE | BPF_K:
78562306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSLT | BPF_K:
78662306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSLE | BPF_K:
78762306a36Sopenharmony_ci		jmp_offset = bpf2la_offset(i, off, ctx);
78862306a36Sopenharmony_ci		if (imm) {
78962306a36Sopenharmony_ci			move_imm(ctx, t1, imm, false);
79062306a36Sopenharmony_ci			tm = t1;
79162306a36Sopenharmony_ci		} else {
79262306a36Sopenharmony_ci			/* If imm is 0, simply use zero register. */
79362306a36Sopenharmony_ci			tm = LOONGARCH_GPR_ZERO;
79462306a36Sopenharmony_ci		}
79562306a36Sopenharmony_ci		move_reg(ctx, t2, dst);
79662306a36Sopenharmony_ci		if (is_signed_bpf_cond(BPF_OP(code))) {
79762306a36Sopenharmony_ci			emit_sext_32(ctx, tm, is32);
79862306a36Sopenharmony_ci			emit_sext_32(ctx, t2, is32);
79962306a36Sopenharmony_ci		} else {
80062306a36Sopenharmony_ci			emit_zext_32(ctx, tm, is32);
80162306a36Sopenharmony_ci			emit_zext_32(ctx, t2, is32);
80262306a36Sopenharmony_ci		}
80362306a36Sopenharmony_ci		if (emit_cond_jmp(ctx, cond, t2, tm, jmp_offset) < 0)
80462306a36Sopenharmony_ci			goto toofar;
80562306a36Sopenharmony_ci		break;
80662306a36Sopenharmony_ci
80762306a36Sopenharmony_ci	/* PC += off if dst & src */
80862306a36Sopenharmony_ci	case BPF_JMP | BPF_JSET | BPF_X:
80962306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSET | BPF_X:
81062306a36Sopenharmony_ci		jmp_offset = bpf2la_offset(i, off, ctx);
81162306a36Sopenharmony_ci		emit_insn(ctx, and, t1, dst, src);
81262306a36Sopenharmony_ci		emit_zext_32(ctx, t1, is32);
81362306a36Sopenharmony_ci		if (emit_cond_jmp(ctx, cond, t1, LOONGARCH_GPR_ZERO, jmp_offset) < 0)
81462306a36Sopenharmony_ci			goto toofar;
81562306a36Sopenharmony_ci		break;
81662306a36Sopenharmony_ci
81762306a36Sopenharmony_ci	/* PC += off if dst & imm */
81862306a36Sopenharmony_ci	case BPF_JMP | BPF_JSET | BPF_K:
81962306a36Sopenharmony_ci	case BPF_JMP32 | BPF_JSET | BPF_K:
82062306a36Sopenharmony_ci		jmp_offset = bpf2la_offset(i, off, ctx);
82162306a36Sopenharmony_ci		move_imm(ctx, t1, imm, is32);
82262306a36Sopenharmony_ci		emit_insn(ctx, and, t1, dst, t1);
82362306a36Sopenharmony_ci		emit_zext_32(ctx, t1, is32);
82462306a36Sopenharmony_ci		if (emit_cond_jmp(ctx, cond, t1, LOONGARCH_GPR_ZERO, jmp_offset) < 0)
82562306a36Sopenharmony_ci			goto toofar;
82662306a36Sopenharmony_ci		break;
82762306a36Sopenharmony_ci
82862306a36Sopenharmony_ci	/* PC += off */
82962306a36Sopenharmony_ci	case BPF_JMP | BPF_JA:
83062306a36Sopenharmony_ci		jmp_offset = bpf2la_offset(i, off, ctx);
83162306a36Sopenharmony_ci		if (emit_uncond_jmp(ctx, jmp_offset) < 0)
83262306a36Sopenharmony_ci			goto toofar;
83362306a36Sopenharmony_ci		break;
83462306a36Sopenharmony_ci
83562306a36Sopenharmony_ci	/* function call */
83662306a36Sopenharmony_ci	case BPF_JMP | BPF_CALL:
83762306a36Sopenharmony_ci		mark_call(ctx);
83862306a36Sopenharmony_ci		ret = bpf_jit_get_func_addr(ctx->prog, insn, extra_pass,
83962306a36Sopenharmony_ci					    &func_addr, &func_addr_fixed);
84062306a36Sopenharmony_ci		if (ret < 0)
84162306a36Sopenharmony_ci			return ret;
84262306a36Sopenharmony_ci
84362306a36Sopenharmony_ci		move_addr(ctx, t1, func_addr);
84462306a36Sopenharmony_ci		emit_insn(ctx, jirl, t1, LOONGARCH_GPR_RA, 0);
84562306a36Sopenharmony_ci		move_reg(ctx, regmap[BPF_REG_0], LOONGARCH_GPR_A0);
84662306a36Sopenharmony_ci		break;
84762306a36Sopenharmony_ci
84862306a36Sopenharmony_ci	/* tail call */
84962306a36Sopenharmony_ci	case BPF_JMP | BPF_TAIL_CALL:
85062306a36Sopenharmony_ci		mark_tail_call(ctx);
85162306a36Sopenharmony_ci		if (emit_bpf_tail_call(ctx) < 0)
85262306a36Sopenharmony_ci			return -EINVAL;
85362306a36Sopenharmony_ci		break;
85462306a36Sopenharmony_ci
85562306a36Sopenharmony_ci	/* function return */
85662306a36Sopenharmony_ci	case BPF_JMP | BPF_EXIT:
85762306a36Sopenharmony_ci		if (i == ctx->prog->len - 1)
85862306a36Sopenharmony_ci			break;
85962306a36Sopenharmony_ci
86062306a36Sopenharmony_ci		jmp_offset = epilogue_offset(ctx);
86162306a36Sopenharmony_ci		if (emit_uncond_jmp(ctx, jmp_offset) < 0)
86262306a36Sopenharmony_ci			goto toofar;
86362306a36Sopenharmony_ci		break;
86462306a36Sopenharmony_ci
86562306a36Sopenharmony_ci	/* dst = imm64 */
86662306a36Sopenharmony_ci	case BPF_LD | BPF_IMM | BPF_DW:
86762306a36Sopenharmony_ci	{
86862306a36Sopenharmony_ci		const u64 imm64 = (u64)(insn + 1)->imm << 32 | (u32)insn->imm;
86962306a36Sopenharmony_ci
87062306a36Sopenharmony_ci		move_imm(ctx, dst, imm64, is32);
87162306a36Sopenharmony_ci		return 1;
87262306a36Sopenharmony_ci	}
87362306a36Sopenharmony_ci
87462306a36Sopenharmony_ci	/* dst = *(size *)(src + off) */
87562306a36Sopenharmony_ci	case BPF_LDX | BPF_MEM | BPF_B:
87662306a36Sopenharmony_ci	case BPF_LDX | BPF_MEM | BPF_H:
87762306a36Sopenharmony_ci	case BPF_LDX | BPF_MEM | BPF_W:
87862306a36Sopenharmony_ci	case BPF_LDX | BPF_MEM | BPF_DW:
87962306a36Sopenharmony_ci	case BPF_LDX | BPF_PROBE_MEM | BPF_DW:
88062306a36Sopenharmony_ci	case BPF_LDX | BPF_PROBE_MEM | BPF_W:
88162306a36Sopenharmony_ci	case BPF_LDX | BPF_PROBE_MEM | BPF_H:
88262306a36Sopenharmony_ci	case BPF_LDX | BPF_PROBE_MEM | BPF_B:
88362306a36Sopenharmony_ci		switch (BPF_SIZE(code)) {
88462306a36Sopenharmony_ci		case BPF_B:
88562306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
88662306a36Sopenharmony_ci				emit_insn(ctx, ldbu, dst, src, off);
88762306a36Sopenharmony_ci			} else {
88862306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
88962306a36Sopenharmony_ci				emit_insn(ctx, ldxbu, dst, src, t1);
89062306a36Sopenharmony_ci			}
89162306a36Sopenharmony_ci			break;
89262306a36Sopenharmony_ci		case BPF_H:
89362306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
89462306a36Sopenharmony_ci				emit_insn(ctx, ldhu, dst, src, off);
89562306a36Sopenharmony_ci			} else {
89662306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
89762306a36Sopenharmony_ci				emit_insn(ctx, ldxhu, dst, src, t1);
89862306a36Sopenharmony_ci			}
89962306a36Sopenharmony_ci			break;
90062306a36Sopenharmony_ci		case BPF_W:
90162306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
90262306a36Sopenharmony_ci				emit_insn(ctx, ldwu, dst, src, off);
90362306a36Sopenharmony_ci			} else if (is_signed_imm14(off)) {
90462306a36Sopenharmony_ci				emit_insn(ctx, ldptrw, dst, src, off);
90562306a36Sopenharmony_ci			} else {
90662306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
90762306a36Sopenharmony_ci				emit_insn(ctx, ldxwu, dst, src, t1);
90862306a36Sopenharmony_ci			}
90962306a36Sopenharmony_ci			break;
91062306a36Sopenharmony_ci		case BPF_DW:
91162306a36Sopenharmony_ci			move_imm(ctx, t1, off, is32);
91262306a36Sopenharmony_ci			emit_insn(ctx, ldxd, dst, src, t1);
91362306a36Sopenharmony_ci			break;
91462306a36Sopenharmony_ci		}
91562306a36Sopenharmony_ci
91662306a36Sopenharmony_ci		ret = add_exception_handler(insn, ctx, dst);
91762306a36Sopenharmony_ci		if (ret)
91862306a36Sopenharmony_ci			return ret;
91962306a36Sopenharmony_ci		break;
92062306a36Sopenharmony_ci
92162306a36Sopenharmony_ci	/* *(size *)(dst + off) = imm */
92262306a36Sopenharmony_ci	case BPF_ST | BPF_MEM | BPF_B:
92362306a36Sopenharmony_ci	case BPF_ST | BPF_MEM | BPF_H:
92462306a36Sopenharmony_ci	case BPF_ST | BPF_MEM | BPF_W:
92562306a36Sopenharmony_ci	case BPF_ST | BPF_MEM | BPF_DW:
92662306a36Sopenharmony_ci		switch (BPF_SIZE(code)) {
92762306a36Sopenharmony_ci		case BPF_B:
92862306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
92962306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
93062306a36Sopenharmony_ci				emit_insn(ctx, stb, t1, dst, off);
93162306a36Sopenharmony_ci			} else {
93262306a36Sopenharmony_ci				move_imm(ctx, t2, off, is32);
93362306a36Sopenharmony_ci				emit_insn(ctx, stxb, t1, dst, t2);
93462306a36Sopenharmony_ci			}
93562306a36Sopenharmony_ci			break;
93662306a36Sopenharmony_ci		case BPF_H:
93762306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
93862306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
93962306a36Sopenharmony_ci				emit_insn(ctx, sth, t1, dst, off);
94062306a36Sopenharmony_ci			} else {
94162306a36Sopenharmony_ci				move_imm(ctx, t2, off, is32);
94262306a36Sopenharmony_ci				emit_insn(ctx, stxh, t1, dst, t2);
94362306a36Sopenharmony_ci			}
94462306a36Sopenharmony_ci			break;
94562306a36Sopenharmony_ci		case BPF_W:
94662306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
94762306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
94862306a36Sopenharmony_ci				emit_insn(ctx, stw, t1, dst, off);
94962306a36Sopenharmony_ci			} else if (is_signed_imm14(off)) {
95062306a36Sopenharmony_ci				emit_insn(ctx, stptrw, t1, dst, off);
95162306a36Sopenharmony_ci			} else {
95262306a36Sopenharmony_ci				move_imm(ctx, t2, off, is32);
95362306a36Sopenharmony_ci				emit_insn(ctx, stxw, t1, dst, t2);
95462306a36Sopenharmony_ci			}
95562306a36Sopenharmony_ci			break;
95662306a36Sopenharmony_ci		case BPF_DW:
95762306a36Sopenharmony_ci			move_imm(ctx, t1, imm, is32);
95862306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
95962306a36Sopenharmony_ci				emit_insn(ctx, std, t1, dst, off);
96062306a36Sopenharmony_ci			} else if (is_signed_imm14(off)) {
96162306a36Sopenharmony_ci				emit_insn(ctx, stptrd, t1, dst, off);
96262306a36Sopenharmony_ci			} else {
96362306a36Sopenharmony_ci				move_imm(ctx, t2, off, is32);
96462306a36Sopenharmony_ci				emit_insn(ctx, stxd, t1, dst, t2);
96562306a36Sopenharmony_ci			}
96662306a36Sopenharmony_ci			break;
96762306a36Sopenharmony_ci		}
96862306a36Sopenharmony_ci		break;
96962306a36Sopenharmony_ci
97062306a36Sopenharmony_ci	/* *(size *)(dst + off) = src */
97162306a36Sopenharmony_ci	case BPF_STX | BPF_MEM | BPF_B:
97262306a36Sopenharmony_ci	case BPF_STX | BPF_MEM | BPF_H:
97362306a36Sopenharmony_ci	case BPF_STX | BPF_MEM | BPF_W:
97462306a36Sopenharmony_ci	case BPF_STX | BPF_MEM | BPF_DW:
97562306a36Sopenharmony_ci		switch (BPF_SIZE(code)) {
97662306a36Sopenharmony_ci		case BPF_B:
97762306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
97862306a36Sopenharmony_ci				emit_insn(ctx, stb, src, dst, off);
97962306a36Sopenharmony_ci			} else {
98062306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
98162306a36Sopenharmony_ci				emit_insn(ctx, stxb, src, dst, t1);
98262306a36Sopenharmony_ci			}
98362306a36Sopenharmony_ci			break;
98462306a36Sopenharmony_ci		case BPF_H:
98562306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
98662306a36Sopenharmony_ci				emit_insn(ctx, sth, src, dst, off);
98762306a36Sopenharmony_ci			} else {
98862306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
98962306a36Sopenharmony_ci				emit_insn(ctx, stxh, src, dst, t1);
99062306a36Sopenharmony_ci			}
99162306a36Sopenharmony_ci			break;
99262306a36Sopenharmony_ci		case BPF_W:
99362306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
99462306a36Sopenharmony_ci				emit_insn(ctx, stw, src, dst, off);
99562306a36Sopenharmony_ci			} else if (is_signed_imm14(off)) {
99662306a36Sopenharmony_ci				emit_insn(ctx, stptrw, src, dst, off);
99762306a36Sopenharmony_ci			} else {
99862306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
99962306a36Sopenharmony_ci				emit_insn(ctx, stxw, src, dst, t1);
100062306a36Sopenharmony_ci			}
100162306a36Sopenharmony_ci			break;
100262306a36Sopenharmony_ci		case BPF_DW:
100362306a36Sopenharmony_ci			if (is_signed_imm12(off)) {
100462306a36Sopenharmony_ci				emit_insn(ctx, std, src, dst, off);
100562306a36Sopenharmony_ci			} else if (is_signed_imm14(off)) {
100662306a36Sopenharmony_ci				emit_insn(ctx, stptrd, src, dst, off);
100762306a36Sopenharmony_ci			} else {
100862306a36Sopenharmony_ci				move_imm(ctx, t1, off, is32);
100962306a36Sopenharmony_ci				emit_insn(ctx, stxd, src, dst, t1);
101062306a36Sopenharmony_ci			}
101162306a36Sopenharmony_ci			break;
101262306a36Sopenharmony_ci		}
101362306a36Sopenharmony_ci		break;
101462306a36Sopenharmony_ci
101562306a36Sopenharmony_ci	case BPF_STX | BPF_ATOMIC | BPF_W:
101662306a36Sopenharmony_ci	case BPF_STX | BPF_ATOMIC | BPF_DW:
101762306a36Sopenharmony_ci		emit_atomic(insn, ctx);
101862306a36Sopenharmony_ci		break;
101962306a36Sopenharmony_ci
102062306a36Sopenharmony_ci	/* Speculation barrier */
102162306a36Sopenharmony_ci	case BPF_ST | BPF_NOSPEC:
102262306a36Sopenharmony_ci		break;
102362306a36Sopenharmony_ci
102462306a36Sopenharmony_ci	default:
102562306a36Sopenharmony_ci		pr_err("bpf_jit: unknown opcode %02x\n", code);
102662306a36Sopenharmony_ci		return -EINVAL;
102762306a36Sopenharmony_ci	}
102862306a36Sopenharmony_ci
102962306a36Sopenharmony_ci	return 0;
103062306a36Sopenharmony_ci
103162306a36Sopenharmony_citoofar:
103262306a36Sopenharmony_ci	pr_info_once("bpf_jit: opcode %02x, jump too far\n", code);
103362306a36Sopenharmony_ci	return -E2BIG;
103462306a36Sopenharmony_ci}
103562306a36Sopenharmony_ci
103662306a36Sopenharmony_cistatic int build_body(struct jit_ctx *ctx, bool extra_pass)
103762306a36Sopenharmony_ci{
103862306a36Sopenharmony_ci	int i;
103962306a36Sopenharmony_ci	const struct bpf_prog *prog = ctx->prog;
104062306a36Sopenharmony_ci
104162306a36Sopenharmony_ci	for (i = 0; i < prog->len; i++) {
104262306a36Sopenharmony_ci		const struct bpf_insn *insn = &prog->insnsi[i];
104362306a36Sopenharmony_ci		int ret;
104462306a36Sopenharmony_ci
104562306a36Sopenharmony_ci		if (ctx->image == NULL)
104662306a36Sopenharmony_ci			ctx->offset[i] = ctx->idx;
104762306a36Sopenharmony_ci
104862306a36Sopenharmony_ci		ret = build_insn(insn, ctx, extra_pass);
104962306a36Sopenharmony_ci		if (ret > 0) {
105062306a36Sopenharmony_ci			i++;
105162306a36Sopenharmony_ci			if (ctx->image == NULL)
105262306a36Sopenharmony_ci				ctx->offset[i] = ctx->idx;
105362306a36Sopenharmony_ci			continue;
105462306a36Sopenharmony_ci		}
105562306a36Sopenharmony_ci		if (ret)
105662306a36Sopenharmony_ci			return ret;
105762306a36Sopenharmony_ci	}
105862306a36Sopenharmony_ci
105962306a36Sopenharmony_ci	if (ctx->image == NULL)
106062306a36Sopenharmony_ci		ctx->offset[i] = ctx->idx;
106162306a36Sopenharmony_ci
106262306a36Sopenharmony_ci	return 0;
106362306a36Sopenharmony_ci}
106462306a36Sopenharmony_ci
106562306a36Sopenharmony_ci/* Fill space with break instructions */
106662306a36Sopenharmony_cistatic void jit_fill_hole(void *area, unsigned int size)
106762306a36Sopenharmony_ci{
106862306a36Sopenharmony_ci	u32 *ptr;
106962306a36Sopenharmony_ci
107062306a36Sopenharmony_ci	/* We are guaranteed to have aligned memory */
107162306a36Sopenharmony_ci	for (ptr = area; size >= sizeof(u32); size -= sizeof(u32))
107262306a36Sopenharmony_ci		*ptr++ = INSN_BREAK;
107362306a36Sopenharmony_ci}
107462306a36Sopenharmony_ci
107562306a36Sopenharmony_cistatic int validate_code(struct jit_ctx *ctx)
107662306a36Sopenharmony_ci{
107762306a36Sopenharmony_ci	int i;
107862306a36Sopenharmony_ci	union loongarch_instruction insn;
107962306a36Sopenharmony_ci
108062306a36Sopenharmony_ci	for (i = 0; i < ctx->idx; i++) {
108162306a36Sopenharmony_ci		insn = ctx->image[i];
108262306a36Sopenharmony_ci		/* Check INSN_BREAK */
108362306a36Sopenharmony_ci		if (insn.word == INSN_BREAK)
108462306a36Sopenharmony_ci			return -1;
108562306a36Sopenharmony_ci	}
108662306a36Sopenharmony_ci
108762306a36Sopenharmony_ci	if (WARN_ON_ONCE(ctx->num_exentries != ctx->prog->aux->num_exentries))
108862306a36Sopenharmony_ci		return -1;
108962306a36Sopenharmony_ci
109062306a36Sopenharmony_ci	return 0;
109162306a36Sopenharmony_ci}
109262306a36Sopenharmony_ci
109362306a36Sopenharmony_cistruct bpf_prog *bpf_int_jit_compile(struct bpf_prog *prog)
109462306a36Sopenharmony_ci{
109562306a36Sopenharmony_ci	bool tmp_blinded = false, extra_pass = false;
109662306a36Sopenharmony_ci	u8 *image_ptr;
109762306a36Sopenharmony_ci	int image_size, prog_size, extable_size;
109862306a36Sopenharmony_ci	struct jit_ctx ctx;
109962306a36Sopenharmony_ci	struct jit_data *jit_data;
110062306a36Sopenharmony_ci	struct bpf_binary_header *header;
110162306a36Sopenharmony_ci	struct bpf_prog *tmp, *orig_prog = prog;
110262306a36Sopenharmony_ci
110362306a36Sopenharmony_ci	/*
110462306a36Sopenharmony_ci	 * If BPF JIT was not enabled then we must fall back to
110562306a36Sopenharmony_ci	 * the interpreter.
110662306a36Sopenharmony_ci	 */
110762306a36Sopenharmony_ci	if (!prog->jit_requested)
110862306a36Sopenharmony_ci		return orig_prog;
110962306a36Sopenharmony_ci
111062306a36Sopenharmony_ci	tmp = bpf_jit_blind_constants(prog);
111162306a36Sopenharmony_ci	/*
111262306a36Sopenharmony_ci	 * If blinding was requested and we failed during blinding,
111362306a36Sopenharmony_ci	 * we must fall back to the interpreter. Otherwise, we save
111462306a36Sopenharmony_ci	 * the new JITed code.
111562306a36Sopenharmony_ci	 */
111662306a36Sopenharmony_ci	if (IS_ERR(tmp))
111762306a36Sopenharmony_ci		return orig_prog;
111862306a36Sopenharmony_ci
111962306a36Sopenharmony_ci	if (tmp != prog) {
112062306a36Sopenharmony_ci		tmp_blinded = true;
112162306a36Sopenharmony_ci		prog = tmp;
112262306a36Sopenharmony_ci	}
112362306a36Sopenharmony_ci
112462306a36Sopenharmony_ci	jit_data = prog->aux->jit_data;
112562306a36Sopenharmony_ci	if (!jit_data) {
112662306a36Sopenharmony_ci		jit_data = kzalloc(sizeof(*jit_data), GFP_KERNEL);
112762306a36Sopenharmony_ci		if (!jit_data) {
112862306a36Sopenharmony_ci			prog = orig_prog;
112962306a36Sopenharmony_ci			goto out;
113062306a36Sopenharmony_ci		}
113162306a36Sopenharmony_ci		prog->aux->jit_data = jit_data;
113262306a36Sopenharmony_ci	}
113362306a36Sopenharmony_ci	if (jit_data->ctx.offset) {
113462306a36Sopenharmony_ci		ctx = jit_data->ctx;
113562306a36Sopenharmony_ci		image_ptr = jit_data->image;
113662306a36Sopenharmony_ci		header = jit_data->header;
113762306a36Sopenharmony_ci		extra_pass = true;
113862306a36Sopenharmony_ci		prog_size = sizeof(u32) * ctx.idx;
113962306a36Sopenharmony_ci		goto skip_init_ctx;
114062306a36Sopenharmony_ci	}
114162306a36Sopenharmony_ci
114262306a36Sopenharmony_ci	memset(&ctx, 0, sizeof(ctx));
114362306a36Sopenharmony_ci	ctx.prog = prog;
114462306a36Sopenharmony_ci
114562306a36Sopenharmony_ci	ctx.offset = kvcalloc(prog->len + 1, sizeof(u32), GFP_KERNEL);
114662306a36Sopenharmony_ci	if (ctx.offset == NULL) {
114762306a36Sopenharmony_ci		prog = orig_prog;
114862306a36Sopenharmony_ci		goto out_offset;
114962306a36Sopenharmony_ci	}
115062306a36Sopenharmony_ci
115162306a36Sopenharmony_ci	/* 1. Initial fake pass to compute ctx->idx and set ctx->flags */
115262306a36Sopenharmony_ci	build_prologue(&ctx);
115362306a36Sopenharmony_ci	if (build_body(&ctx, extra_pass)) {
115462306a36Sopenharmony_ci		prog = orig_prog;
115562306a36Sopenharmony_ci		goto out_offset;
115662306a36Sopenharmony_ci	}
115762306a36Sopenharmony_ci	ctx.epilogue_offset = ctx.idx;
115862306a36Sopenharmony_ci	build_epilogue(&ctx);
115962306a36Sopenharmony_ci
116062306a36Sopenharmony_ci	extable_size = prog->aux->num_exentries * sizeof(struct exception_table_entry);
116162306a36Sopenharmony_ci
116262306a36Sopenharmony_ci	/* Now we know the actual image size.
116362306a36Sopenharmony_ci	 * As each LoongArch instruction is of length 32bit,
116462306a36Sopenharmony_ci	 * we are translating number of JITed intructions into
116562306a36Sopenharmony_ci	 * the size required to store these JITed code.
116662306a36Sopenharmony_ci	 */
116762306a36Sopenharmony_ci	prog_size = sizeof(u32) * ctx.idx;
116862306a36Sopenharmony_ci	image_size = prog_size + extable_size;
116962306a36Sopenharmony_ci	/* Now we know the size of the structure to make */
117062306a36Sopenharmony_ci	header = bpf_jit_binary_alloc(image_size, &image_ptr,
117162306a36Sopenharmony_ci				      sizeof(u32), jit_fill_hole);
117262306a36Sopenharmony_ci	if (header == NULL) {
117362306a36Sopenharmony_ci		prog = orig_prog;
117462306a36Sopenharmony_ci		goto out_offset;
117562306a36Sopenharmony_ci	}
117662306a36Sopenharmony_ci
117762306a36Sopenharmony_ci	/* 2. Now, the actual pass to generate final JIT code */
117862306a36Sopenharmony_ci	ctx.image = (union loongarch_instruction *)image_ptr;
117962306a36Sopenharmony_ci	if (extable_size)
118062306a36Sopenharmony_ci		prog->aux->extable = (void *)image_ptr + prog_size;
118162306a36Sopenharmony_ci
118262306a36Sopenharmony_ciskip_init_ctx:
118362306a36Sopenharmony_ci	ctx.idx = 0;
118462306a36Sopenharmony_ci	ctx.num_exentries = 0;
118562306a36Sopenharmony_ci
118662306a36Sopenharmony_ci	build_prologue(&ctx);
118762306a36Sopenharmony_ci	if (build_body(&ctx, extra_pass)) {
118862306a36Sopenharmony_ci		bpf_jit_binary_free(header);
118962306a36Sopenharmony_ci		prog = orig_prog;
119062306a36Sopenharmony_ci		goto out_offset;
119162306a36Sopenharmony_ci	}
119262306a36Sopenharmony_ci	build_epilogue(&ctx);
119362306a36Sopenharmony_ci
119462306a36Sopenharmony_ci	/* 3. Extra pass to validate JITed code */
119562306a36Sopenharmony_ci	if (validate_code(&ctx)) {
119662306a36Sopenharmony_ci		bpf_jit_binary_free(header);
119762306a36Sopenharmony_ci		prog = orig_prog;
119862306a36Sopenharmony_ci		goto out_offset;
119962306a36Sopenharmony_ci	}
120062306a36Sopenharmony_ci
120162306a36Sopenharmony_ci	/* And we're done */
120262306a36Sopenharmony_ci	if (bpf_jit_enable > 1)
120362306a36Sopenharmony_ci		bpf_jit_dump(prog->len, prog_size, 2, ctx.image);
120462306a36Sopenharmony_ci
120562306a36Sopenharmony_ci	/* Update the icache */
120662306a36Sopenharmony_ci	flush_icache_range((unsigned long)header, (unsigned long)(ctx.image + ctx.idx));
120762306a36Sopenharmony_ci
120862306a36Sopenharmony_ci	if (!prog->is_func || extra_pass) {
120962306a36Sopenharmony_ci		if (extra_pass && ctx.idx != jit_data->ctx.idx) {
121062306a36Sopenharmony_ci			pr_err_once("multi-func JIT bug %d != %d\n",
121162306a36Sopenharmony_ci				    ctx.idx, jit_data->ctx.idx);
121262306a36Sopenharmony_ci			bpf_jit_binary_free(header);
121362306a36Sopenharmony_ci			prog->bpf_func = NULL;
121462306a36Sopenharmony_ci			prog->jited = 0;
121562306a36Sopenharmony_ci			prog->jited_len = 0;
121662306a36Sopenharmony_ci			goto out_offset;
121762306a36Sopenharmony_ci		}
121862306a36Sopenharmony_ci		bpf_jit_binary_lock_ro(header);
121962306a36Sopenharmony_ci	} else {
122062306a36Sopenharmony_ci		jit_data->ctx = ctx;
122162306a36Sopenharmony_ci		jit_data->image = image_ptr;
122262306a36Sopenharmony_ci		jit_data->header = header;
122362306a36Sopenharmony_ci	}
122462306a36Sopenharmony_ci	prog->jited = 1;
122562306a36Sopenharmony_ci	prog->jited_len = prog_size;
122662306a36Sopenharmony_ci	prog->bpf_func = (void *)ctx.image;
122762306a36Sopenharmony_ci
122862306a36Sopenharmony_ci	if (!prog->is_func || extra_pass) {
122962306a36Sopenharmony_ci		int i;
123062306a36Sopenharmony_ci
123162306a36Sopenharmony_ci		/* offset[prog->len] is the size of program */
123262306a36Sopenharmony_ci		for (i = 0; i <= prog->len; i++)
123362306a36Sopenharmony_ci			ctx.offset[i] *= LOONGARCH_INSN_SIZE;
123462306a36Sopenharmony_ci		bpf_prog_fill_jited_linfo(prog, ctx.offset + 1);
123562306a36Sopenharmony_ci
123662306a36Sopenharmony_ciout_offset:
123762306a36Sopenharmony_ci		kvfree(ctx.offset);
123862306a36Sopenharmony_ci		kfree(jit_data);
123962306a36Sopenharmony_ci		prog->aux->jit_data = NULL;
124062306a36Sopenharmony_ci	}
124162306a36Sopenharmony_ci
124262306a36Sopenharmony_ciout:
124362306a36Sopenharmony_ci	if (tmp_blinded)
124462306a36Sopenharmony_ci		bpf_jit_prog_release_other(prog, prog == orig_prog ? tmp : orig_prog);
124562306a36Sopenharmony_ci
124662306a36Sopenharmony_ci	out_offset = -1;
124762306a36Sopenharmony_ci
124862306a36Sopenharmony_ci	return prog;
124962306a36Sopenharmony_ci}
125062306a36Sopenharmony_ci
125162306a36Sopenharmony_ci/* Indicate the JIT backend supports mixing bpf2bpf and tailcalls. */
125262306a36Sopenharmony_cibool bpf_jit_supports_subprog_tailcalls(void)
125362306a36Sopenharmony_ci{
125462306a36Sopenharmony_ci	return true;
125562306a36Sopenharmony_ci}
1256