4 년 전 · 9a038e7fd1
--- a/target/linux/generic/backport-5.15/010-Kbuild-don-t-hardcode-path-to-awk-in-scripts-ld-vers.patch
+++ b/target/linux/generic/backport-5.15/010-Kbuild-don-t-hardcode-path-to-awk-in-scripts-ld-vers.patch
@@ -0,0 +1,30 @@
 
				+From 13b1ecc3401653a355798eb1dee10cc1608202f4 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Mon, 18 Jan 2016 12:27:49 +0100
			
 
				+Subject: [PATCH 33/34] Kbuild: don't hardcode path to awk in
			
 
				+ scripts/ld-version.sh
			
 
				+
			
 
				+On some systems /usr/bin/awk does not exist, or is broken. Find it via
			
 
				+$PATH instead.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+---
			
 
				+ scripts/ld-version.sh | 4 +++-
			
 
				+ 1 file changed, 3 insertions(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/scripts/ld-version.sh
			
 
				++++ b/scripts/ld-version.sh
			
 
				+@@ -1,6 +1,7 @@
			
 
				+-#!/usr/bin/awk -f
			
 
				++#!/bin/sh
			
 
				+ # SPDX-License-Identifier: GPL-2.0
			
 
				+ # extract linker version number from stdin and turn into single number
			
 
				++exec awk '
			
 
				+ 	{
			
 
				+ 	gsub(".*\\)", "");
			
 
				+ 	gsub(".*version ", "");
			
 
				+@@ -9,3 +10,4 @@
			
 
				+ 	print a[1]*100000000 + a[2]*1000000 + a[3]*10000;
			
 
				+ 	exit
			
 
				+ 	}
			
 
				++'
			
--- a/target/linux/generic/backport-5.15/011-kbuild-export-SUBARCH.patch
+++ b/target/linux/generic/backport-5.15/011-kbuild-export-SUBARCH.patch
@@ -0,0 +1,21 @@
 
				+From 173019b66dcc9d68ad9333aa744dad1e369b5aa8 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Sun, 9 Jul 2017 00:26:53 +0200
			
 
				+Subject: [PATCH 34/34] kernel: add compile fix for linux 4.9 on x86
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+---
			
 
				+ Makefile | 4 ++--
			
 
				+ 1 file changed, 2 insertions(+), 2 deletions(-)
			
 
				+
			
 
				+--- a/Makefile
			
 
				++++ b/Makefile
			
 
				+@@ -507,7 +507,7 @@ KBUILD_LDFLAGS_MODULE :=
			
 
				+ KBUILD_LDFLAGS :=
			
 
				+ CLANG_FLAGS :=
			
 
				+ 
			
 
				+-export ARCH SRCARCH CONFIG_SHELL BASH HOSTCC KBUILD_HOSTCFLAGS CROSS_COMPILE LD CC
			
 
				++export ARCH SRCARCH SUBARCH CONFIG_SHELL BASH HOSTCC KBUILD_HOSTCFLAGS CROSS_COMPILE LD CC
			
 
				+ export CPP AR NM STRIP OBJCOPY OBJDUMP READELF PAHOLE RESOLVE_BTFIDS LEX YACC AWK INSTALLKERNEL
			
 
				+ export PERL PYTHON PYTHON3 CHECK CHECKFLAGS MAKE UTS_MACHINE HOSTCXX
			
 
				+ export KGZIP KBZIP2 KLZOP LZMA LZ4 XZ ZSTD
			
--- a/target/linux/generic/backport-5.15/026-power-reset-linkstation-poweroff-add-missing-put_dev.patch
+++ b/target/linux/generic/backport-5.15/026-power-reset-linkstation-poweroff-add-missing-put_dev.patch
@@ -0,0 +1,27 @@
 
				+From 1027a42c25cbf8cfc4ade6503c5110aae04866af Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Daniel=20Gonz=C3=A1lez=20Cabanelas?= <[email protected]>
			
 
				+Date: Fri, 16 Oct 2020 20:22:37 +0200
			
 
				+Subject: [PATCH] power: reset: linkstation-poweroff: add missing put_device()
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+The of_mdio_find_bus() takes a reference to the underlying device
			
 
				+structure, we should release that reference using a put_device() call.
			
 
				+
			
 
				+Signed-off-by: Daniel González Cabanelas <[email protected]>
			
 
				+Signed-off-by: Sebastian Reichel <[email protected]>
			
 
				+---
			
 
				+ drivers/power/reset/linkstation-poweroff.c | 1 +
			
 
				+ 1 file changed, 1 insertion(+)
			
 
				+
			
 
				+--- a/drivers/power/reset/linkstation-poweroff.c
			
 
				++++ b/drivers/power/reset/linkstation-poweroff.c
			
 
				+@@ -113,6 +113,7 @@ static int __init linkstation_poweroff_i
			
 
				+ 		return -EPROBE_DEFER;
			
 
				+ 
			
 
				+ 	phydev = phy_find_first(bus);
			
 
				++	put_device(&bus->dev);
			
 
				+ 	if (!phydev)
			
 
				+ 		return -EPROBE_DEFER;
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/050-v5.16-00-MIPS-uasm-Enable-muhu-opcode-for-MIPS-R6.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-00-MIPS-uasm-Enable-muhu-opcode-for-MIPS-R6.patch
@@ -0,0 +1,65 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:02 +0200
			
 
				+Subject: [PATCH] MIPS: uasm: Enable muhu opcode for MIPS R6
			
 
				+
			
 
				+Enable the 'muhu' instruction, complementing the existing 'mulu', needed
			
 
				+to implement a MIPS32 BPF JIT.
			
 
				+
			
 
				+Also fix a typo in the existing definition of 'dmulu'.
			
 
				+
			
 
				+Signed-off-by: Tony Ambardar <[email protected]>
			
 
				+
			
 
				+This patch is a dependency for my 32-bit MIPS eBPF JIT.
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/arch/mips/include/asm/uasm.h
			
 
				++++ b/arch/mips/include/asm/uasm.h
			
 
				+@@ -145,6 +145,7 @@ Ip_u1(_mtlo);
			
 
				+ Ip_u3u1u2(_mul);
			
 
				+ Ip_u1u2(_multu);
			
 
				+ Ip_u3u1u2(_mulu);
			
 
				++Ip_u3u1u2(_muhu);
			
 
				+ Ip_u3u1u2(_nor);
			
 
				+ Ip_u3u1u2(_or);
			
 
				+ Ip_u2u1u3(_ori);
			
 
				+--- a/arch/mips/mm/uasm-mips.c
			
 
				++++ b/arch/mips/mm/uasm-mips.c
			
 
				+@@ -90,7 +90,7 @@ static const struct insn insn_table[insn
			
 
				+ 				RS | RT | RD},
			
 
				+ 	[insn_dmtc0]	= {M(cop0_op, dmtc_op, 0, 0, 0, 0), RT | RD | SET},
			
 
				+ 	[insn_dmultu]	= {M(spec_op, 0, 0, 0, 0, dmultu_op), RS | RT},
			
 
				+-	[insn_dmulu]	= {M(spec_op, 0, 0, 0, dmult_dmul_op, dmultu_op),
			
 
				++	[insn_dmulu]	= {M(spec_op, 0, 0, 0, dmultu_dmulu_op, dmultu_op),
			
 
				+ 				RS | RT | RD},
			
 
				+ 	[insn_drotr]	= {M(spec_op, 1, 0, 0, 0, dsrl_op), RT | RD | RE},
			
 
				+ 	[insn_drotr32]	= {M(spec_op, 1, 0, 0, 0, dsrl32_op), RT | RD | RE},
			
 
				+@@ -150,6 +150,8 @@ static const struct insn insn_table[insn
			
 
				+ 	[insn_mtlo]	= {M(spec_op, 0, 0, 0, 0, mtlo_op), RS},
			
 
				+ 	[insn_mulu]	= {M(spec_op, 0, 0, 0, multu_mulu_op, multu_op),
			
 
				+ 				RS | RT | RD},
			
 
				++	[insn_muhu]	= {M(spec_op, 0, 0, 0, multu_muhu_op, multu_op),
			
 
				++				RS | RT | RD},
			
 
				+ #ifndef CONFIG_CPU_MIPSR6
			
 
				+ 	[insn_mul]	= {M(spec2_op, 0, 0, 0, 0, mul_op), RS | RT | RD},
			
 
				+ #else
			
 
				+--- a/arch/mips/mm/uasm.c
			
 
				++++ b/arch/mips/mm/uasm.c
			
 
				+@@ -59,7 +59,7 @@ enum opcode {
			
 
				+ 	insn_lddir, insn_ldpte, insn_ldx, insn_lh, insn_lhu, insn_ll, insn_lld,
			
 
				+ 	insn_lui, insn_lw, insn_lwu, insn_lwx, insn_mfc0, insn_mfhc0, insn_mfhi,
			
 
				+ 	insn_mflo, insn_modu, insn_movn, insn_movz, insn_mtc0, insn_mthc0,
			
 
				+-	insn_mthi, insn_mtlo, insn_mul, insn_multu, insn_mulu, insn_nor,
			
 
				++	insn_mthi, insn_mtlo, insn_mul, insn_multu, insn_mulu, insn_muhu, insn_nor,
			
 
				+ 	insn_or, insn_ori, insn_pref, insn_rfe, insn_rotr, insn_sb, insn_sc,
			
 
				+ 	insn_scd, insn_seleqz, insn_selnez, insn_sd, insn_sh, insn_sll,
			
 
				+ 	insn_sllv, insn_slt, insn_slti, insn_sltiu, insn_sltu, insn_sra,
			
 
				+@@ -344,6 +344,7 @@ I_u1(_mtlo)
			
 
				+ I_u3u1u2(_mul)
			
 
				+ I_u1u2(_multu)
			
 
				+ I_u3u1u2(_mulu)
			
 
				++I_u3u1u2(_muhu)
			
 
				+ I_u3u1u2(_nor)
			
 
				+ I_u3u1u2(_or)
			
 
				+ I_u2u1u3(_ori)
			
--- a/target/linux/generic/backport-5.15/050-v5.16-01-mips-uasm-Add-workaround-for-Loongson-2F-nop-CPU-err.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-01-mips-uasm-Add-workaround-for-Loongson-2F-nop-CPU-err.patch
@@ -0,0 +1,31 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:03 +0200
			
 
				+Subject: [PATCH] mips: uasm: Add workaround for Loongson-2F nop CPU errata
			
 
				+
			
 
				+This patch implements a workaround for the Loongson-2F nop in generated,
			
 
				+code, if the existing option CONFIG_CPU_NOP_WORKAROUND is set. Before,
			
 
				+the binutils option -mfix-loongson2f-nop was enabled, but no workaround
			
 
				+was done when emitting MIPS code. Now, the nop pseudo instruction is
			
 
				+emitted as "or ax,ax,zero" instead of the default "sll zero,zero,0". This
			
 
				+is consistent with the workaround implemented by binutils.
			
 
				+
			
 
				+Link: https://sourceware.org/legacy-ml/binutils/2009-11/msg00387.html
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+Reviewed-by: Jiaxun Yang <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/arch/mips/include/asm/uasm.h
			
 
				++++ b/arch/mips/include/asm/uasm.h
			
 
				+@@ -249,7 +249,11 @@ static inline void uasm_l##lb(struct uas
			
 
				+ #define uasm_i_bnezl(buf, rs, off) uasm_i_bnel(buf, rs, 0, off)
			
 
				+ #define uasm_i_ehb(buf) uasm_i_sll(buf, 0, 0, 3)
			
 
				+ #define uasm_i_move(buf, a, b) UASM_i_ADDU(buf, a, 0, b)
			
 
				++#ifdef CONFIG_CPU_NOP_WORKAROUNDS
			
 
				++#define uasm_i_nop(buf) uasm_i_or(buf, 1, 1, 0)
			
 
				++#else
			
 
				+ #define uasm_i_nop(buf) uasm_i_sll(buf, 0, 0, 0)
			
 
				++#endif
			
 
				+ #define uasm_i_ssnop(buf) uasm_i_sll(buf, 0, 0, 1)
			
 
				+ 
			
 
				+ static inline void uasm_i_drotr_safe(u32 **p, unsigned int a1,
			
--- a/target/linux/generic/backport-5.15/050-v5.16-02-mips-bpf-Add-eBPF-JIT-for-32-bit-MIPS.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-02-mips-bpf-Add-eBPF-JIT-for-32-bit-MIPS.patch
@@ -0,0 +1,3078 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:04 +0200
			
 
				+Subject: [PATCH] mips: bpf: Add eBPF JIT for 32-bit MIPS
			
 
				+
			
 
				+This is an implementation of an eBPF JIT for 32-bit MIPS I-V and MIPS32.
			
 
				+The implementation supports all 32-bit and 64-bit ALU and JMP operations,
			
 
				+including the recently-added atomics. 64-bit div/mod and 64-bit atomics
			
 
				+are implemented using function calls to math64 and atomic64 functions,
			
 
				+respectively. All 32-bit operations are implemented natively by the JIT,
			
 
				+except if the CPU lacks ll/sc instructions.
			
 
				+
			
 
				+Register mapping
			
 
				+================
			
 
				+All 64-bit eBPF registers are mapped to native 32-bit MIPS register pairs,
			
 
				+and does not use any stack scratch space for register swapping. This means
			
 
				+that all eBPF register data is kept in CPU registers all the time, and
			
 
				+this simplifies the register management a lot. It also reduces the JIT's
			
 
				+pressure on temporary registers since we do not have to move data around.
			
 
				+
			
 
				+Native register pairs are ordered according to CPU endiannes, following
			
 
				+the O32 calling convention for passing 64-bit arguments and return values.
			
 
				+The eBPF return value, arguments and callee-saved registers are mapped to
			
 
				+their native MIPS equivalents.
			
 
				+
			
 
				+Since the 32 highest bits in the eBPF FP (frame pointer) register are
			
 
				+always zero, only one general-purpose register is actually needed for the
			
 
				+mapping. The MIPS fp register is used for this purpose. The high bits are
			
 
				+mapped to MIPS register r0. This saves us one CPU register, which is much
			
 
				+needed for temporaries, while still allowing us to treat the R10 (FP)
			
 
				+register just like any other eBPF register in the JIT.
			
 
				+
			
 
				+The MIPS gp (global pointer) and at (assembler temporary) registers are
			
 
				+used as internal temporary registers for constant blinding. CPU registers
			
 
				+t6-t9 are used internally by the JIT when constructing more complex 64-bit
			
 
				+operations. This is precisely what is needed - two registers to store an
			
 
				+operand value, and two more as scratch registers when performing the
			
 
				+operation.
			
 
				+
			
 
				+The register mapping is shown below.
			
 
				+
			
 
				+    R0 - $v1, $v0   return value
			
 
				+    R1 - $a1, $a0   argument 1, passed in registers
			
 
				+    R2 - $a3, $a2   argument 2, passed in registers
			
 
				+    R3 - $t1, $t0   argument 3, passed on stack
			
 
				+    R4 - $t3, $t2   argument 4, passed on stack
			
 
				+    R5 - $t4, $t3   argument 5, passed on stack
			
 
				+    R6 - $s1, $s0   callee-saved
			
 
				+    R7 - $s3, $s2   callee-saved
			
 
				+    R8 - $s5, $s4   callee-saved
			
 
				+    R9 - $s7, $s6   callee-saved
			
 
				+    FP - $r0, $fp   32-bit frame pointer
			
 
				+    AX - $gp, $at   constant-blinding
			
 
				+         $t6 - $t9  unallocated, JIT temporaries
			
 
				+
			
 
				+Jump offsets
			
 
				+============
			
 
				+The JIT tries to map all conditional JMP operations to MIPS conditional
			
 
				+PC-relative branches. The MIPS branch offset field is 18 bits, in bytes,
			
 
				+which is equivalent to the eBPF 16-bit instruction offset. However, since
			
 
				+the JIT may emit more than one CPU instruction per eBPF instruction, the
			
 
				+field width may overflow. If that happens, the JIT converts the long
			
 
				+conditional jump to a short PC-relative branch with the condition
			
 
				+inverted, jumping over a long unconditional absolute jmp (j).
			
 
				+
			
 
				+This conversion will change the instruction offset mapping used for jumps,
			
 
				+and may in turn result in more branch offset overflows. The JIT therefore
			
 
				+dry-runs the translation until no more branches are converted and the
			
 
				+offsets do not change anymore. There is an upper bound on this of course,
			
 
				+and if the JIT hits that limit, the last two iterations are run with all
			
 
				+branches being converted.
			
 
				+
			
 
				+Tail call count
			
 
				+===============
			
 
				+The current tail call count is stored in the 16-byte area of the caller's
			
 
				+stack frame that is reserved for the callee in the o32 ABI. The value is
			
 
				+initialized in the prologue, and propagated to the tail-callee by skipping
			
 
				+the initialization instructions when emitting the tail call.
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+---
			
 
				+ create mode 100644 arch/mips/net/bpf_jit_comp.c
			
 
				+ create mode 100644 arch/mips/net/bpf_jit_comp.h
			
 
				+ create mode 100644 arch/mips/net/bpf_jit_comp32.c
			
 
				+
			
 
				+--- a/arch/mips/net/Makefile
			
 
				++++ b/arch/mips/net/Makefile
			
 
				+@@ -2,4 +2,9 @@
			
 
				+ # MIPS networking code
			
 
				+ 
			
 
				+ obj-$(CONFIG_MIPS_CBPF_JIT) += bpf_jit.o bpf_jit_asm.o
			
 
				+-obj-$(CONFIG_MIPS_EBPF_JIT) += ebpf_jit.o
			
 
				++
			
 
				++ifeq ($(CONFIG_32BIT),y)
			
 
				++        obj-$(CONFIG_MIPS_EBPF_JIT) += bpf_jit_comp.o bpf_jit_comp32.o
			
 
				++else
			
 
				++        obj-$(CONFIG_MIPS_EBPF_JIT) += ebpf_jit.o
			
 
				++endif
			
 
				+--- /dev/null
			
 
				++++ b/arch/mips/net/bpf_jit_comp.c
			
 
				+@@ -0,0 +1,1020 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/*
			
 
				++ * Just-In-Time compiler for eBPF bytecode on MIPS.
			
 
				++ * Implementation of JIT functions common to 32-bit and 64-bit CPUs.
			
 
				++ *
			
 
				++ * Copyright (c) 2021 Anyfi Networks AB.
			
 
				++ * Author: Johan Almbladh <[email protected]>
			
 
				++ *
			
 
				++ * Based on code and ideas from
			
 
				++ * Copyright (c) 2017 Cavium, Inc.
			
 
				++ * Copyright (c) 2017 Shubham Bansal <[email protected]>
			
 
				++ * Copyright (c) 2011 Mircea Gherzan <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++/*
			
 
				++ * Code overview
			
 
				++ * =============
			
 
				++ *
			
 
				++ * - bpf_jit_comp.h
			
 
				++ *   Common definitions and utilities.
			
 
				++ *
			
 
				++ * - bpf_jit_comp.c
			
 
				++ *   Implementation of JIT top-level logic and exported JIT API functions.
			
 
				++ *   Implementation of internal operations shared by 32-bit and 64-bit code.
			
 
				++ *   JMP and ALU JIT control code, register control code, shared ALU and
			
 
				++ *   JMP/JMP32 JIT operations.
			
 
				++ *
			
 
				++ * - bpf_jit_comp32.c
			
 
				++ *   Implementation of functions to JIT prologue, epilogue and a single eBPF
			
 
				++ *   instruction for 32-bit MIPS CPUs. The functions use shared operations
			
 
				++ *   where possible, and implement the rest for 32-bit MIPS such as ALU64
			
 
				++ *   operations.
			
 
				++ *
			
 
				++ * - bpf_jit_comp64.c
			
 
				++ *   Ditto, for 64-bit MIPS CPUs.
			
 
				++ *
			
 
				++ * Zero and sign extension
			
 
				++ * ========================
			
 
				++ * 32-bit MIPS instructions on 64-bit MIPS registers use sign extension,
			
 
				++ * but the eBPF instruction set mandates zero extension. We let the verifier
			
 
				++ * insert explicit zero-extensions after 32-bit ALU operations, both for
			
 
				++ * 32-bit and 64-bit MIPS JITs. Conditional JMP32 operations on 64-bit MIPs
			
 
				++ * are JITed with sign extensions inserted when so expected.
			
 
				++ *
			
 
				++ * ALU operations
			
 
				++ * ==============
			
 
				++ * ALU operations on 32/64-bit MIPS and ALU64 operations on 64-bit MIPS are
			
 
				++ * JITed in the following steps. ALU64 operations on 32-bit MIPS are more
			
 
				++ * complicated and therefore only processed by special implementations in
			
 
				++ * step (3).
			
 
				++ *
			
 
				++ * 1) valid_alu_i:
			
 
				++ *    Determine if an immediate operation can be emitted as such, or if
			
 
				++ *    we must fall back to the register version.
			
 
				++ *
			
 
				++ * 2) rewrite_alu_i:
			
 
				++ *    Convert BPF operation and immediate value to a canonical form for
			
 
				++ *    JITing. In some degenerate cases this form may be a no-op.
			
 
				++ *
			
 
				++ * 3) emit_alu_{i,i64,r,64}:
			
 
				++ *    Emit instructions for an ALU or ALU64 immediate or register operation.
			
 
				++ *
			
 
				++ * JMP operations
			
 
				++ * ==============
			
 
				++ * JMP and JMP32 operations require an JIT instruction offset table for
			
 
				++ * translating the jump offset. This table is computed by dry-running the
			
 
				++ * JIT without actually emitting anything. However, the computed PC-relative
			
 
				++ * offset may overflow the 18-bit offset field width of the native MIPS
			
 
				++ * branch instruction. In such cases, the long jump is converted into the
			
 
				++ * following sequence.
			
 
				++ *
			
 
				++ *    <branch> !<cond> +2    Inverted PC-relative branch
			
 
				++ *    nop                    Delay slot
			
 
				++ *    j <offset>             Unconditional absolute long jump
			
 
				++ *    nop                    Delay slot
			
 
				++ *
			
 
				++ * Since this converted sequence alters the offset table, all offsets must
			
 
				++ * be re-calculated. This may in turn trigger new branch conversions, so
			
 
				++ * the process is repeated until no further changes are made. Normally it
			
 
				++ * completes in 1-2 iterations. If JIT_MAX_ITERATIONS should reached, we
			
 
				++ * fall back to converting every remaining jump operation. The branch
			
 
				++ * conversion is independent of how the JMP or JMP32 condition is JITed.
			
 
				++ *
			
 
				++ * JMP32 and JMP operations are JITed as follows.
			
 
				++ *
			
 
				++ * 1) setup_jmp_{i,r}:
			
 
				++ *    Convert jump conditional and offset into a form that can be JITed.
			
 
				++ *    This form may be a no-op, a canonical form, or an inverted PC-relative
			
 
				++ *    jump if branch conversion is necessary.
			
 
				++ *
			
 
				++ * 2) valid_jmp_i:
			
 
				++ *    Determine if an immediate operations can be emitted as such, or if
			
 
				++ *    we must fall back to the register version. Applies to JMP32 for 32-bit
			
 
				++ *    MIPS, and both JMP and JMP32 for 64-bit MIPS.
			
 
				++ *
			
 
				++ * 3) emit_jmp_{i,i64,r,r64}:
			
 
				++ *    Emit instructions for an JMP or JMP32 immediate or register operation.
			
 
				++ *
			
 
				++ * 4) finish_jmp_{i,r}:
			
 
				++ *    Emit any instructions needed to finish the jump. This includes a nop
			
 
				++ *    for the delay slot if a branch was emitted, and a long absolute jump
			
 
				++ *    if the branch was converted.
			
 
				++ */
			
 
				++
			
 
				++#include <linux/limits.h>
			
 
				++#include <linux/bitops.h>
			
 
				++#include <linux/errno.h>
			
 
				++#include <linux/filter.h>
			
 
				++#include <linux/bpf.h>
			
 
				++#include <linux/slab.h>
			
 
				++#include <asm/bitops.h>
			
 
				++#include <asm/cacheflush.h>
			
 
				++#include <asm/cpu-features.h>
			
 
				++#include <asm/isa-rev.h>
			
 
				++#include <asm/uasm.h>
			
 
				++
			
 
				++#include "bpf_jit_comp.h"
			
 
				++
			
 
				++/* Convenience macros for descriptor access */
			
 
				++#define CONVERTED(desc)	((desc) & JIT_DESC_CONVERT)
			
 
				++#define INDEX(desc)	((desc) & ~JIT_DESC_CONVERT)
			
 
				++
			
 
				++/*
			
 
				++ * Push registers on the stack, starting at a given depth from the stack
			
 
				++ * pointer and increasing. The next depth to be written is returned.
			
 
				++ */
			
 
				++int push_regs(struct jit_context *ctx, u32 mask, u32 excl, int depth)
			
 
				++{
			
 
				++	int reg;
			
 
				++
			
 
				++	for (reg = 0; reg < BITS_PER_BYTE * sizeof(mask); reg++)
			
 
				++		if (mask & BIT(reg)) {
			
 
				++			if ((excl & BIT(reg)) == 0) {
			
 
				++				if (sizeof(long) == 4)
			
 
				++					emit(ctx, sw, reg, depth, MIPS_R_SP);
			
 
				++				else /* sizeof(long) == 8 */
			
 
				++					emit(ctx, sd, reg, depth, MIPS_R_SP);
			
 
				++			}
			
 
				++			depth += sizeof(long);
			
 
				++		}
			
 
				++
			
 
				++	ctx->stack_used = max((int)ctx->stack_used, depth);
			
 
				++	return depth;
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Pop registers from the stack, starting at a given depth from the stack
			
 
				++ * pointer and increasing. The next depth to be read is returned.
			
 
				++ */
			
 
				++int pop_regs(struct jit_context *ctx, u32 mask, u32 excl, int depth)
			
 
				++{
			
 
				++	int reg;
			
 
				++
			
 
				++	for (reg = 0; reg < BITS_PER_BYTE * sizeof(mask); reg++)
			
 
				++		if (mask & BIT(reg)) {
			
 
				++			if ((excl & BIT(reg)) == 0) {
			
 
				++				if (sizeof(long) == 4)
			
 
				++					emit(ctx, lw, reg, depth, MIPS_R_SP);
			
 
				++				else /* sizeof(long) == 8 */
			
 
				++					emit(ctx, ld, reg, depth, MIPS_R_SP);
			
 
				++			}
			
 
				++			depth += sizeof(long);
			
 
				++		}
			
 
				++
			
 
				++	return depth;
			
 
				++}
			
 
				++
			
 
				++/* Compute the 28-bit jump target address from a BPF program location */
			
 
				++int get_target(struct jit_context *ctx, u32 loc)
			
 
				++{
			
 
				++	u32 index = INDEX(ctx->descriptors[loc]);
			
 
				++	unsigned long pc = (unsigned long)&ctx->target[ctx->jit_index];
			
 
				++	unsigned long addr = (unsigned long)&ctx->target[index];
			
 
				++
			
 
				++	if (!ctx->target)
			
 
				++		return 0;
			
 
				++
			
 
				++	if ((addr ^ pc) & ~MIPS_JMP_MASK)
			
 
				++		return -1;
			
 
				++
			
 
				++	return addr & MIPS_JMP_MASK;
			
 
				++}
			
 
				++
			
 
				++/* Compute the PC-relative offset to relative BPF program offset */
			
 
				++int get_offset(const struct jit_context *ctx, int off)
			
 
				++{
			
 
				++	return (INDEX(ctx->descriptors[ctx->bpf_index + off]) -
			
 
				++		ctx->jit_index - 1) * sizeof(u32);
			
 
				++}
			
 
				++
			
 
				++/* dst = imm (register width) */
			
 
				++void emit_mov_i(struct jit_context *ctx, u8 dst, s32 imm)
			
 
				++{
			
 
				++	if (imm >= -0x8000 && imm <= 0x7fff) {
			
 
				++		emit(ctx, addiu, dst, MIPS_R_ZERO, imm);
			
 
				++	} else {
			
 
				++		emit(ctx, lui, dst, (s16)((u32)imm >> 16));
			
 
				++		emit(ctx, ori, dst, dst, (u16)(imm & 0xffff));
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* dst = src (register width) */
			
 
				++void emit_mov_r(struct jit_context *ctx, u8 dst, u8 src)
			
 
				++{
			
 
				++	emit(ctx, ori, dst, src, 0);
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Validate ALU immediate range */
			
 
				++bool valid_alu_i(u8 op, s32 imm)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	case BPF_NEG:
			
 
				++	case BPF_LSH:
			
 
				++	case BPF_RSH:
			
 
				++	case BPF_ARSH:
			
 
				++		/* All legal eBPF values are valid */
			
 
				++		return true;
			
 
				++	case BPF_ADD:
			
 
				++		/* imm must be 16 bits */
			
 
				++		return imm >= -0x8000 && imm <= 0x7fff;
			
 
				++	case BPF_SUB:
			
 
				++		/* -imm must be 16 bits */
			
 
				++		return imm >= -0x7fff && imm <= 0x8000;
			
 
				++	case BPF_AND:
			
 
				++	case BPF_OR:
			
 
				++	case BPF_XOR:
			
 
				++		/* imm must be 16 bits unsigned */
			
 
				++		return imm >= 0 && imm <= 0xffff;
			
 
				++	case BPF_MUL:
			
 
				++		/* imm must be zero or a positive power of two */
			
 
				++		return imm == 0 || (imm > 0 && is_power_of_2(imm));
			
 
				++	case BPF_DIV:
			
 
				++	case BPF_MOD:
			
 
				++		/* imm must be an 17-bit power of two */
			
 
				++		return (u32)imm <= 0x10000 && is_power_of_2((u32)imm);
			
 
				++	}
			
 
				++	return false;
			
 
				++}
			
 
				++
			
 
				++/* Rewrite ALU immediate operation */
			
 
				++bool rewrite_alu_i(u8 op, s32 imm, u8 *alu, s32 *val)
			
 
				++{
			
 
				++	bool act = true;
			
 
				++
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	case BPF_LSH:
			
 
				++	case BPF_RSH:
			
 
				++	case BPF_ARSH:
			
 
				++	case BPF_ADD:
			
 
				++	case BPF_SUB:
			
 
				++	case BPF_OR:
			
 
				++	case BPF_XOR:
			
 
				++		/* imm == 0 is a no-op */
			
 
				++		act = imm != 0;
			
 
				++		break;
			
 
				++	case BPF_MUL:
			
 
				++		if (imm == 1) {
			
 
				++			/* dst * 1 is a no-op */
			
 
				++			act = false;
			
 
				++		} else if (imm == 0) {
			
 
				++			/* dst * 0 is dst & 0 */
			
 
				++			op = BPF_AND;
			
 
				++		} else {
			
 
				++			/* dst * (1 << n) is dst << n */
			
 
				++			op = BPF_LSH;
			
 
				++			imm = ilog2(abs(imm));
			
 
				++		}
			
 
				++		break;
			
 
				++	case BPF_DIV:
			
 
				++		if (imm == 1) {
			
 
				++			/* dst / 1 is a no-op */
			
 
				++			act = false;
			
 
				++		} else {
			
 
				++			/* dst / (1 << n) is dst >> n */
			
 
				++			op = BPF_RSH;
			
 
				++			imm = ilog2(imm);
			
 
				++		}
			
 
				++		break;
			
 
				++	case BPF_MOD:
			
 
				++		/* dst % (1 << n) is dst & ((1 << n) - 1) */
			
 
				++		op = BPF_AND;
			
 
				++		imm--;
			
 
				++		break;
			
 
				++	}
			
 
				++
			
 
				++	*alu = op;
			
 
				++	*val = imm;
			
 
				++	return act;
			
 
				++}
			
 
				++
			
 
				++/* ALU immediate operation (32-bit) */
			
 
				++void emit_alu_i(struct jit_context *ctx, u8 dst, s32 imm, u8 op)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = -dst */
			
 
				++	case BPF_NEG:
			
 
				++		emit(ctx, subu, dst, MIPS_R_ZERO, dst);
			
 
				++		break;
			
 
				++	/* dst = dst & imm */
			
 
				++	case BPF_AND:
			
 
				++		emit(ctx, andi, dst, dst, (u16)imm);
			
 
				++		break;
			
 
				++	/* dst = dst | imm */
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, ori, dst, dst, (u16)imm);
			
 
				++		break;
			
 
				++	/* dst = dst ^ imm */
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xori, dst, dst, (u16)imm);
			
 
				++		break;
			
 
				++	/* dst = dst << imm */
			
 
				++	case BPF_LSH:
			
 
				++		emit(ctx, sll, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst >> imm */
			
 
				++	case BPF_RSH:
			
 
				++		emit(ctx, srl, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst >> imm (arithmetic) */
			
 
				++	case BPF_ARSH:
			
 
				++		emit(ctx, sra, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst + imm */
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, addiu, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst - imm */
			
 
				++	case BPF_SUB:
			
 
				++		emit(ctx, addiu, dst, dst, -imm);
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU register operation (32-bit) */
			
 
				++void emit_alu_r(struct jit_context *ctx, u8 dst, u8 src, u8 op)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst & src */
			
 
				++	case BPF_AND:
			
 
				++		emit(ctx, and, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst | src */
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, or, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst ^ src */
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xor, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst << src */
			
 
				++	case BPF_LSH:
			
 
				++		emit(ctx, sllv, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst >> src */
			
 
				++	case BPF_RSH:
			
 
				++		emit(ctx, srlv, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst >> src (arithmetic) */
			
 
				++	case BPF_ARSH:
			
 
				++		emit(ctx, srav, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst + src */
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, addu, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst - src */
			
 
				++	case BPF_SUB:
			
 
				++		emit(ctx, subu, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst * src */
			
 
				++	case BPF_MUL:
			
 
				++		if (cpu_has_mips32r1 || cpu_has_mips32r6) {
			
 
				++			emit(ctx, mul, dst, dst, src);
			
 
				++		} else {
			
 
				++			emit(ctx, multu, dst, src);
			
 
				++			emit(ctx, mflo, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst / src */
			
 
				++	case BPF_DIV:
			
 
				++		if (cpu_has_mips32r6) {
			
 
				++			emit(ctx, divu_r6, dst, dst, src);
			
 
				++		} else {
			
 
				++			emit(ctx, divu, dst, src);
			
 
				++			emit(ctx, mflo, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst % src */
			
 
				++	case BPF_MOD:
			
 
				++		if (cpu_has_mips32r6) {
			
 
				++			emit(ctx, modu, dst, dst, src);
			
 
				++		} else {
			
 
				++			emit(ctx, divu, dst, src);
			
 
				++			emit(ctx, mfhi, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Atomic read-modify-write (32-bit) */
			
 
				++void emit_atomic_r(struct jit_context *ctx, u8 dst, u8 src, s16 off, u8 code)
			
 
				++{
			
 
				++	emit(ctx, ll, MIPS_R_T9, off, dst);
			
 
				++	switch (code) {
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, addu, MIPS_R_T8, MIPS_R_T9, src);
			
 
				++		break;
			
 
				++	case BPF_AND:
			
 
				++		emit(ctx, and, MIPS_R_T8, MIPS_R_T9, src);
			
 
				++		break;
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, or, MIPS_R_T8, MIPS_R_T9, src);
			
 
				++		break;
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xor, MIPS_R_T8, MIPS_R_T9, src);
			
 
				++		break;
			
 
				++	}
			
 
				++	emit(ctx, sc, MIPS_R_T8, off, dst);
			
 
				++	emit(ctx, beqz, MIPS_R_T8, -16);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++}
			
 
				++
			
 
				++/* Atomic compare-and-exchange (32-bit) */
			
 
				++void emit_cmpxchg_r(struct jit_context *ctx, u8 dst, u8 src, u8 res, s16 off)
			
 
				++{
			
 
				++	emit(ctx, ll, MIPS_R_T9, off, dst);
			
 
				++	emit(ctx, bne, MIPS_R_T9, res, 12);
			
 
				++	emit(ctx, move, MIPS_R_T8, src);     /* Delay slot */
			
 
				++	emit(ctx, sc, MIPS_R_T8, off, dst);
			
 
				++	emit(ctx, beqz, MIPS_R_T8, -20);
			
 
				++	emit(ctx, move, res, MIPS_R_T9);     /* Delay slot */
			
 
				++	clobber_reg(ctx, res);
			
 
				++}
			
 
				++
			
 
				++/* Swap bytes and truncate a register word or half word */
			
 
				++void emit_bswap_r(struct jit_context *ctx, u8 dst, u32 width)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T8;
			
 
				++	u8 msk = MIPS_R_T9;
			
 
				++
			
 
				++	switch (width) {
			
 
				++	/* Swap bytes in a word */
			
 
				++	case 32:
			
 
				++		if (cpu_has_mips32r2 || cpu_has_mips32r6) {
			
 
				++			emit(ctx, wsbh, dst, dst);
			
 
				++			emit(ctx, rotr, dst, dst, 16);
			
 
				++		} else {
			
 
				++			emit(ctx, sll, tmp, dst, 16);    /* tmp  = dst << 16 */
			
 
				++			emit(ctx, srl, dst, dst, 16);    /* dst = dst >> 16  */
			
 
				++			emit(ctx, or, dst, dst, tmp);    /* dst = dst | tmp  */
			
 
				++
			
 
				++			emit(ctx, lui, msk, 0xff);       /* msk = 0x00ff0000 */
			
 
				++			emit(ctx, ori, msk, msk, 0xff);  /* msk = msk | 0xff */
			
 
				++
			
 
				++			emit(ctx, and, tmp, dst, msk);   /* tmp = dst & msk  */
			
 
				++			emit(ctx, sll, tmp, tmp, 8);     /* tmp = tmp << 8   */
			
 
				++			emit(ctx, srl, dst, dst, 8);     /* dst = dst >> 8   */
			
 
				++			emit(ctx, and, dst, dst, msk);   /* dst = dst & msk  */
			
 
				++			emit(ctx, or, dst, dst, tmp);    /* reg = dst | tmp  */
			
 
				++		}
			
 
				++		break;
			
 
				++	/* Swap bytes in a half word */
			
 
				++	case 16:
			
 
				++		if (cpu_has_mips32r2 || cpu_has_mips32r6) {
			
 
				++			emit(ctx, wsbh, dst, dst);
			
 
				++			emit(ctx, andi, dst, dst, 0xffff);
			
 
				++		} else {
			
 
				++			emit(ctx, andi, tmp, dst, 0xff00); /* t = d & 0xff00 */
			
 
				++			emit(ctx, srl, tmp, tmp, 8);       /* t = t >> 8     */
			
 
				++			emit(ctx, andi, dst, dst, 0x00ff); /* d = d & 0x00ff */
			
 
				++			emit(ctx, sll, dst, dst, 8);       /* d = d << 8     */
			
 
				++			emit(ctx, or,  dst, dst, tmp);     /* d = d | t      */
			
 
				++		}
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Validate jump immediate range */
			
 
				++bool valid_jmp_i(u8 op, s32 imm)
			
 
				++{
			
 
				++	switch (op) {
			
 
				++	case JIT_JNOP:
			
 
				++		/* Immediate value not used */
			
 
				++		return true;
			
 
				++	case BPF_JEQ:
			
 
				++	case BPF_JNE:
			
 
				++		/* No immediate operation */
			
 
				++		return false;
			
 
				++	case BPF_JSET:
			
 
				++	case JIT_JNSET:
			
 
				++		/* imm must be 16 bits unsigned */
			
 
				++		return imm >= 0 && imm <= 0xffff;
			
 
				++	case BPF_JGE:
			
 
				++	case BPF_JLT:
			
 
				++	case BPF_JSGE:
			
 
				++	case BPF_JSLT:
			
 
				++		/* imm must be 16 bits */
			
 
				++		return imm >= -0x8000 && imm <= 0x7fff;
			
 
				++	case BPF_JGT:
			
 
				++	case BPF_JLE:
			
 
				++	case BPF_JSGT:
			
 
				++	case BPF_JSLE:
			
 
				++		/* imm + 1 must be 16 bits */
			
 
				++		return imm >= -0x8001 && imm <= 0x7ffe;
			
 
				++	}
			
 
				++	return false;
			
 
				++}
			
 
				++
			
 
				++/* Invert a conditional jump operation */
			
 
				++static u8 invert_jmp(u8 op)
			
 
				++{
			
 
				++	switch (op) {
			
 
				++	case BPF_JA: return JIT_JNOP;
			
 
				++	case BPF_JEQ: return BPF_JNE;
			
 
				++	case BPF_JNE: return BPF_JEQ;
			
 
				++	case BPF_JSET: return JIT_JNSET;
			
 
				++	case BPF_JGT: return BPF_JLE;
			
 
				++	case BPF_JGE: return BPF_JLT;
			
 
				++	case BPF_JLT: return BPF_JGE;
			
 
				++	case BPF_JLE: return BPF_JGT;
			
 
				++	case BPF_JSGT: return BPF_JSLE;
			
 
				++	case BPF_JSGE: return BPF_JSLT;
			
 
				++	case BPF_JSLT: return BPF_JSGE;
			
 
				++	case BPF_JSLE: return BPF_JSGT;
			
 
				++	}
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Prepare a PC-relative jump operation */
			
 
				++static void setup_jmp(struct jit_context *ctx, u8 bpf_op,
			
 
				++		      s16 bpf_off, u8 *jit_op, s32 *jit_off)
			
 
				++{
			
 
				++	u32 *descp = &ctx->descriptors[ctx->bpf_index];
			
 
				++	int op = bpf_op;
			
 
				++	int offset = 0;
			
 
				++
			
 
				++	/* Do not compute offsets on the first pass */
			
 
				++	if (INDEX(*descp) == 0)
			
 
				++		goto done;
			
 
				++
			
 
				++	/* Skip jumps never taken */
			
 
				++	if (bpf_op == JIT_JNOP)
			
 
				++		goto done;
			
 
				++
			
 
				++	/* Convert jumps always taken */
			
 
				++	if (bpf_op == BPF_JA)
			
 
				++		*descp |= JIT_DESC_CONVERT;
			
 
				++
			
 
				++	/*
			
 
				++	 * Current ctx->jit_index points to the start of the branch preamble.
			
 
				++	 * Since the preamble differs among different branch conditionals,
			
 
				++	 * the current index cannot be used to compute the branch offset.
			
 
				++	 * Instead, we use the offset table value for the next instruction,
			
 
				++	 * which gives the index immediately after the branch delay slot.
			
 
				++	 */
			
 
				++	if (!CONVERTED(*descp)) {
			
 
				++		int target = ctx->bpf_index + bpf_off + 1;
			
 
				++		int origin = ctx->bpf_index + 1;
			
 
				++
			
 
				++		offset = (INDEX(ctx->descriptors[target]) -
			
 
				++			  INDEX(ctx->descriptors[origin]) + 1) * sizeof(u32);
			
 
				++	}
			
 
				++
			
 
				++	/*
			
 
				++	 * The PC-relative branch offset field on MIPS is 18 bits signed,
			
 
				++	 * so if the computed offset is larger than this we generate a an
			
 
				++	 * absolute jump that we skip with an inverted conditional branch.
			
 
				++	 */
			
 
				++	if (CONVERTED(*descp) || offset < -0x20000 || offset > 0x1ffff) {
			
 
				++		offset = 3 * sizeof(u32);
			
 
				++		op = invert_jmp(bpf_op);
			
 
				++		ctx->changes += !CONVERTED(*descp);
			
 
				++		*descp |= JIT_DESC_CONVERT;
			
 
				++	}
			
 
				++
			
 
				++done:
			
 
				++	*jit_off = offset;
			
 
				++	*jit_op = op;
			
 
				++}
			
 
				++
			
 
				++/* Prepare a PC-relative jump operation with immediate conditional */
			
 
				++void setup_jmp_i(struct jit_context *ctx, s32 imm, u8 width,
			
 
				++		 u8 bpf_op, s16 bpf_off, u8 *jit_op, s32 *jit_off)
			
 
				++{
			
 
				++	bool always = false;
			
 
				++	bool never = false;
			
 
				++
			
 
				++	switch (bpf_op) {
			
 
				++	case BPF_JEQ:
			
 
				++	case BPF_JNE:
			
 
				++		break;
			
 
				++	case BPF_JSET:
			
 
				++	case BPF_JLT:
			
 
				++		never = imm == 0;
			
 
				++		break;
			
 
				++	case BPF_JGE:
			
 
				++		always = imm == 0;
			
 
				++		break;
			
 
				++	case BPF_JGT:
			
 
				++		never = (u32)imm == U32_MAX;
			
 
				++		break;
			
 
				++	case BPF_JLE:
			
 
				++		always = (u32)imm == U32_MAX;
			
 
				++		break;
			
 
				++	case BPF_JSGT:
			
 
				++		never = imm == S32_MAX && width == 32;
			
 
				++		break;
			
 
				++	case BPF_JSGE:
			
 
				++		always = imm == S32_MIN && width == 32;
			
 
				++		break;
			
 
				++	case BPF_JSLT:
			
 
				++		never = imm == S32_MIN && width == 32;
			
 
				++		break;
			
 
				++	case BPF_JSLE:
			
 
				++		always = imm == S32_MAX && width == 32;
			
 
				++		break;
			
 
				++	}
			
 
				++
			
 
				++	if (never)
			
 
				++		bpf_op = JIT_JNOP;
			
 
				++	if (always)
			
 
				++		bpf_op = BPF_JA;
			
 
				++	setup_jmp(ctx, bpf_op, bpf_off, jit_op, jit_off);
			
 
				++}
			
 
				++
			
 
				++/* Prepare a PC-relative jump operation with register conditional */
			
 
				++void setup_jmp_r(struct jit_context *ctx, bool same_reg,
			
 
				++		 u8 bpf_op, s16 bpf_off, u8 *jit_op, s32 *jit_off)
			
 
				++{
			
 
				++	switch (bpf_op) {
			
 
				++	case BPF_JSET:
			
 
				++		break;
			
 
				++	case BPF_JEQ:
			
 
				++	case BPF_JGE:
			
 
				++	case BPF_JLE:
			
 
				++	case BPF_JSGE:
			
 
				++	case BPF_JSLE:
			
 
				++		if (same_reg)
			
 
				++			bpf_op = BPF_JA;
			
 
				++		break;
			
 
				++	case BPF_JNE:
			
 
				++	case BPF_JLT:
			
 
				++	case BPF_JGT:
			
 
				++	case BPF_JSGT:
			
 
				++	case BPF_JSLT:
			
 
				++		if (same_reg)
			
 
				++			bpf_op = JIT_JNOP;
			
 
				++		break;
			
 
				++	}
			
 
				++	setup_jmp(ctx, bpf_op, bpf_off, jit_op, jit_off);
			
 
				++}
			
 
				++
			
 
				++/* Finish a PC-relative jump operation */
			
 
				++int finish_jmp(struct jit_context *ctx, u8 jit_op, s16 bpf_off)
			
 
				++{
			
 
				++	/* Emit conditional branch delay slot */
			
 
				++	if (jit_op != JIT_JNOP)
			
 
				++		emit(ctx, nop);
			
 
				++	/*
			
 
				++	 * Emit an absolute long jump with delay slot,
			
 
				++	 * if the PC-relative branch was converted.
			
 
				++	 */
			
 
				++	if (CONVERTED(ctx->descriptors[ctx->bpf_index])) {
			
 
				++		int target = get_target(ctx, ctx->bpf_index + bpf_off + 1);
			
 
				++
			
 
				++		if (target < 0)
			
 
				++			return -1;
			
 
				++		emit(ctx, j, target);
			
 
				++		emit(ctx, nop);
			
 
				++	}
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Jump immediate (32-bit) */
			
 
				++void emit_jmp_i(struct jit_context *ctx, u8 dst, s32 imm, s32 off, u8 op)
			
 
				++{
			
 
				++	switch (op) {
			
 
				++	/* No-op, used internally for branch optimization */
			
 
				++	case JIT_JNOP:
			
 
				++		break;
			
 
				++	/* PC += off if dst & imm */
			
 
				++	case BPF_JSET:
			
 
				++		emit(ctx, andi, MIPS_R_T9, dst, (u16)imm);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if (dst & imm) == 0 (not in BPF, used for long jumps) */
			
 
				++	case JIT_JNSET:
			
 
				++		emit(ctx, andi, MIPS_R_T9, dst, (u16)imm);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > imm */
			
 
				++	case BPF_JGT:
			
 
				++		emit(ctx, sltiu, MIPS_R_T9, dst, imm + 1);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= imm */
			
 
				++	case BPF_JGE:
			
 
				++		emit(ctx, sltiu, MIPS_R_T9, dst, imm);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < imm */
			
 
				++	case BPF_JLT:
			
 
				++		emit(ctx, sltiu, MIPS_R_T9, dst, imm);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= imm */
			
 
				++	case BPF_JLE:
			
 
				++		emit(ctx, sltiu, MIPS_R_T9, dst, imm + 1);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > imm (signed) */
			
 
				++	case BPF_JSGT:
			
 
				++		emit(ctx, slti, MIPS_R_T9, dst, imm + 1);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= imm (signed) */
			
 
				++	case BPF_JSGE:
			
 
				++		emit(ctx, slti, MIPS_R_T9, dst, imm);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < imm (signed) */
			
 
				++	case BPF_JSLT:
			
 
				++		emit(ctx, slti, MIPS_R_T9, dst, imm);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= imm (signed) */
			
 
				++	case BPF_JSLE:
			
 
				++		emit(ctx, slti, MIPS_R_T9, dst, imm + 1);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Jump register (32-bit) */
			
 
				++void emit_jmp_r(struct jit_context *ctx, u8 dst, u8 src, s32 off, u8 op)
			
 
				++{
			
 
				++	switch (op) {
			
 
				++	/* No-op, used internally for branch optimization */
			
 
				++	case JIT_JNOP:
			
 
				++		break;
			
 
				++	/* PC += off if dst == src */
			
 
				++	case BPF_JEQ:
			
 
				++		emit(ctx, beq, dst, src, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst != src */
			
 
				++	case BPF_JNE:
			
 
				++		emit(ctx, bne, dst, src, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst & src */
			
 
				++	case BPF_JSET:
			
 
				++		emit(ctx, and, MIPS_R_T9, dst, src);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if (dst & imm) == 0 (not in BPF, used for long jumps) */
			
 
				++	case JIT_JNSET:
			
 
				++		emit(ctx, and, MIPS_R_T9, dst, src);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > src */
			
 
				++	case BPF_JGT:
			
 
				++		emit(ctx, sltu, MIPS_R_T9, src, dst);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= src */
			
 
				++	case BPF_JGE:
			
 
				++		emit(ctx, sltu, MIPS_R_T9, dst, src);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < src */
			
 
				++	case BPF_JLT:
			
 
				++		emit(ctx, sltu, MIPS_R_T9, dst, src);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= src */
			
 
				++	case BPF_JLE:
			
 
				++		emit(ctx, sltu, MIPS_R_T9, src, dst);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > src (signed) */
			
 
				++	case BPF_JSGT:
			
 
				++		emit(ctx, slt, MIPS_R_T9, src, dst);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= src (signed) */
			
 
				++	case BPF_JSGE:
			
 
				++		emit(ctx, slt, MIPS_R_T9, dst, src);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < src (signed) */
			
 
				++	case BPF_JSLT:
			
 
				++		emit(ctx, slt, MIPS_R_T9, dst, src);
			
 
				++		emit(ctx, bnez, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= src (signed) */
			
 
				++	case BPF_JSLE:
			
 
				++		emit(ctx, slt, MIPS_R_T9, src, dst);
			
 
				++		emit(ctx, beqz, MIPS_R_T9, off);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Jump always */
			
 
				++int emit_ja(struct jit_context *ctx, s16 off)
			
 
				++{
			
 
				++	int target = get_target(ctx, ctx->bpf_index + off + 1);
			
 
				++
			
 
				++	if (target < 0)
			
 
				++		return -1;
			
 
				++	emit(ctx, j, target);
			
 
				++	emit(ctx, nop);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Jump to epilogue */
			
 
				++int emit_exit(struct jit_context *ctx)
			
 
				++{
			
 
				++	int target = get_target(ctx, ctx->program->len);
			
 
				++
			
 
				++	if (target < 0)
			
 
				++		return -1;
			
 
				++	emit(ctx, j, target);
			
 
				++	emit(ctx, nop);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Build the program body from eBPF bytecode */
			
 
				++static int build_body(struct jit_context *ctx)
			
 
				++{
			
 
				++	const struct bpf_prog *prog = ctx->program;
			
 
				++	unsigned int i;
			
 
				++
			
 
				++	ctx->stack_used = 0;
			
 
				++	for (i = 0; i < prog->len; i++) {
			
 
				++		const struct bpf_insn *insn = &prog->insnsi[i];
			
 
				++		u32 *descp = &ctx->descriptors[i];
			
 
				++		int ret;
			
 
				++
			
 
				++		access_reg(ctx, insn->src_reg);
			
 
				++		access_reg(ctx, insn->dst_reg);
			
 
				++
			
 
				++		ctx->bpf_index = i;
			
 
				++		if (ctx->target == NULL) {
			
 
				++			ctx->changes += INDEX(*descp) != ctx->jit_index;
			
 
				++			*descp &= JIT_DESC_CONVERT;
			
 
				++			*descp |= ctx->jit_index;
			
 
				++		}
			
 
				++
			
 
				++		ret = build_insn(insn, ctx);
			
 
				++		if (ret < 0)
			
 
				++			return ret;
			
 
				++
			
 
				++		if (ret > 0) {
			
 
				++			i++;
			
 
				++			if (ctx->target == NULL)
			
 
				++				descp[1] = ctx->jit_index;
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				++	/* Store the end offset, where the epilogue begins */
			
 
				++	ctx->descriptors[prog->len] = ctx->jit_index;
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Set the branch conversion flag on all instructions */
			
 
				++static void set_convert_flag(struct jit_context *ctx, bool enable)
			
 
				++{
			
 
				++	const struct bpf_prog *prog = ctx->program;
			
 
				++	u32 flag = enable ? JIT_DESC_CONVERT : 0;
			
 
				++	unsigned int i;
			
 
				++
			
 
				++	for (i = 0; i <= prog->len; i++)
			
 
				++		ctx->descriptors[i] = INDEX(ctx->descriptors[i]) | flag;
			
 
				++}
			
 
				++
			
 
				++static void jit_fill_hole(void *area, unsigned int size)
			
 
				++{
			
 
				++	u32 *p;
			
 
				++
			
 
				++	/* We are guaranteed to have aligned memory. */
			
 
				++	for (p = area; size >= sizeof(u32); size -= sizeof(u32))
			
 
				++		uasm_i_break(&p, BRK_BUG); /* Increments p */
			
 
				++}
			
 
				++
			
 
				++bool bpf_jit_needs_zext(void)
			
 
				++{
			
 
				++	return true;
			
 
				++}
			
 
				++
			
 
				++struct bpf_prog *bpf_int_jit_compile(struct bpf_prog *prog)
			
 
				++{
			
 
				++	struct bpf_prog *tmp, *orig_prog = prog;
			
 
				++	struct bpf_binary_header *header = NULL;
			
 
				++	struct jit_context ctx;
			
 
				++	bool tmp_blinded = false;
			
 
				++	unsigned int tmp_idx;
			
 
				++	unsigned int image_size;
			
 
				++	u8 *image_ptr;
			
 
				++	int tries;
			
 
				++
			
 
				++	/*
			
 
				++	 * If BPF JIT was not enabled then we must fall back to
			
 
				++	 * the interpreter.
			
 
				++	 */
			
 
				++	if (!prog->jit_requested)
			
 
				++		return orig_prog;
			
 
				++	/*
			
 
				++	 * If constant blinding was enabled and we failed during blinding
			
 
				++	 * then we must fall back to the interpreter. Otherwise, we save
			
 
				++	 * the new JITed code.
			
 
				++	 */
			
 
				++	tmp = bpf_jit_blind_constants(prog);
			
 
				++	if (IS_ERR(tmp))
			
 
				++		return orig_prog;
			
 
				++	if (tmp != prog) {
			
 
				++		tmp_blinded = true;
			
 
				++		prog = tmp;
			
 
				++	}
			
 
				++
			
 
				++	memset(&ctx, 0, sizeof(ctx));
			
 
				++	ctx.program = prog;
			
 
				++
			
 
				++	/*
			
 
				++	 * Not able to allocate memory for descriptors[], then
			
 
				++	 * we must fall back to the interpreter
			
 
				++	 */
			
 
				++	ctx.descriptors = kcalloc(prog->len + 1, sizeof(*ctx.descriptors),
			
 
				++				  GFP_KERNEL);
			
 
				++	if (ctx.descriptors == NULL)
			
 
				++		goto out_err;
			
 
				++
			
 
				++	/* First pass discovers used resources */
			
 
				++	if (build_body(&ctx) < 0)
			
 
				++		goto out_err;
			
 
				++	/*
			
 
				++	 * Second pass computes instruction offsets.
			
 
				++	 * If any PC-relative branches are out of range, a sequence of
			
 
				++	 * a PC-relative branch + a jump is generated, and we have to
			
 
				++	 * try again from the beginning to generate the new offsets.
			
 
				++	 * This is done until no additional conversions are necessary.
			
 
				++	 * The last two iterations are done with all branches being
			
 
				++	 * converted, to guarantee offset table convergence within a
			
 
				++	 * fixed number of iterations.
			
 
				++	 */
			
 
				++	ctx.jit_index = 0;
			
 
				++	build_prologue(&ctx);
			
 
				++	tmp_idx = ctx.jit_index;
			
 
				++
			
 
				++	tries = JIT_MAX_ITERATIONS;
			
 
				++	do {
			
 
				++		ctx.jit_index = tmp_idx;
			
 
				++		ctx.changes = 0;
			
 
				++		if (tries == 2)
			
 
				++			set_convert_flag(&ctx, true);
			
 
				++		if (build_body(&ctx) < 0)
			
 
				++			goto out_err;
			
 
				++	} while (ctx.changes > 0 && --tries > 0);
			
 
				++
			
 
				++	if (WARN_ONCE(ctx.changes > 0, "JIT offsets failed to converge"))
			
 
				++		goto out_err;
			
 
				++
			
 
				++	build_epilogue(&ctx, MIPS_R_RA);
			
 
				++
			
 
				++	/* Now we know the size of the structure to make */
			
 
				++	image_size = sizeof(u32) * ctx.jit_index;
			
 
				++	header = bpf_jit_binary_alloc(image_size, &image_ptr,
			
 
				++				      sizeof(u32), jit_fill_hole);
			
 
				++	/*
			
 
				++	 * Not able to allocate memory for the structure then
			
 
				++	 * we must fall back to the interpretation
			
 
				++	 */
			
 
				++	if (header == NULL)
			
 
				++		goto out_err;
			
 
				++
			
 
				++	/* Actual pass to generate final JIT code */
			
 
				++	ctx.target = (u32 *)image_ptr;
			
 
				++	ctx.jit_index = 0;
			
 
				++
			
 
				++	/*
			
 
				++	 * If building the JITed code fails somehow,
			
 
				++	 * we fall back to the interpretation.
			
 
				++	 */
			
 
				++	build_prologue(&ctx);
			
 
				++	if (build_body(&ctx) < 0)
			
 
				++		goto out_err;
			
 
				++	build_epilogue(&ctx, MIPS_R_RA);
			
 
				++
			
 
				++	/* Populate line info meta data */
			
 
				++	set_convert_flag(&ctx, false);
			
 
				++	bpf_prog_fill_jited_linfo(prog, &ctx.descriptors[1]);
			
 
				++
			
 
				++	/* Set as read-only exec and flush instruction cache */
			
 
				++	bpf_jit_binary_lock_ro(header);
			
 
				++	flush_icache_range((unsigned long)header,
			
 
				++			   (unsigned long)&ctx.target[ctx.jit_index]);
			
 
				++
			
 
				++	if (bpf_jit_enable > 1)
			
 
				++		bpf_jit_dump(prog->len, image_size, 2, ctx.target);
			
 
				++
			
 
				++	prog->bpf_func = (void *)ctx.target;
			
 
				++	prog->jited = 1;
			
 
				++	prog->jited_len = image_size;
			
 
				++
			
 
				++out:
			
 
				++	if (tmp_blinded)
			
 
				++		bpf_jit_prog_release_other(prog, prog == orig_prog ?
			
 
				++					   tmp : orig_prog);
			
 
				++	kfree(ctx.descriptors);
			
 
				++	return prog;
			
 
				++
			
 
				++out_err:
			
 
				++	prog = orig_prog;
			
 
				++	if (header)
			
 
				++		bpf_jit_binary_free(header);
			
 
				++	goto out;
			
 
				++}
			
 
				+--- /dev/null
			
 
				++++ b/arch/mips/net/bpf_jit_comp.h
			
 
				+@@ -0,0 +1,211 @@
			
 
				++/* SPDX-License-Identifier: GPL-2.0-only */
			
 
				++/*
			
 
				++ * Just-In-Time compiler for eBPF bytecode on 32-bit and 64-bit MIPS.
			
 
				++ *
			
 
				++ * Copyright (c) 2021 Anyfi Networks AB.
			
 
				++ * Author: Johan Almbladh <[email protected]>
			
 
				++ *
			
 
				++ * Based on code and ideas from
			
 
				++ * Copyright (c) 2017 Cavium, Inc.
			
 
				++ * Copyright (c) 2017 Shubham Bansal <[email protected]>
			
 
				++ * Copyright (c) 2011 Mircea Gherzan <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++#ifndef _BPF_JIT_COMP_H
			
 
				++#define _BPF_JIT_COMP_H
			
 
				++
			
 
				++/* MIPS registers */
			
 
				++#define MIPS_R_ZERO	0   /* Const zero */
			
 
				++#define MIPS_R_AT	1   /* Asm temp   */
			
 
				++#define MIPS_R_V0	2   /* Result     */
			
 
				++#define MIPS_R_V1	3   /* Result     */
			
 
				++#define MIPS_R_A0	4   /* Argument   */
			
 
				++#define MIPS_R_A1	5   /* Argument   */
			
 
				++#define MIPS_R_A2	6   /* Argument   */
			
 
				++#define MIPS_R_A3	7   /* Argument   */
			
 
				++#define MIPS_R_A4	8   /* Arg (n64)  */
			
 
				++#define MIPS_R_A5	9   /* Arg (n64)  */
			
 
				++#define MIPS_R_A6	10  /* Arg (n64)  */
			
 
				++#define MIPS_R_A7	11  /* Arg (n64)  */
			
 
				++#define MIPS_R_T0	8   /* Temp (o32) */
			
 
				++#define MIPS_R_T1	9   /* Temp (o32) */
			
 
				++#define MIPS_R_T2	10  /* Temp (o32) */
			
 
				++#define MIPS_R_T3	11  /* Temp (o32) */
			
 
				++#define MIPS_R_T4	12  /* Temporary  */
			
 
				++#define MIPS_R_T5	13  /* Temporary  */
			
 
				++#define MIPS_R_T6	14  /* Temporary  */
			
 
				++#define MIPS_R_T7	15  /* Temporary  */
			
 
				++#define MIPS_R_S0	16  /* Saved      */
			
 
				++#define MIPS_R_S1	17  /* Saved      */
			
 
				++#define MIPS_R_S2	18  /* Saved      */
			
 
				++#define MIPS_R_S3	19  /* Saved      */
			
 
				++#define MIPS_R_S4	20  /* Saved      */
			
 
				++#define MIPS_R_S5	21  /* Saved      */
			
 
				++#define MIPS_R_S6	22  /* Saved      */
			
 
				++#define MIPS_R_S7	23  /* Saved      */
			
 
				++#define MIPS_R_T8	24  /* Temporary  */
			
 
				++#define MIPS_R_T9	25  /* Temporary  */
			
 
				++/*      MIPS_R_K0	26     Reserved   */
			
 
				++/*      MIPS_R_K1	27     Reserved   */
			
 
				++#define MIPS_R_GP	28  /* Global ptr */
			
 
				++#define MIPS_R_SP	29  /* Stack ptr  */
			
 
				++#define MIPS_R_FP	30  /* Frame ptr  */
			
 
				++#define MIPS_R_RA	31  /* Return     */
			
 
				++
			
 
				++/*
			
 
				++ * Jump address mask for immediate jumps. The four most significant bits
			
 
				++ * must be equal to PC.
			
 
				++ */
			
 
				++#define MIPS_JMP_MASK	0x0fffffffUL
			
 
				++
			
 
				++/* Maximum number of iterations in offset table computation */
			
 
				++#define JIT_MAX_ITERATIONS	8
			
 
				++
			
 
				++/*
			
 
				++ * Jump pseudo-instructions used internally
			
 
				++ * for branch conversion and branch optimization.
			
 
				++ */
			
 
				++#define JIT_JNSET	0xe0
			
 
				++#define JIT_JNOP	0xf0
			
 
				++
			
 
				++/* Descriptor flag for PC-relative branch conversion */
			
 
				++#define JIT_DESC_CONVERT	BIT(31)
			
 
				++
			
 
				++/* JIT context for an eBPF program */
			
 
				++struct jit_context {
			
 
				++	struct bpf_prog *program;     /* The eBPF program being JITed        */
			
 
				++	u32 *descriptors;             /* eBPF to JITed CPU insn descriptors  */
			
 
				++	u32 *target;                  /* JITed code buffer                   */
			
 
				++	u32 bpf_index;                /* Index of current BPF program insn   */
			
 
				++	u32 jit_index;                /* Index of current JIT target insn    */
			
 
				++	u32 changes;                  /* Number of PC-relative branch conv   */
			
 
				++	u32 accessed;                 /* Bit mask of read eBPF registers     */
			
 
				++	u32 clobbered;                /* Bit mask of modified CPU registers  */
			
 
				++	u32 stack_size;               /* Total allocated stack size in bytes */
			
 
				++	u32 saved_size;               /* Size of callee-saved registers      */
			
 
				++	u32 stack_used;               /* Stack size used for function calls  */
			
 
				++};
			
 
				++
			
 
				++/* Emit the instruction if the JIT memory space has been allocated */
			
 
				++#define emit(ctx, func, ...)					\
			
 
				++do {								\
			
 
				++	if ((ctx)->target != NULL) {				\
			
 
				++		u32 *p = &(ctx)->target[ctx->jit_index];	\
			
 
				++		uasm_i_##func(&p, ##__VA_ARGS__);		\
			
 
				++	}							\
			
 
				++	(ctx)->jit_index++;					\
			
 
				++} while (0)
			
 
				++
			
 
				++/*
			
 
				++ * Mark a BPF register as accessed, it needs to be
			
 
				++ * initialized by the program if expected, e.g. FP.
			
 
				++ */
			
 
				++static inline void access_reg(struct jit_context *ctx, u8 reg)
			
 
				++{
			
 
				++	ctx->accessed |= BIT(reg);
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Mark a CPU register as clobbered, it needs to be
			
 
				++ * saved/restored by the program if callee-saved.
			
 
				++ */
			
 
				++static inline void clobber_reg(struct jit_context *ctx, u8 reg)
			
 
				++{
			
 
				++	ctx->clobbered |= BIT(reg);
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Push registers on the stack, starting at a given depth from the stack
			
 
				++ * pointer and increasing. The next depth to be written is returned.
			
 
				++ */
			
 
				++int push_regs(struct jit_context *ctx, u32 mask, u32 excl, int depth);
			
 
				++
			
 
				++/*
			
 
				++ * Pop registers from the stack, starting at a given depth from the stack
			
 
				++ * pointer and increasing. The next depth to be read is returned.
			
 
				++ */
			
 
				++int pop_regs(struct jit_context *ctx, u32 mask, u32 excl, int depth);
			
 
				++
			
 
				++/* Compute the 28-bit jump target address from a BPF program location */
			
 
				++int get_target(struct jit_context *ctx, u32 loc);
			
 
				++
			
 
				++/* Compute the PC-relative offset to relative BPF program offset */
			
 
				++int get_offset(const struct jit_context *ctx, int off);
			
 
				++
			
 
				++/* dst = imm (32-bit) */
			
 
				++void emit_mov_i(struct jit_context *ctx, u8 dst, s32 imm);
			
 
				++
			
 
				++/* dst = src (32-bit) */
			
 
				++void emit_mov_r(struct jit_context *ctx, u8 dst, u8 src);
			
 
				++
			
 
				++/* Validate ALU/ALU64 immediate range */
			
 
				++bool valid_alu_i(u8 op, s32 imm);
			
 
				++
			
 
				++/* Rewrite ALU/ALU64 immediate operation */
			
 
				++bool rewrite_alu_i(u8 op, s32 imm, u8 *alu, s32 *val);
			
 
				++
			
 
				++/* ALU immediate operation (32-bit) */
			
 
				++void emit_alu_i(struct jit_context *ctx, u8 dst, s32 imm, u8 op);
			
 
				++
			
 
				++/* ALU register operation (32-bit) */
			
 
				++void emit_alu_r(struct jit_context *ctx, u8 dst, u8 src, u8 op);
			
 
				++
			
 
				++/* Atomic read-modify-write (32-bit) */
			
 
				++void emit_atomic_r(struct jit_context *ctx, u8 dst, u8 src, s16 off, u8 code);
			
 
				++
			
 
				++/* Atomic compare-and-exchange (32-bit) */
			
 
				++void emit_cmpxchg_r(struct jit_context *ctx, u8 dst, u8 src, u8 res, s16 off);
			
 
				++
			
 
				++/* Swap bytes and truncate a register word or half word */
			
 
				++void emit_bswap_r(struct jit_context *ctx, u8 dst, u32 width);
			
 
				++
			
 
				++/* Validate JMP/JMP32 immediate range */
			
 
				++bool valid_jmp_i(u8 op, s32 imm);
			
 
				++
			
 
				++/* Prepare a PC-relative jump operation with immediate conditional */
			
 
				++void setup_jmp_i(struct jit_context *ctx, s32 imm, u8 width,
			
 
				++		 u8 bpf_op, s16 bpf_off, u8 *jit_op, s32 *jit_off);
			
 
				++
			
 
				++/* Prepare a PC-relative jump operation with register conditional */
			
 
				++void setup_jmp_r(struct jit_context *ctx, bool same_reg,
			
 
				++		 u8 bpf_op, s16 bpf_off, u8 *jit_op, s32 *jit_off);
			
 
				++
			
 
				++/* Finish a PC-relative jump operation */
			
 
				++int finish_jmp(struct jit_context *ctx, u8 jit_op, s16 bpf_off);
			
 
				++
			
 
				++/* Conditional JMP/JMP32 immediate */
			
 
				++void emit_jmp_i(struct jit_context *ctx, u8 dst, s32 imm, s32 off, u8 op);
			
 
				++
			
 
				++/* Conditional JMP/JMP32 register */
			
 
				++void emit_jmp_r(struct jit_context *ctx, u8 dst, u8 src, s32 off, u8 op);
			
 
				++
			
 
				++/* Jump always */
			
 
				++int emit_ja(struct jit_context *ctx, s16 off);
			
 
				++
			
 
				++/* Jump to epilogue */
			
 
				++int emit_exit(struct jit_context *ctx);
			
 
				++
			
 
				++/*
			
 
				++ * Build program prologue to set up the stack and registers.
			
 
				++ * This function is implemented separately for 32-bit and 64-bit JITs.
			
 
				++ */
			
 
				++void build_prologue(struct jit_context *ctx);
			
 
				++
			
 
				++/*
			
 
				++ * Build the program epilogue to restore the stack and registers.
			
 
				++ * This function is implemented separately for 32-bit and 64-bit JITs.
			
 
				++ */
			
 
				++void build_epilogue(struct jit_context *ctx, int dest_reg);
			
 
				++
			
 
				++/*
			
 
				++ * Convert an eBPF instruction to native instruction, i.e
			
 
				++ * JITs an eBPF instruction.
			
 
				++ * Returns :
			
 
				++ *	0  - Successfully JITed an 8-byte eBPF instruction
			
 
				++ *	>0 - Successfully JITed a 16-byte eBPF instruction
			
 
				++ *	<0 - Failed to JIT.
			
 
				++ * This function is implemented separately for 32-bit and 64-bit JITs.
			
 
				++ */
			
 
				++int build_insn(const struct bpf_insn *insn, struct jit_context *ctx);
			
 
				++
			
 
				++#endif /* _BPF_JIT_COMP_H */
			
 
				+--- /dev/null
			
 
				++++ b/arch/mips/net/bpf_jit_comp32.c
			
 
				+@@ -0,0 +1,1741 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/*
			
 
				++ * Just-In-Time compiler for eBPF bytecode on MIPS.
			
 
				++ * Implementation of JIT functions for 32-bit CPUs.
			
 
				++ *
			
 
				++ * Copyright (c) 2021 Anyfi Networks AB.
			
 
				++ * Author: Johan Almbladh <[email protected]>
			
 
				++ *
			
 
				++ * Based on code and ideas from
			
 
				++ * Copyright (c) 2017 Cavium, Inc.
			
 
				++ * Copyright (c) 2017 Shubham Bansal <[email protected]>
			
 
				++ * Copyright (c) 2011 Mircea Gherzan <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++#include <linux/math64.h>
			
 
				++#include <linux/errno.h>
			
 
				++#include <linux/filter.h>
			
 
				++#include <linux/bpf.h>
			
 
				++#include <asm/cpu-features.h>
			
 
				++#include <asm/isa-rev.h>
			
 
				++#include <asm/uasm.h>
			
 
				++
			
 
				++#include "bpf_jit_comp.h"
			
 
				++
			
 
				++/* MIPS a4-a7 are not available in the o32 ABI */
			
 
				++#undef MIPS_R_A4
			
 
				++#undef MIPS_R_A5
			
 
				++#undef MIPS_R_A6
			
 
				++#undef MIPS_R_A7
			
 
				++
			
 
				++/* Stack is 8-byte aligned in o32 ABI */
			
 
				++#define MIPS_STACK_ALIGNMENT 8
			
 
				++
			
 
				++/*
			
 
				++ * The top 16 bytes of a stack frame is reserved for the callee in O32 ABI.
			
 
				++ * This corresponds to stack space for register arguments a0-a3.
			
 
				++ */
			
 
				++#define JIT_RESERVED_STACK 16
			
 
				++
			
 
				++/* Temporary 64-bit register used by JIT */
			
 
				++#define JIT_REG_TMP MAX_BPF_JIT_REG
			
 
				++
			
 
				++/*
			
 
				++ * Number of prologue bytes to skip when doing a tail call.
			
 
				++ * Tail call count (TCC) initialization (8 bytes) always, plus
			
 
				++ * R0-to-v0 assignment (4 bytes) if big endian.
			
 
				++ */
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++#define JIT_TCALL_SKIP 12
			
 
				++#else
			
 
				++#define JIT_TCALL_SKIP 8
			
 
				++#endif
			
 
				++
			
 
				++/* CPU registers holding the callee return value */
			
 
				++#define JIT_RETURN_REGS	  \
			
 
				++	(BIT(MIPS_R_V0) | \
			
 
				++	 BIT(MIPS_R_V1))
			
 
				++
			
 
				++/* CPU registers arguments passed to callee directly */
			
 
				++#define JIT_ARG_REGS      \
			
 
				++	(BIT(MIPS_R_A0) | \
			
 
				++	 BIT(MIPS_R_A1) | \
			
 
				++	 BIT(MIPS_R_A2) | \
			
 
				++	 BIT(MIPS_R_A3))
			
 
				++
			
 
				++/* CPU register arguments passed to callee on stack */
			
 
				++#define JIT_STACK_REGS    \
			
 
				++	(BIT(MIPS_R_T0) | \
			
 
				++	 BIT(MIPS_R_T1) | \
			
 
				++	 BIT(MIPS_R_T2) | \
			
 
				++	 BIT(MIPS_R_T3) | \
			
 
				++	 BIT(MIPS_R_T4) | \
			
 
				++	 BIT(MIPS_R_T5))
			
 
				++
			
 
				++/* Caller-saved CPU registers */
			
 
				++#define JIT_CALLER_REGS    \
			
 
				++	(JIT_RETURN_REGS | \
			
 
				++	 JIT_ARG_REGS    | \
			
 
				++	 JIT_STACK_REGS)
			
 
				++
			
 
				++/* Callee-saved CPU registers */
			
 
				++#define JIT_CALLEE_REGS   \
			
 
				++	(BIT(MIPS_R_S0) | \
			
 
				++	 BIT(MIPS_R_S1) | \
			
 
				++	 BIT(MIPS_R_S2) | \
			
 
				++	 BIT(MIPS_R_S3) | \
			
 
				++	 BIT(MIPS_R_S4) | \
			
 
				++	 BIT(MIPS_R_S5) | \
			
 
				++	 BIT(MIPS_R_S6) | \
			
 
				++	 BIT(MIPS_R_S7) | \
			
 
				++	 BIT(MIPS_R_GP) | \
			
 
				++	 BIT(MIPS_R_FP) | \
			
 
				++	 BIT(MIPS_R_RA))
			
 
				++
			
 
				++/*
			
 
				++ * Mapping of 64-bit eBPF registers to 32-bit native MIPS registers.
			
 
				++ *
			
 
				++ * 1) Native register pairs are ordered according to CPU endiannes, following
			
 
				++ *    the MIPS convention for passing 64-bit arguments and return values.
			
 
				++ * 2) The eBPF return value, arguments and callee-saved registers are mapped
			
 
				++ *    to their native MIPS equivalents.
			
 
				++ * 3) Since the 32 highest bits in the eBPF FP register are always zero,
			
 
				++ *    only one general-purpose register is actually needed for the mapping.
			
 
				++ *    We use the fp register for this purpose, and map the highest bits to
			
 
				++ *    the MIPS register r0 (zero).
			
 
				++ * 4) We use the MIPS gp and at registers as internal temporary registers
			
 
				++ *    for constant blinding. The gp register is callee-saved.
			
 
				++ * 5) One 64-bit temporary register is mapped for use when sign-extending
			
 
				++ *    immediate operands. MIPS registers t6-t9 are available to the JIT
			
 
				++ *    for as temporaries when implementing complex 64-bit operations.
			
 
				++ *
			
 
				++ * With this scheme all eBPF registers are being mapped to native MIPS
			
 
				++ * registers without having to use any stack scratch space. The direct
			
 
				++ * register mapping (2) simplifies the handling of function calls.
			
 
				++ */
			
 
				++static const u8 bpf2mips32[][2] = {
			
 
				++	/* Return value from in-kernel function, and exit value from eBPF */
			
 
				++	[BPF_REG_0] = {MIPS_R_V1, MIPS_R_V0},
			
 
				++	/* Arguments from eBPF program to in-kernel function */
			
 
				++	[BPF_REG_1] = {MIPS_R_A1, MIPS_R_A0},
			
 
				++	[BPF_REG_2] = {MIPS_R_A3, MIPS_R_A2},
			
 
				++	/* Remaining arguments, to be passed on the stack per O32 ABI */
			
 
				++	[BPF_REG_3] = {MIPS_R_T1, MIPS_R_T0},
			
 
				++	[BPF_REG_4] = {MIPS_R_T3, MIPS_R_T2},
			
 
				++	[BPF_REG_5] = {MIPS_R_T5, MIPS_R_T4},
			
 
				++	/* Callee-saved registers that in-kernel function will preserve */
			
 
				++	[BPF_REG_6] = {MIPS_R_S1, MIPS_R_S0},
			
 
				++	[BPF_REG_7] = {MIPS_R_S3, MIPS_R_S2},
			
 
				++	[BPF_REG_8] = {MIPS_R_S5, MIPS_R_S4},
			
 
				++	[BPF_REG_9] = {MIPS_R_S7, MIPS_R_S6},
			
 
				++	/* Read-only frame pointer to access the eBPF stack */
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++	[BPF_REG_FP] = {MIPS_R_FP, MIPS_R_ZERO},
			
 
				++#else
			
 
				++	[BPF_REG_FP] = {MIPS_R_ZERO, MIPS_R_FP},
			
 
				++#endif
			
 
				++	/* Temporary register for blinding constants */
			
 
				++	[BPF_REG_AX] = {MIPS_R_GP, MIPS_R_AT},
			
 
				++	/* Temporary register for internal JIT use */
			
 
				++	[JIT_REG_TMP] = {MIPS_R_T7, MIPS_R_T6},
			
 
				++};
			
 
				++
			
 
				++/* Get low CPU register for a 64-bit eBPF register mapping */
			
 
				++static inline u8 lo(const u8 reg[])
			
 
				++{
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++	return reg[0];
			
 
				++#else
			
 
				++	return reg[1];
			
 
				++#endif
			
 
				++}
			
 
				++
			
 
				++/* Get high CPU register for a 64-bit eBPF register mapping */
			
 
				++static inline u8 hi(const u8 reg[])
			
 
				++{
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++	return reg[1];
			
 
				++#else
			
 
				++	return reg[0];
			
 
				++#endif
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Mark a 64-bit CPU register pair as clobbered, it needs to be
			
 
				++ * saved/restored by the program if callee-saved.
			
 
				++ */
			
 
				++static void clobber_reg64(struct jit_context *ctx, const u8 reg[])
			
 
				++{
			
 
				++	clobber_reg(ctx, reg[0]);
			
 
				++	clobber_reg(ctx, reg[1]);
			
 
				++}
			
 
				++
			
 
				++/* dst = imm (sign-extended) */
			
 
				++static void emit_mov_se_i64(struct jit_context *ctx, const u8 dst[], s32 imm)
			
 
				++{
			
 
				++	emit_mov_i(ctx, lo(dst), imm);
			
 
				++	if (imm < 0)
			
 
				++		emit(ctx, addiu, hi(dst), MIPS_R_ZERO, -1);
			
 
				++	else
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Zero extension, if verifier does not do it for us  */
			
 
				++static void emit_zext_ver(struct jit_context *ctx, const u8 dst[])
			
 
				++{
			
 
				++	if (!ctx->program->aux->verifier_zext) {
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		clobber_reg(ctx, hi(dst));
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Load delay slot, if ISA mandates it */
			
 
				++static void emit_load_delay(struct jit_context *ctx)
			
 
				++{
			
 
				++	if (!cpu_has_mips_2_3_4_5_r)
			
 
				++		emit(ctx, nop);
			
 
				++}
			
 
				++
			
 
				++/* ALU immediate operation (64-bit) */
			
 
				++static void emit_alu_i64(struct jit_context *ctx,
			
 
				++			 const u8 dst[], s32 imm, u8 op)
			
 
				++{
			
 
				++	u8 src = MIPS_R_T6;
			
 
				++
			
 
				++	/*
			
 
				++	 * ADD/SUB with all but the max negative imm can be handled by
			
 
				++	 * inverting the operation and the imm value, saving one insn.
			
 
				++	 */
			
 
				++	if (imm > S32_MIN && imm < 0)
			
 
				++		switch (op) {
			
 
				++		case BPF_ADD:
			
 
				++			op = BPF_SUB;
			
 
				++			imm = -imm;
			
 
				++			break;
			
 
				++		case BPF_SUB:
			
 
				++			op = BPF_ADD;
			
 
				++			imm = -imm;
			
 
				++			break;
			
 
				++		}
			
 
				++
			
 
				++	/* Move immediate to temporary register */
			
 
				++	emit_mov_i(ctx, src, imm);
			
 
				++
			
 
				++	switch (op) {
			
 
				++	/* dst = dst + imm */
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, addu, lo(dst), lo(dst), src);
			
 
				++		emit(ctx, sltu, MIPS_R_T9, lo(dst), src);
			
 
				++		emit(ctx, addu, hi(dst), hi(dst), MIPS_R_T9);
			
 
				++		if (imm < 0)
			
 
				++			emit(ctx, addiu, hi(dst), hi(dst), -1);
			
 
				++		break;
			
 
				++	/* dst = dst - imm */
			
 
				++	case BPF_SUB:
			
 
				++		emit(ctx, sltu, MIPS_R_T9, lo(dst), src);
			
 
				++		emit(ctx, subu, lo(dst), lo(dst), src);
			
 
				++		emit(ctx, subu, hi(dst), hi(dst), MIPS_R_T9);
			
 
				++		if (imm < 0)
			
 
				++			emit(ctx, addiu, hi(dst), hi(dst), 1);
			
 
				++		break;
			
 
				++	/* dst = dst | imm */
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, or, lo(dst), lo(dst), src);
			
 
				++		if (imm < 0)
			
 
				++			emit(ctx, addiu, hi(dst), MIPS_R_ZERO, -1);
			
 
				++		break;
			
 
				++	/* dst = dst & imm */
			
 
				++	case BPF_AND:
			
 
				++		emit(ctx, and, lo(dst), lo(dst), src);
			
 
				++		if (imm >= 0)
			
 
				++			emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		break;
			
 
				++	/* dst = dst ^ imm */
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xor, lo(dst), lo(dst), src);
			
 
				++		if (imm < 0) {
			
 
				++			emit(ctx, subu, hi(dst), MIPS_R_ZERO, hi(dst));
			
 
				++			emit(ctx, addiu, hi(dst), hi(dst), -1);
			
 
				++		}
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU register operation (64-bit) */
			
 
				++static void emit_alu_r64(struct jit_context *ctx,
			
 
				++			 const u8 dst[], const u8 src[], u8 op)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst + src */
			
 
				++	case BPF_ADD:
			
 
				++		if (src == dst) {
			
 
				++			emit(ctx, srl, MIPS_R_T9, lo(dst), 31);
			
 
				++			emit(ctx, addu, lo(dst), lo(dst), lo(dst));
			
 
				++		} else {
			
 
				++			emit(ctx, addu, lo(dst), lo(dst), lo(src));
			
 
				++			emit(ctx, sltu, MIPS_R_T9, lo(dst), lo(src));
			
 
				++		}
			
 
				++		emit(ctx, addu, hi(dst), hi(dst), hi(src));
			
 
				++		emit(ctx, addu, hi(dst), hi(dst), MIPS_R_T9);
			
 
				++		break;
			
 
				++	/* dst = dst - src */
			
 
				++	case BPF_SUB:
			
 
				++		emit(ctx, sltu, MIPS_R_T9, lo(dst), lo(src));
			
 
				++		emit(ctx, subu, lo(dst), lo(dst), lo(src));
			
 
				++		emit(ctx, subu, hi(dst), hi(dst), hi(src));
			
 
				++		emit(ctx, subu, hi(dst), hi(dst), MIPS_R_T9);
			
 
				++		break;
			
 
				++	/* dst = dst | src */
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, or, lo(dst), lo(dst), lo(src));
			
 
				++		emit(ctx, or, hi(dst), hi(dst), hi(src));
			
 
				++		break;
			
 
				++	/* dst = dst & src */
			
 
				++	case BPF_AND:
			
 
				++		emit(ctx, and, lo(dst), lo(dst), lo(src));
			
 
				++		emit(ctx, and, hi(dst), hi(dst), hi(src));
			
 
				++		break;
			
 
				++	/* dst = dst ^ src */
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xor, lo(dst), lo(dst), lo(src));
			
 
				++		emit(ctx, xor, hi(dst), hi(dst), hi(src));
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU invert (64-bit) */
			
 
				++static void emit_neg_i64(struct jit_context *ctx, const u8 dst[])
			
 
				++{
			
 
				++	emit(ctx, sltu, MIPS_R_T9, MIPS_R_ZERO, lo(dst));
			
 
				++	emit(ctx, subu, lo(dst), MIPS_R_ZERO, lo(dst));
			
 
				++	emit(ctx, subu, hi(dst), MIPS_R_ZERO, hi(dst));
			
 
				++	emit(ctx, subu, hi(dst), hi(dst), MIPS_R_T9);
			
 
				++
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU shift immediate (64-bit) */
			
 
				++static void emit_shift_i64(struct jit_context *ctx,
			
 
				++			   const u8 dst[], u32 imm, u8 op)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst << imm */
			
 
				++	case BPF_LSH:
			
 
				++		if (imm < 32) {
			
 
				++			emit(ctx, srl, MIPS_R_T9, lo(dst), 32 - imm);
			
 
				++			emit(ctx, sll, lo(dst), lo(dst), imm);
			
 
				++			emit(ctx, sll, hi(dst), hi(dst), imm);
			
 
				++			emit(ctx, or, hi(dst), hi(dst), MIPS_R_T9);
			
 
				++		} else {
			
 
				++			emit(ctx, sll, hi(dst), lo(dst), imm - 32);
			
 
				++			emit(ctx, move, lo(dst), MIPS_R_ZERO);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst >> imm */
			
 
				++	case BPF_RSH:
			
 
				++		if (imm < 32) {
			
 
				++			emit(ctx, sll, MIPS_R_T9, hi(dst), 32 - imm);
			
 
				++			emit(ctx, srl, lo(dst), lo(dst), imm);
			
 
				++			emit(ctx, srl, hi(dst), hi(dst), imm);
			
 
				++			emit(ctx, or, lo(dst), lo(dst), MIPS_R_T9);
			
 
				++		} else {
			
 
				++			emit(ctx, srl, lo(dst), hi(dst), imm - 32);
			
 
				++			emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst >> imm (arithmetic) */
			
 
				++	case BPF_ARSH:
			
 
				++		if (imm < 32) {
			
 
				++			emit(ctx, sll, MIPS_R_T9, hi(dst), 32 - imm);
			
 
				++			emit(ctx, srl, lo(dst), lo(dst), imm);
			
 
				++			emit(ctx, sra, hi(dst), hi(dst), imm);
			
 
				++			emit(ctx, or, lo(dst), lo(dst), MIPS_R_T9);
			
 
				++		} else {
			
 
				++			emit(ctx, sra, lo(dst), hi(dst), imm - 32);
			
 
				++			emit(ctx, sra, hi(dst), hi(dst), 31);
			
 
				++		}
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU shift register (64-bit) */
			
 
				++static void emit_shift_r64(struct jit_context *ctx,
			
 
				++			   const u8 dst[], u8 src, u8 op)
			
 
				++{
			
 
				++	u8 t1 = MIPS_R_T8;
			
 
				++	u8 t2 = MIPS_R_T9;
			
 
				++
			
 
				++	emit(ctx, andi, t1, src, 32);              /* t1 = src & 32          */
			
 
				++	emit(ctx, beqz, t1, 16);                   /* PC += 16 if t1 == 0    */
			
 
				++	emit(ctx, nor, t2, src, MIPS_R_ZERO);      /* t2 = ~src (delay slot) */
			
 
				++
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst << src */
			
 
				++	case BPF_LSH:
			
 
				++		/* Next: shift >= 32 */
			
 
				++		emit(ctx, sllv, hi(dst), lo(dst), src);    /* dh = dl << src */
			
 
				++		emit(ctx, move, lo(dst), MIPS_R_ZERO);     /* dl = 0         */
			
 
				++		emit(ctx, b, 20);                          /* PC += 20       */
			
 
				++		/* +16: shift < 32 */
			
 
				++		emit(ctx, srl, t1, lo(dst), 1);            /* t1 = dl >> 1   */
			
 
				++		emit(ctx, srlv, t1, t1, t2);               /* t1 = t1 >> t2  */
			
 
				++		emit(ctx, sllv, lo(dst), lo(dst), src);    /* dl = dl << src */
			
 
				++		emit(ctx, sllv, hi(dst), hi(dst), src);    /* dh = dh << src */
			
 
				++		emit(ctx, or, hi(dst), hi(dst), t1);       /* dh = dh | t1   */
			
 
				++		break;
			
 
				++	/* dst = dst >> src */
			
 
				++	case BPF_RSH:
			
 
				++		/* Next: shift >= 32 */
			
 
				++		emit(ctx, srlv, lo(dst), hi(dst), src);    /* dl = dh >> src */
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);     /* dh = 0         */
			
 
				++		emit(ctx, b, 20);                          /* PC += 20       */
			
 
				++		/* +16: shift < 32 */
			
 
				++		emit(ctx, sll, t1, hi(dst), 1);            /* t1 = dl << 1   */
			
 
				++		emit(ctx, sllv, t1, t1, t2);               /* t1 = t1 << t2  */
			
 
				++		emit(ctx, srlv, lo(dst), lo(dst), src);    /* dl = dl >> src */
			
 
				++		emit(ctx, srlv, hi(dst), hi(dst), src);    /* dh = dh >> src */
			
 
				++		emit(ctx, or, lo(dst), lo(dst), t1);       /* dl = dl | t1   */
			
 
				++		break;
			
 
				++	/* dst = dst >> src (arithmetic) */
			
 
				++	case BPF_ARSH:
			
 
				++		/* Next: shift >= 32 */
			
 
				++		emit(ctx, srav, lo(dst), hi(dst), src);   /* dl = dh >>a src */
			
 
				++		emit(ctx, sra, hi(dst), hi(dst), 31);     /* dh = dh >>a 31  */
			
 
				++		emit(ctx, b, 20);                         /* PC += 20        */
			
 
				++		/* +16: shift < 32 */
			
 
				++		emit(ctx, sll, t1, hi(dst), 1);           /* t1 = dl << 1    */
			
 
				++		emit(ctx, sllv, t1, t1, t2);              /* t1 = t1 << t2   */
			
 
				++		emit(ctx, srlv, lo(dst), lo(dst), src);   /* dl = dl >>a src */
			
 
				++		emit(ctx, srav, hi(dst), hi(dst), src);   /* dh = dh >> src  */
			
 
				++		emit(ctx, or, lo(dst), lo(dst), t1);      /* dl = dl | t1    */
			
 
				++		break;
			
 
				++	}
			
 
				++
			
 
				++	/* +20: Done */
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU mul immediate (64x32-bit) */
			
 
				++static void emit_mul_i64(struct jit_context *ctx, const u8 dst[], s32 imm)
			
 
				++{
			
 
				++	u8 src = MIPS_R_T6;
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	switch (imm) {
			
 
				++	/* dst = dst * 1 is a no-op */
			
 
				++	case 1:
			
 
				++		break;
			
 
				++	/* dst = dst * -1 */
			
 
				++	case -1:
			
 
				++		emit_neg_i64(ctx, dst);
			
 
				++		break;
			
 
				++	case 0:
			
 
				++		emit_mov_r(ctx, lo(dst), MIPS_R_ZERO);
			
 
				++		emit_mov_r(ctx, hi(dst), MIPS_R_ZERO);
			
 
				++		break;
			
 
				++	/* Full 64x32 multiply */
			
 
				++	default:
			
 
				++		/* hi(dst) = hi(dst) * src(imm) */
			
 
				++		emit_mov_i(ctx, src, imm);
			
 
				++		if (cpu_has_mips32r1 || cpu_has_mips32r6) {
			
 
				++			emit(ctx, mul, hi(dst), hi(dst), src);
			
 
				++		} else {
			
 
				++			emit(ctx, multu, hi(dst), src);
			
 
				++			emit(ctx, mflo, hi(dst));
			
 
				++		}
			
 
				++
			
 
				++		/* hi(dst) = hi(dst) - lo(dst) */
			
 
				++		if (imm < 0)
			
 
				++			emit(ctx, subu, hi(dst), hi(dst), lo(dst));
			
 
				++
			
 
				++		/* tmp = lo(dst) * src(imm) >> 32 */
			
 
				++		/* lo(dst) = lo(dst) * src(imm) */
			
 
				++		if (cpu_has_mips32r6) {
			
 
				++			emit(ctx, muhu, tmp, lo(dst), src);
			
 
				++			emit(ctx, mulu, lo(dst), lo(dst), src);
			
 
				++		} else {
			
 
				++			emit(ctx, multu, lo(dst), src);
			
 
				++			emit(ctx, mflo, lo(dst));
			
 
				++			emit(ctx, mfhi, tmp);
			
 
				++		}
			
 
				++
			
 
				++		/* hi(dst) += tmp */
			
 
				++		emit(ctx, addu, hi(dst), hi(dst), tmp);
			
 
				++		clobber_reg64(ctx, dst);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* ALU mul register (64x64-bit) */
			
 
				++static void emit_mul_r64(struct jit_context *ctx,
			
 
				++			 const u8 dst[], const u8 src[])
			
 
				++{
			
 
				++	u8 acc = MIPS_R_T8;
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	/* acc = hi(dst) * lo(src) */
			
 
				++	if (cpu_has_mips32r1 || cpu_has_mips32r6) {
			
 
				++		emit(ctx, mul, acc, hi(dst), lo(src));
			
 
				++	} else {
			
 
				++		emit(ctx, multu, hi(dst), lo(src));
			
 
				++		emit(ctx, mflo, acc);
			
 
				++	}
			
 
				++
			
 
				++	/* tmp = lo(dst) * hi(src) */
			
 
				++	if (cpu_has_mips32r1 || cpu_has_mips32r6) {
			
 
				++		emit(ctx, mul, tmp, lo(dst), hi(src));
			
 
				++	} else {
			
 
				++		emit(ctx, multu, lo(dst), hi(src));
			
 
				++		emit(ctx, mflo, tmp);
			
 
				++	}
			
 
				++
			
 
				++	/* acc += tmp */
			
 
				++	emit(ctx, addu, acc, acc, tmp);
			
 
				++
			
 
				++	/* tmp = lo(dst) * lo(src) >> 32 */
			
 
				++	/* lo(dst) = lo(dst) * lo(src) */
			
 
				++	if (cpu_has_mips32r6) {
			
 
				++		emit(ctx, muhu, tmp, lo(dst), lo(src));
			
 
				++		emit(ctx, mulu, lo(dst), lo(dst), lo(src));
			
 
				++	} else {
			
 
				++		emit(ctx, multu, lo(dst), lo(src));
			
 
				++		emit(ctx, mflo, lo(dst));
			
 
				++		emit(ctx, mfhi, tmp);
			
 
				++	}
			
 
				++
			
 
				++	/* hi(dst) = acc + tmp */
			
 
				++	emit(ctx, addu, hi(dst), acc, tmp);
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Helper function for 64-bit modulo */
			
 
				++static u64 jit_mod64(u64 a, u64 b)
			
 
				++{
			
 
				++	u64 rem;
			
 
				++
			
 
				++	div64_u64_rem(a, b, &rem);
			
 
				++	return rem;
			
 
				++}
			
 
				++
			
 
				++/* ALU div/mod register (64-bit) */
			
 
				++static void emit_divmod_r64(struct jit_context *ctx,
			
 
				++			    const u8 dst[], const u8 src[], u8 op)
			
 
				++{
			
 
				++	const u8 *r0 = bpf2mips32[BPF_REG_0]; /* Mapped to v0-v1 */
			
 
				++	const u8 *r1 = bpf2mips32[BPF_REG_1]; /* Mapped to a0-a1 */
			
 
				++	const u8 *r2 = bpf2mips32[BPF_REG_2]; /* Mapped to a2-a3 */
			
 
				++	int exclude, k;
			
 
				++	u32 addr = 0;
			
 
				++
			
 
				++	/* Push caller-saved registers on stack */
			
 
				++	push_regs(ctx, ctx->clobbered & JIT_CALLER_REGS,
			
 
				++		  0, JIT_RESERVED_STACK);
			
 
				++
			
 
				++	/* Put 64-bit arguments 1 and 2 in registers a0-a3 */
			
 
				++	for (k = 0; k < 2; k++) {
			
 
				++		emit(ctx, move, MIPS_R_T9, src[k]);
			
 
				++		emit(ctx, move, r1[k], dst[k]);
			
 
				++		emit(ctx, move, r2[k], MIPS_R_T9);
			
 
				++	}
			
 
				++
			
 
				++	/* Emit function call */
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst / src */
			
 
				++	case BPF_DIV:
			
 
				++		addr = (u32)&div64_u64;
			
 
				++		break;
			
 
				++	/* dst = dst % src */
			
 
				++	case BPF_MOD:
			
 
				++		addr = (u32)&jit_mod64;
			
 
				++		break;
			
 
				++	}
			
 
				++	emit_mov_i(ctx, MIPS_R_T9, addr);
			
 
				++	emit(ctx, jalr, MIPS_R_RA, MIPS_R_T9);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++
			
 
				++	/* Store the 64-bit result in dst */
			
 
				++	emit(ctx, move, dst[0], r0[0]);
			
 
				++	emit(ctx, move, dst[1], r0[1]);
			
 
				++
			
 
				++	/* Restore caller-saved registers, excluding the computed result */
			
 
				++	exclude = BIT(lo(dst)) | BIT(hi(dst));
			
 
				++	pop_regs(ctx, ctx->clobbered & JIT_CALLER_REGS,
			
 
				++		 exclude, JIT_RESERVED_STACK);
			
 
				++	emit_load_delay(ctx);
			
 
				++
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++	clobber_reg(ctx, MIPS_R_V0);
			
 
				++	clobber_reg(ctx, MIPS_R_V1);
			
 
				++	clobber_reg(ctx, MIPS_R_RA);
			
 
				++}
			
 
				++
			
 
				++/* Swap bytes in a register word */
			
 
				++static void emit_swap8_r(struct jit_context *ctx, u8 dst, u8 src, u8 mask)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	emit(ctx, and, tmp, src, mask); /* tmp = src & 0x00ff00ff */
			
 
				++	emit(ctx, sll, tmp, tmp, 8);    /* tmp = tmp << 8         */
			
 
				++	emit(ctx, srl, dst, src, 8);    /* dst = src >> 8         */
			
 
				++	emit(ctx, and, dst, dst, mask); /* dst = dst & 0x00ff00ff */
			
 
				++	emit(ctx, or,  dst, dst, tmp);  /* dst = dst | tmp        */
			
 
				++}
			
 
				++
			
 
				++/* Swap half words in a register word */
			
 
				++static void emit_swap16_r(struct jit_context *ctx, u8 dst, u8 src)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	emit(ctx, sll, tmp, src, 16);  /* tmp = src << 16 */
			
 
				++	emit(ctx, srl, dst, src, 16);  /* dst = src >> 16 */
			
 
				++	emit(ctx, or,  dst, dst, tmp); /* dst = dst | tmp */
			
 
				++}
			
 
				++
			
 
				++/* Swap bytes and truncate a register double word, word or half word */
			
 
				++static void emit_bswap_r64(struct jit_context *ctx, const u8 dst[], u32 width)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T8;
			
 
				++
			
 
				++	switch (width) {
			
 
				++	/* Swap bytes in a double word */
			
 
				++	case 64:
			
 
				++		if (cpu_has_mips32r2 || cpu_has_mips32r6) {
			
 
				++			emit(ctx, rotr, tmp, hi(dst), 16);
			
 
				++			emit(ctx, rotr, hi(dst), lo(dst), 16);
			
 
				++			emit(ctx, wsbh, lo(dst), tmp);
			
 
				++			emit(ctx, wsbh, hi(dst), hi(dst));
			
 
				++		} else {
			
 
				++			emit_swap16_r(ctx, tmp, lo(dst));
			
 
				++			emit_swap16_r(ctx, lo(dst), hi(dst));
			
 
				++			emit(ctx, move, hi(dst), tmp);
			
 
				++
			
 
				++			emit(ctx, lui, tmp, 0xff);      /* tmp = 0x00ff0000 */
			
 
				++			emit(ctx, ori, tmp, tmp, 0xff); /* tmp = 0x00ff00ff */
			
 
				++			emit_swap8_r(ctx, lo(dst), lo(dst), tmp);
			
 
				++			emit_swap8_r(ctx, hi(dst), hi(dst), tmp);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* Swap bytes in a word */
			
 
				++	/* Swap bytes in a half word */
			
 
				++	case 32:
			
 
				++	case 16:
			
 
				++		emit_bswap_r(ctx, lo(dst), width);
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Truncate a register double word, word or half word */
			
 
				++static void emit_trunc_r64(struct jit_context *ctx, const u8 dst[], u32 width)
			
 
				++{
			
 
				++	switch (width) {
			
 
				++	case 64:
			
 
				++		break;
			
 
				++	/* Zero-extend a word */
			
 
				++	case 32:
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		clobber_reg(ctx, hi(dst));
			
 
				++		break;
			
 
				++	/* Zero-extend a half word */
			
 
				++	case 16:
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		emit(ctx, andi, lo(dst), lo(dst), 0xffff);
			
 
				++		clobber_reg64(ctx, dst);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Load operation: dst = *(size*)(src + off) */
			
 
				++static void emit_ldx(struct jit_context *ctx,
			
 
				++		     const u8 dst[], u8 src, s16 off, u8 size)
			
 
				++{
			
 
				++	switch (size) {
			
 
				++	/* Load a byte */
			
 
				++	case BPF_B:
			
 
				++		emit(ctx, lbu, lo(dst), off, src);
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		break;
			
 
				++	/* Load a half word */
			
 
				++	case BPF_H:
			
 
				++		emit(ctx, lhu, lo(dst), off, src);
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		break;
			
 
				++	/* Load a word */
			
 
				++	case BPF_W:
			
 
				++		emit(ctx, lw, lo(dst), off, src);
			
 
				++		emit(ctx, move, hi(dst), MIPS_R_ZERO);
			
 
				++		break;
			
 
				++	/* Load a double word */
			
 
				++	case BPF_DW:
			
 
				++		if (dst[1] == src) {
			
 
				++			emit(ctx, lw, dst[0], off + 4, src);
			
 
				++			emit(ctx, lw, dst[1], off, src);
			
 
				++		} else {
			
 
				++			emit(ctx, lw, dst[1], off, src);
			
 
				++			emit(ctx, lw, dst[0], off + 4, src);
			
 
				++		}
			
 
				++		emit_load_delay(ctx);
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg64(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Store operation: *(size *)(dst + off) = src */
			
 
				++static void emit_stx(struct jit_context *ctx,
			
 
				++		     const u8 dst, const u8 src[], s16 off, u8 size)
			
 
				++{
			
 
				++	switch (size) {
			
 
				++	/* Store a byte */
			
 
				++	case BPF_B:
			
 
				++		emit(ctx, sb, lo(src), off, dst);
			
 
				++		break;
			
 
				++	/* Store a half word */
			
 
				++	case BPF_H:
			
 
				++		emit(ctx, sh, lo(src), off, dst);
			
 
				++		break;
			
 
				++	/* Store a word */
			
 
				++	case BPF_W:
			
 
				++		emit(ctx, sw, lo(src), off, dst);
			
 
				++		break;
			
 
				++	/* Store a double word */
			
 
				++	case BPF_DW:
			
 
				++		emit(ctx, sw, src[1], off, dst);
			
 
				++		emit(ctx, sw, src[0], off + 4, dst);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Atomic read-modify-write (32-bit, non-ll/sc fallback) */
			
 
				++static void emit_atomic_r32(struct jit_context *ctx,
			
 
				++			    u8 dst, u8 src, s16 off, u8 code)
			
 
				++{
			
 
				++	u32 exclude = 0;
			
 
				++	u32 addr = 0;
			
 
				++
			
 
				++	/* Push caller-saved registers on stack */
			
 
				++	push_regs(ctx, ctx->clobbered & JIT_CALLER_REGS,
			
 
				++		  0, JIT_RESERVED_STACK);
			
 
				++	/*
			
 
				++	 * Argument 1: dst+off if xchg, otherwise src, passed in register a0
			
 
				++	 * Argument 2: src if xchg, othersize dst+off, passed in register a1
			
 
				++	 */
			
 
				++	emit(ctx, move, MIPS_R_T9, dst);
			
 
				++	emit(ctx, move, MIPS_R_A0, src);
			
 
				++	emit(ctx, addiu, MIPS_R_A1, MIPS_R_T9, off);
			
 
				++
			
 
				++	/* Emit function call */
			
 
				++	switch (code) {
			
 
				++	case BPF_ADD:
			
 
				++		addr = (u32)&atomic_add;
			
 
				++		break;
			
 
				++	case BPF_SUB:
			
 
				++		addr = (u32)&atomic_sub;
			
 
				++		break;
			
 
				++	case BPF_OR:
			
 
				++		addr = (u32)&atomic_or;
			
 
				++		break;
			
 
				++	case BPF_AND:
			
 
				++		addr = (u32)&atomic_and;
			
 
				++		break;
			
 
				++	case BPF_XOR:
			
 
				++		addr = (u32)&atomic_xor;
			
 
				++		break;
			
 
				++	}
			
 
				++	emit_mov_i(ctx, MIPS_R_T9, addr);
			
 
				++	emit(ctx, jalr, MIPS_R_RA, MIPS_R_T9);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++
			
 
				++	/* Restore caller-saved registers, except any fetched value */
			
 
				++	pop_regs(ctx, ctx->clobbered & JIT_CALLER_REGS,
			
 
				++		 exclude, JIT_RESERVED_STACK);
			
 
				++	emit_load_delay(ctx);
			
 
				++	clobber_reg(ctx, MIPS_R_RA);
			
 
				++}
			
 
				++
			
 
				++/* Atomic read-modify-write (64-bit) */
			
 
				++static void emit_atomic_r64(struct jit_context *ctx,
			
 
				++			    u8 dst, const u8 src[], s16 off, u8 code)
			
 
				++{
			
 
				++	const u8 *r1 = bpf2mips32[BPF_REG_1]; /* Mapped to a0-a1 */
			
 
				++	u32 exclude = 0;
			
 
				++	u32 addr = 0;
			
 
				++
			
 
				++	/* Push caller-saved registers on stack */
			
 
				++	push_regs(ctx, ctx->clobbered & JIT_CALLER_REGS,
			
 
				++		  0, JIT_RESERVED_STACK);
			
 
				++	/*
			
 
				++	 * Argument 1: 64-bit src, passed in registers a0-a1
			
 
				++	 * Argument 2: 32-bit dst+off, passed in register a2
			
 
				++	 */
			
 
				++	emit(ctx, move, MIPS_R_T9, dst);
			
 
				++	emit(ctx, move, r1[0], src[0]);
			
 
				++	emit(ctx, move, r1[1], src[1]);
			
 
				++	emit(ctx, addiu, MIPS_R_A2, MIPS_R_T9, off);
			
 
				++
			
 
				++	/* Emit function call */
			
 
				++	switch (code) {
			
 
				++	case BPF_ADD:
			
 
				++		addr = (u32)&atomic64_add;
			
 
				++		break;
			
 
				++	case BPF_SUB:
			
 
				++		addr = (u32)&atomic64_sub;
			
 
				++		break;
			
 
				++	case BPF_OR:
			
 
				++		addr = (u32)&atomic64_or;
			
 
				++		break;
			
 
				++	case BPF_AND:
			
 
				++		addr = (u32)&atomic64_and;
			
 
				++		break;
			
 
				++	case BPF_XOR:
			
 
				++		addr = (u32)&atomic64_xor;
			
 
				++		break;
			
 
				++	}
			
 
				++	emit_mov_i(ctx, MIPS_R_T9, addr);
			
 
				++	emit(ctx, jalr, MIPS_R_RA, MIPS_R_T9);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++
			
 
				++	/* Restore caller-saved registers, except any fetched value */
			
 
				++	pop_regs(ctx, ctx->clobbered & JIT_CALLER_REGS,
			
 
				++		 exclude, JIT_RESERVED_STACK);
			
 
				++	emit_load_delay(ctx);
			
 
				++	clobber_reg(ctx, MIPS_R_RA);
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Conditional movz or an emulated equivalent.
			
 
				++ * Note that the rs register may be modified.
			
 
				++ */
			
 
				++static void emit_movz_r(struct jit_context *ctx, u8 rd, u8 rs, u8 rt)
			
 
				++{
			
 
				++	if (cpu_has_mips_2) {
			
 
				++		emit(ctx, movz, rd, rs, rt);           /* rd = rt ? rd : rs  */
			
 
				++	} else if (cpu_has_mips32r6) {
			
 
				++		if (rs != MIPS_R_ZERO)
			
 
				++			emit(ctx, seleqz, rs, rs, rt); /* rs = 0 if rt == 0  */
			
 
				++		emit(ctx, selnez, rd, rd, rt);         /* rd = 0 if rt != 0  */
			
 
				++		if (rs != MIPS_R_ZERO)
			
 
				++			emit(ctx, or, rd, rd, rs);     /* rd = rd | rs       */
			
 
				++	} else {
			
 
				++		emit(ctx, bnez, rt, 8);                /* PC += 8 if rd != 0 */
			
 
				++		emit(ctx, nop);                        /* +0: delay slot     */
			
 
				++		emit(ctx, or, rd, rs, MIPS_R_ZERO);    /* +4: rd = rs        */
			
 
				++	}
			
 
				++	clobber_reg(ctx, rd);
			
 
				++	clobber_reg(ctx, rs);
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Conditional movn or an emulated equivalent.
			
 
				++ * Note that the rs register may be modified.
			
 
				++ */
			
 
				++static void emit_movn_r(struct jit_context *ctx, u8 rd, u8 rs, u8 rt)
			
 
				++{
			
 
				++	if (cpu_has_mips_2) {
			
 
				++		emit(ctx, movn, rd, rs, rt);           /* rd = rt ? rs : rd  */
			
 
				++	} else if (cpu_has_mips32r6) {
			
 
				++		if (rs != MIPS_R_ZERO)
			
 
				++			emit(ctx, selnez, rs, rs, rt); /* rs = 0 if rt == 0  */
			
 
				++		emit(ctx, seleqz, rd, rd, rt);         /* rd = 0 if rt != 0  */
			
 
				++		if (rs != MIPS_R_ZERO)
			
 
				++			emit(ctx, or, rd, rd, rs);     /* rd = rd | rs       */
			
 
				++	} else {
			
 
				++		emit(ctx, beqz, rt, 8);                /* PC += 8 if rd == 0 */
			
 
				++		emit(ctx, nop);                        /* +0: delay slot     */
			
 
				++		emit(ctx, or, rd, rs, MIPS_R_ZERO);    /* +4: rd = rs        */
			
 
				++	}
			
 
				++	clobber_reg(ctx, rd);
			
 
				++	clobber_reg(ctx, rs);
			
 
				++}
			
 
				++
			
 
				++/* Emulation of 64-bit sltiu rd, rs, imm, where imm may be S32_MAX + 1 */
			
 
				++static void emit_sltiu_r64(struct jit_context *ctx, u8 rd,
			
 
				++			   const u8 rs[], s64 imm)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	if (imm < 0) {
			
 
				++		emit_mov_i(ctx, rd, imm);                 /* rd = imm        */
			
 
				++		emit(ctx, sltu, rd, lo(rs), rd);          /* rd = rsl < rd   */
			
 
				++		emit(ctx, sltiu, tmp, hi(rs), -1);        /* tmp = rsh < ~0U */
			
 
				++		emit(ctx, or, rd, rd, tmp);               /* rd = rd | tmp   */
			
 
				++	} else { /* imm >= 0 */
			
 
				++		if (imm > 0x7fff) {
			
 
				++			emit_mov_i(ctx, rd, (s32)imm);     /* rd = imm       */
			
 
				++			emit(ctx, sltu, rd, lo(rs), rd);   /* rd = rsl < rd  */
			
 
				++		} else {
			
 
				++			emit(ctx, sltiu, rd, lo(rs), imm); /* rd = rsl < imm */
			
 
				++		}
			
 
				++		emit_movn_r(ctx, rd, MIPS_R_ZERO, hi(rs)); /* rd = 0 if rsh  */
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Emulation of 64-bit sltu rd, rs, rt */
			
 
				++static void emit_sltu_r64(struct jit_context *ctx, u8 rd,
			
 
				++			  const u8 rs[], const u8 rt[])
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	emit(ctx, sltu, rd, lo(rs), lo(rt));           /* rd = rsl < rtl     */
			
 
				++	emit(ctx, subu, tmp, hi(rs), hi(rt));          /* tmp = rsh - rth    */
			
 
				++	emit_movn_r(ctx, rd, MIPS_R_ZERO, tmp);        /* rd = 0 if tmp != 0 */
			
 
				++	emit(ctx, sltu, tmp, hi(rs), hi(rt));          /* tmp = rsh < rth    */
			
 
				++	emit(ctx, or, rd, rd, tmp);                    /* rd = rd | tmp      */
			
 
				++}
			
 
				++
			
 
				++/* Emulation of 64-bit slti rd, rs, imm, where imm may be S32_MAX + 1 */
			
 
				++static void emit_slti_r64(struct jit_context *ctx, u8 rd,
			
 
				++			  const u8 rs[], s64 imm)
			
 
				++{
			
 
				++	u8 t1 = MIPS_R_T8;
			
 
				++	u8 t2 = MIPS_R_T9;
			
 
				++	u8 cmp;
			
 
				++
			
 
				++	/*
			
 
				++	 * if ((rs < 0) ^ (imm < 0)) t1 = imm >u rsl
			
 
				++	 * else                      t1 = rsl <u imm
			
 
				++	 */
			
 
				++	emit_mov_i(ctx, rd, (s32)imm);
			
 
				++	emit(ctx, sltu, t1, lo(rs), rd);               /* t1 = rsl <u imm   */
			
 
				++	emit(ctx, sltu, t2, rd, lo(rs));               /* t2 = imm <u rsl   */
			
 
				++	emit(ctx, srl, rd, hi(rs), 31);                /* rd = rsh >> 31    */
			
 
				++	if (imm < 0)
			
 
				++		emit_movz_r(ctx, t1, t2, rd);          /* t1 = rd ? t1 : t2 */
			
 
				++	else
			
 
				++		emit_movn_r(ctx, t1, t2, rd);          /* t1 = rd ? t2 : t1 */
			
 
				++	/*
			
 
				++	 * if ((imm < 0 && rsh != 0xffffffff) ||
			
 
				++	 *     (imm >= 0 && rsh != 0))
			
 
				++	 *      t1 = 0
			
 
				++	 */
			
 
				++	if (imm < 0) {
			
 
				++		emit(ctx, addiu, rd, hi(rs), 1);       /* rd = rsh + 1 */
			
 
				++		cmp = rd;
			
 
				++	} else { /* imm >= 0 */
			
 
				++		cmp = hi(rs);
			
 
				++	}
			
 
				++	emit_movn_r(ctx, t1, MIPS_R_ZERO, cmp);        /* t1 = 0 if cmp != 0 */
			
 
				++
			
 
				++	/*
			
 
				++	 * if (imm < 0) rd = rsh < -1
			
 
				++	 * else         rd = rsh != 0
			
 
				++	 * rd = rd | t1
			
 
				++	 */
			
 
				++	emit(ctx, slti, rd, hi(rs), imm < 0 ? -1 : 0); /* rd = rsh < hi(imm) */
			
 
				++	emit(ctx, or, rd, rd, t1);                     /* rd = rd | t1       */
			
 
				++}
			
 
				++
			
 
				++/* Emulation of 64-bit(slt rd, rs, rt) */
			
 
				++static void emit_slt_r64(struct jit_context *ctx, u8 rd,
			
 
				++			 const u8 rs[], const u8 rt[])
			
 
				++{
			
 
				++	u8 t1 = MIPS_R_T7;
			
 
				++	u8 t2 = MIPS_R_T8;
			
 
				++	u8 t3 = MIPS_R_T9;
			
 
				++
			
 
				++	/*
			
 
				++	 * if ((rs < 0) ^ (rt < 0)) t1 = rtl <u rsl
			
 
				++	 * else                     t1 = rsl <u rtl
			
 
				++	 * if (rsh == rth)          t1 = 0
			
 
				++	 */
			
 
				++	emit(ctx, sltu, t1, lo(rs), lo(rt));           /* t1 = rsl <u rtl   */
			
 
				++	emit(ctx, sltu, t2, lo(rt), lo(rs));           /* t2 = rtl <u rsl   */
			
 
				++	emit(ctx, xor, t3, hi(rs), hi(rt));            /* t3 = rlh ^ rth    */
			
 
				++	emit(ctx, srl, rd, t3, 31);                    /* rd = t3 >> 31     */
			
 
				++	emit_movn_r(ctx, t1, t2, rd);                  /* t1 = rd ? t2 : t1 */
			
 
				++	emit_movn_r(ctx, t1, MIPS_R_ZERO, t3);         /* t1 = 0 if t3 != 0 */
			
 
				++
			
 
				++	/* rd = (rsh < rth) | t1 */
			
 
				++	emit(ctx, slt, rd, hi(rs), hi(rt));            /* rd = rsh <s rth   */
			
 
				++	emit(ctx, or, rd, rd, t1);                     /* rd = rd | t1      */
			
 
				++}
			
 
				++
			
 
				++/* Jump immediate (64-bit) */
			
 
				++static void emit_jmp_i64(struct jit_context *ctx,
			
 
				++			 const u8 dst[], s32 imm, s32 off, u8 op)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T6;
			
 
				++
			
 
				++	switch (op) {
			
 
				++	/* No-op, used internally for branch optimization */
			
 
				++	case JIT_JNOP:
			
 
				++		break;
			
 
				++	/* PC += off if dst == imm */
			
 
				++	/* PC += off if dst != imm */
			
 
				++	case BPF_JEQ:
			
 
				++	case BPF_JNE:
			
 
				++		if (imm >= -0x7fff && imm <= 0x8000) {
			
 
				++			emit(ctx, addiu, tmp, lo(dst), -imm);
			
 
				++		} else if ((u32)imm <= 0xffff) {
			
 
				++			emit(ctx, xori, tmp, lo(dst), imm);
			
 
				++		} else {       /* Register fallback */
			
 
				++			emit_mov_i(ctx, tmp, imm);
			
 
				++			emit(ctx, xor, tmp, lo(dst), tmp);
			
 
				++		}
			
 
				++		if (imm < 0) { /* Compare sign extension */
			
 
				++			emit(ctx, addu, MIPS_R_T9, hi(dst), 1);
			
 
				++			emit(ctx, or, tmp, tmp, MIPS_R_T9);
			
 
				++		} else {       /* Compare zero extension */
			
 
				++			emit(ctx, or, tmp, tmp, hi(dst));
			
 
				++		}
			
 
				++		if (op == BPF_JEQ)
			
 
				++			emit(ctx, beqz, tmp, off);
			
 
				++		else   /* BPF_JNE */
			
 
				++			emit(ctx, bnez, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst & imm */
			
 
				++	/* PC += off if (dst & imm) == 0 (not in BPF, used for long jumps) */
			
 
				++	case BPF_JSET:
			
 
				++	case JIT_JNSET:
			
 
				++		if ((u32)imm <= 0xffff) {
			
 
				++			emit(ctx, andi, tmp, lo(dst), imm);
			
 
				++		} else {     /* Register fallback */
			
 
				++			emit_mov_i(ctx, tmp, imm);
			
 
				++			emit(ctx, and, tmp, lo(dst), tmp);
			
 
				++		}
			
 
				++		if (imm < 0) /* Sign-extension pulls in high word */
			
 
				++			emit(ctx, or, tmp, tmp, hi(dst));
			
 
				++		if (op == BPF_JSET)
			
 
				++			emit(ctx, bnez, tmp, off);
			
 
				++		else   /* JIT_JNSET */
			
 
				++			emit(ctx, beqz, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > imm */
			
 
				++	case BPF_JGT:
			
 
				++		emit_sltiu_r64(ctx, tmp, dst, (s64)imm + 1);
			
 
				++		emit(ctx, beqz, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= imm */
			
 
				++	case BPF_JGE:
			
 
				++		emit_sltiu_r64(ctx, tmp, dst, imm);
			
 
				++		emit(ctx, beqz, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < imm */
			
 
				++	case BPF_JLT:
			
 
				++		emit_sltiu_r64(ctx, tmp, dst, imm);
			
 
				++		emit(ctx, bnez, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= imm */
			
 
				++	case BPF_JLE:
			
 
				++		emit_sltiu_r64(ctx, tmp, dst, (s64)imm + 1);
			
 
				++		emit(ctx, bnez, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > imm (signed) */
			
 
				++	case BPF_JSGT:
			
 
				++		emit_slti_r64(ctx, tmp, dst, (s64)imm + 1);
			
 
				++		emit(ctx, beqz, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= imm (signed) */
			
 
				++	case BPF_JSGE:
			
 
				++		emit_slti_r64(ctx, tmp, dst, imm);
			
 
				++		emit(ctx, beqz, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < imm (signed) */
			
 
				++	case BPF_JSLT:
			
 
				++		emit_slti_r64(ctx, tmp, dst, imm);
			
 
				++		emit(ctx, bnez, tmp, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= imm (signed) */
			
 
				++	case BPF_JSLE:
			
 
				++		emit_slti_r64(ctx, tmp, dst, (s64)imm + 1);
			
 
				++		emit(ctx, bnez, tmp, off);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Jump register (64-bit) */
			
 
				++static void emit_jmp_r64(struct jit_context *ctx,
			
 
				++			 const u8 dst[], const u8 src[], s32 off, u8 op)
			
 
				++{
			
 
				++	u8 t1 = MIPS_R_T6;
			
 
				++	u8 t2 = MIPS_R_T7;
			
 
				++
			
 
				++	switch (op) {
			
 
				++	/* No-op, used internally for branch optimization */
			
 
				++	case JIT_JNOP:
			
 
				++		break;
			
 
				++	/* PC += off if dst == src */
			
 
				++	/* PC += off if dst != src */
			
 
				++	case BPF_JEQ:
			
 
				++	case BPF_JNE:
			
 
				++		emit(ctx, subu, t1, lo(dst), lo(src));
			
 
				++		emit(ctx, subu, t2, hi(dst), hi(src));
			
 
				++		emit(ctx, or, t1, t1, t2);
			
 
				++		if (op == BPF_JEQ)
			
 
				++			emit(ctx, beqz, t1, off);
			
 
				++		else   /* BPF_JNE */
			
 
				++			emit(ctx, bnez, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst & src */
			
 
				++	/* PC += off if (dst & imm) == 0 (not in BPF, used for long jumps) */
			
 
				++	case BPF_JSET:
			
 
				++	case JIT_JNSET:
			
 
				++		emit(ctx, and, t1, lo(dst), lo(src));
			
 
				++		emit(ctx, and, t2, hi(dst), hi(src));
			
 
				++		emit(ctx, or, t1, t1, t2);
			
 
				++		if (op == BPF_JSET)
			
 
				++			emit(ctx, bnez, t1, off);
			
 
				++		else   /* JIT_JNSET */
			
 
				++			emit(ctx, beqz, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > src */
			
 
				++	case BPF_JGT:
			
 
				++		emit_sltu_r64(ctx, t1, src, dst);
			
 
				++		emit(ctx, bnez, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= src */
			
 
				++	case BPF_JGE:
			
 
				++		emit_sltu_r64(ctx, t1, dst, src);
			
 
				++		emit(ctx, beqz, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < src */
			
 
				++	case BPF_JLT:
			
 
				++		emit_sltu_r64(ctx, t1, dst, src);
			
 
				++		emit(ctx, bnez, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= src */
			
 
				++	case BPF_JLE:
			
 
				++		emit_sltu_r64(ctx, t1, src, dst);
			
 
				++		emit(ctx, beqz, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst > src (signed) */
			
 
				++	case BPF_JSGT:
			
 
				++		emit_slt_r64(ctx, t1, src, dst);
			
 
				++		emit(ctx, bnez, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst >= src (signed) */
			
 
				++	case BPF_JSGE:
			
 
				++		emit_slt_r64(ctx, t1, dst, src);
			
 
				++		emit(ctx, beqz, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst < src (signed) */
			
 
				++	case BPF_JSLT:
			
 
				++		emit_slt_r64(ctx, t1, dst, src);
			
 
				++		emit(ctx, bnez, t1, off);
			
 
				++		break;
			
 
				++	/* PC += off if dst <= src (signed) */
			
 
				++	case BPF_JSLE:
			
 
				++		emit_slt_r64(ctx, t1, src, dst);
			
 
				++		emit(ctx, beqz, t1, off);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Function call */
			
 
				++static int emit_call(struct jit_context *ctx, const struct bpf_insn *insn)
			
 
				++{
			
 
				++	bool fixed;
			
 
				++	u64 addr;
			
 
				++
			
 
				++	/* Decode the call address */
			
 
				++	if (bpf_jit_get_func_addr(ctx->program, insn, false,
			
 
				++				  &addr, &fixed) < 0)
			
 
				++		return -1;
			
 
				++	if (!fixed)
			
 
				++		return -1;
			
 
				++
			
 
				++	/* Push stack arguments */
			
 
				++	push_regs(ctx, JIT_STACK_REGS, 0, JIT_RESERVED_STACK);
			
 
				++
			
 
				++	/* Emit function call */
			
 
				++	emit_mov_i(ctx, MIPS_R_T9, addr);
			
 
				++	emit(ctx, jalr, MIPS_R_RA, MIPS_R_T9);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++
			
 
				++	clobber_reg(ctx, MIPS_R_RA);
			
 
				++	clobber_reg(ctx, MIPS_R_V0);
			
 
				++	clobber_reg(ctx, MIPS_R_V1);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Function tail call */
			
 
				++static int emit_tail_call(struct jit_context *ctx)
			
 
				++{
			
 
				++	u8 ary = lo(bpf2mips32[BPF_REG_2]);
			
 
				++	u8 ind = lo(bpf2mips32[BPF_REG_3]);
			
 
				++	u8 t1 = MIPS_R_T8;
			
 
				++	u8 t2 = MIPS_R_T9;
			
 
				++	int off;
			
 
				++
			
 
				++	/*
			
 
				++	 * Tail call:
			
 
				++	 * eBPF R1   - function argument (context ptr), passed in a0-a1
			
 
				++	 * eBPF R2   - ptr to object with array of function entry points
			
 
				++	 * eBPF R3   - array index of function to be called
			
 
				++	 * stack[sz] - remaining tail call count, initialized in prologue
			
 
				++	 */
			
 
				++
			
 
				++	/* if (ind >= ary->map.max_entries) goto out */
			
 
				++	off = offsetof(struct bpf_array, map.max_entries);
			
 
				++	if (off > 0x7fff)
			
 
				++		return -1;
			
 
				++	emit(ctx, lw, t1, off, ary);             /* t1 = ary->map.max_entries*/
			
 
				++	emit_load_delay(ctx);                    /* Load delay slot          */
			
 
				++	emit(ctx, sltu, t1, ind, t1);            /* t1 = ind < t1            */
			
 
				++	emit(ctx, beqz, t1, get_offset(ctx, 1)); /* PC += off(1) if t1 == 0  */
			
 
				++						 /* (next insn delay slot)   */
			
 
				++	/* if (TCC-- <= 0) goto out */
			
 
				++	emit(ctx, lw, t2, ctx->stack_size, MIPS_R_SP);  /* t2 = *(SP + size) */
			
 
				++	emit_load_delay(ctx);                     /* Load delay slot         */
			
 
				++	emit(ctx, blez, t2, get_offset(ctx, 1));  /* PC += off(1) if t2 < 0  */
			
 
				++	emit(ctx, addiu, t2, t2, -1);             /* t2-- (delay slot)       */
			
 
				++	emit(ctx, sw, t2, ctx->stack_size, MIPS_R_SP);  /* *(SP + size) = t2 */
			
 
				++
			
 
				++	/* prog = ary->ptrs[ind] */
			
 
				++	off = offsetof(struct bpf_array, ptrs);
			
 
				++	if (off > 0x7fff)
			
 
				++		return -1;
			
 
				++	emit(ctx, sll, t1, ind, 2);               /* t1 = ind << 2           */
			
 
				++	emit(ctx, addu, t1, t1, ary);             /* t1 += ary               */
			
 
				++	emit(ctx, lw, t2, off, t1);               /* t2 = *(t1 + off)        */
			
 
				++	emit_load_delay(ctx);                     /* Load delay slot         */
			
 
				++
			
 
				++	/* if (prog == 0) goto out */
			
 
				++	emit(ctx, beqz, t2, get_offset(ctx, 1));  /* PC += off(1) if t2 == 0 */
			
 
				++	emit(ctx, nop);                           /* Delay slot              */
			
 
				++
			
 
				++	/* func = prog->bpf_func + 8 (prologue skip offset) */
			
 
				++	off = offsetof(struct bpf_prog, bpf_func);
			
 
				++	if (off > 0x7fff)
			
 
				++		return -1;
			
 
				++	emit(ctx, lw, t1, off, t2);                /* t1 = *(t2 + off)       */
			
 
				++	emit_load_delay(ctx);                      /* Load delay slot        */
			
 
				++	emit(ctx, addiu, t1, t1, JIT_TCALL_SKIP);  /* t1 += skip (8 or 12)   */
			
 
				++
			
 
				++	/* goto func */
			
 
				++	build_epilogue(ctx, t1);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Stack frame layout for a JITed program (stack grows down).
			
 
				++ *
			
 
				++ * Higher address  : Caller's stack frame       :
			
 
				++ *                 :----------------------------:
			
 
				++ *                 : 64-bit eBPF args r3-r5     :
			
 
				++ *                 :----------------------------:
			
 
				++ *                 : Reserved / tail call count :
			
 
				++ *                 +============================+  <--- MIPS sp before call
			
 
				++ *                 | Callee-saved registers,    |
			
 
				++ *                 | including RA and FP        |
			
 
				++ *                 +----------------------------+  <--- eBPF FP (MIPS zero,fp)
			
 
				++ *                 | Local eBPF variables       |
			
 
				++ *                 | allocated by program       |
			
 
				++ *                 +----------------------------+
			
 
				++ *                 | Reserved for caller-saved  |
			
 
				++ *                 | registers                  |
			
 
				++ *                 +----------------------------+
			
 
				++ *                 | Reserved for 64-bit eBPF   |
			
 
				++ *                 | args r3-r5 & args passed   |
			
 
				++ *                 | on stack in kernel calls   |
			
 
				++ * Lower address   +============================+  <--- MIPS sp
			
 
				++ */
			
 
				++
			
 
				++/* Build program prologue to set up the stack and registers */
			
 
				++void build_prologue(struct jit_context *ctx)
			
 
				++{
			
 
				++	const u8 *r1 = bpf2mips32[BPF_REG_1];
			
 
				++	const u8 *fp = bpf2mips32[BPF_REG_FP];
			
 
				++	int stack, saved, locals, reserved;
			
 
				++
			
 
				++	/*
			
 
				++	 * The first two instructions initialize TCC in the reserved (for us)
			
 
				++	 * 16-byte area in the parent's stack frame. On a tail call, the
			
 
				++	 * calling function jumps into the prologue after these instructions.
			
 
				++	 */
			
 
				++	emit(ctx, ori, MIPS_R_T9, MIPS_R_ZERO,
			
 
				++	     min(MAX_TAIL_CALL_CNT + 1, 0xffff));
			
 
				++	emit(ctx, sw, MIPS_R_T9, 0, MIPS_R_SP);
			
 
				++
			
 
				++	/*
			
 
				++	 * Register eBPF R1 contains the 32-bit context pointer argument.
			
 
				++	 * A 32-bit argument is always passed in MIPS register a0, regardless
			
 
				++	 * of CPU endianness. Initialize R1 accordingly and zero-extend.
			
 
				++	 */
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++	emit(ctx, move, lo(r1), MIPS_R_A0);
			
 
				++#endif
			
 
				++
			
 
				++	/* === Entry-point for tail calls === */
			
 
				++
			
 
				++	/* Zero-extend the 32-bit argument */
			
 
				++	emit(ctx, move, hi(r1), MIPS_R_ZERO);
			
 
				++
			
 
				++	/* If the eBPF frame pointer was accessed it must be saved */
			
 
				++	if (ctx->accessed & BIT(BPF_REG_FP))
			
 
				++		clobber_reg64(ctx, fp);
			
 
				++
			
 
				++	/* Compute the stack space needed for callee-saved registers */
			
 
				++	saved = hweight32(ctx->clobbered & JIT_CALLEE_REGS) * sizeof(u32);
			
 
				++	saved = ALIGN(saved, MIPS_STACK_ALIGNMENT);
			
 
				++
			
 
				++	/* Stack space used by eBPF program local data */
			
 
				++	locals = ALIGN(ctx->program->aux->stack_depth, MIPS_STACK_ALIGNMENT);
			
 
				++
			
 
				++	/*
			
 
				++	 * If we are emitting function calls, reserve extra stack space for
			
 
				++	 * caller-saved registers and function arguments passed on the stack.
			
 
				++	 * The required space is computed automatically during resource
			
 
				++	 * usage discovery (pass 1).
			
 
				++	 */
			
 
				++	reserved = ctx->stack_used;
			
 
				++
			
 
				++	/* Allocate the stack frame */
			
 
				++	stack = ALIGN(saved + locals + reserved, MIPS_STACK_ALIGNMENT);
			
 
				++	emit(ctx, addiu, MIPS_R_SP, MIPS_R_SP, -stack);
			
 
				++
			
 
				++	/* Store callee-saved registers on stack */
			
 
				++	push_regs(ctx, ctx->clobbered & JIT_CALLEE_REGS, 0, stack - saved);
			
 
				++
			
 
				++	/* Initialize the eBPF frame pointer if accessed */
			
 
				++	if (ctx->accessed & BIT(BPF_REG_FP))
			
 
				++		emit(ctx, addiu, lo(fp), MIPS_R_SP, stack - saved);
			
 
				++
			
 
				++	ctx->saved_size = saved;
			
 
				++	ctx->stack_size = stack;
			
 
				++}
			
 
				++
			
 
				++/* Build the program epilogue to restore the stack and registers */
			
 
				++void build_epilogue(struct jit_context *ctx, int dest_reg)
			
 
				++{
			
 
				++	/* Restore callee-saved registers from stack */
			
 
				++	pop_regs(ctx, ctx->clobbered & JIT_CALLEE_REGS, 0,
			
 
				++		 ctx->stack_size - ctx->saved_size);
			
 
				++	/*
			
 
				++	 * A 32-bit return value is always passed in MIPS register v0,
			
 
				++	 * but on big-endian targets the low part of R0 is mapped to v1.
			
 
				++	 */
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++	emit(ctx, move, MIPS_R_V0, MIPS_R_V1);
			
 
				++#endif
			
 
				++
			
 
				++	/* Jump to the return address and adjust the stack pointer */
			
 
				++	emit(ctx, jr, dest_reg);
			
 
				++	emit(ctx, addiu, MIPS_R_SP, MIPS_R_SP, ctx->stack_size);
			
 
				++}
			
 
				++
			
 
				++/* Build one eBPF instruction */
			
 
				++int build_insn(const struct bpf_insn *insn, struct jit_context *ctx)
			
 
				++{
			
 
				++	const u8 *dst = bpf2mips32[insn->dst_reg];
			
 
				++	const u8 *src = bpf2mips32[insn->src_reg];
			
 
				++	const u8 *tmp = bpf2mips32[JIT_REG_TMP];
			
 
				++	u8 code = insn->code;
			
 
				++	s16 off = insn->off;
			
 
				++	s32 imm = insn->imm;
			
 
				++	s32 val, rel;
			
 
				++	u8 alu, jmp;
			
 
				++
			
 
				++	switch (code) {
			
 
				++	/* ALU operations */
			
 
				++	/* dst = imm */
			
 
				++	case BPF_ALU | BPF_MOV | BPF_K:
			
 
				++		emit_mov_i(ctx, lo(dst), imm);
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = src */
			
 
				++	case BPF_ALU | BPF_MOV | BPF_X:
			
 
				++		if (imm == 1) {
			
 
				++			/* Special mov32 for zext */
			
 
				++			emit_mov_i(ctx, hi(dst), 0);
			
 
				++		} else {
			
 
				++			emit_mov_r(ctx, lo(dst), lo(src));
			
 
				++			emit_zext_ver(ctx, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = -dst */
			
 
				++	case BPF_ALU | BPF_NEG:
			
 
				++		emit_alu_i(ctx, lo(dst), 0, BPF_NEG);
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst & imm */
			
 
				++	/* dst = dst | imm */
			
 
				++	/* dst = dst ^ imm */
			
 
				++	/* dst = dst << imm */
			
 
				++	/* dst = dst >> imm */
			
 
				++	/* dst = dst >> imm (arithmetic) */
			
 
				++	/* dst = dst + imm */
			
 
				++	/* dst = dst - imm */
			
 
				++	/* dst = dst * imm */
			
 
				++	/* dst = dst / imm */
			
 
				++	/* dst = dst % imm */
			
 
				++	case BPF_ALU | BPF_OR | BPF_K:
			
 
				++	case BPF_ALU | BPF_AND | BPF_K:
			
 
				++	case BPF_ALU | BPF_XOR | BPF_K:
			
 
				++	case BPF_ALU | BPF_LSH | BPF_K:
			
 
				++	case BPF_ALU | BPF_RSH | BPF_K:
			
 
				++	case BPF_ALU | BPF_ARSH | BPF_K:
			
 
				++	case BPF_ALU | BPF_ADD | BPF_K:
			
 
				++	case BPF_ALU | BPF_SUB | BPF_K:
			
 
				++	case BPF_ALU | BPF_MUL | BPF_K:
			
 
				++	case BPF_ALU | BPF_DIV | BPF_K:
			
 
				++	case BPF_ALU | BPF_MOD | BPF_K:
			
 
				++		if (!valid_alu_i(BPF_OP(code), imm)) {
			
 
				++			emit_mov_i(ctx, MIPS_R_T6, imm);
			
 
				++			emit_alu_r(ctx, lo(dst), MIPS_R_T6, BPF_OP(code));
			
 
				++		} else if (rewrite_alu_i(BPF_OP(code), imm, &alu, &val)) {
			
 
				++			emit_alu_i(ctx, lo(dst), val, alu);
			
 
				++		}
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst & src */
			
 
				++	/* dst = dst | src */
			
 
				++	/* dst = dst ^ src */
			
 
				++	/* dst = dst << src */
			
 
				++	/* dst = dst >> src */
			
 
				++	/* dst = dst >> src (arithmetic) */
			
 
				++	/* dst = dst + src */
			
 
				++	/* dst = dst - src */
			
 
				++	/* dst = dst * src */
			
 
				++	/* dst = dst / src */
			
 
				++	/* dst = dst % src */
			
 
				++	case BPF_ALU | BPF_AND | BPF_X:
			
 
				++	case BPF_ALU | BPF_OR | BPF_X:
			
 
				++	case BPF_ALU | BPF_XOR | BPF_X:
			
 
				++	case BPF_ALU | BPF_LSH | BPF_X:
			
 
				++	case BPF_ALU | BPF_RSH | BPF_X:
			
 
				++	case BPF_ALU | BPF_ARSH | BPF_X:
			
 
				++	case BPF_ALU | BPF_ADD | BPF_X:
			
 
				++	case BPF_ALU | BPF_SUB | BPF_X:
			
 
				++	case BPF_ALU | BPF_MUL | BPF_X:
			
 
				++	case BPF_ALU | BPF_DIV | BPF_X:
			
 
				++	case BPF_ALU | BPF_MOD | BPF_X:
			
 
				++		emit_alu_r(ctx, lo(dst), lo(src), BPF_OP(code));
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_MOV | BPF_K:
			
 
				++		emit_mov_se_i64(ctx, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = src (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_MOV | BPF_X:
			
 
				++		emit_mov_r(ctx, lo(dst), lo(src));
			
 
				++		emit_mov_r(ctx, hi(dst), hi(src));
			
 
				++		break;
			
 
				++	/* dst = -dst (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_NEG:
			
 
				++		emit_neg_i64(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst & imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_AND | BPF_K:
			
 
				++		emit_alu_i64(ctx, dst, imm, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = dst | imm (64-bit) */
			
 
				++	/* dst = dst ^ imm (64-bit) */
			
 
				++	/* dst = dst + imm (64-bit) */
			
 
				++	/* dst = dst - imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_OR | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_XOR | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_ADD | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_SUB | BPF_K:
			
 
				++		if (imm)
			
 
				++			emit_alu_i64(ctx, dst, imm, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = dst << imm (64-bit) */
			
 
				++	/* dst = dst >> imm (64-bit) */
			
 
				++	/* dst = dst >> imm (64-bit, arithmetic) */
			
 
				++	case BPF_ALU64 | BPF_LSH | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_RSH | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_ARSH | BPF_K:
			
 
				++		if (imm)
			
 
				++			emit_shift_i64(ctx, dst, imm, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = dst * imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_MUL | BPF_K:
			
 
				++		emit_mul_i64(ctx, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst / imm (64-bit) */
			
 
				++	/* dst = dst % imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_DIV | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_MOD | BPF_K:
			
 
				++		/*
			
 
				++		 * Sign-extend the immediate value into a temporary register,
			
 
				++		 * and then do the operation on this register.
			
 
				++		 */
			
 
				++		emit_mov_se_i64(ctx, tmp, imm);
			
 
				++		emit_divmod_r64(ctx, dst, tmp, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = dst & src (64-bit) */
			
 
				++	/* dst = dst | src (64-bit) */
			
 
				++	/* dst = dst ^ src (64-bit) */
			
 
				++	/* dst = dst + src (64-bit) */
			
 
				++	/* dst = dst - src (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_AND | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_OR | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_XOR | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_ADD | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_SUB | BPF_X:
			
 
				++		emit_alu_r64(ctx, dst, src, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = dst << src (64-bit) */
			
 
				++	/* dst = dst >> src (64-bit) */
			
 
				++	/* dst = dst >> src (64-bit, arithmetic) */
			
 
				++	case BPF_ALU64 | BPF_LSH | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_RSH | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_ARSH | BPF_X:
			
 
				++		emit_shift_r64(ctx, dst, lo(src), BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = dst * src (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_MUL | BPF_X:
			
 
				++		emit_mul_r64(ctx, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst / src (64-bit) */
			
 
				++	/* dst = dst % src (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_DIV | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_MOD | BPF_X:
			
 
				++		emit_divmod_r64(ctx, dst, src, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = htole(dst) */
			
 
				++	/* dst = htobe(dst) */
			
 
				++	case BPF_ALU | BPF_END | BPF_FROM_LE:
			
 
				++	case BPF_ALU | BPF_END | BPF_FROM_BE:
			
 
				++		if (BPF_SRC(code) ==
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++		    BPF_FROM_LE
			
 
				++#else
			
 
				++		    BPF_FROM_BE
			
 
				++#endif
			
 
				++		    )
			
 
				++			emit_bswap_r64(ctx, dst, imm);
			
 
				++		else
			
 
				++			emit_trunc_r64(ctx, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = imm64 */
			
 
				++	case BPF_LD | BPF_IMM | BPF_DW:
			
 
				++		emit_mov_i(ctx, lo(dst), imm);
			
 
				++		emit_mov_i(ctx, hi(dst), insn[1].imm);
			
 
				++		return 1;
			
 
				++	/* LDX: dst = *(size *)(src + off) */
			
 
				++	case BPF_LDX | BPF_MEM | BPF_W:
			
 
				++	case BPF_LDX | BPF_MEM | BPF_H:
			
 
				++	case BPF_LDX | BPF_MEM | BPF_B:
			
 
				++	case BPF_LDX | BPF_MEM | BPF_DW:
			
 
				++		emit_ldx(ctx, dst, lo(src), off, BPF_SIZE(code));
			
 
				++		break;
			
 
				++	/* ST: *(size *)(dst + off) = imm */
			
 
				++	case BPF_ST | BPF_MEM | BPF_W:
			
 
				++	case BPF_ST | BPF_MEM | BPF_H:
			
 
				++	case BPF_ST | BPF_MEM | BPF_B:
			
 
				++	case BPF_ST | BPF_MEM | BPF_DW:
			
 
				++		switch (BPF_SIZE(code)) {
			
 
				++		case BPF_DW:
			
 
				++			/* Sign-extend immediate value into temporary reg */
			
 
				++			emit_mov_se_i64(ctx, tmp, imm);
			
 
				++			break;
			
 
				++		case BPF_W:
			
 
				++		case BPF_H:
			
 
				++		case BPF_B:
			
 
				++			emit_mov_i(ctx, lo(tmp), imm);
			
 
				++			break;
			
 
				++		}
			
 
				++		emit_stx(ctx, lo(dst), tmp, off, BPF_SIZE(code));
			
 
				++		break;
			
 
				++	/* STX: *(size *)(dst + off) = src */
			
 
				++	case BPF_STX | BPF_MEM | BPF_W:
			
 
				++	case BPF_STX | BPF_MEM | BPF_H:
			
 
				++	case BPF_STX | BPF_MEM | BPF_B:
			
 
				++	case BPF_STX | BPF_MEM | BPF_DW:
			
 
				++		emit_stx(ctx, lo(dst), src, off, BPF_SIZE(code));
			
 
				++		break;
			
 
				++	/* Speculation barrier */
			
 
				++	case BPF_ST | BPF_NOSPEC:
			
 
				++		break;
			
 
				++	/* Atomics */
			
 
				++	case BPF_STX | BPF_XADD | BPF_W:
			
 
				++		switch (imm) {
			
 
				++		case BPF_ADD:
			
 
				++		case BPF_AND:
			
 
				++		case BPF_OR:
			
 
				++		case BPF_XOR:
			
 
				++			if (cpu_has_llsc)
			
 
				++				emit_atomic_r(ctx, lo(dst), lo(src), off, imm);
			
 
				++			else /* Non-ll/sc fallback */
			
 
				++				emit_atomic_r32(ctx, lo(dst), lo(src),
			
 
				++						off, imm);
			
 
				++			break;
			
 
				++		default:
			
 
				++			goto notyet;
			
 
				++		}
			
 
				++		break;
			
 
				++	/* Atomics (64-bit) */
			
 
				++	case BPF_STX | BPF_XADD | BPF_DW:
			
 
				++		switch (imm) {
			
 
				++		case BPF_ADD:
			
 
				++		case BPF_AND:
			
 
				++		case BPF_OR:
			
 
				++		case BPF_XOR:
			
 
				++			emit_atomic_r64(ctx, lo(dst), src, off, imm);
			
 
				++			break;
			
 
				++		default:
			
 
				++			goto notyet;
			
 
				++		}
			
 
				++		break;
			
 
				++	/* PC += off if dst == src */
			
 
				++	/* PC += off if dst != src */
			
 
				++	/* PC += off if dst & src */
			
 
				++	/* PC += off if dst > src */
			
 
				++	/* PC += off if dst >= src */
			
 
				++	/* PC += off if dst < src */
			
 
				++	/* PC += off if dst <= src */
			
 
				++	/* PC += off if dst > src (signed) */
			
 
				++	/* PC += off if dst >= src (signed) */
			
 
				++	/* PC += off if dst < src (signed) */
			
 
				++	/* PC += off if dst <= src (signed) */
			
 
				++	case BPF_JMP32 | BPF_JEQ | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JNE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSET | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JGT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JGE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JLT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JLE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSGT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSGE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSLT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSLE | BPF_X:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_r(ctx, dst == src, BPF_OP(code), off, &jmp, &rel);
			
 
				++		emit_jmp_r(ctx, lo(dst), lo(src), rel, jmp);
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off if dst == imm */
			
 
				++	/* PC += off if dst != imm */
			
 
				++	/* PC += off if dst & imm */
			
 
				++	/* PC += off if dst > imm */
			
 
				++	/* PC += off if dst >= imm */
			
 
				++	/* PC += off if dst < imm */
			
 
				++	/* PC += off if dst <= imm */
			
 
				++	/* PC += off if dst > imm (signed) */
			
 
				++	/* PC += off if dst >= imm (signed) */
			
 
				++	/* PC += off if dst < imm (signed) */
			
 
				++	/* PC += off if dst <= imm (signed) */
			
 
				++	case BPF_JMP32 | BPF_JEQ | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JNE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSET | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JGT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JGE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JLT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JLE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSGT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSGE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSLT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSLE | BPF_K:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_i(ctx, imm, 32, BPF_OP(code), off, &jmp, &rel);
			
 
				++		if (valid_jmp_i(jmp, imm)) {
			
 
				++			emit_jmp_i(ctx, lo(dst), imm, rel, jmp);
			
 
				++		} else {
			
 
				++			/* Move large immediate to register */
			
 
				++			emit_mov_i(ctx, MIPS_R_T6, imm);
			
 
				++			emit_jmp_r(ctx, lo(dst), MIPS_R_T6, rel, jmp);
			
 
				++		}
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off if dst == src */
			
 
				++	/* PC += off if dst != src */
			
 
				++	/* PC += off if dst & src */
			
 
				++	/* PC += off if dst > src */
			
 
				++	/* PC += off if dst >= src */
			
 
				++	/* PC += off if dst < src */
			
 
				++	/* PC += off if dst <= src */
			
 
				++	/* PC += off if dst > src (signed) */
			
 
				++	/* PC += off if dst >= src (signed) */
			
 
				++	/* PC += off if dst < src (signed) */
			
 
				++	/* PC += off if dst <= src (signed) */
			
 
				++	case BPF_JMP | BPF_JEQ | BPF_X:
			
 
				++	case BPF_JMP | BPF_JNE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSET | BPF_X:
			
 
				++	case BPF_JMP | BPF_JGT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JGE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JLT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JLE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSGT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSGE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSLT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSLE | BPF_X:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_r(ctx, dst == src, BPF_OP(code), off, &jmp, &rel);
			
 
				++		emit_jmp_r64(ctx, dst, src, rel, jmp);
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off if dst == imm */
			
 
				++	/* PC += off if dst != imm */
			
 
				++	/* PC += off if dst & imm */
			
 
				++	/* PC += off if dst > imm */
			
 
				++	/* PC += off if dst >= imm */
			
 
				++	/* PC += off if dst < imm */
			
 
				++	/* PC += off if dst <= imm */
			
 
				++	/* PC += off if dst > imm (signed) */
			
 
				++	/* PC += off if dst >= imm (signed) */
			
 
				++	/* PC += off if dst < imm (signed) */
			
 
				++	/* PC += off if dst <= imm (signed) */
			
 
				++	case BPF_JMP | BPF_JEQ | BPF_K:
			
 
				++	case BPF_JMP | BPF_JNE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSET | BPF_K:
			
 
				++	case BPF_JMP | BPF_JGT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JGE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JLT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JLE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSGT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSGE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSLT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSLE | BPF_K:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_i(ctx, imm, 64, BPF_OP(code), off, &jmp, &rel);
			
 
				++		emit_jmp_i64(ctx, dst, imm, rel, jmp);
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off */
			
 
				++	case BPF_JMP | BPF_JA:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		if (emit_ja(ctx, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* Tail call */
			
 
				++	case BPF_JMP | BPF_TAIL_CALL:
			
 
				++		if (emit_tail_call(ctx) < 0)
			
 
				++			goto invalid;
			
 
				++		break;
			
 
				++	/* Function call */
			
 
				++	case BPF_JMP | BPF_CALL:
			
 
				++		if (emit_call(ctx, insn) < 0)
			
 
				++			goto invalid;
			
 
				++		break;
			
 
				++	/* Function return */
			
 
				++	case BPF_JMP | BPF_EXIT:
			
 
				++		/*
			
 
				++		 * Optimization: when last instruction is EXIT
			
 
				++		 * simply continue to epilogue.
			
 
				++		 */
			
 
				++		if (ctx->bpf_index == ctx->program->len - 1)
			
 
				++			break;
			
 
				++		if (emit_exit(ctx) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++
			
 
				++	default:
			
 
				++invalid:
			
 
				++		pr_err_once("unknown opcode %02x\n", code);
			
 
				++		return -EINVAL;
			
 
				++notyet:
			
 
				++		pr_info_once("*** NOT YET: opcode %02x ***\n", code);
			
 
				++		return -EFAULT;
			
 
				++toofar:
			
 
				++		pr_info_once("*** TOO FAR: jump at %u opcode %02x ***\n",
			
 
				++			     ctx->bpf_index, code);
			
 
				++		return -E2BIG;
			
 
				++	}
			
 
				++	return 0;
			
 
				++}
			
--- a/target/linux/generic/backport-5.15/050-v5.16-03-mips-bpf-Add-new-eBPF-JIT-for-64-bit-MIPS.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-03-mips-bpf-Add-new-eBPF-JIT-for-64-bit-MIPS.patch
@@ -0,0 +1,1005 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:05 +0200
			
 
				+Subject: [PATCH] mips: bpf: Add new eBPF JIT for 64-bit MIPS
			
 
				+
			
 
				+This is an implementation on of an eBPF JIT for 64-bit MIPS III-V and
			
 
				+MIPS64r1-r6. It uses the same framework introduced by the 32-bit JIT.
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+---
			
 
				+ create mode 100644 arch/mips/net/bpf_jit_comp64.c
			
 
				+
			
 
				+--- /dev/null
			
 
				++++ b/arch/mips/net/bpf_jit_comp64.c
			
 
				+@@ -0,0 +1,991 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/*
			
 
				++ * Just-In-Time compiler for eBPF bytecode on MIPS.
			
 
				++ * Implementation of JIT functions for 64-bit CPUs.
			
 
				++ *
			
 
				++ * Copyright (c) 2021 Anyfi Networks AB.
			
 
				++ * Author: Johan Almbladh <[email protected]>
			
 
				++ *
			
 
				++ * Based on code and ideas from
			
 
				++ * Copyright (c) 2017 Cavium, Inc.
			
 
				++ * Copyright (c) 2017 Shubham Bansal <[email protected]>
			
 
				++ * Copyright (c) 2011 Mircea Gherzan <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++#include <linux/errno.h>
			
 
				++#include <linux/filter.h>
			
 
				++#include <linux/bpf.h>
			
 
				++#include <asm/cpu-features.h>
			
 
				++#include <asm/isa-rev.h>
			
 
				++#include <asm/uasm.h>
			
 
				++
			
 
				++#include "bpf_jit_comp.h"
			
 
				++
			
 
				++/* MIPS t0-t3 are not available in the n64 ABI */
			
 
				++#undef MIPS_R_T0
			
 
				++#undef MIPS_R_T1
			
 
				++#undef MIPS_R_T2
			
 
				++#undef MIPS_R_T3
			
 
				++
			
 
				++/* Stack is 16-byte aligned in n64 ABI */
			
 
				++#define MIPS_STACK_ALIGNMENT 16
			
 
				++
			
 
				++/* Extra 64-bit eBPF registers used by JIT */
			
 
				++#define JIT_REG_TC (MAX_BPF_JIT_REG + 0)
			
 
				++#define JIT_REG_ZX (MAX_BPF_JIT_REG + 1)
			
 
				++
			
 
				++/* Number of prologue bytes to skip when doing a tail call */
			
 
				++#define JIT_TCALL_SKIP 4
			
 
				++
			
 
				++/* Callee-saved CPU registers that the JIT must preserve */
			
 
				++#define JIT_CALLEE_REGS   \
			
 
				++	(BIT(MIPS_R_S0) | \
			
 
				++	 BIT(MIPS_R_S1) | \
			
 
				++	 BIT(MIPS_R_S2) | \
			
 
				++	 BIT(MIPS_R_S3) | \
			
 
				++	 BIT(MIPS_R_S4) | \
			
 
				++	 BIT(MIPS_R_S5) | \
			
 
				++	 BIT(MIPS_R_S6) | \
			
 
				++	 BIT(MIPS_R_S7) | \
			
 
				++	 BIT(MIPS_R_GP) | \
			
 
				++	 BIT(MIPS_R_FP) | \
			
 
				++	 BIT(MIPS_R_RA))
			
 
				++
			
 
				++/* Caller-saved CPU registers available for JIT use */
			
 
				++#define JIT_CALLER_REGS	  \
			
 
				++	(BIT(MIPS_R_A5) | \
			
 
				++	 BIT(MIPS_R_A6) | \
			
 
				++	 BIT(MIPS_R_A7))
			
 
				++/*
			
 
				++ * Mapping of 64-bit eBPF registers to 64-bit native MIPS registers.
			
 
				++ * MIPS registers t4 - t7 may be used by the JIT as temporary registers.
			
 
				++ * MIPS registers t8 - t9 are reserved for single-register common functions.
			
 
				++ */
			
 
				++static const u8 bpf2mips64[] = {
			
 
				++	/* Return value from in-kernel function, and exit value from eBPF */
			
 
				++	[BPF_REG_0] = MIPS_R_V0,
			
 
				++	/* Arguments from eBPF program to in-kernel function */
			
 
				++	[BPF_REG_1] = MIPS_R_A0,
			
 
				++	[BPF_REG_2] = MIPS_R_A1,
			
 
				++	[BPF_REG_3] = MIPS_R_A2,
			
 
				++	[BPF_REG_4] = MIPS_R_A3,
			
 
				++	[BPF_REG_5] = MIPS_R_A4,
			
 
				++	/* Callee-saved registers that in-kernel function will preserve */
			
 
				++	[BPF_REG_6] = MIPS_R_S0,
			
 
				++	[BPF_REG_7] = MIPS_R_S1,
			
 
				++	[BPF_REG_8] = MIPS_R_S2,
			
 
				++	[BPF_REG_9] = MIPS_R_S3,
			
 
				++	/* Read-only frame pointer to access the eBPF stack */
			
 
				++	[BPF_REG_FP] = MIPS_R_FP,
			
 
				++	/* Temporary register for blinding constants */
			
 
				++	[BPF_REG_AX] = MIPS_R_AT,
			
 
				++	/* Tail call count register, caller-saved */
			
 
				++	[JIT_REG_TC] = MIPS_R_A5,
			
 
				++	/* Constant for register zero-extension */
			
 
				++	[JIT_REG_ZX] = MIPS_R_V1,
			
 
				++};
			
 
				++
			
 
				++/*
			
 
				++ * MIPS 32-bit operations on 64-bit registers generate a sign-extended
			
 
				++ * result. However, the eBPF ISA mandates zero-extension, so we rely on the
			
 
				++ * verifier to add that for us (emit_zext_ver). In addition, ALU arithmetic
			
 
				++ * operations, right shift and byte swap require properly sign-extended
			
 
				++ * operands or the result is unpredictable. We emit explicit sign-extensions
			
 
				++ * in those cases.
			
 
				++ */
			
 
				++
			
 
				++/* Sign extension */
			
 
				++static void emit_sext(struct jit_context *ctx, u8 dst, u8 src)
			
 
				++{
			
 
				++	emit(ctx, sll, dst, src, 0);
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Zero extension */
			
 
				++static void emit_zext(struct jit_context *ctx, u8 dst)
			
 
				++{
			
 
				++	if (cpu_has_mips64r2 || cpu_has_mips64r6) {
			
 
				++		emit(ctx, dinsu, dst, MIPS_R_ZERO, 32, 32);
			
 
				++	} else {
			
 
				++		emit(ctx, and, dst, dst, bpf2mips64[JIT_REG_ZX]);
			
 
				++		access_reg(ctx, JIT_REG_ZX); /* We need the ZX register */
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Zero extension, if verifier does not do it for us  */
			
 
				++static void emit_zext_ver(struct jit_context *ctx, u8 dst)
			
 
				++{
			
 
				++	if (!ctx->program->aux->verifier_zext)
			
 
				++		emit_zext(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* dst = imm (64-bit) */
			
 
				++static void emit_mov_i64(struct jit_context *ctx, u8 dst, u64 imm64)
			
 
				++{
			
 
				++	if (imm64 >= 0xffffffffffff8000ULL || imm64 < 0x8000ULL) {
			
 
				++		emit(ctx, daddiu, dst, MIPS_R_ZERO, (s16)imm64);
			
 
				++	} else if (imm64 >= 0xffffffff80000000ULL ||
			
 
				++		   (imm64 < 0x80000000 && imm64 > 0xffff)) {
			
 
				++		emit(ctx, lui, dst, (s16)(imm64 >> 16));
			
 
				++		emit(ctx, ori, dst, dst, (u16)imm64 & 0xffff);
			
 
				++	} else {
			
 
				++		u8 acc = MIPS_R_ZERO;
			
 
				++		int k;
			
 
				++
			
 
				++		for (k = 0; k < 4; k++) {
			
 
				++			u16 half = imm64 >> (48 - 16 * k);
			
 
				++
			
 
				++			if (acc == dst)
			
 
				++				emit(ctx, dsll, dst, dst, 16);
			
 
				++
			
 
				++			if (half) {
			
 
				++				emit(ctx, ori, dst, acc, half);
			
 
				++				acc = dst;
			
 
				++			}
			
 
				++		}
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU immediate operation (64-bit) */
			
 
				++static void emit_alu_i64(struct jit_context *ctx, u8 dst, s32 imm, u8 op)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst | imm */
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, ori, dst, dst, (u16)imm);
			
 
				++		break;
			
 
				++	/* dst = dst ^ imm */
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xori, dst, dst, (u16)imm);
			
 
				++		break;
			
 
				++	/* dst = -dst */
			
 
				++	case BPF_NEG:
			
 
				++		emit(ctx, dsubu, dst, MIPS_R_ZERO, dst);
			
 
				++		break;
			
 
				++	/* dst = dst << imm */
			
 
				++	case BPF_LSH:
			
 
				++		emit(ctx, dsll_safe, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst >> imm */
			
 
				++	case BPF_RSH:
			
 
				++		emit(ctx, dsrl_safe, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst >> imm (arithmetic) */
			
 
				++	case BPF_ARSH:
			
 
				++		emit(ctx, dsra_safe, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst + imm */
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, daddiu, dst, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = dst - imm */
			
 
				++	case BPF_SUB:
			
 
				++		emit(ctx, daddiu, dst, dst, -imm);
			
 
				++		break;
			
 
				++	default:
			
 
				++		/* Width-generic operations */
			
 
				++		emit_alu_i(ctx, dst, imm, op);
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* ALU register operation (64-bit) */
			
 
				++static void emit_alu_r64(struct jit_context *ctx, u8 dst, u8 src, u8 op)
			
 
				++{
			
 
				++	switch (BPF_OP(op)) {
			
 
				++	/* dst = dst << src */
			
 
				++	case BPF_LSH:
			
 
				++		emit(ctx, dsllv, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst >> src */
			
 
				++	case BPF_RSH:
			
 
				++		emit(ctx, dsrlv, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst >> src (arithmetic) */
			
 
				++	case BPF_ARSH:
			
 
				++		emit(ctx, dsrav, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst + src */
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, daddu, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst - src */
			
 
				++	case BPF_SUB:
			
 
				++		emit(ctx, dsubu, dst, dst, src);
			
 
				++		break;
			
 
				++	/* dst = dst * src */
			
 
				++	case BPF_MUL:
			
 
				++		if (cpu_has_mips64r6) {
			
 
				++			emit(ctx, dmulu, dst, dst, src);
			
 
				++		} else {
			
 
				++			emit(ctx, dmultu, dst, src);
			
 
				++			emit(ctx, mflo, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst / src */
			
 
				++	case BPF_DIV:
			
 
				++		if (cpu_has_mips64r6) {
			
 
				++			emit(ctx, ddivu_r6, dst, dst, src);
			
 
				++		} else {
			
 
				++			emit(ctx, ddivu, dst, src);
			
 
				++			emit(ctx, mflo, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst % src */
			
 
				++	case BPF_MOD:
			
 
				++		if (cpu_has_mips64r6) {
			
 
				++			emit(ctx, dmodu, dst, dst, src);
			
 
				++		} else {
			
 
				++			emit(ctx, ddivu, dst, src);
			
 
				++			emit(ctx, mfhi, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	default:
			
 
				++		/* Width-generic operations */
			
 
				++		emit_alu_r(ctx, dst, src, op);
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Swap sub words in a register double word */
			
 
				++static void emit_swap_r64(struct jit_context *ctx, u8 dst, u8 mask, u32 bits)
			
 
				++{
			
 
				++	u8 tmp = MIPS_R_T9;
			
 
				++
			
 
				++	emit(ctx, and, tmp, dst, mask);  /* tmp = dst & mask  */
			
 
				++	emit(ctx, dsll, tmp, tmp, bits); /* tmp = tmp << bits */
			
 
				++	emit(ctx, dsrl, dst, dst, bits); /* dst = dst >> bits */
			
 
				++	emit(ctx, and, dst, dst, mask);  /* dst = dst & mask  */
			
 
				++	emit(ctx, or, dst, dst, tmp);    /* dst = dst | tmp   */
			
 
				++}
			
 
				++
			
 
				++/* Swap bytes and truncate a register double word, word or half word */
			
 
				++static void emit_bswap_r64(struct jit_context *ctx, u8 dst, u32 width)
			
 
				++{
			
 
				++	switch (width) {
			
 
				++	/* Swap bytes in a double word */
			
 
				++	case 64:
			
 
				++		if (cpu_has_mips64r2 || cpu_has_mips64r6) {
			
 
				++			emit(ctx, dsbh, dst, dst);
			
 
				++			emit(ctx, dshd, dst, dst);
			
 
				++		} else {
			
 
				++			u8 t1 = MIPS_R_T6;
			
 
				++			u8 t2 = MIPS_R_T7;
			
 
				++
			
 
				++			emit(ctx, dsll32, t2, dst, 0);  /* t2 = dst << 32    */
			
 
				++			emit(ctx, dsrl32, dst, dst, 0); /* dst = dst >> 32   */
			
 
				++			emit(ctx, or, dst, dst, t2);    /* dst = dst | t2    */
			
 
				++
			
 
				++			emit(ctx, ori, t2, MIPS_R_ZERO, 0xffff);
			
 
				++			emit(ctx, dsll32, t1, t2, 0);   /* t1 = t2 << 32     */
			
 
				++			emit(ctx, or, t1, t1, t2);      /* t1 = t1 | t2      */
			
 
				++			emit_swap_r64(ctx, dst, t1, 16);/* dst = swap16(dst) */
			
 
				++
			
 
				++			emit(ctx, lui, t2, 0xff);       /* t2 = 0x00ff0000   */
			
 
				++			emit(ctx, ori, t2, t2, 0xff);   /* t2 = t2 | 0x00ff  */
			
 
				++			emit(ctx, dsll32, t1, t2, 0);   /* t1 = t2 << 32     */
			
 
				++			emit(ctx, or, t1, t1, t2);      /* t1 = t1 | t2      */
			
 
				++			emit_swap_r64(ctx, dst, t1, 8); /* dst = swap8(dst)  */
			
 
				++		}
			
 
				++		break;
			
 
				++	/* Swap bytes in a half word */
			
 
				++	/* Swap bytes in a word */
			
 
				++	case 32:
			
 
				++	case 16:
			
 
				++		emit_sext(ctx, dst, dst);
			
 
				++		emit_bswap_r(ctx, dst, width);
			
 
				++		if (cpu_has_mips64r2 || cpu_has_mips64r6)
			
 
				++			emit_zext(ctx, dst);
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Truncate a register double word, word or half word */
			
 
				++static void emit_trunc_r64(struct jit_context *ctx, u8 dst, u32 width)
			
 
				++{
			
 
				++	switch (width) {
			
 
				++	case 64:
			
 
				++		break;
			
 
				++	/* Zero-extend a word */
			
 
				++	case 32:
			
 
				++		emit_zext(ctx, dst);
			
 
				++		break;
			
 
				++	/* Zero-extend a half word */
			
 
				++	case 16:
			
 
				++		emit(ctx, andi, dst, dst, 0xffff);
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Load operation: dst = *(size*)(src + off) */
			
 
				++static void emit_ldx(struct jit_context *ctx, u8 dst, u8 src, s16 off, u8 size)
			
 
				++{
			
 
				++	switch (size) {
			
 
				++	/* Load a byte */
			
 
				++	case BPF_B:
			
 
				++		emit(ctx, lbu, dst, off, src);
			
 
				++		break;
			
 
				++	/* Load a half word */
			
 
				++	case BPF_H:
			
 
				++		emit(ctx, lhu, dst, off, src);
			
 
				++		break;
			
 
				++	/* Load a word */
			
 
				++	case BPF_W:
			
 
				++		emit(ctx, lwu, dst, off, src);
			
 
				++		break;
			
 
				++	/* Load a double word */
			
 
				++	case BPF_DW:
			
 
				++		emit(ctx, ld, dst, off, src);
			
 
				++		break;
			
 
				++	}
			
 
				++	clobber_reg(ctx, dst);
			
 
				++}
			
 
				++
			
 
				++/* Store operation: *(size *)(dst + off) = src */
			
 
				++static void emit_stx(struct jit_context *ctx, u8 dst, u8 src, s16 off, u8 size)
			
 
				++{
			
 
				++	switch (size) {
			
 
				++	/* Store a byte */
			
 
				++	case BPF_B:
			
 
				++		emit(ctx, sb, src, off, dst);
			
 
				++		break;
			
 
				++	/* Store a half word */
			
 
				++	case BPF_H:
			
 
				++		emit(ctx, sh, src, off, dst);
			
 
				++		break;
			
 
				++	/* Store a word */
			
 
				++	case BPF_W:
			
 
				++		emit(ctx, sw, src, off, dst);
			
 
				++		break;
			
 
				++	/* Store a double word */
			
 
				++	case BPF_DW:
			
 
				++		emit(ctx, sd, src, off, dst);
			
 
				++		break;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++/* Atomic read-modify-write */
			
 
				++static void emit_atomic_r64(struct jit_context *ctx,
			
 
				++			    u8 dst, u8 src, s16 off, u8 code)
			
 
				++{
			
 
				++	u8 t1 = MIPS_R_T6;
			
 
				++	u8 t2 = MIPS_R_T7;
			
 
				++
			
 
				++	emit(ctx, lld, t1, off, dst);
			
 
				++	switch (code) {
			
 
				++	case BPF_ADD:
			
 
				++		emit(ctx, daddu, t2, t1, src);
			
 
				++		break;
			
 
				++	case BPF_AND:
			
 
				++		emit(ctx, and, t2, t1, src);
			
 
				++		break;
			
 
				++	case BPF_OR:
			
 
				++		emit(ctx, or, t2, t1, src);
			
 
				++		break;
			
 
				++	case BPF_XOR:
			
 
				++		emit(ctx, xor, t2, t1, src);
			
 
				++		break;
			
 
				++	}
			
 
				++	emit(ctx, scd, t2, off, dst);
			
 
				++	emit(ctx, beqz, t2, -16);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++}
			
 
				++
			
 
				++/* Function call */
			
 
				++static int emit_call(struct jit_context *ctx, const struct bpf_insn *insn)
			
 
				++{
			
 
				++	u8 zx = bpf2mips64[JIT_REG_ZX];
			
 
				++	u8 tmp = MIPS_R_T6;
			
 
				++	bool fixed;
			
 
				++	u64 addr;
			
 
				++
			
 
				++	/* Decode the call address */
			
 
				++	if (bpf_jit_get_func_addr(ctx->program, insn, false,
			
 
				++				  &addr, &fixed) < 0)
			
 
				++		return -1;
			
 
				++	if (!fixed)
			
 
				++		return -1;
			
 
				++
			
 
				++	/* Push caller-saved registers on stack */
			
 
				++	push_regs(ctx, ctx->clobbered & JIT_CALLER_REGS, 0, 0);
			
 
				++
			
 
				++	/* Emit function call */
			
 
				++	emit_mov_i64(ctx, tmp, addr);
			
 
				++	emit(ctx, jalr, MIPS_R_RA, tmp);
			
 
				++	emit(ctx, nop); /* Delay slot */
			
 
				++
			
 
				++	/* Restore caller-saved registers */
			
 
				++	pop_regs(ctx, ctx->clobbered & JIT_CALLER_REGS, 0, 0);
			
 
				++
			
 
				++	/* Re-initialize the JIT zero-extension register if accessed */
			
 
				++	if (ctx->accessed & BIT(JIT_REG_ZX)) {
			
 
				++		emit(ctx, daddiu, zx, MIPS_R_ZERO, -1);
			
 
				++		emit(ctx, dsrl32, zx, zx, 0);
			
 
				++	}
			
 
				++
			
 
				++	clobber_reg(ctx, MIPS_R_RA);
			
 
				++	clobber_reg(ctx, MIPS_R_V0);
			
 
				++	clobber_reg(ctx, MIPS_R_V1);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/* Function tail call */
			
 
				++static int emit_tail_call(struct jit_context *ctx)
			
 
				++{
			
 
				++	u8 ary = bpf2mips64[BPF_REG_2];
			
 
				++	u8 ind = bpf2mips64[BPF_REG_3];
			
 
				++	u8 tcc = bpf2mips64[JIT_REG_TC];
			
 
				++	u8 tmp = MIPS_R_T6;
			
 
				++	int off;
			
 
				++
			
 
				++	/*
			
 
				++	 * Tail call:
			
 
				++	 * eBPF R1 - function argument (context ptr), passed in a0-a1
			
 
				++	 * eBPF R2 - ptr to object with array of function entry points
			
 
				++	 * eBPF R3 - array index of function to be called
			
 
				++	 */
			
 
				++
			
 
				++	/* if (ind >= ary->map.max_entries) goto out */
			
 
				++	off = offsetof(struct bpf_array, map.max_entries);
			
 
				++	if (off > 0x7fff)
			
 
				++		return -1;
			
 
				++	emit(ctx, lwu, tmp, off, ary);            /* tmp = ary->map.max_entrs*/
			
 
				++	emit(ctx, sltu, tmp, ind, tmp);           /* tmp = ind < t1          */
			
 
				++	emit(ctx, beqz, tmp, get_offset(ctx, 1)); /* PC += off(1) if tmp == 0*/
			
 
				++
			
 
				++	/* if (--TCC < 0) goto out */
			
 
				++	emit(ctx, daddiu, tcc, tcc, -1);          /* tcc-- (delay slot)      */
			
 
				++	emit(ctx, bltz, tcc, get_offset(ctx, 1)); /* PC += off(1) if tcc < 0 */
			
 
				++						  /* (next insn delay slot)  */
			
 
				++	/* prog = ary->ptrs[ind] */
			
 
				++	off = offsetof(struct bpf_array, ptrs);
			
 
				++	if (off > 0x7fff)
			
 
				++		return -1;
			
 
				++	emit(ctx, dsll, tmp, ind, 3);             /* tmp = ind << 3          */
			
 
				++	emit(ctx, daddu, tmp, tmp, ary);          /* tmp += ary              */
			
 
				++	emit(ctx, ld, tmp, off, tmp);             /* tmp = *(tmp + off)      */
			
 
				++
			
 
				++	/* if (prog == 0) goto out */
			
 
				++	emit(ctx, beqz, tmp, get_offset(ctx, 1)); /* PC += off(1) if tmp == 0*/
			
 
				++	emit(ctx, nop);                           /* Delay slot              */
			
 
				++
			
 
				++	/* func = prog->bpf_func + 8 (prologue skip offset) */
			
 
				++	off = offsetof(struct bpf_prog, bpf_func);
			
 
				++	if (off > 0x7fff)
			
 
				++		return -1;
			
 
				++	emit(ctx, ld, tmp, off, tmp);                /* tmp = *(tmp + off)   */
			
 
				++	emit(ctx, daddiu, tmp, tmp, JIT_TCALL_SKIP); /* tmp += skip (4)      */
			
 
				++
			
 
				++	/* goto func */
			
 
				++	build_epilogue(ctx, tmp);
			
 
				++	access_reg(ctx, JIT_REG_TC);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++/*
			
 
				++ * Stack frame layout for a JITed program (stack grows down).
			
 
				++ *
			
 
				++ * Higher address  : Previous stack frame      :
			
 
				++ *                 +===========================+  <--- MIPS sp before call
			
 
				++ *                 | Callee-saved registers,   |
			
 
				++ *                 | including RA and FP       |
			
 
				++ *                 +---------------------------+  <--- eBPF FP (MIPS fp)
			
 
				++ *                 | Local eBPF variables      |
			
 
				++ *                 | allocated by program      |
			
 
				++ *                 +---------------------------+
			
 
				++ *                 | Reserved for caller-saved |
			
 
				++ *                 | registers                 |
			
 
				++ * Lower address   +===========================+  <--- MIPS sp
			
 
				++ */
			
 
				++
			
 
				++/* Build program prologue to set up the stack and registers */
			
 
				++void build_prologue(struct jit_context *ctx)
			
 
				++{
			
 
				++	u8 fp = bpf2mips64[BPF_REG_FP];
			
 
				++	u8 tc = bpf2mips64[JIT_REG_TC];
			
 
				++	u8 zx = bpf2mips64[JIT_REG_ZX];
			
 
				++	int stack, saved, locals, reserved;
			
 
				++
			
 
				++	/*
			
 
				++	 * The first instruction initializes the tail call count register.
			
 
				++	 * On a tail call, the calling function jumps into the prologue
			
 
				++	 * after this instruction.
			
 
				++	 */
			
 
				++	emit(ctx, addiu, tc, MIPS_R_ZERO, min(MAX_TAIL_CALL_CNT + 1, 0xffff));
			
 
				++
			
 
				++	/* === Entry-point for tail calls === */
			
 
				++
			
 
				++	/*
			
 
				++	 * If the eBPF frame pointer and tail call count registers were
			
 
				++	 * accessed they must be preserved. Mark them as clobbered here
			
 
				++	 * to save and restore them on the stack as needed.
			
 
				++	 */
			
 
				++	if (ctx->accessed & BIT(BPF_REG_FP))
			
 
				++		clobber_reg(ctx, fp);
			
 
				++	if (ctx->accessed & BIT(JIT_REG_TC))
			
 
				++		clobber_reg(ctx, tc);
			
 
				++	if (ctx->accessed & BIT(JIT_REG_ZX))
			
 
				++		clobber_reg(ctx, zx);
			
 
				++
			
 
				++	/* Compute the stack space needed for callee-saved registers */
			
 
				++	saved = hweight32(ctx->clobbered & JIT_CALLEE_REGS) * sizeof(u64);
			
 
				++	saved = ALIGN(saved, MIPS_STACK_ALIGNMENT);
			
 
				++
			
 
				++	/* Stack space used by eBPF program local data */
			
 
				++	locals = ALIGN(ctx->program->aux->stack_depth, MIPS_STACK_ALIGNMENT);
			
 
				++
			
 
				++	/*
			
 
				++	 * If we are emitting function calls, reserve extra stack space for
			
 
				++	 * caller-saved registers needed by the JIT. The required space is
			
 
				++	 * computed automatically during resource usage discovery (pass 1).
			
 
				++	 */
			
 
				++	reserved = ctx->stack_used;
			
 
				++
			
 
				++	/* Allocate the stack frame */
			
 
				++	stack = ALIGN(saved + locals + reserved, MIPS_STACK_ALIGNMENT);
			
 
				++	if (stack)
			
 
				++		emit(ctx, daddiu, MIPS_R_SP, MIPS_R_SP, -stack);
			
 
				++
			
 
				++	/* Store callee-saved registers on stack */
			
 
				++	push_regs(ctx, ctx->clobbered & JIT_CALLEE_REGS, 0, stack - saved);
			
 
				++
			
 
				++	/* Initialize the eBPF frame pointer if accessed */
			
 
				++	if (ctx->accessed & BIT(BPF_REG_FP))
			
 
				++		emit(ctx, daddiu, fp, MIPS_R_SP, stack - saved);
			
 
				++
			
 
				++	/* Initialize the ePF JIT zero-extension register if accessed */
			
 
				++	if (ctx->accessed & BIT(JIT_REG_ZX)) {
			
 
				++		emit(ctx, daddiu, zx, MIPS_R_ZERO, -1);
			
 
				++		emit(ctx, dsrl32, zx, zx, 0);
			
 
				++	}
			
 
				++
			
 
				++	ctx->saved_size = saved;
			
 
				++	ctx->stack_size = stack;
			
 
				++}
			
 
				++
			
 
				++/* Build the program epilogue to restore the stack and registers */
			
 
				++void build_epilogue(struct jit_context *ctx, int dest_reg)
			
 
				++{
			
 
				++	/* Restore callee-saved registers from stack */
			
 
				++	pop_regs(ctx, ctx->clobbered & JIT_CALLEE_REGS, 0,
			
 
				++		 ctx->stack_size - ctx->saved_size);
			
 
				++
			
 
				++	/* Release the stack frame */
			
 
				++	if (ctx->stack_size)
			
 
				++		emit(ctx, daddiu, MIPS_R_SP, MIPS_R_SP, ctx->stack_size);
			
 
				++
			
 
				++	/* Jump to return address and sign-extend the 32-bit return value */
			
 
				++	emit(ctx, jr, dest_reg);
			
 
				++	emit(ctx, sll, MIPS_R_V0, MIPS_R_V0, 0); /* Delay slot */
			
 
				++}
			
 
				++
			
 
				++/* Build one eBPF instruction */
			
 
				++int build_insn(const struct bpf_insn *insn, struct jit_context *ctx)
			
 
				++{
			
 
				++	u8 dst = bpf2mips64[insn->dst_reg];
			
 
				++	u8 src = bpf2mips64[insn->src_reg];
			
 
				++	u8 code = insn->code;
			
 
				++	s16 off = insn->off;
			
 
				++	s32 imm = insn->imm;
			
 
				++	s32 val, rel;
			
 
				++	u8 alu, jmp;
			
 
				++
			
 
				++	switch (code) {
			
 
				++	/* ALU operations */
			
 
				++	/* dst = imm */
			
 
				++	case BPF_ALU | BPF_MOV | BPF_K:
			
 
				++		emit_mov_i(ctx, dst, imm);
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = src */
			
 
				++	case BPF_ALU | BPF_MOV | BPF_X:
			
 
				++		if (imm == 1) {
			
 
				++			/* Special mov32 for zext */
			
 
				++			emit_zext(ctx, dst);
			
 
				++		} else {
			
 
				++			emit_mov_r(ctx, dst, src);
			
 
				++			emit_zext_ver(ctx, dst);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = -dst */
			
 
				++	case BPF_ALU | BPF_NEG:
			
 
				++		emit_sext(ctx, dst, dst);
			
 
				++		emit_alu_i(ctx, dst, 0, BPF_NEG);
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst & imm */
			
 
				++	/* dst = dst | imm */
			
 
				++	/* dst = dst ^ imm */
			
 
				++	/* dst = dst << imm */
			
 
				++	case BPF_ALU | BPF_OR | BPF_K:
			
 
				++	case BPF_ALU | BPF_AND | BPF_K:
			
 
				++	case BPF_ALU | BPF_XOR | BPF_K:
			
 
				++	case BPF_ALU | BPF_LSH | BPF_K:
			
 
				++		if (!valid_alu_i(BPF_OP(code), imm)) {
			
 
				++			emit_mov_i(ctx, MIPS_R_T4, imm);
			
 
				++			emit_alu_r(ctx, dst, MIPS_R_T4, BPF_OP(code));
			
 
				++		} else if (rewrite_alu_i(BPF_OP(code), imm, &alu, &val)) {
			
 
				++			emit_alu_i(ctx, dst, val, alu);
			
 
				++		}
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst >> imm */
			
 
				++	/* dst = dst >> imm (arithmetic) */
			
 
				++	/* dst = dst + imm */
			
 
				++	/* dst = dst - imm */
			
 
				++	/* dst = dst * imm */
			
 
				++	/* dst = dst / imm */
			
 
				++	/* dst = dst % imm */
			
 
				++	case BPF_ALU | BPF_RSH | BPF_K:
			
 
				++	case BPF_ALU | BPF_ARSH | BPF_K:
			
 
				++	case BPF_ALU | BPF_ADD | BPF_K:
			
 
				++	case BPF_ALU | BPF_SUB | BPF_K:
			
 
				++	case BPF_ALU | BPF_MUL | BPF_K:
			
 
				++	case BPF_ALU | BPF_DIV | BPF_K:
			
 
				++	case BPF_ALU | BPF_MOD | BPF_K:
			
 
				++		if (!valid_alu_i(BPF_OP(code), imm)) {
			
 
				++			emit_sext(ctx, dst, dst);
			
 
				++			emit_mov_i(ctx, MIPS_R_T4, imm);
			
 
				++			emit_alu_r(ctx, dst, MIPS_R_T4, BPF_OP(code));
			
 
				++		} else if (rewrite_alu_i(BPF_OP(code), imm, &alu, &val)) {
			
 
				++			emit_sext(ctx, dst, dst);
			
 
				++			emit_alu_i(ctx, dst, val, alu);
			
 
				++		}
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst & src */
			
 
				++	/* dst = dst | src */
			
 
				++	/* dst = dst ^ src */
			
 
				++	/* dst = dst << src */
			
 
				++	case BPF_ALU | BPF_AND | BPF_X:
			
 
				++	case BPF_ALU | BPF_OR | BPF_X:
			
 
				++	case BPF_ALU | BPF_XOR | BPF_X:
			
 
				++	case BPF_ALU | BPF_LSH | BPF_X:
			
 
				++		emit_alu_r(ctx, dst, src, BPF_OP(code));
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = dst >> src */
			
 
				++	/* dst = dst >> src (arithmetic) */
			
 
				++	/* dst = dst + src */
			
 
				++	/* dst = dst - src */
			
 
				++	/* dst = dst * src */
			
 
				++	/* dst = dst / src */
			
 
				++	/* dst = dst % src */
			
 
				++	case BPF_ALU | BPF_RSH | BPF_X:
			
 
				++	case BPF_ALU | BPF_ARSH | BPF_X:
			
 
				++	case BPF_ALU | BPF_ADD | BPF_X:
			
 
				++	case BPF_ALU | BPF_SUB | BPF_X:
			
 
				++	case BPF_ALU | BPF_MUL | BPF_X:
			
 
				++	case BPF_ALU | BPF_DIV | BPF_X:
			
 
				++	case BPF_ALU | BPF_MOD | BPF_X:
			
 
				++		emit_sext(ctx, dst, dst);
			
 
				++		emit_sext(ctx, MIPS_R_T4, src);
			
 
				++		emit_alu_r(ctx, dst, MIPS_R_T4, BPF_OP(code));
			
 
				++		emit_zext_ver(ctx, dst);
			
 
				++		break;
			
 
				++	/* dst = imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_MOV | BPF_K:
			
 
				++		emit_mov_i(ctx, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = src (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_MOV | BPF_X:
			
 
				++		emit_mov_r(ctx, dst, src);
			
 
				++		break;
			
 
				++	/* dst = -dst (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_NEG:
			
 
				++		emit_alu_i64(ctx, dst, 0, BPF_NEG);
			
 
				++		break;
			
 
				++	/* dst = dst & imm (64-bit) */
			
 
				++	/* dst = dst | imm (64-bit) */
			
 
				++	/* dst = dst ^ imm (64-bit) */
			
 
				++	/* dst = dst << imm (64-bit) */
			
 
				++	/* dst = dst >> imm (64-bit) */
			
 
				++	/* dst = dst >> imm ((64-bit, arithmetic) */
			
 
				++	/* dst = dst + imm (64-bit) */
			
 
				++	/* dst = dst - imm (64-bit) */
			
 
				++	/* dst = dst * imm (64-bit) */
			
 
				++	/* dst = dst / imm (64-bit) */
			
 
				++	/* dst = dst % imm (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_AND | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_OR | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_XOR | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_LSH | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_RSH | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_ARSH | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_ADD | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_SUB | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_MUL | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_DIV | BPF_K:
			
 
				++	case BPF_ALU64 | BPF_MOD | BPF_K:
			
 
				++		if (!valid_alu_i(BPF_OP(code), imm)) {
			
 
				++			emit_mov_i(ctx, MIPS_R_T4, imm);
			
 
				++			emit_alu_r64(ctx, dst, MIPS_R_T4, BPF_OP(code));
			
 
				++		} else if (rewrite_alu_i(BPF_OP(code), imm, &alu, &val)) {
			
 
				++			emit_alu_i64(ctx, dst, val, alu);
			
 
				++		}
			
 
				++		break;
			
 
				++	/* dst = dst & src (64-bit) */
			
 
				++	/* dst = dst | src (64-bit) */
			
 
				++	/* dst = dst ^ src (64-bit) */
			
 
				++	/* dst = dst << src (64-bit) */
			
 
				++	/* dst = dst >> src (64-bit) */
			
 
				++	/* dst = dst >> src (64-bit, arithmetic) */
			
 
				++	/* dst = dst + src (64-bit) */
			
 
				++	/* dst = dst - src (64-bit) */
			
 
				++	/* dst = dst * src (64-bit) */
			
 
				++	/* dst = dst / src (64-bit) */
			
 
				++	/* dst = dst % src (64-bit) */
			
 
				++	case BPF_ALU64 | BPF_AND | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_OR | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_XOR | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_LSH | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_RSH | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_ARSH | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_ADD | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_SUB | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_MUL | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_DIV | BPF_X:
			
 
				++	case BPF_ALU64 | BPF_MOD | BPF_X:
			
 
				++		emit_alu_r64(ctx, dst, src, BPF_OP(code));
			
 
				++		break;
			
 
				++	/* dst = htole(dst) */
			
 
				++	/* dst = htobe(dst) */
			
 
				++	case BPF_ALU | BPF_END | BPF_FROM_LE:
			
 
				++	case BPF_ALU | BPF_END | BPF_FROM_BE:
			
 
				++		if (BPF_SRC(code) ==
			
 
				++#ifdef __BIG_ENDIAN
			
 
				++		    BPF_FROM_LE
			
 
				++#else
			
 
				++		    BPF_FROM_BE
			
 
				++#endif
			
 
				++		    )
			
 
				++			emit_bswap_r64(ctx, dst, imm);
			
 
				++		else
			
 
				++			emit_trunc_r64(ctx, dst, imm);
			
 
				++		break;
			
 
				++	/* dst = imm64 */
			
 
				++	case BPF_LD | BPF_IMM | BPF_DW:
			
 
				++		emit_mov_i64(ctx, dst, (u32)imm | ((u64)insn[1].imm << 32));
			
 
				++		return 1;
			
 
				++	/* LDX: dst = *(size *)(src + off) */
			
 
				++	case BPF_LDX | BPF_MEM | BPF_W:
			
 
				++	case BPF_LDX | BPF_MEM | BPF_H:
			
 
				++	case BPF_LDX | BPF_MEM | BPF_B:
			
 
				++	case BPF_LDX | BPF_MEM | BPF_DW:
			
 
				++		emit_ldx(ctx, dst, src, off, BPF_SIZE(code));
			
 
				++		break;
			
 
				++	/* ST: *(size *)(dst + off) = imm */
			
 
				++	case BPF_ST | BPF_MEM | BPF_W:
			
 
				++	case BPF_ST | BPF_MEM | BPF_H:
			
 
				++	case BPF_ST | BPF_MEM | BPF_B:
			
 
				++	case BPF_ST | BPF_MEM | BPF_DW:
			
 
				++		emit_mov_i(ctx, MIPS_R_T4, imm);
			
 
				++		emit_stx(ctx, dst, MIPS_R_T4, off, BPF_SIZE(code));
			
 
				++		break;
			
 
				++	/* STX: *(size *)(dst + off) = src */
			
 
				++	case BPF_STX | BPF_MEM | BPF_W:
			
 
				++	case BPF_STX | BPF_MEM | BPF_H:
			
 
				++	case BPF_STX | BPF_MEM | BPF_B:
			
 
				++	case BPF_STX | BPF_MEM | BPF_DW:
			
 
				++		emit_stx(ctx, dst, src, off, BPF_SIZE(code));
			
 
				++		break;
			
 
				++	/* Speculation barrier */
			
 
				++	case BPF_ST | BPF_NOSPEC:
			
 
				++		break;
			
 
				++	/* Atomics */
			
 
				++	case BPF_STX | BPF_XADD | BPF_W:
			
 
				++	case BPF_STX | BPF_XADD | BPF_DW:
			
 
				++		switch (imm) {
			
 
				++		case BPF_ADD:
			
 
				++		case BPF_AND:
			
 
				++		case BPF_OR:
			
 
				++		case BPF_XOR:
			
 
				++			if (BPF_SIZE(code) == BPF_DW) {
			
 
				++				emit_atomic_r64(ctx, dst, src, off, imm);
			
 
				++			} else { /* 32-bit, no fetch */
			
 
				++				emit_sext(ctx, MIPS_R_T4, src);
			
 
				++				emit_atomic_r(ctx, dst, MIPS_R_T4, off, imm);
			
 
				++			}
			
 
				++			break;
			
 
				++		default:
			
 
				++			goto notyet;
			
 
				++		}
			
 
				++		break;
			
 
				++	/* PC += off if dst == src */
			
 
				++	/* PC += off if dst != src */
			
 
				++	/* PC += off if dst & src */
			
 
				++	/* PC += off if dst > src */
			
 
				++	/* PC += off if dst >= src */
			
 
				++	/* PC += off if dst < src */
			
 
				++	/* PC += off if dst <= src */
			
 
				++	/* PC += off if dst > src (signed) */
			
 
				++	/* PC += off if dst >= src (signed) */
			
 
				++	/* PC += off if dst < src (signed) */
			
 
				++	/* PC += off if dst <= src (signed) */
			
 
				++	case BPF_JMP32 | BPF_JEQ | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JNE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSET | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JGT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JGE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JLT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JLE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSGT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSGE | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSLT | BPF_X:
			
 
				++	case BPF_JMP32 | BPF_JSLE | BPF_X:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_r(ctx, dst == src, BPF_OP(code), off, &jmp, &rel);
			
 
				++		emit_sext(ctx, MIPS_R_T4, dst); /* Sign-extended dst */
			
 
				++		emit_sext(ctx, MIPS_R_T5, src); /* Sign-extended src */
			
 
				++		emit_jmp_r(ctx, MIPS_R_T4, MIPS_R_T5, rel, jmp);
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off if dst == imm */
			
 
				++	/* PC += off if dst != imm */
			
 
				++	/* PC += off if dst & imm */
			
 
				++	/* PC += off if dst > imm */
			
 
				++	/* PC += off if dst >= imm */
			
 
				++	/* PC += off if dst < imm */
			
 
				++	/* PC += off if dst <= imm */
			
 
				++	/* PC += off if dst > imm (signed) */
			
 
				++	/* PC += off if dst >= imm (signed) */
			
 
				++	/* PC += off if dst < imm (signed) */
			
 
				++	/* PC += off if dst <= imm (signed) */
			
 
				++	case BPF_JMP32 | BPF_JEQ | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JNE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSET | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JGT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JGE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JLT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JLE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSGT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSGE | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSLT | BPF_K:
			
 
				++	case BPF_JMP32 | BPF_JSLE | BPF_K:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_i(ctx, imm, 32, BPF_OP(code), off, &jmp, &rel);
			
 
				++		emit_sext(ctx, MIPS_R_T4, dst); /* Sign-extended dst */
			
 
				++		if (valid_jmp_i(jmp, imm)) {
			
 
				++			emit_jmp_i(ctx, MIPS_R_T4, imm, rel, jmp);
			
 
				++		} else {
			
 
				++			/* Move large immediate to register, sign-extended */
			
 
				++			emit_mov_i(ctx, MIPS_R_T5, imm);
			
 
				++			emit_jmp_r(ctx, MIPS_R_T4, MIPS_R_T5, rel, jmp);
			
 
				++		}
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off if dst == src */
			
 
				++	/* PC += off if dst != src */
			
 
				++	/* PC += off if dst & src */
			
 
				++	/* PC += off if dst > src */
			
 
				++	/* PC += off if dst >= src */
			
 
				++	/* PC += off if dst < src */
			
 
				++	/* PC += off if dst <= src */
			
 
				++	/* PC += off if dst > src (signed) */
			
 
				++	/* PC += off if dst >= src (signed) */
			
 
				++	/* PC += off if dst < src (signed) */
			
 
				++	/* PC += off if dst <= src (signed) */
			
 
				++	case BPF_JMP | BPF_JEQ | BPF_X:
			
 
				++	case BPF_JMP | BPF_JNE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSET | BPF_X:
			
 
				++	case BPF_JMP | BPF_JGT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JGE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JLT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JLE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSGT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSGE | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSLT | BPF_X:
			
 
				++	case BPF_JMP | BPF_JSLE | BPF_X:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_r(ctx, dst == src, BPF_OP(code), off, &jmp, &rel);
			
 
				++		emit_jmp_r(ctx, dst, src, rel, jmp);
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off if dst == imm */
			
 
				++	/* PC += off if dst != imm */
			
 
				++	/* PC += off if dst & imm */
			
 
				++	/* PC += off if dst > imm */
			
 
				++	/* PC += off if dst >= imm */
			
 
				++	/* PC += off if dst < imm */
			
 
				++	/* PC += off if dst <= imm */
			
 
				++	/* PC += off if dst > imm (signed) */
			
 
				++	/* PC += off if dst >= imm (signed) */
			
 
				++	/* PC += off if dst < imm (signed) */
			
 
				++	/* PC += off if dst <= imm (signed) */
			
 
				++	case BPF_JMP | BPF_JEQ | BPF_K:
			
 
				++	case BPF_JMP | BPF_JNE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSET | BPF_K:
			
 
				++	case BPF_JMP | BPF_JGT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JGE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JLT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JLE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSGT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSGE | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSLT | BPF_K:
			
 
				++	case BPF_JMP | BPF_JSLE | BPF_K:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		setup_jmp_i(ctx, imm, 64, BPF_OP(code), off, &jmp, &rel);
			
 
				++		if (valid_jmp_i(jmp, imm)) {
			
 
				++			emit_jmp_i(ctx, dst, imm, rel, jmp);
			
 
				++		} else {
			
 
				++			/* Move large immediate to register */
			
 
				++			emit_mov_i(ctx, MIPS_R_T4, imm);
			
 
				++			emit_jmp_r(ctx, dst, MIPS_R_T4, rel, jmp);
			
 
				++		}
			
 
				++		if (finish_jmp(ctx, jmp, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* PC += off */
			
 
				++	case BPF_JMP | BPF_JA:
			
 
				++		if (off == 0)
			
 
				++			break;
			
 
				++		if (emit_ja(ctx, off) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++	/* Tail call */
			
 
				++	case BPF_JMP | BPF_TAIL_CALL:
			
 
				++		if (emit_tail_call(ctx) < 0)
			
 
				++			goto invalid;
			
 
				++		break;
			
 
				++	/* Function call */
			
 
				++	case BPF_JMP | BPF_CALL:
			
 
				++		if (emit_call(ctx, insn) < 0)
			
 
				++			goto invalid;
			
 
				++		break;
			
 
				++	/* Function return */
			
 
				++	case BPF_JMP | BPF_EXIT:
			
 
				++		/*
			
 
				++		 * Optimization: when last instruction is EXIT
			
 
				++		 * simply continue to epilogue.
			
 
				++		 */
			
 
				++		if (ctx->bpf_index == ctx->program->len - 1)
			
 
				++			break;
			
 
				++		if (emit_exit(ctx) < 0)
			
 
				++			goto toofar;
			
 
				++		break;
			
 
				++
			
 
				++	default:
			
 
				++invalid:
			
 
				++		pr_err_once("unknown opcode %02x\n", code);
			
 
				++		return -EINVAL;
			
 
				++notyet:
			
 
				++		pr_info_once("*** NOT YET: opcode %02x ***\n", code);
			
 
				++		return -EFAULT;
			
 
				++toofar:
			
 
				++		pr_info_once("*** TOO FAR: jump at %u opcode %02x ***\n",
			
 
				++			     ctx->bpf_index, code);
			
 
				++		return -E2BIG;
			
 
				++	}
			
 
				++	return 0;
			
 
				++}
			
--- a/target/linux/generic/backport-5.15/050-v5.16-04-mips-bpf-Add-JIT-workarounds-for-CPU-errata.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-04-mips-bpf-Add-JIT-workarounds-for-CPU-errata.patch
@@ -0,0 +1,120 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:06 +0200
			
 
				+Subject: [PATCH] mips: bpf: Add JIT workarounds for CPU errata
			
 
				+
			
 
				+This patch adds workarounds for the following CPU errata to the MIPS
			
 
				+eBPF JIT, if enabled in the kernel configuration.
			
 
				+
			
 
				+  - R10000 ll/sc weak ordering
			
 
				+  - Loongson-3 ll/sc weak ordering
			
 
				+  - Loongson-2F jump hang
			
 
				+
			
 
				+The Loongson-2F nop errata is implemented in uasm, which the JIT uses,
			
 
				+so no additional mitigations are needed for that.
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+Reviewed-by: Jiaxun Yang <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/arch/mips/net/bpf_jit_comp.c
			
 
				++++ b/arch/mips/net/bpf_jit_comp.c
			
 
				+@@ -404,6 +404,7 @@ void emit_alu_r(struct jit_context *ctx,
			
 
				+ /* Atomic read-modify-write (32-bit) */
			
 
				+ void emit_atomic_r(struct jit_context *ctx, u8 dst, u8 src, s16 off, u8 code)
			
 
				+ {
			
 
				++	LLSC_sync(ctx);
			
 
				+ 	emit(ctx, ll, MIPS_R_T9, off, dst);
			
 
				+ 	switch (code) {
			
 
				+ 	case BPF_ADD:
			
 
				+@@ -420,18 +421,19 @@ void emit_atomic_r(struct jit_context *c
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 	emit(ctx, sc, MIPS_R_T8, off, dst);
			
 
				+-	emit(ctx, beqz, MIPS_R_T8, -16);
			
 
				++	emit(ctx, LLSC_beqz, MIPS_R_T8, -16 - LLSC_offset);
			
 
				+ 	emit(ctx, nop); /* Delay slot */
			
 
				+ }
			
 
				+ 
			
 
				+ /* Atomic compare-and-exchange (32-bit) */
			
 
				+ void emit_cmpxchg_r(struct jit_context *ctx, u8 dst, u8 src, u8 res, s16 off)
			
 
				+ {
			
 
				++	LLSC_sync(ctx);
			
 
				+ 	emit(ctx, ll, MIPS_R_T9, off, dst);
			
 
				+ 	emit(ctx, bne, MIPS_R_T9, res, 12);
			
 
				+ 	emit(ctx, move, MIPS_R_T8, src);     /* Delay slot */
			
 
				+ 	emit(ctx, sc, MIPS_R_T8, off, dst);
			
 
				+-	emit(ctx, beqz, MIPS_R_T8, -20);
			
 
				++	emit(ctx, LLSC_beqz, MIPS_R_T8, -20 - LLSC_offset);
			
 
				+ 	emit(ctx, move, res, MIPS_R_T9);     /* Delay slot */
			
 
				+ 	clobber_reg(ctx, res);
			
 
				+ }
			
 
				+--- a/arch/mips/net/bpf_jit_comp.h
			
 
				++++ b/arch/mips/net/bpf_jit_comp.h
			
 
				+@@ -87,7 +87,7 @@ struct jit_context {
			
 
				+ };
			
 
				+ 
			
 
				+ /* Emit the instruction if the JIT memory space has been allocated */
			
 
				+-#define emit(ctx, func, ...)					\
			
 
				++#define __emit(ctx, func, ...)					\
			
 
				+ do {								\
			
 
				+ 	if ((ctx)->target != NULL) {				\
			
 
				+ 		u32 *p = &(ctx)->target[ctx->jit_index];	\
			
 
				+@@ -95,6 +95,30 @@ do {								\
			
 
				+ 	}							\
			
 
				+ 	(ctx)->jit_index++;					\
			
 
				+ } while (0)
			
 
				++#define emit(...) __emit(__VA_ARGS__)
			
 
				++
			
 
				++/* Workaround for R10000 ll/sc errata */
			
 
				++#ifdef CONFIG_WAR_R10000
			
 
				++#define LLSC_beqz	beqzl
			
 
				++#else
			
 
				++#define LLSC_beqz	beqz
			
 
				++#endif
			
 
				++
			
 
				++/* Workaround for Loongson-3 ll/sc errata */
			
 
				++#ifdef CONFIG_CPU_LOONGSON3_WORKAROUNDS
			
 
				++#define LLSC_sync(ctx)	emit(ctx, sync, 0)
			
 
				++#define LLSC_offset	4
			
 
				++#else
			
 
				++#define LLSC_sync(ctx)
			
 
				++#define LLSC_offset	0
			
 
				++#endif
			
 
				++
			
 
				++/* Workaround for Loongson-2F jump errata */
			
 
				++#ifdef CONFIG_CPU_JUMP_WORKAROUNDS
			
 
				++#define JALR_MASK	0xffffffffcfffffffULL
			
 
				++#else
			
 
				++#define JALR_MASK	(~0ULL)
			
 
				++#endif
			
 
				+ 
			
 
				+ /*
			
 
				+  * Mark a BPF register as accessed, it needs to be
			
 
				+--- a/arch/mips/net/bpf_jit_comp64.c
			
 
				++++ b/arch/mips/net/bpf_jit_comp64.c
			
 
				+@@ -375,6 +375,7 @@ static void emit_atomic_r64(struct jit_c
			
 
				+ 	u8 t1 = MIPS_R_T6;
			
 
				+ 	u8 t2 = MIPS_R_T7;
			
 
				+ 
			
 
				++	LLSC_sync(ctx);
			
 
				+ 	emit(ctx, lld, t1, off, dst);
			
 
				+ 	switch (code) {
			
 
				+ 	case BPF_ADD:
			
 
				+@@ -391,7 +392,7 @@ static void emit_atomic_r64(struct jit_c
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 	emit(ctx, scd, t2, off, dst);
			
 
				+-	emit(ctx, beqz, t2, -16);
			
 
				++	emit(ctx, LLSC_beqz, t2, -16 - LLSC_offset);
			
 
				+ 	emit(ctx, nop); /* Delay slot */
			
 
				+ }
			
 
				+ 
			
 
				+@@ -414,7 +415,7 @@ static int emit_call(struct jit_context
			
 
				+ 	push_regs(ctx, ctx->clobbered & JIT_CALLER_REGS, 0, 0);
			
 
				+ 
			
 
				+ 	/* Emit function call */
			
 
				+-	emit_mov_i64(ctx, tmp, addr);
			
 
				++	emit_mov_i64(ctx, tmp, addr & JALR_MASK);
			
 
				+ 	emit(ctx, jalr, MIPS_R_RA, tmp);
			
 
				+ 	emit(ctx, nop); /* Delay slot */
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/050-v5.16-05-mips-bpf-Enable-eBPF-JITs.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-05-mips-bpf-Enable-eBPF-JITs.patch
@@ -0,0 +1,61 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:07 +0200
			
 
				+Subject: [PATCH] mips: bpf: Enable eBPF JITs
			
 
				+
			
 
				+This patch enables the new eBPF JITs for 32-bit and 64-bit MIPS. It also
			
 
				+disables the old cBPF JIT to so cBPF programs are converted to use the
			
 
				+new JIT.
			
 
				+
			
 
				+Workarounds for R4000 CPU errata are not implemented by the JIT, so the
			
 
				+JIT is disabled if any of those workarounds are configured.
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/MAINTAINERS
			
 
				++++ b/MAINTAINERS
			
 
				+@@ -3294,6 +3294,7 @@ S:	Supported
			
 
				+ F:	arch/arm64/net/
			
 
				+ 
			
 
				+ BPF JIT for MIPS (32-BIT AND 64-BIT)
			
 
				++M:	Johan Almbladh <[email protected]>
			
 
				+ M:	Paul Burton <[email protected]>
			
 
				+ L:	[email protected]
			
 
				+ L:	[email protected]
			
 
				+--- a/arch/mips/Kconfig
			
 
				++++ b/arch/mips/Kconfig
			
 
				+@@ -49,7 +49,6 @@ config MIPS
			
 
				+ 	select HAVE_ARCH_TRACEHOOK
			
 
				+ 	select HAVE_ARCH_TRANSPARENT_HUGEPAGE if CPU_SUPPORTS_HUGEPAGES
			
 
				+ 	select HAVE_ASM_MODVERSIONS
			
 
				+-	select HAVE_CBPF_JIT if !64BIT && !CPU_MICROMIPS
			
 
				+ 	select HAVE_CONTEXT_TRACKING
			
 
				+ 	select HAVE_TIF_NOHZ
			
 
				+ 	select HAVE_C_RECORDMCOUNT
			
 
				+@@ -57,7 +56,10 @@ config MIPS
			
 
				+ 	select HAVE_DEBUG_STACKOVERFLOW
			
 
				+ 	select HAVE_DMA_CONTIGUOUS
			
 
				+ 	select HAVE_DYNAMIC_FTRACE
			
 
				+-	select HAVE_EBPF_JIT if 64BIT && !CPU_MICROMIPS && TARGET_ISA_REV >= 2
			
 
				++	select HAVE_EBPF_JIT if !CPU_MICROMIPS && \
			
 
				++				!CPU_DADDI_WORKAROUNDS && \
			
 
				++				!CPU_R4000_WORKAROUNDS && \
			
 
				++				!CPU_R4400_WORKAROUNDS
			
 
				+ 	select HAVE_EXIT_THREAD
			
 
				+ 	select HAVE_FAST_GUP
			
 
				+ 	select HAVE_FTRACE_MCOUNT_RECORD
			
 
				+--- a/arch/mips/net/Makefile
			
 
				++++ b/arch/mips/net/Makefile
			
 
				+@@ -2,9 +2,10 @@
			
 
				+ # MIPS networking code
			
 
				+ 
			
 
				+ obj-$(CONFIG_MIPS_CBPF_JIT) += bpf_jit.o bpf_jit_asm.o
			
 
				++obj-$(CONFIG_MIPS_EBPF_JIT) += bpf_jit_comp.o
			
 
				+ 
			
 
				+ ifeq ($(CONFIG_32BIT),y)
			
 
				+-        obj-$(CONFIG_MIPS_EBPF_JIT) += bpf_jit_comp.o bpf_jit_comp32.o
			
 
				++        obj-$(CONFIG_MIPS_EBPF_JIT) += bpf_jit_comp32.o
			
 
				+ else
			
 
				+-        obj-$(CONFIG_MIPS_EBPF_JIT) += ebpf_jit.o
			
 
				++        obj-$(CONFIG_MIPS_EBPF_JIT) += bpf_jit_comp64.o
			
 
				+ endif
			
--- a/target/linux/generic/backport-5.15/050-v5.16-06-mips-bpf-Remove-old-BPF-JIT-implementations.patch
+++ b/target/linux/generic/backport-5.15/050-v5.16-06-mips-bpf-Remove-old-BPF-JIT-implementations.patch
@@ -0,0 +1,387 @@
 
				+From: Johan Almbladh <[email protected]>
			
 
				+Date: Tue, 5 Oct 2021 18:54:08 +0200
			
 
				+Subject: [PATCH] mips: bpf: Remove old BPF JIT implementations
			
 
				+
			
 
				+This patch removes the old 32-bit cBPF and 64-bit eBPF JIT implementations.
			
 
				+They are replaced by a new eBPF implementation that supports both 32-bit
			
 
				+and 64-bit MIPS CPUs.
			
 
				+
			
 
				+Signed-off-by: Johan Almbladh <[email protected]>
			
 
				+---
			
 
				+ delete mode 100644 arch/mips/net/bpf_jit.c
			
 
				+ delete mode 100644 arch/mips/net/bpf_jit.h
			
 
				+ delete mode 100644 arch/mips/net/bpf_jit_asm.S
			
 
				+ delete mode 100644 arch/mips/net/ebpf_jit.c
			
 
				+
			
 
				+--- a/arch/mips/net/bpf_jit.h
			
 
				++++ /dev/null
			
 
				+@@ -1,81 +0,0 @@
			
 
				+-/* SPDX-License-Identifier: GPL-2.0-only */
			
 
				+-/*
			
 
				+- * Just-In-Time compiler for BPF filters on MIPS
			
 
				+- *
			
 
				+- * Copyright (c) 2014 Imagination Technologies Ltd.
			
 
				+- * Author: Markos Chandras <[email protected]>
			
 
				+- */
			
 
				+-
			
 
				+-#ifndef BPF_JIT_MIPS_OP_H
			
 
				+-#define BPF_JIT_MIPS_OP_H
			
 
				+-
			
 
				+-/* Registers used by JIT */
			
 
				+-#define MIPS_R_ZERO	0
			
 
				+-#define MIPS_R_V0	2
			
 
				+-#define MIPS_R_A0	4
			
 
				+-#define MIPS_R_A1	5
			
 
				+-#define MIPS_R_T4	12
			
 
				+-#define MIPS_R_T5	13
			
 
				+-#define MIPS_R_T6	14
			
 
				+-#define MIPS_R_T7	15
			
 
				+-#define MIPS_R_S0	16
			
 
				+-#define MIPS_R_S1	17
			
 
				+-#define MIPS_R_S2	18
			
 
				+-#define MIPS_R_S3	19
			
 
				+-#define MIPS_R_S4	20
			
 
				+-#define MIPS_R_S5	21
			
 
				+-#define MIPS_R_S6	22
			
 
				+-#define MIPS_R_S7	23
			
 
				+-#define MIPS_R_SP	29
			
 
				+-#define MIPS_R_RA	31
			
 
				+-
			
 
				+-/* Conditional codes */
			
 
				+-#define MIPS_COND_EQ	0x1
			
 
				+-#define MIPS_COND_GE	(0x1 << 1)
			
 
				+-#define MIPS_COND_GT	(0x1 << 2)
			
 
				+-#define MIPS_COND_NE	(0x1 << 3)
			
 
				+-#define MIPS_COND_ALL	(0x1 << 4)
			
 
				+-/* Conditionals on X register or K immediate */
			
 
				+-#define MIPS_COND_X	(0x1 << 5)
			
 
				+-#define MIPS_COND_K	(0x1 << 6)
			
 
				+-
			
 
				+-#define r_ret	MIPS_R_V0
			
 
				+-
			
 
				+-/*
			
 
				+- * Use 2 scratch registers to avoid pipeline interlocks.
			
 
				+- * There is no overhead during epilogue and prologue since
			
 
				+- * any of the $s0-$s6 registers will only be preserved if
			
 
				+- * they are going to actually be used.
			
 
				+- */
			
 
				+-#define r_skb_hl	MIPS_R_S0 /* skb header length */
			
 
				+-#define r_skb_data	MIPS_R_S1 /* skb actual data */
			
 
				+-#define r_off		MIPS_R_S2
			
 
				+-#define r_A		MIPS_R_S3
			
 
				+-#define r_X		MIPS_R_S4
			
 
				+-#define r_skb		MIPS_R_S5
			
 
				+-#define r_M		MIPS_R_S6
			
 
				+-#define r_skb_len	MIPS_R_S7
			
 
				+-#define r_s0		MIPS_R_T4 /* scratch reg 1 */
			
 
				+-#define r_s1		MIPS_R_T5 /* scratch reg 2 */
			
 
				+-#define r_tmp_imm	MIPS_R_T6 /* No need to preserve this */
			
 
				+-#define r_tmp		MIPS_R_T7 /* No need to preserve this */
			
 
				+-#define r_zero		MIPS_R_ZERO
			
 
				+-#define r_sp		MIPS_R_SP
			
 
				+-#define r_ra		MIPS_R_RA
			
 
				+-
			
 
				+-#ifndef __ASSEMBLY__
			
 
				+-
			
 
				+-/* Declare ASM helpers */
			
 
				+-
			
 
				+-#define DECLARE_LOAD_FUNC(func) \
			
 
				+-	extern u8 func(unsigned long *skb, int offset); \
			
 
				+-	extern u8 func##_negative(unsigned long *skb, int offset); \
			
 
				+-	extern u8 func##_positive(unsigned long *skb, int offset)
			
 
				+-
			
 
				+-DECLARE_LOAD_FUNC(sk_load_word);
			
 
				+-DECLARE_LOAD_FUNC(sk_load_half);
			
 
				+-DECLARE_LOAD_FUNC(sk_load_byte);
			
 
				+-
			
 
				+-#endif
			
 
				+-
			
 
				+-#endif /* BPF_JIT_MIPS_OP_H */
			
 
				+--- a/arch/mips/net/bpf_jit_asm.S
			
 
				++++ /dev/null
			
 
				+@@ -1,285 +0,0 @@
			
 
				+-/*
			
 
				+- * bpf_jib_asm.S: Packet/header access helper functions for MIPS/MIPS64 BPF
			
 
				+- * compiler.
			
 
				+- *
			
 
				+- * Copyright (C) 2015 Imagination Technologies Ltd.
			
 
				+- * Author: Markos Chandras <[email protected]>
			
 
				+- *
			
 
				+- * This program is free software; you can redistribute it and/or modify it
			
 
				+- * under the terms of the GNU General Public License as published by the
			
 
				+- * Free Software Foundation; version 2 of the License.
			
 
				+- */
			
 
				+-
			
 
				+-#include <asm/asm.h>
			
 
				+-#include <asm/isa-rev.h>
			
 
				+-#include <asm/regdef.h>
			
 
				+-#include "bpf_jit.h"
			
 
				+-
			
 
				+-/* ABI
			
 
				+- *
			
 
				+- * r_skb_hl	skb header length
			
 
				+- * r_skb_data	skb data
			
 
				+- * r_off(a1)	offset register
			
 
				+- * r_A		BPF register A
			
 
				+- * r_X		PF register X
			
 
				+- * r_skb(a0)	*skb
			
 
				+- * r_M		*scratch memory
			
 
				+- * r_skb_le	skb length
			
 
				+- * r_s0		Scratch register 0
			
 
				+- * r_s1		Scratch register 1
			
 
				+- *
			
 
				+- * On entry:
			
 
				+- * a0: *skb
			
 
				+- * a1: offset (imm or imm + X)
			
 
				+- *
			
 
				+- * All non-BPF-ABI registers are free for use. On return, we only
			
 
				+- * care about r_ret. The BPF-ABI registers are assumed to remain
			
 
				+- * unmodified during the entire filter operation.
			
 
				+- */
			
 
				+-
			
 
				+-#define skb	a0
			
 
				+-#define offset	a1
			
 
				+-#define SKF_LL_OFF  (-0x200000) /* Can't include linux/filter.h in assembly */
			
 
				+-
			
 
				+-	/* We know better :) so prevent assembler reordering etc */
			
 
				+-	.set 	noreorder
			
 
				+-
			
 
				+-#define is_offset_negative(TYPE)				\
			
 
				+-	/* If offset is negative we have more work to do */	\
			
 
				+-	slti	t0, offset, 0;					\
			
 
				+-	bgtz	t0, bpf_slow_path_##TYPE##_neg;			\
			
 
				+-	/* Be careful what follows in DS. */
			
 
				+-
			
 
				+-#define is_offset_in_header(SIZE, TYPE)				\
			
 
				+-	/* Reading from header? */				\
			
 
				+-	addiu	$r_s0, $r_skb_hl, -SIZE;			\
			
 
				+-	slt	t0, $r_s0, offset;				\
			
 
				+-	bgtz	t0, bpf_slow_path_##TYPE;			\
			
 
				+-
			
 
				+-LEAF(sk_load_word)
			
 
				+-	is_offset_negative(word)
			
 
				+-FEXPORT(sk_load_word_positive)
			
 
				+-	is_offset_in_header(4, word)
			
 
				+-	/* Offset within header boundaries */
			
 
				+-	PTR_ADDU t1, $r_skb_data, offset
			
 
				+-	.set	reorder
			
 
				+-	lw	$r_A, 0(t1)
			
 
				+-	.set	noreorder
			
 
				+-#ifdef CONFIG_CPU_LITTLE_ENDIAN
			
 
				+-# if MIPS_ISA_REV >= 2
			
 
				+-	wsbh	t0, $r_A
			
 
				+-	rotr	$r_A, t0, 16
			
 
				+-# else
			
 
				+-	sll	t0, $r_A, 24
			
 
				+-	srl	t1, $r_A, 24
			
 
				+-	srl	t2, $r_A, 8
			
 
				+-	or	t0, t0, t1
			
 
				+-	andi	t2, t2, 0xff00
			
 
				+-	andi	t1, $r_A, 0xff00
			
 
				+-	or	t0, t0, t2
			
 
				+-	sll	t1, t1, 8
			
 
				+-	or	$r_A, t0, t1
			
 
				+-# endif
			
 
				+-#endif
			
 
				+-	jr	$r_ra
			
 
				+-	 move	$r_ret, zero
			
 
				+-	END(sk_load_word)
			
 
				+-
			
 
				+-LEAF(sk_load_half)
			
 
				+-	is_offset_negative(half)
			
 
				+-FEXPORT(sk_load_half_positive)
			
 
				+-	is_offset_in_header(2, half)
			
 
				+-	/* Offset within header boundaries */
			
 
				+-	PTR_ADDU t1, $r_skb_data, offset
			
 
				+-	lhu	$r_A, 0(t1)
			
 
				+-#ifdef CONFIG_CPU_LITTLE_ENDIAN
			
 
				+-# if MIPS_ISA_REV >= 2
			
 
				+-	wsbh	$r_A, $r_A
			
 
				+-# else
			
 
				+-	sll	t0, $r_A, 8
			
 
				+-	srl	t1, $r_A, 8
			
 
				+-	andi	t0, t0, 0xff00
			
 
				+-	or	$r_A, t0, t1
			
 
				+-# endif
			
 
				+-#endif
			
 
				+-	jr	$r_ra
			
 
				+-	 move	$r_ret, zero
			
 
				+-	END(sk_load_half)
			
 
				+-
			
 
				+-LEAF(sk_load_byte)
			
 
				+-	is_offset_negative(byte)
			
 
				+-FEXPORT(sk_load_byte_positive)
			
 
				+-	is_offset_in_header(1, byte)
			
 
				+-	/* Offset within header boundaries */
			
 
				+-	PTR_ADDU t1, $r_skb_data, offset
			
 
				+-	lbu	$r_A, 0(t1)
			
 
				+-	jr	$r_ra
			
 
				+-	 move	$r_ret, zero
			
 
				+-	END(sk_load_byte)
			
 
				+-
			
 
				+-/*
			
 
				+- * call skb_copy_bits:
			
 
				+- * (prototype in linux/skbuff.h)
			
 
				+- *
			
 
				+- * int skb_copy_bits(sk_buff *skb, int offset, void *to, int len)
			
 
				+- *
			
 
				+- * o32 mandates we leave 4 spaces for argument registers in case
			
 
				+- * the callee needs to use them. Even though we don't care about
			
 
				+- * the argument registers ourselves, we need to allocate that space
			
 
				+- * to remain ABI compliant since the callee may want to use that space.
			
 
				+- * We also allocate 2 more spaces for $r_ra and our return register (*to).
			
 
				+- *
			
 
				+- * n64 is a bit different. The *caller* will allocate the space to preserve
			
 
				+- * the arguments. So in 64-bit kernels, we allocate the 4-arg space for no
			
 
				+- * good reason but it does not matter that much really.
			
 
				+- *
			
 
				+- * (void *to) is returned in r_s0
			
 
				+- *
			
 
				+- */
			
 
				+-#ifdef CONFIG_CPU_LITTLE_ENDIAN
			
 
				+-#define DS_OFFSET(SIZE) (4 * SZREG)
			
 
				+-#else
			
 
				+-#define DS_OFFSET(SIZE) ((4 * SZREG) + (4 - SIZE))
			
 
				+-#endif
			
 
				+-#define bpf_slow_path_common(SIZE)				\
			
 
				+-	/* Quick check. Are we within reasonable boundaries? */ \
			
 
				+-	LONG_ADDIU	$r_s1, $r_skb_len, -SIZE;		\
			
 
				+-	sltu		$r_s0, offset, $r_s1;			\
			
 
				+-	beqz		$r_s0, fault;				\
			
 
				+-	/* Load 4th argument in DS */				\
			
 
				+-	 LONG_ADDIU	a3, zero, SIZE;				\
			
 
				+-	PTR_ADDIU	$r_sp, $r_sp, -(6 * SZREG);		\
			
 
				+-	PTR_LA		t0, skb_copy_bits;			\
			
 
				+-	PTR_S		$r_ra, (5 * SZREG)($r_sp);		\
			
 
				+-	/* Assign low slot to a2 */				\
			
 
				+-	PTR_ADDIU	a2, $r_sp, DS_OFFSET(SIZE);		\
			
 
				+-	jalr		t0;					\
			
 
				+-	/* Reset our destination slot (DS but it's ok) */	\
			
 
				+-	 INT_S		zero, (4 * SZREG)($r_sp);		\
			
 
				+-	/*							\
			
 
				+-	 * skb_copy_bits returns 0 on success and -EFAULT	\
			
 
				+-	 * on error. Our data live in a2. Do not bother with	\
			
 
				+-	 * our data if an error has been returned.		\
			
 
				+-	 */							\
			
 
				+-	/* Restore our frame */					\
			
 
				+-	PTR_L		$r_ra, (5 * SZREG)($r_sp);		\
			
 
				+-	INT_L		$r_s0, (4 * SZREG)($r_sp);		\
			
 
				+-	bltz		v0, fault;				\
			
 
				+-	 PTR_ADDIU	$r_sp, $r_sp, 6 * SZREG;		\
			
 
				+-	move		$r_ret, zero;				\
			
 
				+-
			
 
				+-NESTED(bpf_slow_path_word, (6 * SZREG), $r_sp)
			
 
				+-	bpf_slow_path_common(4)
			
 
				+-#ifdef CONFIG_CPU_LITTLE_ENDIAN
			
 
				+-# if MIPS_ISA_REV >= 2
			
 
				+-	wsbh	t0, $r_s0
			
 
				+-	jr	$r_ra
			
 
				+-	 rotr	$r_A, t0, 16
			
 
				+-# else
			
 
				+-	sll	t0, $r_s0, 24
			
 
				+-	srl	t1, $r_s0, 24
			
 
				+-	srl	t2, $r_s0, 8
			
 
				+-	or	t0, t0, t1
			
 
				+-	andi	t2, t2, 0xff00
			
 
				+-	andi	t1, $r_s0, 0xff00
			
 
				+-	or	t0, t0, t2
			
 
				+-	sll	t1, t1, 8
			
 
				+-	jr	$r_ra
			
 
				+-	 or	$r_A, t0, t1
			
 
				+-# endif
			
 
				+-#else
			
 
				+-	jr	$r_ra
			
 
				+-	 move	$r_A, $r_s0
			
 
				+-#endif
			
 
				+-
			
 
				+-	END(bpf_slow_path_word)
			
 
				+-
			
 
				+-NESTED(bpf_slow_path_half, (6 * SZREG), $r_sp)
			
 
				+-	bpf_slow_path_common(2)
			
 
				+-#ifdef CONFIG_CPU_LITTLE_ENDIAN
			
 
				+-# if MIPS_ISA_REV >= 2
			
 
				+-	jr	$r_ra
			
 
				+-	 wsbh	$r_A, $r_s0
			
 
				+-# else
			
 
				+-	sll	t0, $r_s0, 8
			
 
				+-	andi	t1, $r_s0, 0xff00
			
 
				+-	andi	t0, t0, 0xff00
			
 
				+-	srl	t1, t1, 8
			
 
				+-	jr	$r_ra
			
 
				+-	 or	$r_A, t0, t1
			
 
				+-# endif
			
 
				+-#else
			
 
				+-	jr	$r_ra
			
 
				+-	 move	$r_A, $r_s0
			
 
				+-#endif
			
 
				+-
			
 
				+-	END(bpf_slow_path_half)
			
 
				+-
			
 
				+-NESTED(bpf_slow_path_byte, (6 * SZREG), $r_sp)
			
 
				+-	bpf_slow_path_common(1)
			
 
				+-	jr	$r_ra
			
 
				+-	 move	$r_A, $r_s0
			
 
				+-
			
 
				+-	END(bpf_slow_path_byte)
			
 
				+-
			
 
				+-/*
			
 
				+- * Negative entry points
			
 
				+- */
			
 
				+-	.macro bpf_is_end_of_data
			
 
				+-	li	t0, SKF_LL_OFF
			
 
				+-	/* Reading link layer data? */
			
 
				+-	slt	t1, offset, t0
			
 
				+-	bgtz	t1, fault
			
 
				+-	/* Be careful what follows in DS. */
			
 
				+-	.endm
			
 
				+-/*
			
 
				+- * call skb_copy_bits:
			
 
				+- * (prototype in linux/filter.h)
			
 
				+- *
			
 
				+- * void *bpf_internal_load_pointer_neg_helper(const struct sk_buff *skb,
			
 
				+- *                                            int k, unsigned int size)
			
 
				+- *
			
 
				+- * see above (bpf_slow_path_common) for ABI restrictions
			
 
				+- */
			
 
				+-#define bpf_negative_common(SIZE)					\
			
 
				+-	PTR_ADDIU	$r_sp, $r_sp, -(6 * SZREG);			\
			
 
				+-	PTR_LA		t0, bpf_internal_load_pointer_neg_helper;	\
			
 
				+-	PTR_S		$r_ra, (5 * SZREG)($r_sp);			\
			
 
				+-	jalr		t0;						\
			
 
				+-	 li		a2, SIZE;					\
			
 
				+-	PTR_L		$r_ra, (5 * SZREG)($r_sp);			\
			
 
				+-	/* Check return pointer */					\
			
 
				+-	beqz		v0, fault;					\
			
 
				+-	 PTR_ADDIU	$r_sp, $r_sp, 6 * SZREG;			\
			
 
				+-	/* Preserve our pointer */					\
			
 
				+-	move		$r_s0, v0;					\
			
 
				+-	/* Set return value */						\
			
 
				+-	move		$r_ret, zero;					\
			
 
				+-
			
 
				+-bpf_slow_path_word_neg:
			
 
				+-	bpf_is_end_of_data
			
 
				+-NESTED(sk_load_word_negative, (6 * SZREG), $r_sp)
			
 
				+-	bpf_negative_common(4)
			
 
				+-	jr	$r_ra
			
 
				+-	 lw	$r_A, 0($r_s0)
			
 
				+-	END(sk_load_word_negative)
			
 
				+-
			
 
				+-bpf_slow_path_half_neg:
			
 
				+-	bpf_is_end_of_data
			
 
				+-NESTED(sk_load_half_negative, (6 * SZREG), $r_sp)
			
 
				+-	bpf_negative_common(2)
			
 
				+-	jr	$r_ra
			
 
				+-	 lhu	$r_A, 0($r_s0)
			
 
				+-	END(sk_load_half_negative)
			
 
				+-
			
 
				+-bpf_slow_path_byte_neg:
			
 
				+-	bpf_is_end_of_data
			
 
				+-NESTED(sk_load_byte_negative, (6 * SZREG), $r_sp)
			
 
				+-	bpf_negative_common(1)
			
 
				+-	jr	$r_ra
			
 
				+-	 lbu	$r_A, 0($r_s0)
			
 
				+-	END(sk_load_byte_negative)
			
 
				+-
			
 
				+-fault:
			
 
				+-	jr	$r_ra
			
 
				+-	 addiu $r_ret, zero, 1
			
--- a/target/linux/generic/backport-5.15/071-crypto-arm-chacha-neon-optimize-for-non-block-size-m.patch
+++ b/target/linux/generic/backport-5.15/071-crypto-arm-chacha-neon-optimize-for-non-block-size-m.patch
@@ -0,0 +1,272 @@
 
				+From 03662fcd41f4b764857f17b95f9a2a63c24bddd4 Mon Sep 17 00:00:00 2001
			
 
				+From: Ard Biesheuvel <[email protected]>
			
 
				+Date: Tue, 3 Nov 2020 17:28:09 +0100
			
 
				+Subject: [PATCH 1/2] crypto: arm/chacha-neon - optimize for non-block size
			
 
				+ multiples
			
 
				+
			
 
				+commit 86cd97ec4b943af35562a74688bc4e909b32c3d1 upstream.
			
 
				+
			
 
				+The current NEON based ChaCha implementation for ARM is optimized for
			
 
				+multiples of 4x the ChaCha block size (64 bytes). This makes sense for
			
 
				+block encryption, but given that ChaCha is also often used in the
			
 
				+context of networking, it makes sense to consider arbitrary length
			
 
				+inputs as well.
			
 
				+
			
 
				+For example, WireGuard typically uses 1420 byte packets, and performing
			
 
				+ChaCha encryption involves 5 invocations of chacha_4block_xor_neon()
			
 
				+and 3 invocations of chacha_block_xor_neon(), where the last one also
			
 
				+involves a memcpy() using a buffer on the stack to process the final
			
 
				+chunk of 1420 % 64 == 12 bytes.
			
 
				+
			
 
				+Let's optimize for this case as well, by letting chacha_4block_xor_neon()
			
 
				+deal with any input size between 64 and 256 bytes, using NEON permutation
			
 
				+instructions and overlapping loads and stores. This way, the 140 byte
			
 
				+tail of a 1420 byte input buffer can simply be processed in one go.
			
 
				+
			
 
				+This results in the following performance improvements for 1420 byte
			
 
				+blocks, without significant impact on power-of-2 input sizes. (Note
			
 
				+that Raspberry Pi is widely used in combination with a 32-bit kernel,
			
 
				+even though the core is 64-bit capable)
			
 
				+
			
 
				+   Cortex-A8  (BeagleBone)       :   7%
			
 
				+   Cortex-A15 (Calxeda Midway)   :  21%
			
 
				+   Cortex-A53 (Raspberry Pi 3)   :   3%
			
 
				+   Cortex-A72 (Raspberry Pi 4)   :  19%
			
 
				+
			
 
				+Cc: Eric Biggers <[email protected]>
			
 
				+Cc: "Jason A . Donenfeld" <[email protected]>
			
 
				+Signed-off-by: Ard Biesheuvel <[email protected]>
			
 
				+Signed-off-by: Herbert Xu <[email protected]>
			
 
				+Signed-off-by: Jason A. Donenfeld <[email protected]>
			
 
				+---
			
 
				+ arch/arm/crypto/chacha-glue.c      | 34 +++++------
			
 
				+ arch/arm/crypto/chacha-neon-core.S | 97 +++++++++++++++++++++++++++---
			
 
				+ 2 files changed, 107 insertions(+), 24 deletions(-)
			
 
				+
			
 
				+--- a/arch/arm/crypto/chacha-glue.c
			
 
				++++ b/arch/arm/crypto/chacha-glue.c
			
 
				+@@ -23,7 +23,7 @@
			
 
				+ asmlinkage void chacha_block_xor_neon(const u32 *state, u8 *dst, const u8 *src,
			
 
				+ 				      int nrounds);
			
 
				+ asmlinkage void chacha_4block_xor_neon(const u32 *state, u8 *dst, const u8 *src,
			
 
				+-				       int nrounds);
			
 
				++				       int nrounds, unsigned int nbytes);
			
 
				+ asmlinkage void hchacha_block_arm(const u32 *state, u32 *out, int nrounds);
			
 
				+ asmlinkage void hchacha_block_neon(const u32 *state, u32 *out, int nrounds);
			
 
				+ 
			
 
				+@@ -42,24 +42,24 @@ static void chacha_doneon(u32 *state, u8
			
 
				+ {
			
 
				+ 	u8 buf[CHACHA_BLOCK_SIZE];
			
 
				+ 
			
 
				+-	while (bytes >= CHACHA_BLOCK_SIZE * 4) {
			
 
				+-		chacha_4block_xor_neon(state, dst, src, nrounds);
			
 
				+-		bytes -= CHACHA_BLOCK_SIZE * 4;
			
 
				+-		src += CHACHA_BLOCK_SIZE * 4;
			
 
				+-		dst += CHACHA_BLOCK_SIZE * 4;
			
 
				+-		state[12] += 4;
			
 
				+-	}
			
 
				+-	while (bytes >= CHACHA_BLOCK_SIZE) {
			
 
				+-		chacha_block_xor_neon(state, dst, src, nrounds);
			
 
				+-		bytes -= CHACHA_BLOCK_SIZE;
			
 
				+-		src += CHACHA_BLOCK_SIZE;
			
 
				+-		dst += CHACHA_BLOCK_SIZE;
			
 
				+-		state[12]++;
			
 
				++	while (bytes > CHACHA_BLOCK_SIZE) {
			
 
				++		unsigned int l = min(bytes, CHACHA_BLOCK_SIZE * 4U);
			
 
				++
			
 
				++		chacha_4block_xor_neon(state, dst, src, nrounds, l);
			
 
				++		bytes -= l;
			
 
				++		src += l;
			
 
				++		dst += l;
			
 
				++		state[12] += DIV_ROUND_UP(l, CHACHA_BLOCK_SIZE);
			
 
				+ 	}
			
 
				+ 	if (bytes) {
			
 
				+-		memcpy(buf, src, bytes);
			
 
				+-		chacha_block_xor_neon(state, buf, buf, nrounds);
			
 
				+-		memcpy(dst, buf, bytes);
			
 
				++		const u8 *s = src;
			
 
				++		u8 *d = dst;
			
 
				++
			
 
				++		if (bytes != CHACHA_BLOCK_SIZE)
			
 
				++			s = d = memcpy(buf, src, bytes);
			
 
				++		chacha_block_xor_neon(state, d, s, nrounds);
			
 
				++		if (d != dst)
			
 
				++			memcpy(dst, buf, bytes);
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
 
				+--- a/arch/arm/crypto/chacha-neon-core.S
			
 
				++++ b/arch/arm/crypto/chacha-neon-core.S
			
 
				+@@ -47,6 +47,7 @@
			
 
				+   */
			
 
				+ 
			
 
				+ #include <linux/linkage.h>
			
 
				++#include <asm/cache.h>
			
 
				+ 
			
 
				+ 	.text
			
 
				+ 	.fpu		neon
			
 
				+@@ -205,7 +206,7 @@ ENDPROC(hchacha_block_neon)
			
 
				+ 
			
 
				+ 	.align		5
			
 
				+ ENTRY(chacha_4block_xor_neon)
			
 
				+-	push		{r4-r5}
			
 
				++	push		{r4, lr}
			
 
				+ 	mov		r4, sp			// preserve the stack pointer
			
 
				+ 	sub		ip, sp, #0x20		// allocate a 32 byte buffer
			
 
				+ 	bic		ip, ip, #0x1f		// aligned to 32 bytes
			
 
				+@@ -229,10 +230,10 @@ ENTRY(chacha_4block_xor_neon)
			
 
				+ 	vld1.32		{q0-q1}, [r0]
			
 
				+ 	vld1.32		{q2-q3}, [ip]
			
 
				+ 
			
 
				+-	adr		r5, .Lctrinc
			
 
				++	adr		lr, .Lctrinc
			
 
				+ 	vdup.32		q15, d7[1]
			
 
				+ 	vdup.32		q14, d7[0]
			
 
				+-	vld1.32		{q4}, [r5, :128]
			
 
				++	vld1.32		{q4}, [lr, :128]
			
 
				+ 	vdup.32		q13, d6[1]
			
 
				+ 	vdup.32		q12, d6[0]
			
 
				+ 	vdup.32		q11, d5[1]
			
 
				+@@ -455,7 +456,7 @@ ENTRY(chacha_4block_xor_neon)
			
 
				+ 
			
 
				+ 	// Re-interleave the words in the first two rows of each block (x0..7).
			
 
				+ 	// Also add the counter values 0-3 to x12[0-3].
			
 
				+-	  vld1.32	{q8}, [r5, :128]	// load counter values 0-3
			
 
				++	  vld1.32	{q8}, [lr, :128]	// load counter values 0-3
			
 
				+ 	vzip.32		q0, q1			// => (0 1 0 1) (0 1 0 1)
			
 
				+ 	vzip.32		q2, q3			// => (2 3 2 3) (2 3 2 3)
			
 
				+ 	vzip.32		q4, q5			// => (4 5 4 5) (4 5 4 5)
			
 
				+@@ -493,6 +494,8 @@ ENTRY(chacha_4block_xor_neon)
			
 
				+ 
			
 
				+ 	// Re-interleave the words in the last two rows of each block (x8..15).
			
 
				+ 	vld1.32		{q8-q9}, [sp, :256]
			
 
				++	  mov		sp, r4		// restore original stack pointer
			
 
				++	  ldr		r4, [r4, #8]	// load number of bytes
			
 
				+ 	vzip.32		q12, q13	// => (12 13 12 13) (12 13 12 13)
			
 
				+ 	vzip.32		q14, q15	// => (14 15 14 15) (14 15 14 15)
			
 
				+ 	vzip.32		q8, q9		// => (8 9 8 9) (8 9 8 9)
			
 
				+@@ -520,41 +523,121 @@ ENTRY(chacha_4block_xor_neon)
			
 
				+ 	// XOR the rest of the data with the keystream
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]!
			
 
				++	subs		r4, r4, #96
			
 
				+ 	veor		q0, q0, q8
			
 
				+ 	veor		q1, q1, q12
			
 
				++	ble		.Lle96
			
 
				+ 	vst1.8		{q0-q1}, [r1]!
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]!
			
 
				++	subs		r4, r4, #32
			
 
				+ 	veor		q0, q0, q2
			
 
				+ 	veor		q1, q1, q6
			
 
				++	ble		.Lle128
			
 
				+ 	vst1.8		{q0-q1}, [r1]!
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]!
			
 
				++	subs		r4, r4, #32
			
 
				+ 	veor		q0, q0, q10
			
 
				+ 	veor		q1, q1, q14
			
 
				++	ble		.Lle160
			
 
				+ 	vst1.8		{q0-q1}, [r1]!
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]!
			
 
				++	subs		r4, r4, #32
			
 
				+ 	veor		q0, q0, q4
			
 
				+ 	veor		q1, q1, q5
			
 
				++	ble		.Lle192
			
 
				+ 	vst1.8		{q0-q1}, [r1]!
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]!
			
 
				++	subs		r4, r4, #32
			
 
				+ 	veor		q0, q0, q9
			
 
				+ 	veor		q1, q1, q13
			
 
				++	ble		.Lle224
			
 
				+ 	vst1.8		{q0-q1}, [r1]!
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]!
			
 
				++	subs		r4, r4, #32
			
 
				+ 	veor		q0, q0, q3
			
 
				+ 	veor		q1, q1, q7
			
 
				++	blt		.Llt256
			
 
				++.Lout:
			
 
				+ 	vst1.8		{q0-q1}, [r1]!
			
 
				+ 
			
 
				+ 	vld1.8		{q0-q1}, [r2]
			
 
				+-	  mov		sp, r4		// restore original stack pointer
			
 
				+ 	veor		q0, q0, q11
			
 
				+ 	veor		q1, q1, q15
			
 
				+ 	vst1.8		{q0-q1}, [r1]
			
 
				+ 
			
 
				+-	pop		{r4-r5}
			
 
				+-	bx		lr
			
 
				++	pop		{r4, pc}
			
 
				++
			
 
				++.Lle192:
			
 
				++	vmov		q4, q9
			
 
				++	vmov		q5, q13
			
 
				++
			
 
				++.Lle160:
			
 
				++	// nothing to do
			
 
				++
			
 
				++.Lfinalblock:
			
 
				++	// Process the final block if processing less than 4 full blocks.
			
 
				++	// Entered with 32 bytes of ChaCha cipher stream in q4-q5, and the
			
 
				++	// previous 32 byte output block that still needs to be written at
			
 
				++	// [r1] in q0-q1.
			
 
				++	beq		.Lfullblock
			
 
				++
			
 
				++.Lpartialblock:
			
 
				++	adr		lr, .Lpermute + 32
			
 
				++	add		r2, r2, r4
			
 
				++	add		lr, lr, r4
			
 
				++	add		r4, r4, r1
			
 
				++
			
 
				++	vld1.8		{q2-q3}, [lr]
			
 
				++	vld1.8		{q6-q7}, [r2]
			
 
				++
			
 
				++	add		r4, r4, #32
			
 
				++
			
 
				++	vtbl.8		d4, {q4-q5}, d4
			
 
				++	vtbl.8		d5, {q4-q5}, d5
			
 
				++	vtbl.8		d6, {q4-q5}, d6
			
 
				++	vtbl.8		d7, {q4-q5}, d7
			
 
				++
			
 
				++	veor		q6, q6, q2
			
 
				++	veor		q7, q7, q3
			
 
				++
			
 
				++	vst1.8		{q6-q7}, [r4]	// overlapping stores
			
 
				++	vst1.8		{q0-q1}, [r1]
			
 
				++	pop		{r4, pc}
			
 
				++
			
 
				++.Lfullblock:
			
 
				++	vmov		q11, q4
			
 
				++	vmov		q15, q5
			
 
				++	b		.Lout
			
 
				++.Lle96:
			
 
				++	vmov		q4, q2
			
 
				++	vmov		q5, q6
			
 
				++	b		.Lfinalblock
			
 
				++.Lle128:
			
 
				++	vmov		q4, q10
			
 
				++	vmov		q5, q14
			
 
				++	b		.Lfinalblock
			
 
				++.Lle224:
			
 
				++	vmov		q4, q3
			
 
				++	vmov		q5, q7
			
 
				++	b		.Lfinalblock
			
 
				++.Llt256:
			
 
				++	vmov		q4, q11
			
 
				++	vmov		q5, q15
			
 
				++	b		.Lpartialblock
			
 
				+ ENDPROC(chacha_4block_xor_neon)
			
 
				++
			
 
				++	.align		L1_CACHE_SHIFT
			
 
				++.Lpermute:
			
 
				++	.byte		0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07
			
 
				++	.byte		0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f
			
 
				++	.byte		0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17
			
 
				++	.byte		0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f
			
 
				++	.byte		0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07
			
 
				++	.byte		0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f
			
 
				++	.byte		0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17
			
 
				++	.byte		0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f
			
--- a/target/linux/generic/backport-5.15/072-crypto-arm-chacha-neon-add-missing-counter-increment.patch
+++ b/target/linux/generic/backport-5.15/072-crypto-arm-chacha-neon-add-missing-counter-increment.patch
@@ -0,0 +1,38 @@
 
				+From 7f63462faf9eab69132bea9abd48c2c05a93145b Mon Sep 17 00:00:00 2001
			
 
				+From: Ard Biesheuvel <[email protected]>
			
 
				+Date: Sun, 13 Dec 2020 15:39:29 +0100
			
 
				+Subject: [PATCH 2/2] crypto: arm/chacha-neon - add missing counter increment
			
 
				+
			
 
				+commit fd16931a2f518a32753920ff20895e5cf04c8ff1 upstream.
			
 
				+
			
 
				+Commit 86cd97ec4b943af3 ("crypto: arm/chacha-neon - optimize for non-block
			
 
				+size multiples") refactored the chacha block handling in the glue code in
			
 
				+a way that may result in the counter increment to be omitted when calling
			
 
				+chacha_block_xor_neon() to process a full block. This violates the skcipher
			
 
				+API, which requires that the output IV is suitable for handling more input
			
 
				+as long as the preceding input has been presented in round multiples of the
			
 
				+block size. Also, the same code is exposed via the chacha library interface
			
 
				+whose callers may actually rely on this increment to occur even for final
			
 
				+blocks that are smaller than the chacha block size.
			
 
				+
			
 
				+So increment the counter after calling chacha_block_xor_neon().
			
 
				+
			
 
				+Fixes: 86cd97ec4b943af3 ("crypto: arm/chacha-neon - optimize for non-block size multiples")
			
 
				+Reported-by: Eric Biggers <[email protected]>
			
 
				+Signed-off-by: Ard Biesheuvel <[email protected]>
			
 
				+Signed-off-by: Herbert Xu <[email protected]>
			
 
				+Signed-off-by: Jason A. Donenfeld <[email protected]>
			
 
				+---
			
 
				+ arch/arm/crypto/chacha-glue.c | 1 +
			
 
				+ 1 file changed, 1 insertion(+)
			
 
				+
			
 
				+--- a/arch/arm/crypto/chacha-glue.c
			
 
				++++ b/arch/arm/crypto/chacha-glue.c
			
 
				+@@ -60,6 +60,7 @@ static void chacha_doneon(u32 *state, u8
			
 
				+ 		chacha_block_xor_neon(state, d, s, nrounds);
			
 
				+ 		if (d != dst)
			
 
				+ 			memcpy(dst, buf, bytes);
			
 
				++		state[12]++;
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/080-wireguard-peer-put-frequently-used-members-above-cac.patch
+++ b/target/linux/generic/backport-5.15/080-wireguard-peer-put-frequently-used-members-above-cac.patch
@@ -0,0 +1,42 @@
 
				+From a13827e9091c07e25cdeec9a402d74a27e2a1111 Mon Sep 17 00:00:00 2001
			
 
				+From: "Jason A. Donenfeld" <[email protected]>
			
 
				+Date: Mon, 22 Feb 2021 17:25:46 +0100
			
 
				+Subject: [PATCH] wireguard: peer: put frequently used members above cache
			
 
				+ lines
			
 
				+
			
 
				+commit 5a0598695634a6bb4126818902dd9140cd9df8b6 upstream.
			
 
				+
			
 
				+The is_dead boolean is checked for every single packet, while the
			
 
				+internal_id member is used basically only for pr_debug messages. So it
			
 
				+makes sense to hoist up is_dead into some space formerly unused by a
			
 
				+struct hole, while demoting internal_api to below the lowest struct
			
 
				+cache line.
			
 
				+
			
 
				+Signed-off-by: Jason A. Donenfeld <[email protected]>
			
 
				+Signed-off-by: Jakub Kicinski <[email protected]>
			
 
				+Signed-off-by: Jason A. Donenfeld <[email protected]>
			
 
				+---
			
 
				+ drivers/net/wireguard/peer.h | 4 ++--
			
 
				+ 1 file changed, 2 insertions(+), 2 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/wireguard/peer.h
			
 
				++++ b/drivers/net/wireguard/peer.h
			
 
				+@@ -39,6 +39,7 @@ struct wg_peer {
			
 
				+ 	struct prev_queue tx_queue, rx_queue;
			
 
				+ 	struct sk_buff_head staged_packet_queue;
			
 
				+ 	int serial_work_cpu;
			
 
				++	bool is_dead;
			
 
				+ 	struct noise_keypairs keypairs;
			
 
				+ 	struct endpoint endpoint;
			
 
				+ 	struct dst_cache endpoint_cache;
			
 
				+@@ -61,9 +62,8 @@ struct wg_peer {
			
 
				+ 	struct rcu_head rcu;
			
 
				+ 	struct list_head peer_list;
			
 
				+ 	struct list_head allowedips_list;
			
 
				+-	u64 internal_id;
			
 
				+ 	struct napi_struct napi;
			
 
				+-	bool is_dead;
			
 
				++	u64 internal_id;
			
 
				+ };
			
 
				+ 
			
 
				+ struct wg_peer *wg_peer_create(struct wg_device *wg,
			
--- a/target/linux/generic/backport-5.15/081-net-next-regmap-allow-to-define-reg_update_bits-for-no-bus.patch
+++ b/target/linux/generic/backport-5.15/081-net-next-regmap-allow-to-define-reg_update_bits-for-no-bus.patch
@@ -0,0 +1,52 @@
 
				+From 02d6fdecb9c38de19065f6bed8d5214556fd061d Mon Sep 17 00:00:00 2001
			
 
				+From: Ansuel Smith <[email protected]>
			
 
				+Date: Thu, 4 Nov 2021 16:00:40 +0100
			
 
				+Subject: regmap: allow to define reg_update_bits for no bus configuration
			
 
				+
			
 
				+Some device requires a special handling for reg_update_bits and can't use
			
 
				+the normal regmap read write logic. An example is when locking is
			
 
				+handled by the device and rmw operations requires to do atomic operations.
			
 
				+Allow to declare a dedicated function in regmap_config for
			
 
				+reg_update_bits in no bus configuration.
			
 
				+
			
 
				+Signed-off-by: Ansuel Smith <[email protected]>
			
 
				+Link: https://lore.kernel.org/r/[email protected]
			
 
				+Signed-off-by: Mark Brown <[email protected]>
			
 
				+---
			
 
				+ drivers/base/regmap/regmap.c | 1 +
			
 
				+ include/linux/regmap.h       | 7 +++++++
			
 
				+ 2 files changed, 8 insertions(+)
			
 
				+
			
 
				+--- a/drivers/base/regmap/regmap.c
			
 
				++++ b/drivers/base/regmap/regmap.c
			
 
				+@@ -842,6 +842,7 @@ struct regmap *__regmap_init(struct devi
			
 
				+ 	if (!bus) {
			
 
				+ 		map->reg_read  = config->reg_read;
			
 
				+ 		map->reg_write = config->reg_write;
			
 
				++		map->reg_update_bits = config->reg_update_bits;
			
 
				+ 
			
 
				+ 		map->defer_caching = false;
			
 
				+ 		goto skip_format_initialization;
			
 
				+--- a/include/linux/regmap.h
			
 
				++++ b/include/linux/regmap.h
			
 
				+@@ -289,6 +289,11 @@ typedef void (*regmap_unlock)(void *);
			
 
				+  *		  read operation on a bus such as SPI, I2C, etc. Most of the
			
 
				+  *		  devices do not need this.
			
 
				+  * @reg_write:	  Same as above for writing.
			
 
				++ * @reg_update_bits: Optional callback that if filled will be used to perform
			
 
				++ *		     all the update_bits(rmw) operation. Should only be provided
			
 
				++ *		     if the function require special handling with lock and reg
			
 
				++ *		     handling and the operation cannot be represented as a simple
			
 
				++ *		     update_bits operation on a bus such as SPI, I2C, etc.
			
 
				+  * @fast_io:	  Register IO is fast. Use a spinlock instead of a mutex
			
 
				+  *	     	  to perform locking. This field is ignored if custom lock/unlock
			
 
				+  *	     	  functions are used (see fields lock/unlock of struct regmap_config).
			
 
				+@@ -366,6 +371,8 @@ struct regmap_config {
			
 
				+ 
			
 
				+ 	int (*reg_read)(void *context, unsigned int reg, unsigned int *val);
			
 
				+ 	int (*reg_write)(void *context, unsigned int reg, unsigned int val);
			
 
				++	int (*reg_update_bits)(void *context, unsigned int reg,
			
 
				++			       unsigned int mask, unsigned int val);
			
 
				+ 
			
 
				+ 	bool fast_io;
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/103-v5.13-MIPS-select-CPU_MIPS64-for-remaining-MIPS64-CPUs.patch
+++ b/target/linux/generic/backport-5.15/103-v5.13-MIPS-select-CPU_MIPS64-for-remaining-MIPS64-CPUs.patch
@@ -0,0 +1,36 @@
 
				+From 6523061868212473f63812a0c477a161742bed42 Mon Sep 17 00:00:00 2001
			
 
				+From: "Jason A. Donenfeld" <[email protected]>
			
 
				+Date: Sat, 27 Feb 2021 13:20:24 +0100
			
 
				+Subject: [PATCH] MIPS: select CPU_MIPS64 for remaining MIPS64 CPUs
			
 
				+
			
 
				+The CPU_MIPS64 and CPU_MIPS32 variables are supposed to be able to
			
 
				+distinguish broadly between 64-bit and 32-bit MIPS CPUs. However, they
			
 
				+weren't selected by the specialty CPUs, Octeon and Loongson, which meant
			
 
				+it was possible to hit a weird state of:
			
 
				+
			
 
				+    MIPS=y, CONFIG_64BIT=y, CPU_MIPS64=n
			
 
				+
			
 
				+This commit rectifies the issue by having CPU_MIPS64 be selected when
			
 
				+the missing Octeon or Loongson models are selected.
			
 
				+
			
 
				+Cc: Thomas Bogendoerfer <[email protected]>
			
 
				+Cc: Ralf Baechle <[email protected]>
			
 
				+Cc: George Cherian <[email protected]>
			
 
				+Cc: Huacai Chen <[email protected]>
			
 
				+Cc: Jiaxun Yang <[email protected]>
			
 
				+Signed-off-by: Jason A. Donenfeld <[email protected]>
			
 
				+---
			
 
				+ arch/mips/Kconfig | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/arch/mips/Kconfig
			
 
				++++ b/arch/mips/Kconfig
			
 
				+@@ -2088,7 +2088,7 @@ config CPU_MIPS32
			
 
				+ config CPU_MIPS64
			
 
				+ 	bool
			
 
				+ 	default y if CPU_MIPS64_R1 || CPU_MIPS64_R2 || CPU_MIPS64_R5 || \
			
 
				+-		     CPU_MIPS64_R6
			
 
				++		     CPU_MIPS64_R6 || CPU_LOONGSON64 || CPU_CAVIUM_OCTEON
			
 
				+ 
			
 
				+ #
			
 
				+ # These indicate the revision of the architecture
			
--- a/target/linux/generic/backport-5.15/311-v5.11-MIPS-zboot-put-appended-dtb-into-a-section.patch
+++ b/target/linux/generic/backport-5.15/311-v5.11-MIPS-zboot-put-appended-dtb-into-a-section.patch
@@ -0,0 +1,36 @@
 
				+From 7d1531c81c0fb4c93bea8dc316043ad0e4d0c270 Mon Sep 17 00:00:00 2001
			
 
				+From: Chuanhong Guo <[email protected]>
			
 
				+Date: Sun, 25 Oct 2020 23:19:40 +0800
			
 
				+Subject: [PATCH] MIPS: zboot: put appended dtb into a section
			
 
				+
			
 
				+This will make a separated section for dtb appear in ELF, and we can
			
 
				+then use objcopy to patch a dtb into vmlinuz when RAW_APPENDED_DTB
			
 
				+is set in kernel config.
			
 
				+
			
 
				+command to patch a dtb:
			
 
				+objcopy --set-section-flags=.appended_dtb=alloc,contents \
			
 
				+        --update-section=.appended_dtb=<target>.dtb vmlinuz vmlinuz-dtb
			
 
				+
			
 
				+Signed-off-by: Chuanhong Guo <[email protected]>
			
 
				+---
			
 
				+ arch/mips/boot/compressed/ld.script | 9 ++++++---
			
 
				+ 1 file changed, 6 insertions(+), 3 deletions(-)
			
 
				+
			
 
				+--- a/arch/mips/boot/compressed/ld.script
			
 
				++++ b/arch/mips/boot/compressed/ld.script
			
 
				+@@ -31,9 +31,12 @@ SECTIONS
			
 
				+ 		CONSTRUCTORS
			
 
				+ 		. = ALIGN(16);
			
 
				+ 	}
			
 
				+-	__appended_dtb = .;
			
 
				+-	/* leave space for appended DTB */
			
 
				+-	. += 0x100000;
			
 
				++
			
 
				++	.appended_dtb : {
			
 
				++		__appended_dtb = .;
			
 
				++		/* leave space for appended DTB */
			
 
				++		. += 0x100000;
			
 
				++	}
			
 
				+ 
			
 
				+ 	_edata = .;
			
 
				+ 	/* End of data section */
			
--- a/target/linux/generic/backport-5.15/343-netfilter-nft_flow_offload-handle-netdevice-events-f.patch
+++ b/target/linux/generic/backport-5.15/343-netfilter-nft_flow_offload-handle-netdevice-events-f.patch
@@ -0,0 +1,106 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Thu, 25 Jan 2018 12:58:55 +0100
			
 
				+Subject: [PATCH] netfilter: nft_flow_offload: handle netdevice events from
			
 
				+ nf_flow_table
			
 
				+
			
 
				+Move the code that deals with device events to the core.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -576,13 +576,41 @@ void nf_flow_table_free(struct nf_flowta
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(nf_flow_table_free);
			
 
				+ 
			
 
				++static int nf_flow_table_netdev_event(struct notifier_block *this,
			
 
				++				      unsigned long event, void *ptr)
			
 
				++{
			
 
				++	struct net_device *dev = netdev_notifier_info_to_dev(ptr);
			
 
				++
			
 
				++	if (event != NETDEV_DOWN)
			
 
				++		return NOTIFY_DONE;
			
 
				++
			
 
				++	nf_flow_table_cleanup(dev);
			
 
				++
			
 
				++	return NOTIFY_DONE;
			
 
				++}
			
 
				++
			
 
				++static struct notifier_block flow_offload_netdev_notifier = {
			
 
				++	.notifier_call	= nf_flow_table_netdev_event,
			
 
				++};
			
 
				++
			
 
				+ static int __init nf_flow_table_module_init(void)
			
 
				+ {
			
 
				+-	return nf_flow_table_offload_init();
			
 
				++	int ret;
			
 
				++
			
 
				++	ret = nf_flow_table_offload_init();
			
 
				++	if (ret)
			
 
				++		return ret;
			
 
				++
			
 
				++	ret = register_netdevice_notifier(&flow_offload_netdev_notifier);
			
 
				++	if (ret)
			
 
				++		nf_flow_table_offload_exit();
			
 
				++
			
 
				++	return ret;
			
 
				+ }
			
 
				+ 
			
 
				+ static void __exit nf_flow_table_module_exit(void)
			
 
				+ {
			
 
				++	unregister_netdevice_notifier(&flow_offload_netdev_notifier);
			
 
				+ 	nf_flow_table_offload_exit();
			
 
				+ }
			
 
				+ 
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -237,47 +237,14 @@ static struct nft_expr_type nft_flow_off
			
 
				+ 	.owner		= THIS_MODULE,
			
 
				+ };
			
 
				+ 
			
 
				+-static int flow_offload_netdev_event(struct notifier_block *this,
			
 
				+-				     unsigned long event, void *ptr)
			
 
				+-{
			
 
				+-	struct net_device *dev = netdev_notifier_info_to_dev(ptr);
			
 
				+-
			
 
				+-	if (event != NETDEV_DOWN)
			
 
				+-		return NOTIFY_DONE;
			
 
				+-
			
 
				+-	nf_flow_table_cleanup(dev);
			
 
				+-
			
 
				+-	return NOTIFY_DONE;
			
 
				+-}
			
 
				+-
			
 
				+-static struct notifier_block flow_offload_netdev_notifier = {
			
 
				+-	.notifier_call	= flow_offload_netdev_event,
			
 
				+-};
			
 
				+-
			
 
				+ static int __init nft_flow_offload_module_init(void)
			
 
				+ {
			
 
				+-	int err;
			
 
				+-
			
 
				+-	err = register_netdevice_notifier(&flow_offload_netdev_notifier);
			
 
				+-	if (err)
			
 
				+-		goto err;
			
 
				+-
			
 
				+-	err = nft_register_expr(&nft_flow_offload_type);
			
 
				+-	if (err < 0)
			
 
				+-		goto register_expr;
			
 
				+-
			
 
				+-	return 0;
			
 
				+-
			
 
				+-register_expr:
			
 
				+-	unregister_netdevice_notifier(&flow_offload_netdev_notifier);
			
 
				+-err:
			
 
				+-	return err;
			
 
				++	return nft_register_expr(&nft_flow_offload_type);
			
 
				+ }
			
 
				+ 
			
 
				+ static void __exit nft_flow_offload_module_exit(void)
			
 
				+ {
			
 
				+ 	nft_unregister_expr(&nft_flow_offload_type);
			
 
				+-	unregister_netdevice_notifier(&flow_offload_netdev_notifier);
			
 
				+ }
			
 
				+ 
			
 
				+ module_init(nft_flow_offload_module_init);
			
--- a/target/linux/generic/backport-5.15/401-v5.11-dt-bindings-mtd-convert-fixed-partitions-to-the-json.patch
+++ b/target/linux/generic/backport-5.15/401-v5.11-dt-bindings-mtd-convert-fixed-partitions-to-the-json.patch
@@ -0,0 +1,324 @@
 
				+From 04e9ab75267489224364fa510a88ada83e11c325 Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Thu, 10 Dec 2020 18:23:52 +0100
			
 
				+Subject: [PATCH] dt-bindings: mtd: convert "fixed-partitions" to the
			
 
				+ json-schema
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+This standardizes its documentation, allows validating with Makefile
			
 
				+checks and helps writing DTS files.
			
 
				+
			
 
				+Noticeable changes:
			
 
				+1. Dropped "Partitions can be represented by sub-nodes of a flash
			
 
				+   device." as we also support subpartitions (don't have to be part of
			
 
				+   flash device node)
			
 
				+2. Dropped "to Linux" as bindings are meant to be os agnostic.
			
 
				+
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+Link: https://lore.kernel.org/r/[email protected]
			
 
				+Signed-off-by: Rob Herring <[email protected]>
			
 
				+---
			
 
				+ .../devicetree/bindings/mtd/partition.txt     | 131 +--------------
			
 
				+ .../mtd/partitions/fixed-partitions.yaml      | 152 ++++++++++++++++++
			
 
				+ 2 files changed, 154 insertions(+), 129 deletions(-)
			
 
				+ create mode 100644 Documentation/devicetree/bindings/mtd/partitions/fixed-partitions.yaml
			
 
				+
			
 
				+--- a/Documentation/devicetree/bindings/mtd/partition.txt
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partition.txt
			
 
				+@@ -24,137 +24,10 @@ another partitioning method.
			
 
				+ Available bindings are listed in the "partitions" subdirectory.
			
 
				+ 
			
 
				+ 
			
 
				+-Fixed Partitions
			
 
				+-================
			
 
				+-
			
 
				+-Partitions can be represented by sub-nodes of a flash device. This can be used
			
 
				+-on platforms which have strong conventions about which portions of a flash are
			
 
				+-used for what purposes, but which don't use an on-flash partition table such
			
 
				+-as RedBoot.
			
 
				+-
			
 
				+-The partition table should be a subnode of the flash node and should be named
			
 
				+-'partitions'. This node should have the following property:
			
 
				+-- compatible : (required) must be "fixed-partitions"
			
 
				+-Partitions are then defined in subnodes of the partitions node.
			
 
				++Deprecated: partitions defined in flash node
			
 
				++============================================
			
 
				+ 
			
 
				+ For backwards compatibility partitions as direct subnodes of the flash device are
			
 
				+ supported. This use is discouraged.
			
 
				+ NOTE: also for backwards compatibility, direct subnodes that have a compatible
			
 
				+ string are not considered partitions, as they may be used for other bindings.
			
 
				+-
			
 
				+-#address-cells & #size-cells must both be present in the partitions subnode of the
			
 
				+-flash device. There are two valid values for both:
			
 
				+-<1>: for partitions that require a single 32-bit cell to represent their
			
 
				+-     size/address (aka the value is below 4 GiB)
			
 
				+-<2>: for partitions that require two 32-bit cells to represent their
			
 
				+-     size/address (aka the value is 4 GiB or greater).
			
 
				+-
			
 
				+-Required properties:
			
 
				+-- reg : The partition's offset and size within the flash
			
 
				+-
			
 
				+-Optional properties:
			
 
				+-- label : The label / name for this partition.  If omitted, the label is taken
			
 
				+-  from the node name (excluding the unit address).
			
 
				+-- read-only : This parameter, if present, is a hint to Linux that this
			
 
				+-  partition should only be mounted read-only. This is usually used for flash
			
 
				+-  partitions containing early-boot firmware images or data which should not be
			
 
				+-  clobbered.
			
 
				+-- lock : Do not unlock the partition at initialization time (not supported on
			
 
				+-  all devices)
			
 
				+-- slc-mode: This parameter, if present, allows one to emulate SLC mode on a
			
 
				+-  partition attached to an MLC NAND thus making this partition immune to
			
 
				+-  paired-pages corruptions
			
 
				+-
			
 
				+-Examples:
			
 
				+-
			
 
				+-
			
 
				+-flash@0 {
			
 
				+-	partitions {
			
 
				+-		compatible = "fixed-partitions";
			
 
				+-		#address-cells = <1>;
			
 
				+-		#size-cells = <1>;
			
 
				+-
			
 
				+-		partition@0 {
			
 
				+-			label = "u-boot";
			
 
				+-			reg = <0x0000000 0x100000>;
			
 
				+-			read-only;
			
 
				+-		};
			
 
				+-
			
 
				+-		uimage@100000 {
			
 
				+-			reg = <0x0100000 0x200000>;
			
 
				+-		};
			
 
				+-	};
			
 
				+-};
			
 
				+-
			
 
				+-flash@1 {
			
 
				+-	partitions {
			
 
				+-		compatible = "fixed-partitions";
			
 
				+-		#address-cells = <1>;
			
 
				+-		#size-cells = <2>;
			
 
				+-
			
 
				+-		/* a 4 GiB partition */
			
 
				+-		partition@0 {
			
 
				+-			label = "filesystem";
			
 
				+-			reg = <0x00000000 0x1 0x00000000>;
			
 
				+-		};
			
 
				+-	};
			
 
				+-};
			
 
				+-
			
 
				+-flash@2 {
			
 
				+-	partitions {
			
 
				+-		compatible = "fixed-partitions";
			
 
				+-		#address-cells = <2>;
			
 
				+-		#size-cells = <2>;
			
 
				+-
			
 
				+-		/* an 8 GiB partition */
			
 
				+-		partition@0 {
			
 
				+-			label = "filesystem #1";
			
 
				+-			reg = <0x0 0x00000000 0x2 0x00000000>;
			
 
				+-		};
			
 
				+-
			
 
				+-		/* a 4 GiB partition */
			
 
				+-		partition@200000000 {
			
 
				+-			label = "filesystem #2";
			
 
				+-			reg = <0x2 0x00000000 0x1 0x00000000>;
			
 
				+-		};
			
 
				+-	};
			
 
				+-};
			
 
				+-
			
 
				+-flash@3 {
			
 
				+-	partitions {
			
 
				+-		compatible = "fixed-partitions";
			
 
				+-		#address-cells = <1>;
			
 
				+-		#size-cells = <1>;
			
 
				+-
			
 
				+-		partition@0 {
			
 
				+-			label = "bootloader";
			
 
				+-			reg = <0x000000 0x100000>;
			
 
				+-			read-only;
			
 
				+-		};
			
 
				+-
			
 
				+-		firmware@100000 {
			
 
				+-			label = "firmware";
			
 
				+-			reg = <0x100000 0xe00000>;
			
 
				+-			compatible = "brcm,trx";
			
 
				+-		};
			
 
				+-
			
 
				+-		calibration@f00000 {
			
 
				+-			label = "calibration";
			
 
				+-			reg = <0xf00000 0x100000>;
			
 
				+-			compatible = "fixed-partitions";
			
 
				+-			ranges = <0 0xf00000 0x100000>;
			
 
				+-			#address-cells = <1>;
			
 
				+-			#size-cells = <1>;
			
 
				+-
			
 
				+-			partition@0 {
			
 
				+-				label = "wifi0";
			
 
				+-				reg = <0x000000 0x080000>;
			
 
				+-			};
			
 
				+-
			
 
				+-			partition@80000 {
			
 
				+-				label = "wifi1";
			
 
				+-				reg = <0x080000 0x080000>;
			
 
				+-			};
			
 
				+-		};
			
 
				+-	};
			
 
				+-};
			
 
				+--- /dev/null
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/fixed-partitions.yaml
			
 
				+@@ -0,0 +1,152 @@
			
 
				++# SPDX-License-Identifier: GPL-2.0-only OR BSD-2-Clause
			
 
				++%YAML 1.2
			
 
				++---
			
 
				++$id: http://devicetree.org/schemas/mtd/partitions/fixed-partitions.yaml#
			
 
				++$schema: http://devicetree.org/meta-schemas/core.yaml#
			
 
				++
			
 
				++title: Fixed partitions
			
 
				++
			
 
				++description: |
			
 
				++  This binding can be used on platforms which have strong conventions about
			
 
				++  which portions of a flash are used for what purposes, but which don't use an
			
 
				++  on-flash partition table such as RedBoot.
			
 
				++
			
 
				++  The partition table should be a node named "partitions". Partitions are then
			
 
				++  defined as subnodes.
			
 
				++
			
 
				++maintainers:
			
 
				++  - Rafał Miłecki <[email protected]>
			
 
				++
			
 
				++properties:
			
 
				++  compatible:
			
 
				++    const: fixed-partitions
			
 
				++
			
 
				++  "#address-cells": true
			
 
				++
			
 
				++  "#size-cells": true
			
 
				++
			
 
				++patternProperties:
			
 
				++  "@[0-9a-f]+$":
			
 
				++    description: node describing a single flash partition
			
 
				++    type: object
			
 
				++
			
 
				++    properties:
			
 
				++      reg:
			
 
				++        description: partition's offset and size within the flash
			
 
				++        maxItems: 1
			
 
				++
			
 
				++      label:
			
 
				++        description: The label / name for this partition. If omitted, the label
			
 
				++          is taken from the node name (excluding the unit address).
			
 
				++
			
 
				++      read-only:
			
 
				++        description: This parameter, if present, is a hint that this partition
			
 
				++          should only be mounted read-only. This is usually used for flash
			
 
				++          partitions containing early-boot firmware images or data which should
			
 
				++          not be clobbered.
			
 
				++        type: boolean
			
 
				++
			
 
				++      lock:
			
 
				++        description: Do not unlock the partition at initialization time (not
			
 
				++          supported on all devices)
			
 
				++        type: boolean
			
 
				++
			
 
				++      slc-mode:
			
 
				++        description: This parameter, if present, allows one to emulate SLC mode
			
 
				++          on a partition attached to an MLC NAND thus making this partition
			
 
				++          immune to paired-pages corruptions
			
 
				++        type: boolean
			
 
				++
			
 
				++    required:
			
 
				++      - reg
			
 
				++
			
 
				++required:
			
 
				++  - "#address-cells"
			
 
				++  - "#size-cells"
			
 
				++
			
 
				++additionalProperties: true
			
 
				++
			
 
				++examples:
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "fixed-partitions";
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <1>;
			
 
				++
			
 
				++        partition@0 {
			
 
				++            label = "u-boot";
			
 
				++            reg = <0x0000000 0x100000>;
			
 
				++            read-only;
			
 
				++        };
			
 
				++
			
 
				++        uimage@100000 {
			
 
				++            reg = <0x0100000 0x200000>;
			
 
				++        };
			
 
				++    };
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "fixed-partitions";
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <2>;
			
 
				++
			
 
				++        /* a 4 GiB partition */
			
 
				++        partition@0 {
			
 
				++            label = "filesystem";
			
 
				++            reg = <0x00000000 0x1 0x00000000>;
			
 
				++        };
			
 
				++    };
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "fixed-partitions";
			
 
				++        #address-cells = <2>;
			
 
				++        #size-cells = <2>;
			
 
				++
			
 
				++        /* an 8 GiB partition */
			
 
				++        partition@0 {
			
 
				++            label = "filesystem #1";
			
 
				++            reg = <0x0 0x00000000 0x2 0x00000000>;
			
 
				++        };
			
 
				++
			
 
				++        /* a 4 GiB partition */
			
 
				++        partition@200000000 {
			
 
				++            label = "filesystem #2";
			
 
				++            reg = <0x2 0x00000000 0x1 0x00000000>;
			
 
				++        };
			
 
				++    };
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "fixed-partitions";
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <1>;
			
 
				++
			
 
				++        partition@0 {
			
 
				++            label = "bootloader";
			
 
				++            reg = <0x000000 0x100000>;
			
 
				++            read-only;
			
 
				++        };
			
 
				++
			
 
				++        firmware@100000 {
			
 
				++            compatible = "brcm,trx";
			
 
				++            label = "firmware";
			
 
				++            reg = <0x100000 0xe00000>;
			
 
				++        };
			
 
				++
			
 
				++        calibration@f00000 {
			
 
				++            compatible = "fixed-partitions";
			
 
				++            label = "calibration";
			
 
				++            reg = <0xf00000 0x100000>;
			
 
				++            ranges = <0 0xf00000 0x100000>;
			
 
				++            #address-cells = <1>;
			
 
				++            #size-cells = <1>;
			
 
				++
			
 
				++            partition@0 {
			
 
				++                label = "wifi0";
			
 
				++                reg = <0x000000 0x080000>;
			
 
				++            };
			
 
				++
			
 
				++            partition@80000 {
			
 
				++                label = "wifi1";
			
 
				++                reg = <0x080000 0x080000>;
			
 
				++            };
			
 
				++        };
			
 
				++    };
			
--- a/target/linux/generic/backport-5.15/402-v5.12-0001-dt-bindings-mtd-move-partition-binding-to-its-own-fi.patch
+++ b/target/linux/generic/backport-5.15/402-v5.12-0001-dt-bindings-mtd-move-partition-binding-to-its-own-fi.patch
@@ -0,0 +1,115 @@
 
				+From 6418522022c706fd867b00b2571edba48b8fa8c7 Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Thu, 11 Feb 2021 23:04:25 +0100
			
 
				+Subject: [PATCH] dt-bindings: mtd: move partition binding to its own file
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+Single partition binding is quite common and may be:
			
 
				+1. Used by multiple parsers
			
 
				+2. Extended for more specific cases
			
 
				+
			
 
				+Move it to separated file to avoid code duplication.
			
 
				+
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+Reviewed-by: Rob Herring <[email protected]>
			
 
				+Signed-off-by: Richard Weinberger <[email protected]>
			
 
				+---
			
 
				+ .../mtd/partitions/fixed-partitions.yaml      | 33 +------------
			
 
				+ .../bindings/mtd/partitions/partition.yaml    | 47 +++++++++++++++++++
			
 
				+ 2 files changed, 48 insertions(+), 32 deletions(-)
			
 
				+ create mode 100644 Documentation/devicetree/bindings/mtd/partitions/partition.yaml
			
 
				+
			
 
				+--- a/Documentation/devicetree/bindings/mtd/partitions/fixed-partitions.yaml
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/fixed-partitions.yaml
			
 
				+@@ -27,38 +27,7 @@ properties:
			
 
				+ 
			
 
				+ patternProperties:
			
 
				+   "@[0-9a-f]+$":
			
 
				+-    description: node describing a single flash partition
			
 
				+-    type: object
			
 
				+-
			
 
				+-    properties:
			
 
				+-      reg:
			
 
				+-        description: partition's offset and size within the flash
			
 
				+-        maxItems: 1
			
 
				+-
			
 
				+-      label:
			
 
				+-        description: The label / name for this partition. If omitted, the label
			
 
				+-          is taken from the node name (excluding the unit address).
			
 
				+-
			
 
				+-      read-only:
			
 
				+-        description: This parameter, if present, is a hint that this partition
			
 
				+-          should only be mounted read-only. This is usually used for flash
			
 
				+-          partitions containing early-boot firmware images or data which should
			
 
				+-          not be clobbered.
			
 
				+-        type: boolean
			
 
				+-
			
 
				+-      lock:
			
 
				+-        description: Do not unlock the partition at initialization time (not
			
 
				+-          supported on all devices)
			
 
				+-        type: boolean
			
 
				+-
			
 
				+-      slc-mode:
			
 
				+-        description: This parameter, if present, allows one to emulate SLC mode
			
 
				+-          on a partition attached to an MLC NAND thus making this partition
			
 
				+-          immune to paired-pages corruptions
			
 
				+-        type: boolean
			
 
				+-
			
 
				+-    required:
			
 
				+-      - reg
			
 
				++    $ref: "partition.yaml#"
			
 
				+ 
			
 
				+ required:
			
 
				+   - "#address-cells"
			
 
				+--- /dev/null
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/partition.yaml
			
 
				+@@ -0,0 +1,47 @@
			
 
				++# SPDX-License-Identifier: GPL-2.0-only OR BSD-2-Clause
			
 
				++%YAML 1.2
			
 
				++---
			
 
				++$id: http://devicetree.org/schemas/mtd/partitions/partition.yaml#
			
 
				++$schema: http://devicetree.org/meta-schemas/core.yaml#
			
 
				++
			
 
				++title: Partition
			
 
				++
			
 
				++description: |
			
 
				++  This binding describes a single flash partition. Each partition must have its
			
 
				++  relative offset and size specified. Depending on partition function extra
			
 
				++  properties can be used.
			
 
				++
			
 
				++maintainers:
			
 
				++  - Rafał Miłecki <[email protected]>
			
 
				++
			
 
				++properties:
			
 
				++  reg:
			
 
				++    description: partition's offset and size within the flash
			
 
				++    maxItems: 1
			
 
				++
			
 
				++  label:
			
 
				++    description: The label / name for this partition. If omitted, the label
			
 
				++      is taken from the node name (excluding the unit address).
			
 
				++
			
 
				++  read-only:
			
 
				++    description: This parameter, if present, is a hint that this partition
			
 
				++      should only be mounted read-only. This is usually used for flash
			
 
				++      partitions containing early-boot firmware images or data which should
			
 
				++      not be clobbered.
			
 
				++    type: boolean
			
 
				++
			
 
				++  lock:
			
 
				++    description: Do not unlock the partition at initialization time (not
			
 
				++      supported on all devices)
			
 
				++    type: boolean
			
 
				++
			
 
				++  slc-mode:
			
 
				++    description: This parameter, if present, allows one to emulate SLC mode
			
 
				++      on a partition attached to an MLC NAND thus making this partition
			
 
				++      immune to paired-pages corruptions
			
 
				++    type: boolean
			
 
				++
			
 
				++required:
			
 
				++  - reg
			
 
				++
			
 
				++additionalProperties: true
			
--- a/target/linux/generic/backport-5.15/402-v5.12-0002-dt-bindings-mtd-add-binding-for-BCM4908-partitions.patch
+++ b/target/linux/generic/backport-5.15/402-v5.12-0002-dt-bindings-mtd-add-binding-for-BCM4908-partitions.patch
@@ -0,0 +1,92 @@
 
				+From 6e9dff6fe3fbc452f16566e4a7e293b0decefdba Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Thu, 11 Feb 2021 23:04:26 +0100
			
 
				+Subject: [PATCH] dt-bindings: mtd: add binding for BCM4908 partitions
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+BCM4908 uses fixed partitions layout but function of some partitions may
			
 
				+vary. Some devices use multiple firmware partitions and those partitions
			
 
				+should be marked to let system discover their purpose.
			
 
				+
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+Signed-off-by: Richard Weinberger <[email protected]>
			
 
				+---
			
 
				+ .../partitions/brcm,bcm4908-partitions.yaml   | 70 +++++++++++++++++++
			
 
				+ 1 file changed, 70 insertions(+)
			
 
				+ create mode 100644 Documentation/devicetree/bindings/mtd/partitions/brcm,bcm4908-partitions.yaml
			
 
				+
			
 
				+--- /dev/null
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/brcm,bcm4908-partitions.yaml
			
 
				+@@ -0,0 +1,70 @@
			
 
				++# SPDX-License-Identifier: GPL-2.0-only OR BSD-2-Clause
			
 
				++%YAML 1.2
			
 
				++---
			
 
				++$id: http://devicetree.org/schemas/mtd/partitions/brcm,bcm4908-partitions.yaml#
			
 
				++$schema: http://devicetree.org/meta-schemas/core.yaml#
			
 
				++
			
 
				++title: Broadcom BCM4908 partitioning
			
 
				++
			
 
				++description: |
			
 
				++  Broadcom BCM4908 CFE bootloader supports two firmware partitions. One is used
			
 
				++  for regular booting, the other is treated as fallback.
			
 
				++
			
 
				++  This binding allows defining all fixed partitions and marking those containing
			
 
				++  firmware. System can use that information e.g. for booting or flashing
			
 
				++  purposes.
			
 
				++
			
 
				++maintainers:
			
 
				++  - Rafał Miłecki <[email protected]>
			
 
				++
			
 
				++properties:
			
 
				++  compatible:
			
 
				++    const: brcm,bcm4908-partitions
			
 
				++
			
 
				++  "#address-cells":
			
 
				++    enum: [ 1, 2 ]
			
 
				++
			
 
				++  "#size-cells":
			
 
				++    enum: [ 1, 2 ]
			
 
				++
			
 
				++patternProperties:
			
 
				++  "^partition@[0-9a-f]+$":
			
 
				++    $ref: "partition.yaml#"
			
 
				++    properties:
			
 
				++      compatible:
			
 
				++        const: brcm,bcm4908-firmware
			
 
				++    unevaluatedProperties: false
			
 
				++
			
 
				++required:
			
 
				++  - "#address-cells"
			
 
				++  - "#size-cells"
			
 
				++
			
 
				++additionalProperties: false
			
 
				++
			
 
				++examples:
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "brcm,bcm4908-partitions";
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <1>;
			
 
				++
			
 
				++        partition@0 {
			
 
				++            label = "cferom";
			
 
				++            reg = <0x0 0x100000>;
			
 
				++        };
			
 
				++
			
 
				++        partition@100000 {
			
 
				++            compatible = "brcm,bcm4908-firmware";
			
 
				++            reg = <0x100000 0xf00000>;
			
 
				++        };
			
 
				++
			
 
				++        partition@1000000 {
			
 
				++            compatible = "brcm,bcm4908-firmware";
			
 
				++            reg = <0x1000000 0xf00000>;
			
 
				++        };
			
 
				++
			
 
				++        partition@1f00000 {
			
 
				++            label = "calibration";
			
 
				++            reg = <0x1f00000 0x100000>;
			
 
				++        };
			
 
				++    };
			
--- a/target/linux/generic/backport-5.15/403-v5.13-mtd-parsers-ofpart-support-BCM4908-fixed-partitions.patch
+++ b/target/linux/generic/backport-5.15/403-v5.13-mtd-parsers-ofpart-support-BCM4908-fixed-partitions.patch
@@ -0,0 +1,654 @@
 
				+From afbef8efb591792579c633a7c545f914c6165f82 Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Thu, 11 Feb 2021 23:04:27 +0100
			
 
				+Subject: [PATCH] mtd: parsers: ofpart: support BCM4908 fixed partitions
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+Some devices use fixed partitioning with some partitions requiring some
			
 
				+extra logic. E.g. BCM4908 may have multiple firmware partitions but
			
 
				+detecting currently used one requires checking bootloader parameters.
			
 
				+
			
 
				+To support such cases without duplicating a lot of code (without copying
			
 
				+most of the ofpart.c code) support for post-parsing callback was added.
			
 
				+
			
 
				+BCM4908 support in ofpart can be enabled using config option and results
			
 
				+in compiling & executing a specific callback. It simply reads offset of
			
 
				+currently used firmware partition from the DT. Bootloader specifies it
			
 
				+using the "brcm_blparms" property.
			
 
				+
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+---
			
 
				+ drivers/mtd/parsers/Kconfig                   |  9 +++
			
 
				+ drivers/mtd/parsers/Makefile                  |  2 +
			
 
				+ drivers/mtd/parsers/ofpart_bcm4908.c          | 64 +++++++++++++++++++
			
 
				+ drivers/mtd/parsers/ofpart_bcm4908.h          | 15 +++++
			
 
				+ .../mtd/parsers/{ofpart.c => ofpart_core.c}   | 28 +++++++-
			
 
				+ 5 files changed, 116 insertions(+), 2 deletions(-)
			
 
				+ create mode 100644 drivers/mtd/parsers/ofpart_bcm4908.c
			
 
				+ create mode 100644 drivers/mtd/parsers/ofpart_bcm4908.h
			
 
				+ rename drivers/mtd/parsers/{ofpart.c => ofpart_core.c} (88%)
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/Kconfig
			
 
				++++ b/drivers/mtd/parsers/Kconfig
			
 
				+@@ -67,6 +67,15 @@ config MTD_OF_PARTS
			
 
				+ 	  flash memory node, as described in
			
 
				+ 	  Documentation/devicetree/bindings/mtd/partition.txt.
			
 
				+ 
			
 
				++config MTD_OF_PARTS_BCM4908
			
 
				++	bool "BCM4908 partitioning support"
			
 
				++	depends on MTD_OF_PARTS && (ARCH_BCM4908 || COMPILE_TEST)
			
 
				++	default ARCH_BCM4908
			
 
				++	help
			
 
				++	  This provides partitions parser for BCM4908 family devices
			
 
				++	  that can have multiple "firmware" partitions. It takes care of
			
 
				++	  finding currently used one and backup ones.
			
 
				++
			
 
				+ config MTD_PARSER_IMAGETAG
			
 
				+ 	tristate "Parser for BCM963XX Image Tag format partitions"
			
 
				+ 	depends on BCM63XX || BMIPS_GENERIC || COMPILE_TEST
			
 
				+--- a/drivers/mtd/parsers/Makefile
			
 
				++++ b/drivers/mtd/parsers/Makefile
			
 
				+@@ -4,6 +4,8 @@ obj-$(CONFIG_MTD_BCM47XX_PARTS)		+= bcm4
			
 
				+ obj-$(CONFIG_MTD_BCM63XX_PARTS)		+= bcm63xxpart.o
			
 
				+ obj-$(CONFIG_MTD_CMDLINE_PARTS)		+= cmdlinepart.o
			
 
				+ obj-$(CONFIG_MTD_OF_PARTS)		+= ofpart.o
			
 
				++ofpart-y				+= ofpart_core.o
			
 
				++ofpart-$(CONFIG_MTD_OF_PARTS_BCM4908)	+= ofpart_bcm4908.o
			
 
				+ obj-$(CONFIG_MTD_PARSER_IMAGETAG)	+= parser_imagetag.o
			
 
				+ obj-$(CONFIG_MTD_AFS_PARTS)		+= afs.o
			
 
				+ obj-$(CONFIG_MTD_PARSER_TRX)		+= parser_trx.o
			
 
				+--- /dev/null
			
 
				++++ b/drivers/mtd/parsers/ofpart_bcm4908.c
			
 
				+@@ -0,0 +1,64 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0
			
 
				++/*
			
 
				++ * Copyright (C) 2021 Rafał Miłecki <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++#include <linux/module.h>
			
 
				++#include <linux/init.h>
			
 
				++#include <linux/of.h>
			
 
				++#include <linux/mtd/mtd.h>
			
 
				++#include <linux/slab.h>
			
 
				++#include <linux/mtd/partitions.h>
			
 
				++
			
 
				++#include "ofpart_bcm4908.h"
			
 
				++
			
 
				++#define BLPARAMS_FW_OFFSET		"NAND_RFS_OFS"
			
 
				++
			
 
				++static long long bcm4908_partitions_fw_offset(void)
			
 
				++{
			
 
				++	struct device_node *root;
			
 
				++	struct property *prop;
			
 
				++	const char *s;
			
 
				++
			
 
				++	root = of_find_node_by_path("/");
			
 
				++	if (!root)
			
 
				++		return -ENOENT;
			
 
				++
			
 
				++	of_property_for_each_string(root, "brcm_blparms", prop, s) {
			
 
				++		size_t len = strlen(BLPARAMS_FW_OFFSET);
			
 
				++		unsigned long offset;
			
 
				++		int err;
			
 
				++
			
 
				++		if (strncmp(s, BLPARAMS_FW_OFFSET, len) || s[len] != '=')
			
 
				++			continue;
			
 
				++
			
 
				++		err = kstrtoul(s + len + 1, 0, &offset);
			
 
				++		if (err) {
			
 
				++			pr_err("failed to parse %s\n", s + len + 1);
			
 
				++			return err;
			
 
				++		}
			
 
				++
			
 
				++		return offset << 10;
			
 
				++	}
			
 
				++
			
 
				++	return -ENOENT;
			
 
				++}
			
 
				++
			
 
				++int bcm4908_partitions_post_parse(struct mtd_info *mtd, struct mtd_partition *parts, int nr_parts)
			
 
				++{
			
 
				++	long long fw_offset;
			
 
				++	int i;
			
 
				++
			
 
				++	fw_offset = bcm4908_partitions_fw_offset();
			
 
				++
			
 
				++	for (i = 0; i < nr_parts; i++) {
			
 
				++		if (of_device_is_compatible(parts[i].of_node, "brcm,bcm4908-firmware")) {
			
 
				++			if (fw_offset < 0 || parts[i].offset == fw_offset)
			
 
				++				parts[i].name = "firmware";
			
 
				++			else
			
 
				++				parts[i].name = "backup";
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				+--- /dev/null
			
 
				++++ b/drivers/mtd/parsers/ofpart_bcm4908.h
			
 
				+@@ -0,0 +1,15 @@
			
 
				++/* SPDX-License-Identifier: GPL-2.0 */
			
 
				++#ifndef __BCM4908_PARTITIONS_H
			
 
				++#define __BCM4908_PARTITIONS_H
			
 
				++
			
 
				++#ifdef CONFIG_MTD_OF_PARTS_BCM4908
			
 
				++int bcm4908_partitions_post_parse(struct mtd_info *mtd, struct mtd_partition *parts, int nr_parts);
			
 
				++#else
			
 
				++static inline int bcm4908_partitions_post_parse(struct mtd_info *mtd, struct mtd_partition *parts,
			
 
				++						int nr_parts)
			
 
				++{
			
 
				++	return -EOPNOTSUPP;
			
 
				++}
			
 
				++#endif
			
 
				++
			
 
				++#endif
			
 
				+--- a/drivers/mtd/parsers/ofpart.c
			
 
				++++ /dev/null
			
 
				+@@ -1,239 +0,0 @@
			
 
				+-// SPDX-License-Identifier: GPL-2.0-or-later
			
 
				+-/*
			
 
				+- * Flash partitions described by the OF (or flattened) device tree
			
 
				+- *
			
 
				+- * Copyright © 2006 MontaVista Software Inc.
			
 
				+- * Author: Vitaly Wool <[email protected]>
			
 
				+- *
			
 
				+- * Revised to handle newer style flash binding by:
			
 
				+- *   Copyright © 2007 David Gibson, IBM Corporation.
			
 
				+- */
			
 
				+-
			
 
				+-#include <linux/module.h>
			
 
				+-#include <linux/init.h>
			
 
				+-#include <linux/of.h>
			
 
				+-#include <linux/mtd/mtd.h>
			
 
				+-#include <linux/slab.h>
			
 
				+-#include <linux/mtd/partitions.h>
			
 
				+-
			
 
				+-static bool node_has_compatible(struct device_node *pp)
			
 
				+-{
			
 
				+-	return of_get_property(pp, "compatible", NULL);
			
 
				+-}
			
 
				+-
			
 
				+-static int parse_fixed_partitions(struct mtd_info *master,
			
 
				+-				  const struct mtd_partition **pparts,
			
 
				+-				  struct mtd_part_parser_data *data)
			
 
				+-{
			
 
				+-	struct mtd_partition *parts;
			
 
				+-	struct device_node *mtd_node;
			
 
				+-	struct device_node *ofpart_node;
			
 
				+-	const char *partname;
			
 
				+-	struct device_node *pp;
			
 
				+-	int nr_parts, i, ret = 0;
			
 
				+-	bool dedicated = true;
			
 
				+-
			
 
				+-
			
 
				+-	/* Pull of_node from the master device node */
			
 
				+-	mtd_node = mtd_get_of_node(master);
			
 
				+-	if (!mtd_node)
			
 
				+-		return 0;
			
 
				+-
			
 
				+-	ofpart_node = of_get_child_by_name(mtd_node, "partitions");
			
 
				+-	if (!ofpart_node) {
			
 
				+-		/*
			
 
				+-		 * We might get here even when ofpart isn't used at all (e.g.,
			
 
				+-		 * when using another parser), so don't be louder than
			
 
				+-		 * KERN_DEBUG
			
 
				+-		 */
			
 
				+-		pr_debug("%s: 'partitions' subnode not found on %pOF. Trying to parse direct subnodes as partitions.\n",
			
 
				+-			 master->name, mtd_node);
			
 
				+-		ofpart_node = mtd_node;
			
 
				+-		dedicated = false;
			
 
				+-	} else if (!of_device_is_compatible(ofpart_node, "fixed-partitions")) {
			
 
				+-		/* The 'partitions' subnode might be used by another parser */
			
 
				+-		return 0;
			
 
				+-	}
			
 
				+-
			
 
				+-	/* First count the subnodes */
			
 
				+-	nr_parts = 0;
			
 
				+-	for_each_child_of_node(ofpart_node,  pp) {
			
 
				+-		if (!dedicated && node_has_compatible(pp))
			
 
				+-			continue;
			
 
				+-
			
 
				+-		nr_parts++;
			
 
				+-	}
			
 
				+-
			
 
				+-	if (nr_parts == 0)
			
 
				+-		return 0;
			
 
				+-
			
 
				+-	parts = kcalloc(nr_parts, sizeof(*parts), GFP_KERNEL);
			
 
				+-	if (!parts)
			
 
				+-		return -ENOMEM;
			
 
				+-
			
 
				+-	i = 0;
			
 
				+-	for_each_child_of_node(ofpart_node,  pp) {
			
 
				+-		const __be32 *reg;
			
 
				+-		int len;
			
 
				+-		int a_cells, s_cells;
			
 
				+-
			
 
				+-		if (!dedicated && node_has_compatible(pp))
			
 
				+-			continue;
			
 
				+-
			
 
				+-		reg = of_get_property(pp, "reg", &len);
			
 
				+-		if (!reg) {
			
 
				+-			if (dedicated) {
			
 
				+-				pr_debug("%s: ofpart partition %pOF (%pOF) missing reg property.\n",
			
 
				+-					 master->name, pp,
			
 
				+-					 mtd_node);
			
 
				+-				goto ofpart_fail;
			
 
				+-			} else {
			
 
				+-				nr_parts--;
			
 
				+-				continue;
			
 
				+-			}
			
 
				+-		}
			
 
				+-
			
 
				+-		a_cells = of_n_addr_cells(pp);
			
 
				+-		s_cells = of_n_size_cells(pp);
			
 
				+-		if (len / 4 != a_cells + s_cells) {
			
 
				+-			pr_debug("%s: ofpart partition %pOF (%pOF) error parsing reg property.\n",
			
 
				+-				 master->name, pp,
			
 
				+-				 mtd_node);
			
 
				+-			goto ofpart_fail;
			
 
				+-		}
			
 
				+-
			
 
				+-		parts[i].offset = of_read_number(reg, a_cells);
			
 
				+-		parts[i].size = of_read_number(reg + a_cells, s_cells);
			
 
				+-		parts[i].of_node = pp;
			
 
				+-
			
 
				+-		partname = of_get_property(pp, "label", &len);
			
 
				+-		if (!partname)
			
 
				+-			partname = of_get_property(pp, "name", &len);
			
 
				+-		parts[i].name = partname;
			
 
				+-
			
 
				+-		if (of_get_property(pp, "read-only", &len))
			
 
				+-			parts[i].mask_flags |= MTD_WRITEABLE;
			
 
				+-
			
 
				+-		if (of_get_property(pp, "lock", &len))
			
 
				+-			parts[i].mask_flags |= MTD_POWERUP_LOCK;
			
 
				+-
			
 
				+-		if (of_property_read_bool(pp, "slc-mode"))
			
 
				+-			parts[i].add_flags |= MTD_SLC_ON_MLC_EMULATION;
			
 
				+-
			
 
				+-		i++;
			
 
				+-	}
			
 
				+-
			
 
				+-	if (!nr_parts)
			
 
				+-		goto ofpart_none;
			
 
				+-
			
 
				+-	*pparts = parts;
			
 
				+-	return nr_parts;
			
 
				+-
			
 
				+-ofpart_fail:
			
 
				+-	pr_err("%s: error parsing ofpart partition %pOF (%pOF)\n",
			
 
				+-	       master->name, pp, mtd_node);
			
 
				+-	ret = -EINVAL;
			
 
				+-ofpart_none:
			
 
				+-	of_node_put(pp);
			
 
				+-	kfree(parts);
			
 
				+-	return ret;
			
 
				+-}
			
 
				+-
			
 
				+-static const struct of_device_id parse_ofpart_match_table[] = {
			
 
				+-	{ .compatible = "fixed-partitions" },
			
 
				+-	{},
			
 
				+-};
			
 
				+-MODULE_DEVICE_TABLE(of, parse_ofpart_match_table);
			
 
				+-
			
 
				+-static struct mtd_part_parser ofpart_parser = {
			
 
				+-	.parse_fn = parse_fixed_partitions,
			
 
				+-	.name = "fixed-partitions",
			
 
				+-	.of_match_table = parse_ofpart_match_table,
			
 
				+-};
			
 
				+-
			
 
				+-static int parse_ofoldpart_partitions(struct mtd_info *master,
			
 
				+-				      const struct mtd_partition **pparts,
			
 
				+-				      struct mtd_part_parser_data *data)
			
 
				+-{
			
 
				+-	struct mtd_partition *parts;
			
 
				+-	struct device_node *dp;
			
 
				+-	int i, plen, nr_parts;
			
 
				+-	const struct {
			
 
				+-		__be32 offset, len;
			
 
				+-	} *part;
			
 
				+-	const char *names;
			
 
				+-
			
 
				+-	/* Pull of_node from the master device node */
			
 
				+-	dp = mtd_get_of_node(master);
			
 
				+-	if (!dp)
			
 
				+-		return 0;
			
 
				+-
			
 
				+-	part = of_get_property(dp, "partitions", &plen);
			
 
				+-	if (!part)
			
 
				+-		return 0; /* No partitions found */
			
 
				+-
			
 
				+-	pr_warn("Device tree uses obsolete partition map binding: %pOF\n", dp);
			
 
				+-
			
 
				+-	nr_parts = plen / sizeof(part[0]);
			
 
				+-
			
 
				+-	parts = kcalloc(nr_parts, sizeof(*parts), GFP_KERNEL);
			
 
				+-	if (!parts)
			
 
				+-		return -ENOMEM;
			
 
				+-
			
 
				+-	names = of_get_property(dp, "partition-names", &plen);
			
 
				+-
			
 
				+-	for (i = 0; i < nr_parts; i++) {
			
 
				+-		parts[i].offset = be32_to_cpu(part->offset);
			
 
				+-		parts[i].size   = be32_to_cpu(part->len) & ~1;
			
 
				+-		/* bit 0 set signifies read only partition */
			
 
				+-		if (be32_to_cpu(part->len) & 1)
			
 
				+-			parts[i].mask_flags = MTD_WRITEABLE;
			
 
				+-
			
 
				+-		if (names && (plen > 0)) {
			
 
				+-			int len = strlen(names) + 1;
			
 
				+-
			
 
				+-			parts[i].name = names;
			
 
				+-			plen -= len;
			
 
				+-			names += len;
			
 
				+-		} else {
			
 
				+-			parts[i].name = "unnamed";
			
 
				+-		}
			
 
				+-
			
 
				+-		part++;
			
 
				+-	}
			
 
				+-
			
 
				+-	*pparts = parts;
			
 
				+-	return nr_parts;
			
 
				+-}
			
 
				+-
			
 
				+-static struct mtd_part_parser ofoldpart_parser = {
			
 
				+-	.parse_fn = parse_ofoldpart_partitions,
			
 
				+-	.name = "ofoldpart",
			
 
				+-};
			
 
				+-
			
 
				+-static int __init ofpart_parser_init(void)
			
 
				+-{
			
 
				+-	register_mtd_parser(&ofpart_parser);
			
 
				+-	register_mtd_parser(&ofoldpart_parser);
			
 
				+-	return 0;
			
 
				+-}
			
 
				+-
			
 
				+-static void __exit ofpart_parser_exit(void)
			
 
				+-{
			
 
				+-	deregister_mtd_parser(&ofpart_parser);
			
 
				+-	deregister_mtd_parser(&ofoldpart_parser);
			
 
				+-}
			
 
				+-
			
 
				+-module_init(ofpart_parser_init);
			
 
				+-module_exit(ofpart_parser_exit);
			
 
				+-
			
 
				+-MODULE_LICENSE("GPL");
			
 
				+-MODULE_DESCRIPTION("Parser for MTD partitioning information in device tree");
			
 
				+-MODULE_AUTHOR("Vitaly Wool, David Gibson");
			
 
				+-/*
			
 
				+- * When MTD core cannot find the requested parser, it tries to load the module
			
 
				+- * with the same name. Since we provide the ofoldpart parser, we should have
			
 
				+- * the corresponding alias.
			
 
				+- */
			
 
				+-MODULE_ALIAS("fixed-partitions");
			
 
				+-MODULE_ALIAS("ofoldpart");
			
 
				+--- /dev/null
			
 
				++++ b/drivers/mtd/parsers/ofpart_core.c
			
 
				+@@ -0,0 +1,263 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-or-later
			
 
				++/*
			
 
				++ * Flash partitions described by the OF (or flattened) device tree
			
 
				++ *
			
 
				++ * Copyright © 2006 MontaVista Software Inc.
			
 
				++ * Author: Vitaly Wool <[email protected]>
			
 
				++ *
			
 
				++ * Revised to handle newer style flash binding by:
			
 
				++ *   Copyright © 2007 David Gibson, IBM Corporation.
			
 
				++ */
			
 
				++
			
 
				++#include <linux/module.h>
			
 
				++#include <linux/init.h>
			
 
				++#include <linux/of.h>
			
 
				++#include <linux/mtd/mtd.h>
			
 
				++#include <linux/slab.h>
			
 
				++#include <linux/mtd/partitions.h>
			
 
				++
			
 
				++#include "ofpart_bcm4908.h"
			
 
				++
			
 
				++struct fixed_partitions_quirks {
			
 
				++	int (*post_parse)(struct mtd_info *mtd, struct mtd_partition *parts, int nr_parts);
			
 
				++};
			
 
				++
			
 
				++struct fixed_partitions_quirks bcm4908_partitions_quirks = {
			
 
				++	.post_parse = bcm4908_partitions_post_parse,
			
 
				++};
			
 
				++
			
 
				++static const struct of_device_id parse_ofpart_match_table[];
			
 
				++
			
 
				++static bool node_has_compatible(struct device_node *pp)
			
 
				++{
			
 
				++	return of_get_property(pp, "compatible", NULL);
			
 
				++}
			
 
				++
			
 
				++static int parse_fixed_partitions(struct mtd_info *master,
			
 
				++				  const struct mtd_partition **pparts,
			
 
				++				  struct mtd_part_parser_data *data)
			
 
				++{
			
 
				++	const struct fixed_partitions_quirks *quirks;
			
 
				++	const struct of_device_id *of_id;
			
 
				++	struct mtd_partition *parts;
			
 
				++	struct device_node *mtd_node;
			
 
				++	struct device_node *ofpart_node;
			
 
				++	const char *partname;
			
 
				++	struct device_node *pp;
			
 
				++	int nr_parts, i, ret = 0;
			
 
				++	bool dedicated = true;
			
 
				++
			
 
				++	/* Pull of_node from the master device node */
			
 
				++	mtd_node = mtd_get_of_node(master);
			
 
				++	if (!mtd_node)
			
 
				++		return 0;
			
 
				++
			
 
				++	ofpart_node = of_get_child_by_name(mtd_node, "partitions");
			
 
				++	if (!ofpart_node) {
			
 
				++		/*
			
 
				++		 * We might get here even when ofpart isn't used at all (e.g.,
			
 
				++		 * when using another parser), so don't be louder than
			
 
				++		 * KERN_DEBUG
			
 
				++		 */
			
 
				++		pr_debug("%s: 'partitions' subnode not found on %pOF. Trying to parse direct subnodes as partitions.\n",
			
 
				++			 master->name, mtd_node);
			
 
				++		ofpart_node = mtd_node;
			
 
				++		dedicated = false;
			
 
				++	}
			
 
				++
			
 
				++	of_id = of_match_node(parse_ofpart_match_table, ofpart_node);
			
 
				++	if (dedicated && !of_id) {
			
 
				++		/* The 'partitions' subnode might be used by another parser */
			
 
				++		return 0;
			
 
				++	}
			
 
				++
			
 
				++	quirks = of_id ? of_id->data : NULL;
			
 
				++
			
 
				++	/* First count the subnodes */
			
 
				++	nr_parts = 0;
			
 
				++	for_each_child_of_node(ofpart_node,  pp) {
			
 
				++		if (!dedicated && node_has_compatible(pp))
			
 
				++			continue;
			
 
				++
			
 
				++		nr_parts++;
			
 
				++	}
			
 
				++
			
 
				++	if (nr_parts == 0)
			
 
				++		return 0;
			
 
				++
			
 
				++	parts = kcalloc(nr_parts, sizeof(*parts), GFP_KERNEL);
			
 
				++	if (!parts)
			
 
				++		return -ENOMEM;
			
 
				++
			
 
				++	i = 0;
			
 
				++	for_each_child_of_node(ofpart_node,  pp) {
			
 
				++		const __be32 *reg;
			
 
				++		int len;
			
 
				++		int a_cells, s_cells;
			
 
				++
			
 
				++		if (!dedicated && node_has_compatible(pp))
			
 
				++			continue;
			
 
				++
			
 
				++		reg = of_get_property(pp, "reg", &len);
			
 
				++		if (!reg) {
			
 
				++			if (dedicated) {
			
 
				++				pr_debug("%s: ofpart partition %pOF (%pOF) missing reg property.\n",
			
 
				++					 master->name, pp,
			
 
				++					 mtd_node);
			
 
				++				goto ofpart_fail;
			
 
				++			} else {
			
 
				++				nr_parts--;
			
 
				++				continue;
			
 
				++			}
			
 
				++		}
			
 
				++
			
 
				++		a_cells = of_n_addr_cells(pp);
			
 
				++		s_cells = of_n_size_cells(pp);
			
 
				++		if (len / 4 != a_cells + s_cells) {
			
 
				++			pr_debug("%s: ofpart partition %pOF (%pOF) error parsing reg property.\n",
			
 
				++				 master->name, pp,
			
 
				++				 mtd_node);
			
 
				++			goto ofpart_fail;
			
 
				++		}
			
 
				++
			
 
				++		parts[i].offset = of_read_number(reg, a_cells);
			
 
				++		parts[i].size = of_read_number(reg + a_cells, s_cells);
			
 
				++		parts[i].of_node = pp;
			
 
				++
			
 
				++		partname = of_get_property(pp, "label", &len);
			
 
				++		if (!partname)
			
 
				++			partname = of_get_property(pp, "name", &len);
			
 
				++		parts[i].name = partname;
			
 
				++
			
 
				++		if (of_get_property(pp, "read-only", &len))
			
 
				++			parts[i].mask_flags |= MTD_WRITEABLE;
			
 
				++
			
 
				++		if (of_get_property(pp, "lock", &len))
			
 
				++			parts[i].mask_flags |= MTD_POWERUP_LOCK;
			
 
				++
			
 
				++		if (of_property_read_bool(pp, "slc-mode"))
			
 
				++			parts[i].add_flags |= MTD_SLC_ON_MLC_EMULATION;
			
 
				++
			
 
				++		i++;
			
 
				++	}
			
 
				++
			
 
				++	if (!nr_parts)
			
 
				++		goto ofpart_none;
			
 
				++
			
 
				++	if (quirks && quirks->post_parse)
			
 
				++		quirks->post_parse(master, parts, nr_parts);
			
 
				++
			
 
				++	*pparts = parts;
			
 
				++	return nr_parts;
			
 
				++
			
 
				++ofpart_fail:
			
 
				++	pr_err("%s: error parsing ofpart partition %pOF (%pOF)\n",
			
 
				++	       master->name, pp, mtd_node);
			
 
				++	ret = -EINVAL;
			
 
				++ofpart_none:
			
 
				++	of_node_put(pp);
			
 
				++	kfree(parts);
			
 
				++	return ret;
			
 
				++}
			
 
				++
			
 
				++static const struct of_device_id parse_ofpart_match_table[] = {
			
 
				++	/* Generic */
			
 
				++	{ .compatible = "fixed-partitions" },
			
 
				++	/* Customized */
			
 
				++	{ .compatible = "brcm,bcm4908-partitions", .data = &bcm4908_partitions_quirks, },
			
 
				++	{},
			
 
				++};
			
 
				++MODULE_DEVICE_TABLE(of, parse_ofpart_match_table);
			
 
				++
			
 
				++static struct mtd_part_parser ofpart_parser = {
			
 
				++	.parse_fn = parse_fixed_partitions,
			
 
				++	.name = "fixed-partitions",
			
 
				++	.of_match_table = parse_ofpart_match_table,
			
 
				++};
			
 
				++
			
 
				++static int parse_ofoldpart_partitions(struct mtd_info *master,
			
 
				++				      const struct mtd_partition **pparts,
			
 
				++				      struct mtd_part_parser_data *data)
			
 
				++{
			
 
				++	struct mtd_partition *parts;
			
 
				++	struct device_node *dp;
			
 
				++	int i, plen, nr_parts;
			
 
				++	const struct {
			
 
				++		__be32 offset, len;
			
 
				++	} *part;
			
 
				++	const char *names;
			
 
				++
			
 
				++	/* Pull of_node from the master device node */
			
 
				++	dp = mtd_get_of_node(master);
			
 
				++	if (!dp)
			
 
				++		return 0;
			
 
				++
			
 
				++	part = of_get_property(dp, "partitions", &plen);
			
 
				++	if (!part)
			
 
				++		return 0; /* No partitions found */
			
 
				++
			
 
				++	pr_warn("Device tree uses obsolete partition map binding: %pOF\n", dp);
			
 
				++
			
 
				++	nr_parts = plen / sizeof(part[0]);
			
 
				++
			
 
				++	parts = kcalloc(nr_parts, sizeof(*parts), GFP_KERNEL);
			
 
				++	if (!parts)
			
 
				++		return -ENOMEM;
			
 
				++
			
 
				++	names = of_get_property(dp, "partition-names", &plen);
			
 
				++
			
 
				++	for (i = 0; i < nr_parts; i++) {
			
 
				++		parts[i].offset = be32_to_cpu(part->offset);
			
 
				++		parts[i].size   = be32_to_cpu(part->len) & ~1;
			
 
				++		/* bit 0 set signifies read only partition */
			
 
				++		if (be32_to_cpu(part->len) & 1)
			
 
				++			parts[i].mask_flags = MTD_WRITEABLE;
			
 
				++
			
 
				++		if (names && (plen > 0)) {
			
 
				++			int len = strlen(names) + 1;
			
 
				++
			
 
				++			parts[i].name = names;
			
 
				++			plen -= len;
			
 
				++			names += len;
			
 
				++		} else {
			
 
				++			parts[i].name = "unnamed";
			
 
				++		}
			
 
				++
			
 
				++		part++;
			
 
				++	}
			
 
				++
			
 
				++	*pparts = parts;
			
 
				++	return nr_parts;
			
 
				++}
			
 
				++
			
 
				++static struct mtd_part_parser ofoldpart_parser = {
			
 
				++	.parse_fn = parse_ofoldpart_partitions,
			
 
				++	.name = "ofoldpart",
			
 
				++};
			
 
				++
			
 
				++static int __init ofpart_parser_init(void)
			
 
				++{
			
 
				++	register_mtd_parser(&ofpart_parser);
			
 
				++	register_mtd_parser(&ofoldpart_parser);
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static void __exit ofpart_parser_exit(void)
			
 
				++{
			
 
				++	deregister_mtd_parser(&ofpart_parser);
			
 
				++	deregister_mtd_parser(&ofoldpart_parser);
			
 
				++}
			
 
				++
			
 
				++module_init(ofpart_parser_init);
			
 
				++module_exit(ofpart_parser_exit);
			
 
				++
			
 
				++MODULE_LICENSE("GPL");
			
 
				++MODULE_DESCRIPTION("Parser for MTD partitioning information in device tree");
			
 
				++MODULE_AUTHOR("Vitaly Wool, David Gibson");
			
 
				++/*
			
 
				++ * When MTD core cannot find the requested parser, it tries to load the module
			
 
				++ * with the same name. Since we provide the ofoldpart parser, we should have
			
 
				++ * the corresponding alias.
			
 
				++ */
			
 
				++MODULE_ALIAS("fixed-partitions");
			
 
				++MODULE_ALIAS("ofoldpart");
			
--- a/target/linux/generic/backport-5.15/404-v5.13-mtd-parsers-ofpart-limit-parsing-of-deprecated-DT-sy.patch
+++ b/target/linux/generic/backport-5.15/404-v5.13-mtd-parsers-ofpart-limit-parsing-of-deprecated-DT-sy.patch
@@ -0,0 +1,69 @@
 
				+From 2d751203aacf86a1b301a188d8551c7da91043ab Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Tue, 2 Mar 2021 20:00:12 +0100
			
 
				+Subject: [PATCH] mtd: parsers: ofpart: limit parsing of deprecated DT syntax
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+For backward compatibility ofpart still supports the old syntax like:
			
 
				+spi-flash@0 {
			
 
				+	compatible = "jedec,spi-nor";
			
 
				+	reg = <0x0>;
			
 
				+
			
 
				+	partition@0 {
			
 
				+		label = "bootloader";
			
 
				+		reg = <0x0 0x100000>;
			
 
				+	};
			
 
				+};
			
 
				+(without "partitions" subnode).
			
 
				+
			
 
				+There is no reason however to support nested partitions without a clear
			
 
				+"compatible" string like:
			
 
				+partitions {
			
 
				+	compatible = "fixed-partitions";
			
 
				+	#address-cells = <1>;
			
 
				+	#size-cells = <1>;
			
 
				+
			
 
				+	partition@0 {
			
 
				+		label = "bootloader";
			
 
				+		reg = <0x0 0x100000>;
			
 
				+
			
 
				+		partition@0 {
			
 
				+			label = "config";
			
 
				+			reg = <0x80000 0x80000>;
			
 
				+		};
			
 
				+	};
			
 
				+};
			
 
				+(we never officially supported or documented that).
			
 
				+
			
 
				+Make sure ofpart doesn't attempt to parse above.
			
 
				+
			
 
				+Cc: Ansuel Smith <[email protected]>
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/parsers/ofpart_core.c | 4 +++-
			
 
				+ 1 file changed, 3 insertions(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/ofpart_core.c
			
 
				++++ b/drivers/mtd/parsers/ofpart_core.c
			
 
				+@@ -53,7 +53,7 @@ static int parse_fixed_partitions(struct
			
 
				+ 		return 0;
			
 
				+ 
			
 
				+ 	ofpart_node = of_get_child_by_name(mtd_node, "partitions");
			
 
				+-	if (!ofpart_node) {
			
 
				++	if (!ofpart_node && !master->parent) {
			
 
				+ 		/*
			
 
				+ 		 * We might get here even when ofpart isn't used at all (e.g.,
			
 
				+ 		 * when using another parser), so don't be louder than
			
 
				+@@ -64,6 +64,8 @@ static int parse_fixed_partitions(struct
			
 
				+ 		ofpart_node = mtd_node;
			
 
				+ 		dedicated = false;
			
 
				+ 	}
			
 
				++	if (!ofpart_node)
			
 
				++		return 0;
			
 
				+ 
			
 
				+ 	of_id = of_match_node(parse_ofpart_match_table, ofpart_node);
			
 
				+ 	if (dedicated && !of_id) {
			
--- a/target/linux/generic/backport-5.15/405-v5.13-mtd-parsers-ofpart-make-symbol-bcm4908_partitions_qu.patch
+++ b/target/linux/generic/backport-5.15/405-v5.13-mtd-parsers-ofpart-make-symbol-bcm4908_partitions_qu.patch
@@ -0,0 +1,34 @@
 
				+From b87b6d2d6f540e29c3f98e1572d64e560d73d6c1 Mon Sep 17 00:00:00 2001
			
 
				+From: Wei Yongjun <[email protected]>
			
 
				+Date: Thu, 4 Mar 2021 06:46:00 +0000
			
 
				+Subject: [PATCH] mtd: parsers: ofpart: make symbol 'bcm4908_partitions_quirks'
			
 
				+ static
			
 
				+
			
 
				+The sparse tool complains as follows:
			
 
				+
			
 
				+drivers/mtd/parsers/ofpart_core.c:25:32: warning:
			
 
				+ symbol 'bcm4908_partitions_quirks' was not declared. Should it be static?
			
 
				+
			
 
				+This symbol is not used outside of ofpart_core.c, so this
			
 
				+commit marks it static.
			
 
				+
			
 
				+Fixes: 457da931b608 ("mtd: parsers: ofpart: support BCM4908 fixed partitions")
			
 
				+Reported-by: Hulk Robot <[email protected]>
			
 
				+Signed-off-by: Wei Yongjun <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/parsers/ofpart_core.c | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/ofpart_core.c
			
 
				++++ b/drivers/mtd/parsers/ofpart_core.c
			
 
				+@@ -22,7 +22,7 @@ struct fixed_partitions_quirks {
			
 
				+ 	int (*post_parse)(struct mtd_info *mtd, struct mtd_partition *parts, int nr_parts);
			
 
				+ };
			
 
				+ 
			
 
				+-struct fixed_partitions_quirks bcm4908_partitions_quirks = {
			
 
				++static struct fixed_partitions_quirks bcm4908_partitions_quirks = {
			
 
				+ 	.post_parse = bcm4908_partitions_post_parse,
			
 
				+ };
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/406-v5.13-0001-mtd-core-add-nvmem-cells-compatible-to-parse-mtd-as-.patch
+++ b/target/linux/generic/backport-5.15/406-v5.13-0001-mtd-core-add-nvmem-cells-compatible-to-parse-mtd-as-.patch
@@ -0,0 +1,38 @@
 
				+From a5d83d6e2bc747b13f347962d4b335d70b23559b Mon Sep 17 00:00:00 2001
			
 
				+From: Ansuel Smith <[email protected]>
			
 
				+Date: Fri, 12 Mar 2021 07:28:19 +0100
			
 
				+Subject: [PATCH] mtd: core: add nvmem-cells compatible to parse mtd as nvmem
			
 
				+ cells
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+Partitions that contains the nvmem-cells compatible will register
			
 
				+their direct subonodes as nvmem cells and the node will be treated as a
			
 
				+nvmem provider.
			
 
				+
			
 
				+Signed-off-by: Ansuel Smith <[email protected]>
			
 
				+Tested-by: Rafał Miłecki <[email protected]>
			
 
				+---
			
 
				+ drivers/mtd/mtdcore.c | 3 ++-
			
 
				+ 1 file changed, 2 insertions(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/mtd/mtdcore.c
			
 
				++++ b/drivers/mtd/mtdcore.c
			
 
				+@@ -531,6 +531,7 @@ static int mtd_nvmem_reg_read(void *priv
			
 
				+ 
			
 
				+ static int mtd_nvmem_add(struct mtd_info *mtd)
			
 
				+ {
			
 
				++	struct device_node *node = mtd_get_of_node(mtd);
			
 
				+ 	struct nvmem_config config = {};
			
 
				+ 
			
 
				+ 	config.id = -1;
			
 
				+@@ -543,7 +544,7 @@ static int mtd_nvmem_add(struct mtd_info
			
 
				+ 	config.stride = 1;
			
 
				+ 	config.read_only = true;
			
 
				+ 	config.root_only = true;
			
 
				+-	config.no_of_node = true;
			
 
				++	config.no_of_node = !of_device_is_compatible(node, "nvmem-cells");
			
 
				+ 	config.priv = mtd;
			
 
				+ 
			
 
				+ 	mtd->nvmem = nvmem_register(&config);
			
--- a/target/linux/generic/backport-5.15/406-v5.13-0002-dt-bindings-nvmem-drop-nodename-restriction.patch
+++ b/target/linux/generic/backport-5.15/406-v5.13-0002-dt-bindings-nvmem-drop-nodename-restriction.patch
@@ -0,0 +1,25 @@
 
				+From 42645976c3289b03a12f1bd2bc131fd98fc27170 Mon Sep 17 00:00:00 2001
			
 
				+From: Ansuel Smith <[email protected]>
			
 
				+Date: Fri, 12 Mar 2021 07:28:20 +0100
			
 
				+Subject: [PATCH] devicetree: nvmem: nvmem: drop $nodename restriction
			
 
				+
			
 
				+Drop $nodename restriction as now mtd partition can also be used as
			
 
				+nvmem provider.
			
 
				+
			
 
				+Signed-off-by: Ansuel Smith <[email protected]>
			
 
				+---
			
 
				+ Documentation/devicetree/bindings/nvmem/nvmem.yaml | 3 ---
			
 
				+ 1 file changed, 3 deletions(-)
			
 
				+
			
 
				+--- a/Documentation/devicetree/bindings/nvmem/nvmem.yaml
			
 
				++++ b/Documentation/devicetree/bindings/nvmem/nvmem.yaml
			
 
				+@@ -20,9 +20,6 @@ description: |
			
 
				+   storage device.
			
 
				+ 
			
 
				+ properties:
			
 
				+-  $nodename:
			
 
				+-    pattern: "^(eeprom|efuse|nvram)(@.*|-[0-9a-f])*$"
			
 
				+-
			
 
				+   "#address-cells":
			
 
				+     const: 1
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/406-v5.13-0003-dt-bindings-mtd-Document-use-of-nvmem-cells-compatib.patch
+++ b/target/linux/generic/backport-5.15/406-v5.13-0003-dt-bindings-mtd-Document-use-of-nvmem-cells-compatib.patch
@@ -0,0 +1,117 @@
 
				+From 377aa0135dc8489312edd3184d143ce3a89ff7ee Mon Sep 17 00:00:00 2001
			
 
				+From: Ansuel Smith <[email protected]>
			
 
				+Date: Fri, 12 Mar 2021 07:28:21 +0100
			
 
				+Subject: [PATCH] dt-bindings: mtd: Document use of nvmem-cells compatible
			
 
				+
			
 
				+Document nvmem-cells compatible used to treat mtd partitions as a
			
 
				+nvmem provider.
			
 
				+
			
 
				+Signed-off-by: Ansuel Smith <[email protected]>
			
 
				+Reviewed-by: Rob Herring <[email protected]>
			
 
				+---
			
 
				+ .../bindings/mtd/partitions/nvmem-cells.yaml  | 99 +++++++++++++++++++
			
 
				+ 1 file changed, 99 insertions(+)
			
 
				+ create mode 100644 Documentation/devicetree/bindings/mtd/partitions/nvmem-cells.yaml
			
 
				+
			
 
				+--- /dev/null
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/nvmem-cells.yaml
			
 
				+@@ -0,0 +1,99 @@
			
 
				++# SPDX-License-Identifier: GPL-2.0-only OR BSD-2-Clause
			
 
				++%YAML 1.2
			
 
				++---
			
 
				++$id: http://devicetree.org/schemas/mtd/partitions/nvmem-cells.yaml#
			
 
				++$schema: http://devicetree.org/meta-schemas/core.yaml#
			
 
				++
			
 
				++title: Nvmem cells
			
 
				++
			
 
				++description: |
			
 
				++  Any partition containing the compatible "nvmem-cells" will register as a
			
 
				++  nvmem provider.
			
 
				++  Each direct subnodes represents a nvmem cell following the nvmem binding.
			
 
				++  Nvmem binding to declare nvmem-cells can be found in:
			
 
				++  Documentation/devicetree/bindings/nvmem/nvmem.yaml
			
 
				++
			
 
				++maintainers:
			
 
				++  - Ansuel Smith <[email protected]>
			
 
				++
			
 
				++allOf:
			
 
				++  - $ref: /schemas/nvmem/nvmem.yaml#
			
 
				++
			
 
				++properties:
			
 
				++  compatible:
			
 
				++    const: nvmem-cells
			
 
				++
			
 
				++required:
			
 
				++  - compatible
			
 
				++
			
 
				++additionalProperties: true
			
 
				++
			
 
				++examples:
			
 
				++  - |
			
 
				++    partitions {
			
 
				++      compatible = "fixed-partitions";
			
 
				++      #address-cells = <1>;
			
 
				++      #size-cells = <1>;
			
 
				++
			
 
				++      /* ... */
			
 
				++
			
 
				++      };
			
 
				++      art: art@1200000 {
			
 
				++        compatible = "nvmem-cells";
			
 
				++        reg = <0x1200000 0x0140000>;
			
 
				++        label = "art";
			
 
				++        read-only;
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <1>;
			
 
				++
			
 
				++        macaddr_gmac1: macaddr_gmac1@0 {
			
 
				++          reg = <0x0 0x6>;
			
 
				++        };
			
 
				++
			
 
				++        macaddr_gmac2: macaddr_gmac2@6 {
			
 
				++          reg = <0x6 0x6>;
			
 
				++        };
			
 
				++
			
 
				++        pre_cal_24g: pre_cal_24g@1000 {
			
 
				++          reg = <0x1000 0x2f20>;
			
 
				++        };
			
 
				++
			
 
				++        pre_cal_5g: pre_cal_5g@5000{
			
 
				++          reg = <0x5000 0x2f20>;
			
 
				++        };
			
 
				++      };
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "fixed-partitions";
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <1>;
			
 
				++
			
 
				++        partition@0 {
			
 
				++            label = "bootloader";
			
 
				++            reg = <0x000000 0x100000>;
			
 
				++            read-only;
			
 
				++        };
			
 
				++
			
 
				++        firmware@100000 {
			
 
				++            compatible = "brcm,trx";
			
 
				++            label = "firmware";
			
 
				++            reg = <0x100000 0xe00000>;
			
 
				++        };
			
 
				++
			
 
				++        calibration@f00000 {
			
 
				++            compatible = "nvmem-cells";
			
 
				++            label = "calibration";
			
 
				++            reg = <0xf00000 0x100000>;
			
 
				++            ranges = <0 0xf00000 0x100000>;
			
 
				++            #address-cells = <1>;
			
 
				++            #size-cells = <1>;
			
 
				++
			
 
				++            wifi0@0 {
			
 
				++                reg = <0x000000 0x080000>;
			
 
				++            };
			
 
				++
			
 
				++            wifi1@80000 {
			
 
				++                reg = <0x080000 0x080000>;
			
 
				++            };
			
 
				++        };
			
 
				++    };
			
--- a/target/linux/generic/backport-5.15/407-v5.13-0001-dt-bindings-mtd-add-binding-for-Linksys-Northstar-pa.patch
+++ b/target/linux/generic/backport-5.15/407-v5.13-0001-dt-bindings-mtd-add-binding-for-Linksys-Northstar-pa.patch
@@ -0,0 +1,98 @@
 
				+From 2fa7294175c76e1ec568aa75c1891fd908728c8d Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Fri, 12 Mar 2021 14:49:18 +0100
			
 
				+Subject: [PATCH] dt-bindings: mtd: add binding for Linksys Northstar
			
 
				+ partitions
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+Linksys on Broadcom Northstar devices uses fixed flash layout with
			
 
				+multiple firmware partitions.
			
 
				+
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+Reviewed-by: Rob Herring <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ .../mtd/partitions/linksys,ns-partitions.yaml | 74 +++++++++++++++++++
			
 
				+ 1 file changed, 74 insertions(+)
			
 
				+ create mode 100644 Documentation/devicetree/bindings/mtd/partitions/linksys,ns-partitions.yaml
			
 
				+
			
 
				+--- /dev/null
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/linksys,ns-partitions.yaml
			
 
				+@@ -0,0 +1,74 @@
			
 
				++# SPDX-License-Identifier: GPL-2.0-only OR BSD-2-Clause
			
 
				++%YAML 1.2
			
 
				++---
			
 
				++$id: http://devicetree.org/schemas/mtd/partitions/linksys,ns-partitions.yaml#
			
 
				++$schema: http://devicetree.org/meta-schemas/core.yaml#
			
 
				++
			
 
				++title: Linksys Northstar partitioning
			
 
				++
			
 
				++description: |
			
 
				++  Linksys devices based on Broadcom Northstar architecture often use two
			
 
				++  firmware partitions. One is used for regular booting, the other is treated as
			
 
				++  fallback.
			
 
				++
			
 
				++  This binding allows defining all fixed partitions and marking those containing
			
 
				++  firmware. System can use that information e.g. for booting or flashing
			
 
				++  purposes.
			
 
				++
			
 
				++maintainers:
			
 
				++  - Rafał Miłecki <[email protected]>
			
 
				++
			
 
				++properties:
			
 
				++  compatible:
			
 
				++    const: linksys,ns-partitions
			
 
				++
			
 
				++  "#address-cells":
			
 
				++    enum: [ 1, 2 ]
			
 
				++
			
 
				++  "#size-cells":
			
 
				++    enum: [ 1, 2 ]
			
 
				++
			
 
				++patternProperties:
			
 
				++  "^partition@[0-9a-f]+$":
			
 
				++    $ref: "partition.yaml#"
			
 
				++    properties:
			
 
				++      compatible:
			
 
				++        items:
			
 
				++          - const: linksys,ns-firmware
			
 
				++          - const: brcm,trx
			
 
				++    unevaluatedProperties: false
			
 
				++
			
 
				++required:
			
 
				++  - "#address-cells"
			
 
				++  - "#size-cells"
			
 
				++
			
 
				++additionalProperties: false
			
 
				++
			
 
				++examples:
			
 
				++  - |
			
 
				++    partitions {
			
 
				++        compatible = "linksys,ns-partitions";
			
 
				++        #address-cells = <1>;
			
 
				++        #size-cells = <1>;
			
 
				++
			
 
				++        partition@0 {
			
 
				++            label = "boot";
			
 
				++            reg = <0x0 0x100000>;
			
 
				++            read-only;
			
 
				++        };
			
 
				++
			
 
				++        partition@100000 {
			
 
				++            label = "nvram";
			
 
				++            reg = <0x100000 0x100000>;
			
 
				++        };
			
 
				++
			
 
				++        partition@200000 {
			
 
				++            compatible = "linksys,ns-firmware", "brcm,trx";
			
 
				++            reg = <0x200000 0xf00000>;
			
 
				++        };
			
 
				++
			
 
				++        partition@1100000 {
			
 
				++            compatible = "linksys,ns-firmware", "brcm,trx";
			
 
				++            reg = <0x1100000 0xf00000>;
			
 
				++        };
			
 
				++    };
			
--- a/target/linux/generic/backport-5.15/407-v5.13-0002-mtd-parsers-ofpart-support-Linksys-Northstar-partiti.patch
+++ b/target/linux/generic/backport-5.15/407-v5.13-0002-mtd-parsers-ofpart-support-Linksys-Northstar-partiti.patch
@@ -0,0 +1,156 @@
 
				+From 7134a2d026d942210b4d26d6059c9d979ca7866e Mon Sep 17 00:00:00 2001
			
 
				+From: =?UTF-8?q?Rafa=C5=82=20Mi=C5=82ecki?= <[email protected]>
			
 
				+Date: Fri, 12 Mar 2021 14:49:19 +0100
			
 
				+Subject: [PATCH] mtd: parsers: ofpart: support Linksys Northstar partitions
			
 
				+MIME-Version: 1.0
			
 
				+Content-Type: text/plain; charset=UTF-8
			
 
				+Content-Transfer-Encoding: 8bit
			
 
				+
			
 
				+This allows extending ofpart parser with support for Linksys Northstar
			
 
				+devices. That support uses recently added quirks mechanism.
			
 
				+
			
 
				+Signed-off-by: Rafał Miłecki <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/parsers/Kconfig             | 10 +++++
			
 
				+ drivers/mtd/parsers/Makefile            |  1 +
			
 
				+ drivers/mtd/parsers/ofpart_core.c       |  6 +++
			
 
				+ drivers/mtd/parsers/ofpart_linksys_ns.c | 50 +++++++++++++++++++++++++
			
 
				+ drivers/mtd/parsers/ofpart_linksys_ns.h | 18 +++++++++
			
 
				+ 5 files changed, 85 insertions(+)
			
 
				+ create mode 100644 drivers/mtd/parsers/ofpart_linksys_ns.c
			
 
				+ create mode 100644 drivers/mtd/parsers/ofpart_linksys_ns.h
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/Kconfig
			
 
				++++ b/drivers/mtd/parsers/Kconfig
			
 
				+@@ -76,6 +76,16 @@ config MTD_OF_PARTS_BCM4908
			
 
				+ 	  that can have multiple "firmware" partitions. It takes care of
			
 
				+ 	  finding currently used one and backup ones.
			
 
				+ 
			
 
				++config MTD_OF_PARTS_LINKSYS_NS
			
 
				++	bool "Linksys Northstar partitioning support"
			
 
				++	depends on MTD_OF_PARTS && (ARCH_BCM_5301X || ARCH_BCM4908 || COMPILE_TEST)
			
 
				++	default ARCH_BCM_5301X
			
 
				++	help
			
 
				++	  This provides partitions parser for Linksys devices based on Broadcom
			
 
				++	  Northstar architecture. Linksys commonly uses fixed flash layout with
			
 
				++	  two "firmware" partitions. Currently used firmware has to be detected
			
 
				++	  using CFE environment variable.
			
 
				++
			
 
				+ config MTD_PARSER_IMAGETAG
			
 
				+ 	tristate "Parser for BCM963XX Image Tag format partitions"
			
 
				+ 	depends on BCM63XX || BMIPS_GENERIC || COMPILE_TEST
			
 
				+--- a/drivers/mtd/parsers/Makefile
			
 
				++++ b/drivers/mtd/parsers/Makefile
			
 
				+@@ -6,6 +6,7 @@ obj-$(CONFIG_MTD_CMDLINE_PARTS)		+= cmdl
			
 
				+ obj-$(CONFIG_MTD_OF_PARTS)		+= ofpart.o
			
 
				+ ofpart-y				+= ofpart_core.o
			
 
				+ ofpart-$(CONFIG_MTD_OF_PARTS_BCM4908)	+= ofpart_bcm4908.o
			
 
				++ofpart-$(CONFIG_MTD_OF_PARTS_LINKSYS_NS)+= ofpart_linksys_ns.o
			
 
				+ obj-$(CONFIG_MTD_PARSER_IMAGETAG)	+= parser_imagetag.o
			
 
				+ obj-$(CONFIG_MTD_AFS_PARTS)		+= afs.o
			
 
				+ obj-$(CONFIG_MTD_PARSER_TRX)		+= parser_trx.o
			
 
				+--- a/drivers/mtd/parsers/ofpart_core.c
			
 
				++++ b/drivers/mtd/parsers/ofpart_core.c
			
 
				+@@ -17,6 +17,7 @@
			
 
				+ #include <linux/mtd/partitions.h>
			
 
				+ 
			
 
				+ #include "ofpart_bcm4908.h"
			
 
				++#include "ofpart_linksys_ns.h"
			
 
				+ 
			
 
				+ struct fixed_partitions_quirks {
			
 
				+ 	int (*post_parse)(struct mtd_info *mtd, struct mtd_partition *parts, int nr_parts);
			
 
				+@@ -26,6 +27,10 @@ static struct fixed_partitions_quirks bc
			
 
				+ 	.post_parse = bcm4908_partitions_post_parse,
			
 
				+ };
			
 
				+ 
			
 
				++static struct fixed_partitions_quirks linksys_ns_partitions_quirks = {
			
 
				++	.post_parse = linksys_ns_partitions_post_parse,
			
 
				++};
			
 
				++
			
 
				+ static const struct of_device_id parse_ofpart_match_table[];
			
 
				+ 
			
 
				+ static bool node_has_compatible(struct device_node *pp)
			
 
				+@@ -167,6 +172,7 @@ static const struct of_device_id parse_o
			
 
				+ 	{ .compatible = "fixed-partitions" },
			
 
				+ 	/* Customized */
			
 
				+ 	{ .compatible = "brcm,bcm4908-partitions", .data = &bcm4908_partitions_quirks, },
			
 
				++	{ .compatible = "linksys,ns-partitions", .data = &linksys_ns_partitions_quirks, },
			
 
				+ 	{},
			
 
				+ };
			
 
				+ MODULE_DEVICE_TABLE(of, parse_ofpart_match_table);
			
 
				+--- /dev/null
			
 
				++++ b/drivers/mtd/parsers/ofpart_linksys_ns.c
			
 
				+@@ -0,0 +1,50 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0
			
 
				++/*
			
 
				++ * Copyright (C) 2021 Rafał Miłecki <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++#include <linux/bcm47xx_nvram.h>
			
 
				++#include <linux/mtd/mtd.h>
			
 
				++#include <linux/mtd/partitions.h>
			
 
				++
			
 
				++#include "ofpart_linksys_ns.h"
			
 
				++
			
 
				++#define NVRAM_BOOT_PART		"bootpartition"
			
 
				++
			
 
				++static int ofpart_linksys_ns_bootpartition(void)
			
 
				++{
			
 
				++	char buf[4];
			
 
				++	int bootpartition;
			
 
				++
			
 
				++	/* Check CFE environment variable */
			
 
				++	if (bcm47xx_nvram_getenv(NVRAM_BOOT_PART, buf, sizeof(buf)) > 0) {
			
 
				++		if (!kstrtoint(buf, 0, &bootpartition))
			
 
				++			return bootpartition;
			
 
				++		pr_warn("Failed to parse %s value \"%s\"\n", NVRAM_BOOT_PART,
			
 
				++			buf);
			
 
				++	} else {
			
 
				++		pr_warn("Failed to get NVRAM \"%s\"\n", NVRAM_BOOT_PART);
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int linksys_ns_partitions_post_parse(struct mtd_info *mtd,
			
 
				++				     struct mtd_partition *parts,
			
 
				++				     int nr_parts)
			
 
				++{
			
 
				++	int bootpartition = ofpart_linksys_ns_bootpartition();
			
 
				++	int trx_idx = 0;
			
 
				++	int i;
			
 
				++
			
 
				++	for (i = 0; i < nr_parts; i++) {
			
 
				++		if (of_device_is_compatible(parts[i].of_node, "linksys,ns-firmware")) {
			
 
				++			if (trx_idx++ == bootpartition)
			
 
				++				parts[i].name = "firmware";
			
 
				++			else
			
 
				++				parts[i].name = "backup";
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				+--- /dev/null
			
 
				++++ b/drivers/mtd/parsers/ofpart_linksys_ns.h
			
 
				+@@ -0,0 +1,18 @@
			
 
				++/* SPDX-License-Identifier: GPL-2.0 */
			
 
				++#ifndef __OFPART_LINKSYS_NS_H
			
 
				++#define __OFPART_LINKSYS_NS_H
			
 
				++
			
 
				++#ifdef CONFIG_MTD_OF_PARTS_LINKSYS_NS
			
 
				++int linksys_ns_partitions_post_parse(struct mtd_info *mtd,
			
 
				++				     struct mtd_partition *parts,
			
 
				++				     int nr_parts);
			
 
				++#else
			
 
				++static inline int linksys_ns_partitions_post_parse(struct mtd_info *mtd,
			
 
				++						   struct mtd_partition *parts,
			
 
				++						   int nr_parts)
			
 
				++{
			
 
				++	return -EOPNOTSUPP;
			
 
				++}
			
 
				++#endif
			
 
				++
			
 
				++#endif
			
--- a/target/linux/generic/backport-5.15/408-v5.13-mtd-cfi_cmdset_0002-Disable-buffered-writes-for-AMD.patch
+++ b/target/linux/generic/backport-5.15/408-v5.13-mtd-cfi_cmdset_0002-Disable-buffered-writes-for-AMD.patch
@@ -0,0 +1,54 @@
 
				+From 7e4404113686868858a34210c28ae122e967aa64 Mon Sep 17 00:00:00 2001
			
 
				+From: Mauri Sandberg <[email protected]>
			
 
				+Date: Tue, 9 Mar 2021 19:48:59 +0200
			
 
				+Subject: [PATCH] mtd: cfi_cmdset_0002: Disable buffered writes for AMD chip
			
 
				+ 0x2201
			
 
				+
			
 
				+Buffer writes do not work with AMD chip 0x2201. The chip in question
			
 
				+is a AMD/Spansion/Cypress Semiconductor S29GL256N and datasheet [1]
			
 
				+talks about writing buffers being possible. While waiting for a neater
			
 
				+solution resort to writing word-sized chunks only.
			
 
				+
			
 
				+Without the patch kernel logs will be flooded with entries like below:
			
 
				+
			
 
				+jffs2_scan_eraseblock(): End of filesystem marker found at 0x0
			
 
				+jffs2_build_filesystem(): unlocking the mtd device...
			
 
				+done.
			
 
				+jffs2_build_filesystem(): erasing all blocks after the end marker...
			
 
				+MTD do_write_buffer_wait(): software timeout, address:0x01ec000a.
			
 
				+jffs2: Write clean marker to block at 0x01920000 failed: -5
			
 
				+MTD do_write_buffer_wait(): software timeout, address:0x01e2000a.
			
 
				+jffs2: Write clean marker to block at 0x01880000 failed: -5
			
 
				+MTD do_write_buffer_wait(): software timeout, address:0x01e0000a.
			
 
				+jffs2: Write clean marker to block at 0x01860000 failed: -5
			
 
				+MTD do_write_buffer_wait(): software timeout, address:0x01dc000a.
			
 
				+jffs2: Write clean marker to block at 0x01820000 failed: -5
			
 
				+MTD do_write_buffer_wait(): software timeout, address:0x01da000a.
			
 
				+jffs2: Write clean marker to block at 0x01800000 failed: -5
			
 
				+...
			
 
				+
			
 
				+Tested on a Buffalo wzr-hp-g300nh running kernel 5.10.16.
			
 
				+
			
 
				+[1] https://www.cypress.com/file/219941/download
			
 
				+or  https://datasheetspdf.com/pdf-file/565708/SPANSION/S29GL256N/1
			
 
				+
			
 
				+Signed-off-by: Mauri Sandberg <[email protected]>
			
 
				+Signed-off-by: Vignesh Raghavendra <[email protected]>
			
 
				+Link: https://lore.kernel.org/r/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/chips/cfi_cmdset_0002.c | 4 ++++
			
 
				+ 1 file changed, 4 insertions(+)
			
 
				+
			
 
				+--- a/drivers/mtd/chips/cfi_cmdset_0002.c
			
 
				++++ b/drivers/mtd/chips/cfi_cmdset_0002.c
			
 
				+@@ -272,6 +272,10 @@ static void fixup_use_write_buffers(stru
			
 
				+ {
			
 
				+ 	struct map_info *map = mtd->priv;
			
 
				+ 	struct cfi_private *cfi = map->fldrv_priv;
			
 
				++
			
 
				++	if (cfi->mfr == CFI_MFR_AMD && cfi->id == 0x2201)
			
 
				++		return;
			
 
				++
			
 
				+ 	if (cfi->cfiq->BufWriteTimeoutTyp) {
			
 
				+ 		pr_debug("Using buffer write method\n");
			
 
				+ 		mtd->_write = cfi_amdstd_write_buffers;
			
--- a/target/linux/generic/backport-5.15/409-v5.14-0001-dt-bindings-mtd-brcm-trx-Add-brcm-trx-magic.patch
+++ b/target/linux/generic/backport-5.15/409-v5.14-0001-dt-bindings-mtd-brcm-trx-Add-brcm-trx-magic.patch
@@ -0,0 +1,32 @@
 
				+From a4d82940ff85a7e307953dfa715f65d5ab487e10 Mon Sep 17 00:00:00 2001
			
 
				+From: Hauke Mehrtens <[email protected]>
			
 
				+Date: Sun, 18 Apr 2021 23:46:14 +0200
			
 
				+Subject: dt-bindings: mtd: brcm,trx: Add brcm,trx-magic
			
 
				+
			
 
				+This adds the description of an additional property which allows to
			
 
				+specify a custom partition parser magic to detect a trx partition.
			
 
				+Buffalo has multiple device which are using the trx format, but with
			
 
				+different magic values.
			
 
				+
			
 
				+Signed-off-by: Hauke Mehrtens <[email protected]>
			
 
				+Acked-by: Rob Herring <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ .../devicetree/bindings/mtd/partitions/brcm,trx.txt          | 5 +++++
			
 
				+ 1 file changed, 5 insertions(+)
			
 
				+
			
 
				+--- a/Documentation/devicetree/bindings/mtd/partitions/brcm,trx.txt
			
 
				++++ b/Documentation/devicetree/bindings/mtd/partitions/brcm,trx.txt
			
 
				+@@ -28,6 +28,11 @@ detected by a software parsing TRX heade
			
 
				+ Required properties:
			
 
				+ - compatible : (required) must be "brcm,trx"
			
 
				+ 
			
 
				++Optional properties:
			
 
				++
			
 
				++- brcm,trx-magic: TRX magic, if it is different from the default magic
			
 
				++		  0x30524448 as a u32.
			
 
				++
			
 
				+ Example:
			
 
				+ 
			
 
				+ flash@0 {
			
--- a/target/linux/generic/backport-5.15/409-v5.14-0002-mtd-parsers-trx-Allow-to-specify-brcm-trx-magic-in-D.patch
+++ b/target/linux/generic/backport-5.15/409-v5.14-0002-mtd-parsers-trx-Allow-to-specify-brcm-trx-magic-in-D.patch
@@ -0,0 +1,50 @@
 
				+From d7f7e04f8b67571a4bf5a0dcd4f9da4214f5262c Mon Sep 17 00:00:00 2001
			
 
				+From: Hauke Mehrtens <[email protected]>
			
 
				+Date: Sun, 18 Apr 2021 23:46:15 +0200
			
 
				+Subject: mtd: parsers: trx: Allow to specify brcm, trx-magic in DT
			
 
				+
			
 
				+Buffalo uses a different TRX magic for every device, to be able to use
			
 
				+this trx parser, make it possible to specify the TRX magic in device
			
 
				+tree. If no TRX magic is specified in device tree, the standard value
			
 
				+will be used. This value should only be specified if a vendor chooses to
			
 
				+use a non standard TRX magic.
			
 
				+
			
 
				+Signed-off-by: Hauke Mehrtens <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/parsers/parser_trx.c | 9 ++++++++-
			
 
				+ 1 file changed, 8 insertions(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/parser_trx.c
			
 
				++++ b/drivers/mtd/parsers/parser_trx.c
			
 
				+@@ -51,13 +51,20 @@ static int parser_trx_parse(struct mtd_i
			
 
				+ 			    const struct mtd_partition **pparts,
			
 
				+ 			    struct mtd_part_parser_data *data)
			
 
				+ {
			
 
				++	struct device_node *np = mtd_get_of_node(mtd);
			
 
				+ 	struct mtd_partition *parts;
			
 
				+ 	struct mtd_partition *part;
			
 
				+ 	struct trx_header trx;
			
 
				+ 	size_t bytes_read;
			
 
				+ 	uint8_t curr_part = 0, i = 0;
			
 
				++	uint32_t trx_magic = TRX_MAGIC;
			
 
				+ 	int err;
			
 
				+ 
			
 
				++	/* Get different magic from device tree if specified */
			
 
				++	err = of_property_read_u32(np, "brcm,trx-magic", &trx_magic);
			
 
				++	if (err != 0 && err != -EINVAL)
			
 
				++		pr_err("failed to parse \"brcm,trx-magic\" DT attribute, using default: %d\n", err);
			
 
				++
			
 
				+ 	parts = kcalloc(TRX_PARSER_MAX_PARTS, sizeof(struct mtd_partition),
			
 
				+ 			GFP_KERNEL);
			
 
				+ 	if (!parts)
			
 
				+@@ -70,7 +77,7 @@ static int parser_trx_parse(struct mtd_i
			
 
				+ 		return err;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	if (trx.magic != TRX_MAGIC) {
			
 
				++	if (trx.magic != trx_magic) {
			
 
				+ 		kfree(parts);
			
 
				+ 		return -ENOENT;
			
 
				+ 	}
			
--- a/target/linux/generic/backport-5.15/409-v5.14-0003-mtd-parsers-trx-Allow-to-use-TRX-parser-on-Mediatek-.patch
+++ b/target/linux/generic/backport-5.15/409-v5.14-0003-mtd-parsers-trx-Allow-to-use-TRX-parser-on-Mediatek-.patch
@@ -0,0 +1,25 @@
 
				+From 81bb218c829246962a6327c64eec18ddcc049936 Mon Sep 17 00:00:00 2001
			
 
				+From: Hauke Mehrtens <[email protected]>
			
 
				+Date: Sun, 18 Apr 2021 23:46:16 +0200
			
 
				+Subject: mtd: parsers: trx: Allow to use TRX parser on Mediatek SoCs
			
 
				+
			
 
				+Buffalo uses the TRX partition format also on Mediatek MT7622 SoCs.
			
 
				+
			
 
				+Signed-off-by: Hauke Mehrtens <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/parsers/Kconfig | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/Kconfig
			
 
				++++ b/drivers/mtd/parsers/Kconfig
			
 
				+@@ -115,7 +115,7 @@ config MTD_AFS_PARTS
			
 
				+ 
			
 
				+ config MTD_PARSER_TRX
			
 
				+ 	tristate "Parser for TRX format partitions"
			
 
				+-	depends on MTD && (BCM47XX || ARCH_BCM_5301X || COMPILE_TEST)
			
 
				++	depends on MTD && (BCM47XX || ARCH_BCM_5301X || ARCH_MEDIATEK || COMPILE_TEST)
			
 
				+ 	help
			
 
				+ 	  TRX is a firmware format used by Broadcom on their devices. It
			
 
				+ 	  may contain up to 3/4 partitions (depending on the version).
			
--- a/target/linux/generic/backport-5.15/410-mtd-next-mtd-parsers-trx-allow-to-use-on-MediaTek-MIPS-SoCs.patch
+++ b/target/linux/generic/backport-5.15/410-mtd-next-mtd-parsers-trx-allow-to-use-on-MediaTek-MIPS-SoCs.patch
@@ -0,0 +1,33 @@
 
				+From 2365f91c861cbfeef7141c69842848c7b2d3c2db Mon Sep 17 00:00:00 2001
			
 
				+From: INAGAKI Hiroshi <[email protected]>
			
 
				+Date: Sun, 13 Feb 2022 15:40:44 +0900
			
 
				+Subject: [PATCH] mtd: parsers: trx: allow to use on MediaTek MIPS SoCs
			
 
				+
			
 
				+Buffalo sells some router devices which have trx-formatted firmware,
			
 
				+based on MediaTek MIPS SoCs. To use parser_trx on those devices, add
			
 
				+"RALINK" to dependency and allow to compile for MediaTek MIPS SoCs.
			
 
				+
			
 
				+examples:
			
 
				+
			
 
				+- WCR-1166DS  (MT7628)
			
 
				+- WSR-1166DHP (MT7621)
			
 
				+- WSR-2533DHP (MT7621)
			
 
				+
			
 
				+Signed-off-by: INAGAKI Hiroshi <[email protected]>
			
 
				+Signed-off-by: Miquel Raynal <[email protected]>
			
 
				+Link: https://lore.kernel.org/linux-mtd/[email protected]
			
 
				+---
			
 
				+ drivers/mtd/parsers/Kconfig | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/mtd/parsers/Kconfig
			
 
				++++ b/drivers/mtd/parsers/Kconfig
			
 
				+@@ -115,7 +115,7 @@ config MTD_AFS_PARTS
			
 
				+ 
			
 
				+ config MTD_PARSER_TRX
			
 
				+ 	tristate "Parser for TRX format partitions"
			
 
				+-	depends on MTD && (BCM47XX || ARCH_BCM_5301X || ARCH_MEDIATEK || COMPILE_TEST)
			
 
				++	depends on MTD && (BCM47XX || ARCH_BCM_5301X || ARCH_MEDIATEK || RALINK || COMPILE_TEST)
			
 
				+ 	help
			
 
				+ 	  TRX is a firmware format used by Broadcom on their devices. It
			
 
				+ 	  may contain up to 3/4 partitions (depending on the version).
			
--- a/target/linux/generic/backport-5.15/500-v5.13-ubifs-default-to-zstd-compression.patch
+++ b/target/linux/generic/backport-5.15/500-v5.13-ubifs-default-to-zstd-compression.patch
@@ -0,0 +1,25 @@
 
				+From dcdf415b740923530dc71d89fecc8361078473f5 Mon Sep 17 00:00:00 2001
			
 
				+From: Rui Salvaterra <[email protected]>
			
 
				+Date: Mon, 5 Apr 2021 16:11:55 +0100
			
 
				+Subject: [PATCH] ubifs: default to zstd compression
			
 
				+
			
 
				+Compared to lzo and zlib, zstd is the best all-around performer, both in terms
			
 
				+of speed and compression ratio. Set it as the default, if available.
			
 
				+
			
 
				+Signed-off-by: Rui Salvaterra <[email protected]>
			
 
				+---
			
 
				+ fs/ubifs/sb.c | 3 +++
			
 
				+ 1 file changed, 3 insertions(+)
			
 
				+
			
 
				+--- a/fs/ubifs/sb.c
			
 
				++++ b/fs/ubifs/sb.c
			
 
				+@@ -53,6 +53,9 @@
			
 
				+ 
			
 
				+ static int get_default_compressor(struct ubifs_info *c)
			
 
				+ {
			
 
				++	if (ubifs_compr_present(c, UBIFS_COMPR_ZSTD))
			
 
				++		return UBIFS_COMPR_ZSTD;
			
 
				++
			
 
				+ 	if (ubifs_compr_present(c, UBIFS_COMPR_LZO))
			
 
				+ 		return UBIFS_COMPR_LZO;
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/600-v5.12-net-extract-napi-poll-functionality-to-__napi_poll.patch
+++ b/target/linux/generic/backport-5.15/600-v5.12-net-extract-napi-poll-functionality-to-__napi_poll.patch
@@ -0,0 +1,88 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Mon, 8 Feb 2021 11:34:08 -0800
			
 
				+Subject: [PATCH] net: extract napi poll functionality to __napi_poll()
			
 
				+
			
 
				+This commit introduces a new function __napi_poll() which does the main
			
 
				+logic of the existing napi_poll() function, and will be called by other
			
 
				+functions in later commits.
			
 
				+This idea and implementation is done by Felix Fietkau <[email protected]> and
			
 
				+is proposed as part of the patch to move napi work to work_queue
			
 
				+context.
			
 
				+This commit by itself is a code restructure.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Wei Wang <[email protected]>
			
 
				+Reviewed-by: Alexander Duyck <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/core/dev.c
			
 
				++++ b/net/core/dev.c
			
 
				+@@ -6805,15 +6805,10 @@ void __netif_napi_del(struct napi_struct
			
 
				+ }
			
 
				+ EXPORT_SYMBOL(__netif_napi_del);
			
 
				+ 
			
 
				+-static int napi_poll(struct napi_struct *n, struct list_head *repoll)
			
 
				++static int __napi_poll(struct napi_struct *n, bool *repoll)
			
 
				+ {
			
 
				+-	void *have;
			
 
				+ 	int work, weight;
			
 
				+ 
			
 
				+-	list_del_init(&n->poll_list);
			
 
				+-
			
 
				+-	have = netpoll_poll_lock(n);
			
 
				+-
			
 
				+ 	weight = n->weight;
			
 
				+ 
			
 
				+ 	/* This NAPI_STATE_SCHED test is for avoiding a race
			
 
				+@@ -6833,7 +6828,7 @@ static int napi_poll(struct napi_struct
			
 
				+ 			    n->poll, work, weight);
			
 
				+ 
			
 
				+ 	if (likely(work < weight))
			
 
				+-		goto out_unlock;
			
 
				++		return work;
			
 
				+ 
			
 
				+ 	/* Drivers must not modify the NAPI state if they
			
 
				+ 	 * consume the entire weight.  In such cases this code
			
 
				+@@ -6842,7 +6837,7 @@ static int napi_poll(struct napi_struct
			
 
				+ 	 */
			
 
				+ 	if (unlikely(napi_disable_pending(n))) {
			
 
				+ 		napi_complete(n);
			
 
				+-		goto out_unlock;
			
 
				++		return work;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	if (n->gro_bitmask) {
			
 
				+@@ -6860,12 +6855,29 @@ static int napi_poll(struct napi_struct
			
 
				+ 	if (unlikely(!list_empty(&n->poll_list))) {
			
 
				+ 		pr_warn_once("%s: Budget exhausted after napi rescheduled\n",
			
 
				+ 			     n->dev ? n->dev->name : "backlog");
			
 
				+-		goto out_unlock;
			
 
				++		return work;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	list_add_tail(&n->poll_list, repoll);
			
 
				++	*repoll = true;
			
 
				++
			
 
				++	return work;
			
 
				++}
			
 
				++
			
 
				++static int napi_poll(struct napi_struct *n, struct list_head *repoll)
			
 
				++{
			
 
				++	bool do_repoll = false;
			
 
				++	void *have;
			
 
				++	int work;
			
 
				++
			
 
				++	list_del_init(&n->poll_list);
			
 
				++
			
 
				++	have = netpoll_poll_lock(n);
			
 
				++
			
 
				++	work = __napi_poll(n, &do_repoll);
			
 
				++
			
 
				++	if (do_repoll)
			
 
				++		list_add_tail(&n->poll_list, repoll);
			
 
				+ 
			
 
				+-out_unlock:
			
 
				+ 	netpoll_poll_unlock(have);
			
 
				+ 
			
 
				+ 	return work;
			
--- a/target/linux/generic/backport-5.15/601-v5.12-net-implement-threaded-able-napi-poll-loop-support.patch
+++ b/target/linux/generic/backport-5.15/601-v5.12-net-implement-threaded-able-napi-poll-loop-support.patch
@@ -0,0 +1,261 @@
 
				+From: Wei Wang <[email protected]>
			
 
				+Date: Mon, 8 Feb 2021 11:34:09 -0800
			
 
				+Subject: [PATCH] net: implement threaded-able napi poll loop support
			
 
				+
			
 
				+This patch allows running each napi poll loop inside its own
			
 
				+kernel thread.
			
 
				+The kthread is created during netif_napi_add() if dev->threaded
			
 
				+is set. And threaded mode is enabled in napi_enable(). We will
			
 
				+provide a way to set dev->threaded and enable threaded mode
			
 
				+without a device up/down in the following patch.
			
 
				+
			
 
				+Once that threaded mode is enabled and the kthread is
			
 
				+started, napi_schedule() will wake-up such thread instead
			
 
				+of scheduling the softirq.
			
 
				+
			
 
				+The threaded poll loop behaves quite likely the net_rx_action,
			
 
				+but it does not have to manipulate local irqs and uses
			
 
				+an explicit scheduling point based on netdev_budget.
			
 
				+
			
 
				+Co-developed-by: Paolo Abeni <[email protected]>
			
 
				+Signed-off-by: Paolo Abeni <[email protected]>
			
 
				+Co-developed-by: Hannes Frederic Sowa <[email protected]>
			
 
				+Signed-off-by: Hannes Frederic Sowa <[email protected]>
			
 
				+Co-developed-by: Jakub Kicinski <[email protected]>
			
 
				+Signed-off-by: Jakub Kicinski <[email protected]>
			
 
				+Signed-off-by: Wei Wang <[email protected]>
			
 
				+Reviewed-by: Alexander Duyck <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -347,6 +347,7 @@ struct napi_struct {
			
 
				+ 	struct list_head	dev_list;
			
 
				+ 	struct hlist_node	napi_hash_node;
			
 
				+ 	unsigned int		napi_id;
			
 
				++	struct task_struct	*thread;
			
 
				+ };
			
 
				+ 
			
 
				+ enum {
			
 
				+@@ -357,6 +358,7 @@ enum {
			
 
				+ 	NAPI_STATE_LISTED,	/* NAPI added to system lists */
			
 
				+ 	NAPI_STATE_NO_BUSY_POLL,/* Do not add in napi_hash, no busy polling */
			
 
				+ 	NAPI_STATE_IN_BUSY_POLL,/* sk_busy_loop() owns this NAPI */
			
 
				++	NAPI_STATE_THREADED,		/* The poll is performed inside its own thread*/
			
 
				+ };
			
 
				+ 
			
 
				+ enum {
			
 
				+@@ -367,6 +369,7 @@ enum {
			
 
				+ 	NAPIF_STATE_LISTED	 = BIT(NAPI_STATE_LISTED),
			
 
				+ 	NAPIF_STATE_NO_BUSY_POLL = BIT(NAPI_STATE_NO_BUSY_POLL),
			
 
				+ 	NAPIF_STATE_IN_BUSY_POLL = BIT(NAPI_STATE_IN_BUSY_POLL),
			
 
				++	NAPIF_STATE_THREADED	 = BIT(NAPI_STATE_THREADED),
			
 
				+ };
			
 
				+ 
			
 
				+ enum gro_result {
			
 
				+@@ -497,20 +500,7 @@ static inline bool napi_complete(struct
			
 
				+  */
			
 
				+ void napi_disable(struct napi_struct *n);
			
 
				+ 
			
 
				+-/**
			
 
				+- *	napi_enable - enable NAPI scheduling
			
 
				+- *	@n: NAPI context
			
 
				+- *
			
 
				+- * Resume NAPI from being scheduled on this context.
			
 
				+- * Must be paired with napi_disable.
			
 
				+- */
			
 
				+-static inline void napi_enable(struct napi_struct *n)
			
 
				+-{
			
 
				+-	BUG_ON(!test_bit(NAPI_STATE_SCHED, &n->state));
			
 
				+-	smp_mb__before_atomic();
			
 
				+-	clear_bit(NAPI_STATE_SCHED, &n->state);
			
 
				+-	clear_bit(NAPI_STATE_NPSVC, &n->state);
			
 
				+-}
			
 
				++void napi_enable(struct napi_struct *n);
			
 
				+ 
			
 
				+ /**
			
 
				+  *	napi_synchronize - wait until NAPI is not running
			
 
				+@@ -1842,6 +1832,8 @@ enum netdev_ml_priv_type {
			
 
				+  *
			
 
				+  *	@wol_enabled:	Wake-on-LAN is enabled
			
 
				+  *
			
 
				++ *	@threaded:	napi threaded mode is enabled
			
 
				++ *
			
 
				+  *	@net_notifier_list:	List of per-net netdev notifier block
			
 
				+  *				that follow this device when it is moved
			
 
				+  *				to another network namespace.
			
 
				+@@ -2161,6 +2153,7 @@ struct net_device {
			
 
				+ 	struct lock_class_key	*qdisc_running_key;
			
 
				+ 	bool			proto_down;
			
 
				+ 	unsigned		wol_enabled:1;
			
 
				++	unsigned		threaded:1;
			
 
				+ 
			
 
				+ 	struct list_head	net_notifier_list;
			
 
				+ 
			
 
				+--- a/net/core/dev.c
			
 
				++++ b/net/core/dev.c
			
 
				+@@ -91,6 +91,7 @@
			
 
				+ #include <linux/etherdevice.h>
			
 
				+ #include <linux/ethtool.h>
			
 
				+ #include <linux/skbuff.h>
			
 
				++#include <linux/kthread.h>
			
 
				+ #include <linux/bpf.h>
			
 
				+ #include <linux/bpf_trace.h>
			
 
				+ #include <net/net_namespace.h>
			
 
				+@@ -1500,6 +1501,27 @@ void netdev_notify_peers(struct net_devi
			
 
				+ }
			
 
				+ EXPORT_SYMBOL(netdev_notify_peers);
			
 
				+ 
			
 
				++static int napi_threaded_poll(void *data);
			
 
				++
			
 
				++static int napi_kthread_create(struct napi_struct *n)
			
 
				++{
			
 
				++	int err = 0;
			
 
				++
			
 
				++	/* Create and wake up the kthread once to put it in
			
 
				++	 * TASK_INTERRUPTIBLE mode to avoid the blocked task
			
 
				++	 * warning and work with loadavg.
			
 
				++	 */
			
 
				++	n->thread = kthread_run(napi_threaded_poll, n, "napi/%s-%d",
			
 
				++				n->dev->name, n->napi_id);
			
 
				++	if (IS_ERR(n->thread)) {
			
 
				++		err = PTR_ERR(n->thread);
			
 
				++		pr_err("kthread_run failed with err %d\n", err);
			
 
				++		n->thread = NULL;
			
 
				++	}
			
 
				++
			
 
				++	return err;
			
 
				++}
			
 
				++
			
 
				+ static int __dev_open(struct net_device *dev, struct netlink_ext_ack *extack)
			
 
				+ {
			
 
				+ 	const struct net_device_ops *ops = dev->netdev_ops;
			
 
				+@@ -4267,6 +4289,21 @@ int gro_normal_batch __read_mostly = 8;
			
 
				+ static inline void ____napi_schedule(struct softnet_data *sd,
			
 
				+ 				     struct napi_struct *napi)
			
 
				+ {
			
 
				++	struct task_struct *thread;
			
 
				++
			
 
				++	if (test_bit(NAPI_STATE_THREADED, &napi->state)) {
			
 
				++		/* Paired with smp_mb__before_atomic() in
			
 
				++		 * napi_enable(). Use READ_ONCE() to guarantee
			
 
				++		 * a complete read on napi->thread. Only call
			
 
				++		 * wake_up_process() when it's not NULL.
			
 
				++		 */
			
 
				++		thread = READ_ONCE(napi->thread);
			
 
				++		if (thread) {
			
 
				++			wake_up_process(thread);
			
 
				++			return;
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				+ 	list_add_tail(&napi->poll_list, &sd->poll_list);
			
 
				+ 	__raise_softirq_irqoff(NET_RX_SOFTIRQ);
			
 
				+ }
			
 
				+@@ -6758,6 +6795,12 @@ void netif_napi_add(struct net_device *d
			
 
				+ 	set_bit(NAPI_STATE_NPSVC, &napi->state);
			
 
				+ 	list_add_rcu(&napi->dev_list, &dev->napi_list);
			
 
				+ 	napi_hash_add(napi);
			
 
				++	/* Create kthread for this napi if dev->threaded is set.
			
 
				++	 * Clear dev->threaded if kthread creation failed so that
			
 
				++	 * threaded mode will not be enabled in napi_enable().
			
 
				++	 */
			
 
				++	if (dev->threaded && napi_kthread_create(napi))
			
 
				++		dev->threaded = 0;
			
 
				+ }
			
 
				+ EXPORT_SYMBOL(netif_napi_add);
			
 
				+ 
			
 
				+@@ -6774,9 +6817,28 @@ void napi_disable(struct napi_struct *n)
			
 
				+ 	hrtimer_cancel(&n->timer);
			
 
				+ 
			
 
				+ 	clear_bit(NAPI_STATE_DISABLE, &n->state);
			
 
				++	clear_bit(NAPI_STATE_THREADED, &n->state);
			
 
				+ }
			
 
				+ EXPORT_SYMBOL(napi_disable);
			
 
				+ 
			
 
				++/**
			
 
				++ *	napi_enable - enable NAPI scheduling
			
 
				++ *	@n: NAPI context
			
 
				++ *
			
 
				++ * Resume NAPI from being scheduled on this context.
			
 
				++ * Must be paired with napi_disable.
			
 
				++ */
			
 
				++void napi_enable(struct napi_struct *n)
			
 
				++{
			
 
				++	BUG_ON(!test_bit(NAPI_STATE_SCHED, &n->state));
			
 
				++	smp_mb__before_atomic();
			
 
				++	clear_bit(NAPI_STATE_SCHED, &n->state);
			
 
				++	clear_bit(NAPI_STATE_NPSVC, &n->state);
			
 
				++	if (n->dev->threaded && n->thread)
			
 
				++		set_bit(NAPI_STATE_THREADED, &n->state);
			
 
				++}
			
 
				++EXPORT_SYMBOL(napi_enable);
			
 
				++
			
 
				+ static void flush_gro_hash(struct napi_struct *napi)
			
 
				+ {
			
 
				+ 	int i;
			
 
				+@@ -6802,6 +6864,11 @@ void __netif_napi_del(struct napi_struct
			
 
				+ 
			
 
				+ 	flush_gro_hash(napi);
			
 
				+ 	napi->gro_bitmask = 0;
			
 
				++
			
 
				++	if (napi->thread) {
			
 
				++		kthread_stop(napi->thread);
			
 
				++		napi->thread = NULL;
			
 
				++	}
			
 
				+ }
			
 
				+ EXPORT_SYMBOL(__netif_napi_del);
			
 
				+ 
			
 
				+@@ -6883,6 +6950,51 @@ static int napi_poll(struct napi_struct
			
 
				+ 	return work;
			
 
				+ }
			
 
				+ 
			
 
				++static int napi_thread_wait(struct napi_struct *napi)
			
 
				++{
			
 
				++	set_current_state(TASK_INTERRUPTIBLE);
			
 
				++
			
 
				++	while (!kthread_should_stop() && !napi_disable_pending(napi)) {
			
 
				++		if (test_bit(NAPI_STATE_SCHED, &napi->state)) {
			
 
				++			WARN_ON(!list_empty(&napi->poll_list));
			
 
				++			__set_current_state(TASK_RUNNING);
			
 
				++			return 0;
			
 
				++		}
			
 
				++
			
 
				++		schedule();
			
 
				++		set_current_state(TASK_INTERRUPTIBLE);
			
 
				++	}
			
 
				++	__set_current_state(TASK_RUNNING);
			
 
				++	return -1;
			
 
				++}
			
 
				++
			
 
				++static int napi_threaded_poll(void *data)
			
 
				++{
			
 
				++	struct napi_struct *napi = data;
			
 
				++	void *have;
			
 
				++
			
 
				++	while (!napi_thread_wait(napi)) {
			
 
				++		for (;;) {
			
 
				++			bool repoll = false;
			
 
				++
			
 
				++			local_bh_disable();
			
 
				++
			
 
				++			have = netpoll_poll_lock(napi);
			
 
				++			__napi_poll(napi, &repoll);
			
 
				++			netpoll_poll_unlock(have);
			
 
				++
			
 
				++			__kfree_skb_flush();
			
 
				++			local_bh_enable();
			
 
				++
			
 
				++			if (!repoll)
			
 
				++				break;
			
 
				++
			
 
				++			cond_resched();
			
 
				++		}
			
 
				++	}
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static __latent_entropy void net_rx_action(struct softirq_action *h)
			
 
				+ {
			
 
				+ 	struct softnet_data *sd = this_cpu_ptr(&softnet_data);
			
--- a/target/linux/generic/backport-5.15/602-v5.12-net-add-sysfs-attribute-to-control-napi-threaded-mod.patch
+++ b/target/linux/generic/backport-5.15/602-v5.12-net-add-sysfs-attribute-to-control-napi-threaded-mod.patch
@@ -0,0 +1,177 @@
 
				+From: Wei Wang <[email protected]>
			
 
				+Date: Mon, 8 Feb 2021 11:34:10 -0800
			
 
				+Subject: [PATCH] net: add sysfs attribute to control napi threaded mode
			
 
				+
			
 
				+This patch adds a new sysfs attribute to the network device class.
			
 
				+Said attribute provides a per-device control to enable/disable the
			
 
				+threaded mode for all the napi instances of the given network device,
			
 
				+without the need for a device up/down.
			
 
				+User sets it to 1 or 0 to enable or disable threaded mode.
			
 
				+Note: when switching between threaded and the current softirq based mode
			
 
				+for a napi instance, it will not immediately take effect if the napi is
			
 
				+currently being polled. The mode switch will happen for the next time
			
 
				+napi_schedule() is called.
			
 
				+
			
 
				+Co-developed-by: Paolo Abeni <[email protected]>
			
 
				+Signed-off-by: Paolo Abeni <[email protected]>
			
 
				+Co-developed-by: Hannes Frederic Sowa <[email protected]>
			
 
				+Signed-off-by: Hannes Frederic Sowa <[email protected]>
			
 
				+Co-developed-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Wei Wang <[email protected]>
			
 
				+Reviewed-by: Alexander Duyck <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/Documentation/ABI/testing/sysfs-class-net
			
 
				++++ b/Documentation/ABI/testing/sysfs-class-net
			
 
				+@@ -337,3 +337,18 @@ Contact:	[email protected]
			
 
				+ Description:
			
 
				+ 		32-bit unsigned integer counting the number of times the link has
			
 
				+ 		been down
			
 
				++
			
 
				++What:		/sys/class/net/<iface>/threaded
			
 
				++Date:		Jan 2021
			
 
				++KernelVersion:	5.12
			
 
				++Contact:	[email protected]
			
 
				++Description:
			
 
				++		Boolean value to control the threaded mode per device. User could
			
 
				++		set this value to enable/disable threaded mode for all napi
			
 
				++		belonging to this device, without the need to do device up/down.
			
 
				++
			
 
				++		Possible values:
			
 
				++		== ==================================
			
 
				++		0  threaded mode disabled for this dev
			
 
				++		1  threaded mode enabled for this dev
			
 
				++		== ==================================
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -491,6 +491,8 @@ static inline bool napi_complete(struct
			
 
				+ 	return napi_complete_done(n, 0);
			
 
				+ }
			
 
				+ 
			
 
				++int dev_set_threaded(struct net_device *dev, bool threaded);
			
 
				++
			
 
				+ /**
			
 
				+  *	napi_disable - prevent NAPI from scheduling
			
 
				+  *	@n: NAPI context
			
 
				+--- a/net/core/dev.c
			
 
				++++ b/net/core/dev.c
			
 
				+@@ -4293,8 +4293,9 @@ static inline void ____napi_schedule(str
			
 
				+ 
			
 
				+ 	if (test_bit(NAPI_STATE_THREADED, &napi->state)) {
			
 
				+ 		/* Paired with smp_mb__before_atomic() in
			
 
				+-		 * napi_enable(). Use READ_ONCE() to guarantee
			
 
				+-		 * a complete read on napi->thread. Only call
			
 
				++		 * napi_enable()/dev_set_threaded().
			
 
				++		 * Use READ_ONCE() to guarantee a complete
			
 
				++		 * read on napi->thread. Only call
			
 
				+ 		 * wake_up_process() when it's not NULL.
			
 
				+ 		 */
			
 
				+ 		thread = READ_ONCE(napi->thread);
			
 
				+@@ -6768,6 +6769,49 @@ static void init_gro_hash(struct napi_st
			
 
				+ 	napi->gro_bitmask = 0;
			
 
				+ }
			
 
				+ 
			
 
				++int dev_set_threaded(struct net_device *dev, bool threaded)
			
 
				++{
			
 
				++	struct napi_struct *napi;
			
 
				++	int err = 0;
			
 
				++
			
 
				++	if (dev->threaded == threaded)
			
 
				++		return 0;
			
 
				++
			
 
				++	if (threaded) {
			
 
				++		list_for_each_entry(napi, &dev->napi_list, dev_list) {
			
 
				++			if (!napi->thread) {
			
 
				++				err = napi_kthread_create(napi);
			
 
				++				if (err) {
			
 
				++					threaded = false;
			
 
				++					break;
			
 
				++				}
			
 
				++			}
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				++	dev->threaded = threaded;
			
 
				++
			
 
				++	/* Make sure kthread is created before THREADED bit
			
 
				++	 * is set.
			
 
				++	 */
			
 
				++	smp_mb__before_atomic();
			
 
				++
			
 
				++	/* Setting/unsetting threaded mode on a napi might not immediately
			
 
				++	 * take effect, if the current napi instance is actively being
			
 
				++	 * polled. In this case, the switch between threaded mode and
			
 
				++	 * softirq mode will happen in the next round of napi_schedule().
			
 
				++	 * This should not cause hiccups/stalls to the live traffic.
			
 
				++	 */
			
 
				++	list_for_each_entry(napi, &dev->napi_list, dev_list) {
			
 
				++		if (threaded)
			
 
				++			set_bit(NAPI_STATE_THREADED, &napi->state);
			
 
				++		else
			
 
				++			clear_bit(NAPI_STATE_THREADED, &napi->state);
			
 
				++	}
			
 
				++
			
 
				++	return err;
			
 
				++}
			
 
				++
			
 
				+ void netif_napi_add(struct net_device *dev, struct napi_struct *napi,
			
 
				+ 		    int (*poll)(struct napi_struct *, int), int weight)
			
 
				+ {
			
 
				+--- a/net/core/net-sysfs.c
			
 
				++++ b/net/core/net-sysfs.c
			
 
				+@@ -587,6 +587,45 @@ static ssize_t phys_switch_id_show(struc
			
 
				+ }
			
 
				+ static DEVICE_ATTR_RO(phys_switch_id);
			
 
				+ 
			
 
				++static ssize_t threaded_show(struct device *dev,
			
 
				++			     struct device_attribute *attr, char *buf)
			
 
				++{
			
 
				++	struct net_device *netdev = to_net_dev(dev);
			
 
				++	ssize_t ret = -EINVAL;
			
 
				++
			
 
				++	if (!rtnl_trylock())
			
 
				++		return restart_syscall();
			
 
				++
			
 
				++	if (dev_isalive(netdev))
			
 
				++		ret = sprintf(buf, fmt_dec, netdev->threaded);
			
 
				++
			
 
				++	rtnl_unlock();
			
 
				++	return ret;
			
 
				++}
			
 
				++
			
 
				++static int modify_napi_threaded(struct net_device *dev, unsigned long val)
			
 
				++{
			
 
				++	int ret;
			
 
				++
			
 
				++	if (list_empty(&dev->napi_list))
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	if (val != 0 && val != 1)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	ret = dev_set_threaded(dev, val);
			
 
				++
			
 
				++	return ret;
			
 
				++}
			
 
				++
			
 
				++static ssize_t threaded_store(struct device *dev,
			
 
				++			      struct device_attribute *attr,
			
 
				++			      const char *buf, size_t len)
			
 
				++{
			
 
				++	return netdev_store(dev, attr, buf, len, modify_napi_threaded);
			
 
				++}
			
 
				++static DEVICE_ATTR_RW(threaded);
			
 
				++
			
 
				+ static struct attribute *net_class_attrs[] __ro_after_init = {
			
 
				+ 	&dev_attr_netdev_group.attr,
			
 
				+ 	&dev_attr_type.attr,
			
 
				+@@ -619,6 +658,7 @@ static struct attribute *net_class_attrs
			
 
				+ 	&dev_attr_proto_down.attr,
			
 
				+ 	&dev_attr_carrier_up_count.attr,
			
 
				+ 	&dev_attr_carrier_down_count.attr,
			
 
				++	&dev_attr_threaded.attr,
			
 
				+ 	NULL,
			
 
				+ };
			
 
				+ ATTRIBUTE_GROUPS(net_class);
			
--- a/target/linux/generic/backport-5.15/603-v5.12-net-fix-race-between-napi-kthread-mode-and-busy-poll.patch
+++ b/target/linux/generic/backport-5.15/603-v5.12-net-fix-race-between-napi-kthread-mode-and-busy-poll.patch
@@ -0,0 +1,93 @@
 
				+From: Wei Wang <[email protected]>
			
 
				+Date: Mon, 1 Mar 2021 17:21:13 -0800
			
 
				+Subject: [PATCH] net: fix race between napi kthread mode and busy poll
			
 
				+
			
 
				+Currently, napi_thread_wait() checks for NAPI_STATE_SCHED bit to
			
 
				+determine if the kthread owns this napi and could call napi->poll() on
			
 
				+it. However, if socket busy poll is enabled, it is possible that the
			
 
				+busy poll thread grabs this SCHED bit (after the previous napi->poll()
			
 
				+invokes napi_complete_done() and clears SCHED bit) and tries to poll
			
 
				+on the same napi. napi_disable() could grab the SCHED bit as well.
			
 
				+This patch tries to fix this race by adding a new bit
			
 
				+NAPI_STATE_SCHED_THREADED in napi->state. This bit gets set in
			
 
				+____napi_schedule() if the threaded mode is enabled, and gets cleared
			
 
				+in napi_complete_done(), and we only poll the napi in kthread if this
			
 
				+bit is set. This helps distinguish the ownership of the napi between
			
 
				+kthread and other scenarios and fixes the race issue.
			
 
				+
			
 
				+Fixes: 29863d41bb6e ("net: implement threaded-able napi poll loop support")
			
 
				+Reported-by: Martin Zaharinov <[email protected]>
			
 
				+Suggested-by: Jakub Kicinski <[email protected]>
			
 
				+Signed-off-by: Wei Wang <[email protected]>
			
 
				+Cc: Alexander Duyck <[email protected]>
			
 
				+Cc: Eric Dumazet <[email protected]>
			
 
				+Cc: Paolo Abeni <[email protected]>
			
 
				+Cc: Hannes Frederic Sowa <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -359,6 +359,7 @@ enum {
			
 
				+ 	NAPI_STATE_NO_BUSY_POLL,/* Do not add in napi_hash, no busy polling */
			
 
				+ 	NAPI_STATE_IN_BUSY_POLL,/* sk_busy_loop() owns this NAPI */
			
 
				+ 	NAPI_STATE_THREADED,		/* The poll is performed inside its own thread*/
			
 
				++	NAPI_STATE_SCHED_THREADED,	/* Napi is currently scheduled in threaded mode */
			
 
				+ };
			
 
				+ 
			
 
				+ enum {
			
 
				+@@ -370,6 +371,7 @@ enum {
			
 
				+ 	NAPIF_STATE_NO_BUSY_POLL = BIT(NAPI_STATE_NO_BUSY_POLL),
			
 
				+ 	NAPIF_STATE_IN_BUSY_POLL = BIT(NAPI_STATE_IN_BUSY_POLL),
			
 
				+ 	NAPIF_STATE_THREADED	 = BIT(NAPI_STATE_THREADED),
			
 
				++	NAPIF_STATE_SCHED_THREADED	= BIT(NAPI_STATE_SCHED_THREADED),
			
 
				+ };
			
 
				+ 
			
 
				+ enum gro_result {
			
 
				+--- a/net/core/dev.c
			
 
				++++ b/net/core/dev.c
			
 
				+@@ -4300,6 +4300,8 @@ static inline void ____napi_schedule(str
			
 
				+ 		 */
			
 
				+ 		thread = READ_ONCE(napi->thread);
			
 
				+ 		if (thread) {
			
 
				++			if (thread->state != TASK_INTERRUPTIBLE)
			
 
				++				set_bit(NAPI_STATE_SCHED_THREADED, &napi->state);
			
 
				+ 			wake_up_process(thread);
			
 
				+ 			return;
			
 
				+ 		}
			
 
				+@@ -6560,7 +6562,8 @@ bool napi_complete_done(struct napi_stru
			
 
				+ 
			
 
				+ 		WARN_ON_ONCE(!(val & NAPIF_STATE_SCHED));
			
 
				+ 
			
 
				+-		new = val & ~(NAPIF_STATE_MISSED | NAPIF_STATE_SCHED);
			
 
				++		new = val & ~(NAPIF_STATE_MISSED | NAPIF_STATE_SCHED |
			
 
				++			      NAPIF_STATE_SCHED_THREADED);
			
 
				+ 
			
 
				+ 		/* If STATE_MISSED was set, leave STATE_SCHED set,
			
 
				+ 		 * because we will call napi->poll() one more time.
			
 
				+@@ -6996,16 +6999,25 @@ static int napi_poll(struct napi_struct
			
 
				+ 
			
 
				+ static int napi_thread_wait(struct napi_struct *napi)
			
 
				+ {
			
 
				++	bool woken = false;
			
 
				++
			
 
				+ 	set_current_state(TASK_INTERRUPTIBLE);
			
 
				+ 
			
 
				+ 	while (!kthread_should_stop() && !napi_disable_pending(napi)) {
			
 
				+-		if (test_bit(NAPI_STATE_SCHED, &napi->state)) {
			
 
				++		/* Testing SCHED_THREADED bit here to make sure the current
			
 
				++		 * kthread owns this napi and could poll on this napi.
			
 
				++		 * Testing SCHED bit is not enough because SCHED bit might be
			
 
				++		 * set by some other busy poll thread or by napi_disable().
			
 
				++		 */
			
 
				++		if (test_bit(NAPI_STATE_SCHED_THREADED, &napi->state) || woken) {
			
 
				+ 			WARN_ON(!list_empty(&napi->poll_list));
			
 
				+ 			__set_current_state(TASK_RUNNING);
			
 
				+ 			return 0;
			
 
				+ 		}
			
 
				+ 
			
 
				+ 		schedule();
			
 
				++		/* woken being true indicates this thread owns this napi. */
			
 
				++		woken = true;
			
 
				+ 		set_current_state(TASK_INTERRUPTIBLE);
			
 
				+ 	}
			
 
				+ 	__set_current_state(TASK_RUNNING);
			
--- a/target/linux/generic/backport-5.15/604-v5.12-net-fix-hangup-on-napi_disable-for-threaded-napi.patch
+++ b/target/linux/generic/backport-5.15/604-v5.12-net-fix-hangup-on-napi_disable-for-threaded-napi.patch
@@ -0,0 +1,53 @@
 
				+From: Paolo Abeni <[email protected]>
			
 
				+Date: Fri, 9 Apr 2021 17:24:17 +0200
			
 
				+Subject: [PATCH] net: fix hangup on napi_disable for threaded napi
			
 
				+
			
 
				+napi_disable() is subject to an hangup, when the threaded
			
 
				+mode is enabled and the napi is under heavy traffic.
			
 
				+
			
 
				+If the relevant napi has been scheduled and the napi_disable()
			
 
				+kicks in before the next napi_threaded_wait() completes - so
			
 
				+that the latter quits due to the napi_disable_pending() condition,
			
 
				+the existing code leaves the NAPI_STATE_SCHED bit set and the
			
 
				+napi_disable() loop waiting for such bit will hang.
			
 
				+
			
 
				+This patch addresses the issue by dropping the NAPI_STATE_DISABLE
			
 
				+bit test in napi_thread_wait(). The later napi_threaded_poll()
			
 
				+iteration will take care of clearing the NAPI_STATE_SCHED.
			
 
				+
			
 
				+This also addresses a related problem reported by Jakub:
			
 
				+before this patch a napi_disable()/napi_enable() pair killed
			
 
				+the napi thread, effectively disabling the threaded mode.
			
 
				+On the patched kernel napi_disable() simply stops scheduling
			
 
				+the relevant thread.
			
 
				+
			
 
				+v1 -> v2:
			
 
				+  - let the main napi_thread_poll() loop clear the SCHED bit
			
 
				+
			
 
				+Reported-by: Jakub Kicinski <[email protected]>
			
 
				+Fixes: 29863d41bb6e ("net: implement threaded-able napi poll loop support")
			
 
				+Signed-off-by: Paolo Abeni <[email protected]>
			
 
				+Reviewed-by: Eric Dumazet <[email protected]>
			
 
				+Link: https://lore.kernel.org/r/883923fa22745a9589e8610962b7dc59df09fb1f.1617981844.git.pabeni@redhat.com
			
 
				+Signed-off-by: Jakub Kicinski <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/core/dev.c
			
 
				++++ b/net/core/dev.c
			
 
				+@@ -7003,7 +7003,7 @@ static int napi_thread_wait(struct napi_
			
 
				+ 
			
 
				+ 	set_current_state(TASK_INTERRUPTIBLE);
			
 
				+ 
			
 
				+-	while (!kthread_should_stop() && !napi_disable_pending(napi)) {
			
 
				++	while (!kthread_should_stop()) {
			
 
				+ 		/* Testing SCHED_THREADED bit here to make sure the current
			
 
				+ 		 * kthread owns this napi and could poll on this napi.
			
 
				+ 		 * Testing SCHED bit is not enough because SCHED bit might be
			
 
				+@@ -7021,6 +7021,7 @@ static int napi_thread_wait(struct napi_
			
 
				+ 		set_current_state(TASK_INTERRUPTIBLE);
			
 
				+ 	}
			
 
				+ 	__set_current_state(TASK_RUNNING);
			
 
				++
			
 
				+ 	return -1;
			
 
				+ }
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-00-netfilter-flowtable-add-hash-offset-field-to-tuple.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-00-netfilter-flowtable-add-hash-offset-field-to-tuple.patch
@@ -0,0 +1,52 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Fri, 20 Nov 2020 13:49:13 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add hash offset field to tuple
			
 
				+
			
 
				+Add a placeholder field to calculate hash tuple offset. Similar to
			
 
				+2c407aca6497 ("netfilter: conntrack: avoid gcc-10 zero-length-bounds
			
 
				+warning").
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -107,6 +107,10 @@ struct flow_offload_tuple {
			
 
				+ 
			
 
				+ 	u8				l3proto;
			
 
				+ 	u8				l4proto;
			
 
				++
			
 
				++	/* All members above are keys for lookups, see flow_offload_hash(). */
			
 
				++	struct { }			__hash;
			
 
				++
			
 
				+ 	u8				dir;
			
 
				+ 
			
 
				+ 	u16				mtu;
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -191,14 +191,14 @@ static u32 flow_offload_hash(const void
			
 
				+ {
			
 
				+ 	const struct flow_offload_tuple *tuple = data;
			
 
				+ 
			
 
				+-	return jhash(tuple, offsetof(struct flow_offload_tuple, dir), seed);
			
 
				++	return jhash(tuple, offsetof(struct flow_offload_tuple, __hash), seed);
			
 
				+ }
			
 
				+ 
			
 
				+ static u32 flow_offload_hash_obj(const void *data, u32 len, u32 seed)
			
 
				+ {
			
 
				+ 	const struct flow_offload_tuple_rhash *tuplehash = data;
			
 
				+ 
			
 
				+-	return jhash(&tuplehash->tuple, offsetof(struct flow_offload_tuple, dir), seed);
			
 
				++	return jhash(&tuplehash->tuple, offsetof(struct flow_offload_tuple, __hash), seed);
			
 
				+ }
			
 
				+ 
			
 
				+ static int flow_offload_hash_cmp(struct rhashtable_compare_arg *arg,
			
 
				+@@ -207,7 +207,7 @@ static int flow_offload_hash_cmp(struct
			
 
				+ 	const struct flow_offload_tuple *tuple = arg->key;
			
 
				+ 	const struct flow_offload_tuple_rhash *x = ptr;
			
 
				+ 
			
 
				+-	if (memcmp(&x->tuple, tuple, offsetof(struct flow_offload_tuple, dir)))
			
 
				++	if (memcmp(&x->tuple, tuple, offsetof(struct flow_offload_tuple, __hash)))
			
 
				+ 		return 1;
			
 
				+ 
			
 
				+ 	return 0;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-01-netfilter-flowtable-separate-replace-destroy-and-sta.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-01-netfilter-flowtable-separate-replace-destroy-and-sta.patch
@@ -0,0 +1,98 @@
 
				+From: Oz Shlomo <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:19 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: separate replace, destroy and
			
 
				+ stats to different workqueues
			
 
				+
			
 
				+Currently the flow table offload replace, destroy and stats work items are
			
 
				+executed on a single workqueue. As such, DESTROY and STATS commands may
			
 
				+be backloged after a burst of REPLACE work items. This scenario can bloat
			
 
				+up memory and may cause active connections to age.
			
 
				+
			
 
				+Instatiate add, del and stats workqueues to avoid backlogs of non-dependent
			
 
				+actions. Provide sysfs control over the workqueue attributes, allowing
			
 
				+userspace applications to control the workqueue cpumask.
			
 
				+
			
 
				+Signed-off-by: Oz Shlomo <[email protected]>
			
 
				+Reviewed-by: Paul Blakey <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_offload.c
			
 
				++++ b/net/netfilter/nf_flow_table_offload.c
			
 
				+@@ -13,7 +13,9 @@
			
 
				+ #include <net/netfilter/nf_conntrack_core.h>
			
 
				+ #include <net/netfilter/nf_conntrack_tuple.h>
			
 
				+ 
			
 
				+-static struct workqueue_struct *nf_flow_offload_wq;
			
 
				++static struct workqueue_struct *nf_flow_offload_add_wq;
			
 
				++static struct workqueue_struct *nf_flow_offload_del_wq;
			
 
				++static struct workqueue_struct *nf_flow_offload_stats_wq;
			
 
				+ 
			
 
				+ struct flow_offload_work {
			
 
				+ 	struct list_head	list;
			
 
				+@@ -827,7 +829,12 @@ static void flow_offload_work_handler(st
			
 
				+ 
			
 
				+ static void flow_offload_queue_work(struct flow_offload_work *offload)
			
 
				+ {
			
 
				+-	queue_work(nf_flow_offload_wq, &offload->work);
			
 
				++	if (offload->cmd == FLOW_CLS_REPLACE)
			
 
				++		queue_work(nf_flow_offload_add_wq, &offload->work);
			
 
				++	else if (offload->cmd == FLOW_CLS_DESTROY)
			
 
				++		queue_work(nf_flow_offload_del_wq, &offload->work);
			
 
				++	else
			
 
				++		queue_work(nf_flow_offload_stats_wq, &offload->work);
			
 
				+ }
			
 
				+ 
			
 
				+ static struct flow_offload_work *
			
 
				+@@ -899,8 +906,11 @@ void nf_flow_offload_stats(struct nf_flo
			
 
				+ 
			
 
				+ void nf_flow_table_offload_flush(struct nf_flowtable *flowtable)
			
 
				+ {
			
 
				+-	if (nf_flowtable_hw_offload(flowtable))
			
 
				+-		flush_workqueue(nf_flow_offload_wq);
			
 
				++	if (nf_flowtable_hw_offload(flowtable)) {
			
 
				++		flush_workqueue(nf_flow_offload_add_wq);
			
 
				++		flush_workqueue(nf_flow_offload_del_wq);
			
 
				++		flush_workqueue(nf_flow_offload_stats_wq);
			
 
				++	}
			
 
				+ }
			
 
				+ 
			
 
				+ static int nf_flow_table_block_setup(struct nf_flowtable *flowtable,
			
 
				+@@ -1013,15 +1023,33 @@ EXPORT_SYMBOL_GPL(nf_flow_table_offload_
			
 
				+ 
			
 
				+ int nf_flow_table_offload_init(void)
			
 
				+ {
			
 
				+-	nf_flow_offload_wq  = alloc_workqueue("nf_flow_table_offload",
			
 
				+-					      WQ_UNBOUND, 0);
			
 
				+-	if (!nf_flow_offload_wq)
			
 
				++	nf_flow_offload_add_wq  = alloc_workqueue("nf_ft_offload_add",
			
 
				++						  WQ_UNBOUND | WQ_SYSFS, 0);
			
 
				++	if (!nf_flow_offload_add_wq)
			
 
				+ 		return -ENOMEM;
			
 
				+ 
			
 
				++	nf_flow_offload_del_wq  = alloc_workqueue("nf_ft_offload_del",
			
 
				++						  WQ_UNBOUND | WQ_SYSFS, 0);
			
 
				++	if (!nf_flow_offload_del_wq)
			
 
				++		goto err_del_wq;
			
 
				++
			
 
				++	nf_flow_offload_stats_wq  = alloc_workqueue("nf_ft_offload_stats",
			
 
				++						    WQ_UNBOUND | WQ_SYSFS, 0);
			
 
				++	if (!nf_flow_offload_stats_wq)
			
 
				++		goto err_stats_wq;
			
 
				++
			
 
				+ 	return 0;
			
 
				++
			
 
				++err_stats_wq:
			
 
				++	destroy_workqueue(nf_flow_offload_del_wq);
			
 
				++err_del_wq:
			
 
				++	destroy_workqueue(nf_flow_offload_add_wq);
			
 
				++	return -ENOMEM;
			
 
				+ }
			
 
				+ 
			
 
				+ void nf_flow_table_offload_exit(void)
			
 
				+ {
			
 
				+-	destroy_workqueue(nf_flow_offload_wq);
			
 
				++	destroy_workqueue(nf_flow_offload_add_wq);
			
 
				++	destroy_workqueue(nf_flow_offload_del_wq);
			
 
				++	destroy_workqueue(nf_flow_offload_stats_wq);
			
 
				+ }
			
--- a/target/linux/generic/backport-5.15/610-v5.13-03-netfilter-conntrack-Remove-unused-variable-declarati.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-03-netfilter-conntrack-Remove-unused-variable-declarati.patch
@@ -0,0 +1,22 @@
 
				+From: YueHaibing <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:21 +0100
			
 
				+Subject: [PATCH] netfilter: conntrack: Remove unused variable
			
 
				+ declaration
			
 
				+
			
 
				+commit e97c3e278e95 ("tproxy: split off ipv6 defragmentation to a separate
			
 
				+module") left behind this.
			
 
				+
			
 
				+Signed-off-by: YueHaibing <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/ipv6/nf_conntrack_ipv6.h
			
 
				++++ b/include/net/netfilter/ipv6/nf_conntrack_ipv6.h
			
 
				+@@ -4,7 +4,4 @@
			
 
				+ 
			
 
				+ extern const struct nf_conntrack_l4proto nf_conntrack_l4proto_icmpv6;
			
 
				+ 
			
 
				+-#include <linux/sysctl.h>
			
 
				+-extern struct ctl_table nf_ct_ipv6_sysctl_table[];
			
 
				+-
			
 
				+ #endif /* _NF_CONNTRACK_IPV6_H*/
			
--- a/target/linux/generic/backport-5.15/610-v5.13-04-netfilter-flowtable-consolidate-skb_try_make_writabl.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-04-netfilter-flowtable-consolidate-skb_try_make_writabl.patch
@@ -0,0 +1,291 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:22 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: consolidate
			
 
				+ skb_try_make_writable() call
			
 
				+
			
 
				+Fetch the layer 4 header size to be mangled by NAT when building the
			
 
				+tuple, then use it to make writable the network and the transport
			
 
				+headers. After this update, the NAT routines now assumes that the skbuff
			
 
				+area is writable. Do the pointer refetch only after the single
			
 
				+skb_try_make_writable() call.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -394,9 +394,6 @@ static int nf_flow_nat_port_tcp(struct s
			
 
				+ {
			
 
				+ 	struct tcphdr *tcph;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*tcph)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	tcph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	inet_proto_csum_replace2(&tcph->check, skb, port, new_port, false);
			
 
				+ 
			
 
				+@@ -408,9 +405,6 @@ static int nf_flow_nat_port_udp(struct s
			
 
				+ {
			
 
				+ 	struct udphdr *udph;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*udph)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	udph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	if (udph->check || skb->ip_summed == CHECKSUM_PARTIAL) {
			
 
				+ 		inet_proto_csum_replace2(&udph->check, skb, port,
			
 
				+@@ -446,9 +440,6 @@ int nf_flow_snat_port(const struct flow_
			
 
				+ 	struct flow_ports *hdr;
			
 
				+ 	__be16 port, new_port;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*hdr)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	hdr = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 
			
 
				+ 	switch (dir) {
			
 
				+@@ -477,9 +468,6 @@ int nf_flow_dnat_port(const struct flow_
			
 
				+ 	struct flow_ports *hdr;
			
 
				+ 	__be16 port, new_port;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*hdr)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	hdr = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 
			
 
				+ 	switch (dir) {
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -39,9 +39,6 @@ static int nf_flow_nat_ip_tcp(struct sk_
			
 
				+ {
			
 
				+ 	struct tcphdr *tcph;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*tcph)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	tcph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	inet_proto_csum_replace4(&tcph->check, skb, addr, new_addr, true);
			
 
				+ 
			
 
				+@@ -53,9 +50,6 @@ static int nf_flow_nat_ip_udp(struct sk_
			
 
				+ {
			
 
				+ 	struct udphdr *udph;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*udph)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	udph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	if (udph->check || skb->ip_summed == CHECKSUM_PARTIAL) {
			
 
				+ 		inet_proto_csum_replace4(&udph->check, skb, addr,
			
 
				+@@ -136,19 +130,17 @@ static int nf_flow_dnat_ip(const struct
			
 
				+ }
			
 
				+ 
			
 
				+ static int nf_flow_nat_ip(const struct flow_offload *flow, struct sk_buff *skb,
			
 
				+-			  unsigned int thoff, enum flow_offload_tuple_dir dir)
			
 
				++			  unsigned int thoff, enum flow_offload_tuple_dir dir,
			
 
				++			  struct iphdr *iph)
			
 
				+ {
			
 
				+-	struct iphdr *iph = ip_hdr(skb);
			
 
				+-
			
 
				+ 	if (test_bit(NF_FLOW_SNAT, &flow->flags) &&
			
 
				+ 	    (nf_flow_snat_port(flow, skb, thoff, iph->protocol, dir) < 0 ||
			
 
				+-	     nf_flow_snat_ip(flow, skb, ip_hdr(skb), thoff, dir) < 0))
			
 
				++	     nf_flow_snat_ip(flow, skb, iph, thoff, dir) < 0))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	iph = ip_hdr(skb);
			
 
				+ 	if (test_bit(NF_FLOW_DNAT, &flow->flags) &&
			
 
				+ 	    (nf_flow_dnat_port(flow, skb, thoff, iph->protocol, dir) < 0 ||
			
 
				+-	     nf_flow_dnat_ip(flow, skb, ip_hdr(skb), thoff, dir) < 0))
			
 
				++	     nf_flow_dnat_ip(flow, skb, iph, thoff, dir) < 0))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+@@ -160,10 +152,10 @@ static bool ip_has_options(unsigned int
			
 
				+ }
			
 
				+ 
			
 
				+ static int nf_flow_tuple_ip(struct sk_buff *skb, const struct net_device *dev,
			
 
				+-			    struct flow_offload_tuple *tuple)
			
 
				++			    struct flow_offload_tuple *tuple, u32 *hdrsize)
			
 
				+ {
			
 
				+-	unsigned int thoff, hdrsize;
			
 
				+ 	struct flow_ports *ports;
			
 
				++	unsigned int thoff;
			
 
				+ 	struct iphdr *iph;
			
 
				+ 
			
 
				+ 	if (!pskb_may_pull(skb, sizeof(*iph)))
			
 
				+@@ -178,10 +170,10 @@ static int nf_flow_tuple_ip(struct sk_bu
			
 
				+ 
			
 
				+ 	switch (iph->protocol) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+-		hdrsize = sizeof(struct tcphdr);
			
 
				++		*hdrsize = sizeof(struct tcphdr);
			
 
				+ 		break;
			
 
				+ 	case IPPROTO_UDP:
			
 
				+-		hdrsize = sizeof(struct udphdr);
			
 
				++		*hdrsize = sizeof(struct udphdr);
			
 
				+ 		break;
			
 
				+ 	default:
			
 
				+ 		return -1;
			
 
				+@@ -191,7 +183,7 @@ static int nf_flow_tuple_ip(struct sk_bu
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	thoff = iph->ihl * 4;
			
 
				+-	if (!pskb_may_pull(skb, thoff + hdrsize))
			
 
				++	if (!pskb_may_pull(skb, thoff + *hdrsize))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	iph = ip_hdr(skb);
			
 
				+@@ -252,11 +244,12 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	unsigned int thoff;
			
 
				+ 	struct iphdr *iph;
			
 
				+ 	__be32 nexthop;
			
 
				++	u32 hdrsize;
			
 
				+ 
			
 
				+ 	if (skb->protocol != htons(ETH_P_IP))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (nf_flow_tuple_ip(skb, state->in, &tuple) < 0)
			
 
				++	if (nf_flow_tuple_ip(skb, state->in, &tuple, &hdrsize) < 0)
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+ 	tuplehash = flow_offload_lookup(flow_table, &tuple);
			
 
				+@@ -271,11 +264,13 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (unlikely(nf_flow_exceeds_mtu(skb, flow->tuplehash[dir].tuple.mtu)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, sizeof(*iph)))
			
 
				++	iph = ip_hdr(skb);
			
 
				++	thoff = iph->ihl * 4;
			
 
				++	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+-	thoff = ip_hdr(skb)->ihl * 4;
			
 
				+-	if (nf_flow_state_check(flow, ip_hdr(skb)->protocol, skb, thoff))
			
 
				++	iph = ip_hdr(skb);
			
 
				++	if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+ 	flow_offload_refresh(flow_table, flow);
			
 
				+@@ -285,10 +280,9 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	if (nf_flow_nat_ip(flow, skb, thoff, dir) < 0)
			
 
				++	if (nf_flow_nat_ip(flow, skb, thoff, dir, iph) < 0)
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+-	iph = ip_hdr(skb);
			
 
				+ 	ip_decrease_ttl(iph);
			
 
				+ 	skb->tstamp = 0;
			
 
				+ 
			
 
				+@@ -317,9 +311,6 @@ static int nf_flow_nat_ipv6_tcp(struct s
			
 
				+ {
			
 
				+ 	struct tcphdr *tcph;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*tcph)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	tcph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	inet_proto_csum_replace16(&tcph->check, skb, addr->s6_addr32,
			
 
				+ 				  new_addr->s6_addr32, true);
			
 
				+@@ -333,9 +324,6 @@ static int nf_flow_nat_ipv6_udp(struct s
			
 
				+ {
			
 
				+ 	struct udphdr *udph;
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, thoff + sizeof(*udph)))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	udph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	if (udph->check || skb->ip_summed == CHECKSUM_PARTIAL) {
			
 
				+ 		inet_proto_csum_replace16(&udph->check, skb, addr->s6_addr32,
			
 
				+@@ -417,31 +405,30 @@ static int nf_flow_dnat_ipv6(const struc
			
 
				+ 
			
 
				+ static int nf_flow_nat_ipv6(const struct flow_offload *flow,
			
 
				+ 			    struct sk_buff *skb,
			
 
				+-			    enum flow_offload_tuple_dir dir)
			
 
				++			    enum flow_offload_tuple_dir dir,
			
 
				++			    struct ipv6hdr *ip6h)
			
 
				+ {
			
 
				+-	struct ipv6hdr *ip6h = ipv6_hdr(skb);
			
 
				+ 	unsigned int thoff = sizeof(*ip6h);
			
 
				+ 
			
 
				+ 	if (test_bit(NF_FLOW_SNAT, &flow->flags) &&
			
 
				+ 	    (nf_flow_snat_port(flow, skb, thoff, ip6h->nexthdr, dir) < 0 ||
			
 
				+-	     nf_flow_snat_ipv6(flow, skb, ipv6_hdr(skb), thoff, dir) < 0))
			
 
				++	     nf_flow_snat_ipv6(flow, skb, ip6h, thoff, dir) < 0))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	ip6h = ipv6_hdr(skb);
			
 
				+ 	if (test_bit(NF_FLOW_DNAT, &flow->flags) &&
			
 
				+ 	    (nf_flow_dnat_port(flow, skb, thoff, ip6h->nexthdr, dir) < 0 ||
			
 
				+-	     nf_flow_dnat_ipv6(flow, skb, ipv6_hdr(skb), thoff, dir) < 0))
			
 
				++	     nf_flow_dnat_ipv6(flow, skb, ip6h, thoff, dir) < 0))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+ static int nf_flow_tuple_ipv6(struct sk_buff *skb, const struct net_device *dev,
			
 
				+-			      struct flow_offload_tuple *tuple)
			
 
				++			      struct flow_offload_tuple *tuple, u32 *hdrsize)
			
 
				+ {
			
 
				+-	unsigned int thoff, hdrsize;
			
 
				+ 	struct flow_ports *ports;
			
 
				+ 	struct ipv6hdr *ip6h;
			
 
				++	unsigned int thoff;
			
 
				+ 
			
 
				+ 	if (!pskb_may_pull(skb, sizeof(*ip6h)))
			
 
				+ 		return -1;
			
 
				+@@ -450,10 +437,10 @@ static int nf_flow_tuple_ipv6(struct sk_
			
 
				+ 
			
 
				+ 	switch (ip6h->nexthdr) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+-		hdrsize = sizeof(struct tcphdr);
			
 
				++		*hdrsize = sizeof(struct tcphdr);
			
 
				+ 		break;
			
 
				+ 	case IPPROTO_UDP:
			
 
				+-		hdrsize = sizeof(struct udphdr);
			
 
				++		*hdrsize = sizeof(struct udphdr);
			
 
				+ 		break;
			
 
				+ 	default:
			
 
				+ 		return -1;
			
 
				+@@ -463,7 +450,7 @@ static int nf_flow_tuple_ipv6(struct sk_
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	thoff = sizeof(*ip6h);
			
 
				+-	if (!pskb_may_pull(skb, thoff + hdrsize))
			
 
				++	if (!pskb_may_pull(skb, thoff + *hdrsize))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	ip6h = ipv6_hdr(skb);
			
 
				+@@ -493,11 +480,12 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	struct net_device *outdev;
			
 
				+ 	struct ipv6hdr *ip6h;
			
 
				+ 	struct rt6_info *rt;
			
 
				++	u32 hdrsize;
			
 
				+ 
			
 
				+ 	if (skb->protocol != htons(ETH_P_IPV6))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (nf_flow_tuple_ipv6(skb, state->in, &tuple) < 0)
			
 
				++	if (nf_flow_tuple_ipv6(skb, state->in, &tuple, &hdrsize) < 0)
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+ 	tuplehash = flow_offload_lookup(flow_table, &tuple);
			
 
				+@@ -523,13 +511,13 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, sizeof(*ip6h)))
			
 
				++	if (skb_try_make_writable(skb, sizeof(*ip6h) + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+-	if (nf_flow_nat_ipv6(flow, skb, dir) < 0)
			
 
				++	ip6h = ipv6_hdr(skb);
			
 
				++	if (nf_flow_nat_ipv6(flow, skb, dir, ip6h) < 0)
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+-	ip6h = ipv6_hdr(skb);
			
 
				+ 	ip6h->hop_limit--;
			
 
				+ 	skb->tstamp = 0;
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-05-netfilter-flowtable-move-skb_try_make_writable-befor.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-05-netfilter-flowtable-move-skb_try_make_writable-befor.patch
@@ -0,0 +1,35 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:23 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: move skb_try_make_writable()
			
 
				+ before NAT in IPv4
			
 
				+
			
 
				+For consistency with the IPv6 flowtable datapath and to make sure the
			
 
				+skbuff is writable right before the NAT header updates.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -266,10 +266,6 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 
			
 
				+ 	iph = ip_hdr(skb);
			
 
				+ 	thoff = iph->ihl * 4;
			
 
				+-	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+-		return NF_DROP;
			
 
				+-
			
 
				+-	iph = ip_hdr(skb);
			
 
				+ 	if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+@@ -280,6 +276,10 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 	}
			
 
				+ 
			
 
				++	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				++		return NF_DROP;
			
 
				++
			
 
				++	iph = ip_hdr(skb);
			
 
				+ 	if (nf_flow_nat_ip(flow, skb, thoff, dir, iph) < 0)
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-06-netfilter-flowtable-move-FLOW_OFFLOAD_DIR_MAX-away-f.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-06-netfilter-flowtable-move-FLOW_OFFLOAD_DIR_MAX-away-f.patch
@@ -0,0 +1,82 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:24 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: move FLOW_OFFLOAD_DIR_MAX away
			
 
				+ from enumeration
			
 
				+
			
 
				+This allows to remove the default case which should not ever happen and
			
 
				+that was added to avoid gcc warnings on unhandled FLOW_OFFLOAD_DIR_MAX
			
 
				+enumeration case.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -86,8 +86,8 @@ static inline bool nf_flowtable_hw_offlo
			
 
				+ enum flow_offload_tuple_dir {
			
 
				+ 	FLOW_OFFLOAD_DIR_ORIGINAL = IP_CT_DIR_ORIGINAL,
			
 
				+ 	FLOW_OFFLOAD_DIR_REPLY = IP_CT_DIR_REPLY,
			
 
				+-	FLOW_OFFLOAD_DIR_MAX = IP_CT_DIR_MAX
			
 
				+ };
			
 
				++#define FLOW_OFFLOAD_DIR_MAX	IP_CT_DIR_MAX
			
 
				+ 
			
 
				+ struct flow_offload_tuple {
			
 
				+ 	union {
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -453,8 +453,6 @@ int nf_flow_snat_port(const struct flow_
			
 
				+ 		new_port = flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.src_port;
			
 
				+ 		hdr->dest = new_port;
			
 
				+ 		break;
			
 
				+-	default:
			
 
				+-		return -1;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return nf_flow_nat_port(skb, thoff, protocol, port, new_port);
			
 
				+@@ -481,8 +479,6 @@ int nf_flow_dnat_port(const struct flow_
			
 
				+ 		new_port = flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.dst_port;
			
 
				+ 		hdr->source = new_port;
			
 
				+ 		break;
			
 
				+-	default:
			
 
				+-		return -1;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return nf_flow_nat_port(skb, thoff, protocol, port, new_port);
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -96,8 +96,6 @@ static int nf_flow_snat_ip(const struct
			
 
				+ 		new_addr = flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.src_v4.s_addr;
			
 
				+ 		iph->daddr = new_addr;
			
 
				+ 		break;
			
 
				+-	default:
			
 
				+-		return -1;
			
 
				+ 	}
			
 
				+ 	csum_replace4(&iph->check, addr, new_addr);
			
 
				+ 
			
 
				+@@ -121,8 +119,6 @@ static int nf_flow_dnat_ip(const struct
			
 
				+ 		new_addr = flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.dst_v4.s_addr;
			
 
				+ 		iph->saddr = new_addr;
			
 
				+ 		break;
			
 
				+-	default:
			
 
				+-		return -1;
			
 
				+ 	}
			
 
				+ 	csum_replace4(&iph->check, addr, new_addr);
			
 
				+ 
			
 
				+@@ -371,8 +367,6 @@ static int nf_flow_snat_ipv6(const struc
			
 
				+ 		new_addr = flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.src_v6;
			
 
				+ 		ip6h->daddr = new_addr;
			
 
				+ 		break;
			
 
				+-	default:
			
 
				+-		return -1;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return nf_flow_nat_ipv6_l4proto(skb, ip6h, thoff, &addr, &new_addr);
			
 
				+@@ -396,8 +390,6 @@ static int nf_flow_dnat_ipv6(const struc
			
 
				+ 		new_addr = flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.dst_v6;
			
 
				+ 		ip6h->saddr = new_addr;
			
 
				+ 		break;
			
 
				+-	default:
			
 
				+-		return -1;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return nf_flow_nat_ipv6_l4proto(skb, ip6h, thoff, &addr, &new_addr);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-07-netfilter-flowtable-fast-NAT-functions-never-fail.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-07-netfilter-flowtable-fast-NAT-functions-never-fail.patch
@@ -0,0 +1,394 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:25 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: fast NAT functions never fail
			
 
				+
			
 
				+Simplify existing fast NAT routines by returning void. After the
			
 
				+skb_try_make_writable() call consolidation, these routines cannot ever
			
 
				+fail.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -228,12 +228,12 @@ void nf_flow_table_free(struct nf_flowta
			
 
				+ 
			
 
				+ void flow_offload_teardown(struct flow_offload *flow);
			
 
				+ 
			
 
				+-int nf_flow_snat_port(const struct flow_offload *flow,
			
 
				+-		      struct sk_buff *skb, unsigned int thoff,
			
 
				+-		      u8 protocol, enum flow_offload_tuple_dir dir);
			
 
				+-int nf_flow_dnat_port(const struct flow_offload *flow,
			
 
				+-		      struct sk_buff *skb, unsigned int thoff,
			
 
				+-		      u8 protocol, enum flow_offload_tuple_dir dir);
			
 
				++void nf_flow_snat_port(const struct flow_offload *flow,
			
 
				++		       struct sk_buff *skb, unsigned int thoff,
			
 
				++		       u8 protocol, enum flow_offload_tuple_dir dir);
			
 
				++void nf_flow_dnat_port(const struct flow_offload *flow,
			
 
				++		       struct sk_buff *skb, unsigned int thoff,
			
 
				++		       u8 protocol, enum flow_offload_tuple_dir dir);
			
 
				+ 
			
 
				+ struct flow_ports {
			
 
				+ 	__be16 source, dest;
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -388,20 +388,17 @@ static void nf_flow_offload_work_gc(stru
			
 
				+ 	queue_delayed_work(system_power_efficient_wq, &flow_table->gc_work, HZ);
			
 
				+ }
			
 
				+ 
			
 
				+-
			
 
				+-static int nf_flow_nat_port_tcp(struct sk_buff *skb, unsigned int thoff,
			
 
				+-				__be16 port, __be16 new_port)
			
 
				++static void nf_flow_nat_port_tcp(struct sk_buff *skb, unsigned int thoff,
			
 
				++				 __be16 port, __be16 new_port)
			
 
				+ {
			
 
				+ 	struct tcphdr *tcph;
			
 
				+ 
			
 
				+ 	tcph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	inet_proto_csum_replace2(&tcph->check, skb, port, new_port, false);
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_port_udp(struct sk_buff *skb, unsigned int thoff,
			
 
				+-				__be16 port, __be16 new_port)
			
 
				++static void nf_flow_nat_port_udp(struct sk_buff *skb, unsigned int thoff,
			
 
				++				 __be16 port, __be16 new_port)
			
 
				+ {
			
 
				+ 	struct udphdr *udph;
			
 
				+ 
			
 
				+@@ -412,30 +409,24 @@ static int nf_flow_nat_port_udp(struct s
			
 
				+ 		if (!udph->check)
			
 
				+ 			udph->check = CSUM_MANGLED_0;
			
 
				+ 	}
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_port(struct sk_buff *skb, unsigned int thoff,
			
 
				+-			    u8 protocol, __be16 port, __be16 new_port)
			
 
				++static void nf_flow_nat_port(struct sk_buff *skb, unsigned int thoff,
			
 
				++			     u8 protocol, __be16 port, __be16 new_port)
			
 
				+ {
			
 
				+ 	switch (protocol) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+-		if (nf_flow_nat_port_tcp(skb, thoff, port, new_port) < 0)
			
 
				+-			return NF_DROP;
			
 
				++		nf_flow_nat_port_tcp(skb, thoff, port, new_port);
			
 
				+ 		break;
			
 
				+ 	case IPPROTO_UDP:
			
 
				+-		if (nf_flow_nat_port_udp(skb, thoff, port, new_port) < 0)
			
 
				+-			return NF_DROP;
			
 
				++		nf_flow_nat_port_udp(skb, thoff, port, new_port);
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-int nf_flow_snat_port(const struct flow_offload *flow,
			
 
				+-		      struct sk_buff *skb, unsigned int thoff,
			
 
				+-		      u8 protocol, enum flow_offload_tuple_dir dir)
			
 
				++void nf_flow_snat_port(const struct flow_offload *flow,
			
 
				++		       struct sk_buff *skb, unsigned int thoff,
			
 
				++		       u8 protocol, enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	struct flow_ports *hdr;
			
 
				+ 	__be16 port, new_port;
			
 
				+@@ -455,13 +446,13 @@ int nf_flow_snat_port(const struct flow_
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	return nf_flow_nat_port(skb, thoff, protocol, port, new_port);
			
 
				++	nf_flow_nat_port(skb, thoff, protocol, port, new_port);
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(nf_flow_snat_port);
			
 
				+ 
			
 
				+-int nf_flow_dnat_port(const struct flow_offload *flow,
			
 
				+-		      struct sk_buff *skb, unsigned int thoff,
			
 
				+-		      u8 protocol, enum flow_offload_tuple_dir dir)
			
 
				++void nf_flow_dnat_port(const struct flow_offload *flow, struct sk_buff *skb,
			
 
				++		       unsigned int thoff, u8 protocol,
			
 
				++		       enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	struct flow_ports *hdr;
			
 
				+ 	__be16 port, new_port;
			
 
				+@@ -481,7 +472,7 @@ int nf_flow_dnat_port(const struct flow_
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	return nf_flow_nat_port(skb, thoff, protocol, port, new_port);
			
 
				++	nf_flow_nat_port(skb, thoff, protocol, port, new_port);
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(nf_flow_dnat_port);
			
 
				+ 
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -34,19 +34,17 @@ static int nf_flow_state_check(struct fl
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ip_tcp(struct sk_buff *skb, unsigned int thoff,
			
 
				+-			      __be32 addr, __be32 new_addr)
			
 
				++static void nf_flow_nat_ip_tcp(struct sk_buff *skb, unsigned int thoff,
			
 
				++			       __be32 addr, __be32 new_addr)
			
 
				+ {
			
 
				+ 	struct tcphdr *tcph;
			
 
				+ 
			
 
				+ 	tcph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	inet_proto_csum_replace4(&tcph->check, skb, addr, new_addr, true);
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ip_udp(struct sk_buff *skb, unsigned int thoff,
			
 
				+-			      __be32 addr, __be32 new_addr)
			
 
				++static void nf_flow_nat_ip_udp(struct sk_buff *skb, unsigned int thoff,
			
 
				++			       __be32 addr, __be32 new_addr)
			
 
				+ {
			
 
				+ 	struct udphdr *udph;
			
 
				+ 
			
 
				+@@ -57,31 +55,25 @@ static int nf_flow_nat_ip_udp(struct sk_
			
 
				+ 		if (!udph->check)
			
 
				+ 			udph->check = CSUM_MANGLED_0;
			
 
				+ 	}
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ip_l4proto(struct sk_buff *skb, struct iphdr *iph,
			
 
				+-				  unsigned int thoff, __be32 addr,
			
 
				+-				  __be32 new_addr)
			
 
				++static void nf_flow_nat_ip_l4proto(struct sk_buff *skb, struct iphdr *iph,
			
 
				++				   unsigned int thoff, __be32 addr,
			
 
				++				   __be32 new_addr)
			
 
				+ {
			
 
				+ 	switch (iph->protocol) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+-		if (nf_flow_nat_ip_tcp(skb, thoff, addr, new_addr) < 0)
			
 
				+-			return NF_DROP;
			
 
				++		nf_flow_nat_ip_tcp(skb, thoff, addr, new_addr);
			
 
				+ 		break;
			
 
				+ 	case IPPROTO_UDP:
			
 
				+-		if (nf_flow_nat_ip_udp(skb, thoff, addr, new_addr) < 0)
			
 
				+-			return NF_DROP;
			
 
				++		nf_flow_nat_ip_udp(skb, thoff, addr, new_addr);
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_snat_ip(const struct flow_offload *flow, struct sk_buff *skb,
			
 
				+-			   struct iphdr *iph, unsigned int thoff,
			
 
				+-			   enum flow_offload_tuple_dir dir)
			
 
				++static void nf_flow_snat_ip(const struct flow_offload *flow,
			
 
				++			    struct sk_buff *skb, struct iphdr *iph,
			
 
				++			    unsigned int thoff, enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	__be32 addr, new_addr;
			
 
				+ 
			
 
				+@@ -99,12 +91,12 @@ static int nf_flow_snat_ip(const struct
			
 
				+ 	}
			
 
				+ 	csum_replace4(&iph->check, addr, new_addr);
			
 
				+ 
			
 
				+-	return nf_flow_nat_ip_l4proto(skb, iph, thoff, addr, new_addr);
			
 
				++	nf_flow_nat_ip_l4proto(skb, iph, thoff, addr, new_addr);
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_dnat_ip(const struct flow_offload *flow, struct sk_buff *skb,
			
 
				+-			   struct iphdr *iph, unsigned int thoff,
			
 
				+-			   enum flow_offload_tuple_dir dir)
			
 
				++static void nf_flow_dnat_ip(const struct flow_offload *flow,
			
 
				++			    struct sk_buff *skb, struct iphdr *iph,
			
 
				++			    unsigned int thoff, enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	__be32 addr, new_addr;
			
 
				+ 
			
 
				+@@ -122,24 +114,21 @@ static int nf_flow_dnat_ip(const struct
			
 
				+ 	}
			
 
				+ 	csum_replace4(&iph->check, addr, new_addr);
			
 
				+ 
			
 
				+-	return nf_flow_nat_ip_l4proto(skb, iph, thoff, addr, new_addr);
			
 
				++	nf_flow_nat_ip_l4proto(skb, iph, thoff, addr, new_addr);
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ip(const struct flow_offload *flow, struct sk_buff *skb,
			
 
				++static void nf_flow_nat_ip(const struct flow_offload *flow, struct sk_buff *skb,
			
 
				+ 			  unsigned int thoff, enum flow_offload_tuple_dir dir,
			
 
				+ 			  struct iphdr *iph)
			
 
				+ {
			
 
				+-	if (test_bit(NF_FLOW_SNAT, &flow->flags) &&
			
 
				+-	    (nf_flow_snat_port(flow, skb, thoff, iph->protocol, dir) < 0 ||
			
 
				+-	     nf_flow_snat_ip(flow, skb, iph, thoff, dir) < 0))
			
 
				+-		return -1;
			
 
				+-
			
 
				+-	if (test_bit(NF_FLOW_DNAT, &flow->flags) &&
			
 
				+-	    (nf_flow_dnat_port(flow, skb, thoff, iph->protocol, dir) < 0 ||
			
 
				+-	     nf_flow_dnat_ip(flow, skb, iph, thoff, dir) < 0))
			
 
				+-		return -1;
			
 
				+-
			
 
				+-	return 0;
			
 
				++	if (test_bit(NF_FLOW_SNAT, &flow->flags)) {
			
 
				++		nf_flow_snat_port(flow, skb, thoff, iph->protocol, dir);
			
 
				++		nf_flow_snat_ip(flow, skb, iph, thoff, dir);
			
 
				++	}
			
 
				++	if (test_bit(NF_FLOW_DNAT, &flow->flags)) {
			
 
				++		nf_flow_dnat_port(flow, skb, thoff, iph->protocol, dir);
			
 
				++		nf_flow_dnat_ip(flow, skb, iph, thoff, dir);
			
 
				++	}
			
 
				+ }
			
 
				+ 
			
 
				+ static bool ip_has_options(unsigned int thoff)
			
 
				+@@ -276,8 +265,7 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+ 	iph = ip_hdr(skb);
			
 
				+-	if (nf_flow_nat_ip(flow, skb, thoff, dir, iph) < 0)
			
 
				+-		return NF_DROP;
			
 
				++	nf_flow_nat_ip(flow, skb, thoff, dir, iph);
			
 
				+ 
			
 
				+ 	ip_decrease_ttl(iph);
			
 
				+ 	skb->tstamp = 0;
			
 
				+@@ -301,22 +289,21 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(nf_flow_offload_ip_hook);
			
 
				+ 
			
 
				+-static int nf_flow_nat_ipv6_tcp(struct sk_buff *skb, unsigned int thoff,
			
 
				+-				struct in6_addr *addr,
			
 
				+-				struct in6_addr *new_addr)
			
 
				++static void nf_flow_nat_ipv6_tcp(struct sk_buff *skb, unsigned int thoff,
			
 
				++				 struct in6_addr *addr,
			
 
				++				 struct in6_addr *new_addr,
			
 
				++				 struct ipv6hdr *ip6h)
			
 
				+ {
			
 
				+ 	struct tcphdr *tcph;
			
 
				+ 
			
 
				+ 	tcph = (void *)(skb_network_header(skb) + thoff);
			
 
				+ 	inet_proto_csum_replace16(&tcph->check, skb, addr->s6_addr32,
			
 
				+ 				  new_addr->s6_addr32, true);
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ipv6_udp(struct sk_buff *skb, unsigned int thoff,
			
 
				+-				struct in6_addr *addr,
			
 
				+-				struct in6_addr *new_addr)
			
 
				++static void nf_flow_nat_ipv6_udp(struct sk_buff *skb, unsigned int thoff,
			
 
				++				 struct in6_addr *addr,
			
 
				++				 struct in6_addr *new_addr)
			
 
				+ {
			
 
				+ 	struct udphdr *udph;
			
 
				+ 
			
 
				+@@ -327,32 +314,26 @@ static int nf_flow_nat_ipv6_udp(struct s
			
 
				+ 		if (!udph->check)
			
 
				+ 			udph->check = CSUM_MANGLED_0;
			
 
				+ 	}
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ipv6_l4proto(struct sk_buff *skb, struct ipv6hdr *ip6h,
			
 
				+-				    unsigned int thoff, struct in6_addr *addr,
			
 
				+-				    struct in6_addr *new_addr)
			
 
				++static void nf_flow_nat_ipv6_l4proto(struct sk_buff *skb, struct ipv6hdr *ip6h,
			
 
				++				     unsigned int thoff, struct in6_addr *addr,
			
 
				++				     struct in6_addr *new_addr)
			
 
				+ {
			
 
				+ 	switch (ip6h->nexthdr) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+-		if (nf_flow_nat_ipv6_tcp(skb, thoff, addr, new_addr) < 0)
			
 
				+-			return NF_DROP;
			
 
				++		nf_flow_nat_ipv6_tcp(skb, thoff, addr, new_addr, ip6h);
			
 
				+ 		break;
			
 
				+ 	case IPPROTO_UDP:
			
 
				+-		if (nf_flow_nat_ipv6_udp(skb, thoff, addr, new_addr) < 0)
			
 
				+-			return NF_DROP;
			
 
				++		nf_flow_nat_ipv6_udp(skb, thoff, addr, new_addr);
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+-
			
 
				+-	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_snat_ipv6(const struct flow_offload *flow,
			
 
				+-			     struct sk_buff *skb, struct ipv6hdr *ip6h,
			
 
				+-			     unsigned int thoff,
			
 
				+-			     enum flow_offload_tuple_dir dir)
			
 
				++static void nf_flow_snat_ipv6(const struct flow_offload *flow,
			
 
				++			      struct sk_buff *skb, struct ipv6hdr *ip6h,
			
 
				++			      unsigned int thoff,
			
 
				++			      enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	struct in6_addr addr, new_addr;
			
 
				+ 
			
 
				+@@ -369,13 +350,13 @@ static int nf_flow_snat_ipv6(const struc
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	return nf_flow_nat_ipv6_l4proto(skb, ip6h, thoff, &addr, &new_addr);
			
 
				++	nf_flow_nat_ipv6_l4proto(skb, ip6h, thoff, &addr, &new_addr);
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_dnat_ipv6(const struct flow_offload *flow,
			
 
				+-			     struct sk_buff *skb, struct ipv6hdr *ip6h,
			
 
				+-			     unsigned int thoff,
			
 
				+-			     enum flow_offload_tuple_dir dir)
			
 
				++static void nf_flow_dnat_ipv6(const struct flow_offload *flow,
			
 
				++			      struct sk_buff *skb, struct ipv6hdr *ip6h,
			
 
				++			      unsigned int thoff,
			
 
				++			      enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	struct in6_addr addr, new_addr;
			
 
				+ 
			
 
				+@@ -392,27 +373,24 @@ static int nf_flow_dnat_ipv6(const struc
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	return nf_flow_nat_ipv6_l4proto(skb, ip6h, thoff, &addr, &new_addr);
			
 
				++	nf_flow_nat_ipv6_l4proto(skb, ip6h, thoff, &addr, &new_addr);
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_nat_ipv6(const struct flow_offload *flow,
			
 
				+-			    struct sk_buff *skb,
			
 
				+-			    enum flow_offload_tuple_dir dir,
			
 
				+-			    struct ipv6hdr *ip6h)
			
 
				++static void nf_flow_nat_ipv6(const struct flow_offload *flow,
			
 
				++			     struct sk_buff *skb,
			
 
				++			     enum flow_offload_tuple_dir dir,
			
 
				++			     struct ipv6hdr *ip6h)
			
 
				+ {
			
 
				+ 	unsigned int thoff = sizeof(*ip6h);
			
 
				+ 
			
 
				+-	if (test_bit(NF_FLOW_SNAT, &flow->flags) &&
			
 
				+-	    (nf_flow_snat_port(flow, skb, thoff, ip6h->nexthdr, dir) < 0 ||
			
 
				+-	     nf_flow_snat_ipv6(flow, skb, ip6h, thoff, dir) < 0))
			
 
				+-		return -1;
			
 
				+-
			
 
				+-	if (test_bit(NF_FLOW_DNAT, &flow->flags) &&
			
 
				+-	    (nf_flow_dnat_port(flow, skb, thoff, ip6h->nexthdr, dir) < 0 ||
			
 
				+-	     nf_flow_dnat_ipv6(flow, skb, ip6h, thoff, dir) < 0))
			
 
				+-		return -1;
			
 
				+-
			
 
				+-	return 0;
			
 
				++	if (test_bit(NF_FLOW_SNAT, &flow->flags)) {
			
 
				++		nf_flow_snat_port(flow, skb, thoff, ip6h->nexthdr, dir);
			
 
				++		nf_flow_snat_ipv6(flow, skb, ip6h, thoff, dir);
			
 
				++	}
			
 
				++	if (test_bit(NF_FLOW_DNAT, &flow->flags)) {
			
 
				++		nf_flow_dnat_port(flow, skb, thoff, ip6h->nexthdr, dir);
			
 
				++		nf_flow_dnat_ipv6(flow, skb, ip6h, thoff, dir);
			
 
				++	}
			
 
				+ }
			
 
				+ 
			
 
				+ static int nf_flow_tuple_ipv6(struct sk_buff *skb, const struct net_device *dev,
			
 
				+@@ -507,8 +485,7 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+ 	ip6h = ipv6_hdr(skb);
			
 
				+-	if (nf_flow_nat_ipv6(flow, skb, dir, ip6h) < 0)
			
 
				+-		return NF_DROP;
			
 
				++	nf_flow_nat_ipv6(flow, skb, dir, ip6h);
			
 
				+ 
			
 
				+ 	ip6h->hop_limit--;
			
 
				+ 	skb->tstamp = 0;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-08-netfilter-flowtable-call-dst_check-to-fall-back-to-c.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-08-netfilter-flowtable-call-dst_check-to-fall-back-to-c.patch
@@ -0,0 +1,46 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:26 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: call dst_check() to fall back to
			
 
				+ classic forwarding
			
 
				+
			
 
				+In case the route is stale, pass up the packet to the classic forwarding
			
 
				+path for re-evaluation and schedule this flow entry for removal.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -197,14 +197,6 @@ static bool nf_flow_exceeds_mtu(const st
			
 
				+ 	return true;
			
 
				+ }
			
 
				+ 
			
 
				+-static int nf_flow_offload_dst_check(struct dst_entry *dst)
			
 
				+-{
			
 
				+-	if (unlikely(dst_xfrm(dst)))
			
 
				+-		return dst_check(dst, 0) ? 0 : -1;
			
 
				+-
			
 
				+-	return 0;
			
 
				+-}
			
 
				+-
			
 
				+ static unsigned int nf_flow_xmit_xfrm(struct sk_buff *skb,
			
 
				+ 				      const struct nf_hook_state *state,
			
 
				+ 				      struct dst_entry *dst)
			
 
				+@@ -256,7 +248,7 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 
			
 
				+ 	flow_offload_refresh(flow_table, flow);
			
 
				+ 
			
 
				+-	if (nf_flow_offload_dst_check(&rt->dst)) {
			
 
				++	if (!dst_check(&rt->dst, 0)) {
			
 
				+ 		flow_offload_teardown(flow);
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 	}
			
 
				+@@ -476,7 +468,7 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 
			
 
				+ 	flow_offload_refresh(flow_table, flow);
			
 
				+ 
			
 
				+-	if (nf_flow_offload_dst_check(&rt->dst)) {
			
 
				++	if (!dst_check(&rt->dst, 0)) {
			
 
				+ 		flow_offload_teardown(flow);
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 	}
			
--- a/target/linux/generic/backport-5.15/610-v5.13-09-netfilter-flowtable-refresh-timeout-after-dst-and-wr.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-09-netfilter-flowtable-refresh-timeout-after-dst-and-wr.patch
@@ -0,0 +1,49 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:27 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: refresh timeout after dst and
			
 
				+ writable checks
			
 
				+
			
 
				+Refresh the timeout (and retry hardware offload) once the skbuff dst
			
 
				+is confirmed to be current and after the skbuff is made writable.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -246,8 +246,6 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	flow_offload_refresh(flow_table, flow);
			
 
				+-
			
 
				+ 	if (!dst_check(&rt->dst, 0)) {
			
 
				+ 		flow_offload_teardown(flow);
			
 
				+ 		return NF_ACCEPT;
			
 
				+@@ -256,6 +254,8 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				++	flow_offload_refresh(flow_table, flow);
			
 
				++
			
 
				+ 	iph = ip_hdr(skb);
			
 
				+ 	nf_flow_nat_ip(flow, skb, thoff, dir, iph);
			
 
				+ 
			
 
				+@@ -466,8 +466,6 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 				sizeof(*ip6h)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	flow_offload_refresh(flow_table, flow);
			
 
				+-
			
 
				+ 	if (!dst_check(&rt->dst, 0)) {
			
 
				+ 		flow_offload_teardown(flow);
			
 
				+ 		return NF_ACCEPT;
			
 
				+@@ -476,6 +474,8 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	if (skb_try_make_writable(skb, sizeof(*ip6h) + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				++	flow_offload_refresh(flow_table, flow);
			
 
				++
			
 
				+ 	ip6h = ipv6_hdr(skb);
			
 
				+ 	nf_flow_nat_ipv6(flow, skb, dir, ip6h);
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-10-netfilter-nftables-update-table-flags-from-the-commi.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-10-netfilter-nftables-update-table-flags-from-the-commi.patch
@@ -0,0 +1,103 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Tue, 23 Mar 2021 00:56:28 +0100
			
 
				+Subject: [PATCH] netfilter: nftables: update table flags from the commit
			
 
				+ phase
			
 
				+
			
 
				+Do not update table flags from the preparation phase. Store the flags
			
 
				+update into the transaction, then update the flags from the commit
			
 
				+phase.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_tables.h
			
 
				++++ b/include/net/netfilter/nf_tables.h
			
 
				+@@ -1470,13 +1470,16 @@ struct nft_trans_chain {
			
 
				+ 
			
 
				+ struct nft_trans_table {
			
 
				+ 	bool				update;
			
 
				+-	bool				enable;
			
 
				++	u8				state;
			
 
				++	u32				flags;
			
 
				+ };
			
 
				+ 
			
 
				+ #define nft_trans_table_update(trans)	\
			
 
				+ 	(((struct nft_trans_table *)trans->data)->update)
			
 
				+-#define nft_trans_table_enable(trans)	\
			
 
				+-	(((struct nft_trans_table *)trans->data)->enable)
			
 
				++#define nft_trans_table_state(trans)	\
			
 
				++	(((struct nft_trans_table *)trans->data)->state)
			
 
				++#define nft_trans_table_flags(trans)	\
			
 
				++	(((struct nft_trans_table *)trans->data)->flags)
			
 
				+ 
			
 
				+ struct nft_trans_elem {
			
 
				+ 	struct nft_set			*set;
			
 
				+--- a/net/netfilter/nf_tables_api.c
			
 
				++++ b/net/netfilter/nf_tables_api.c
			
 
				+@@ -891,6 +891,12 @@ static void nf_tables_table_disable(stru
			
 
				+ 	nft_table_disable(net, table, 0);
			
 
				+ }
			
 
				+ 
			
 
				++enum {
			
 
				++	NFT_TABLE_STATE_UNCHANGED	= 0,
			
 
				++	NFT_TABLE_STATE_DORMANT,
			
 
				++	NFT_TABLE_STATE_WAKEUP
			
 
				++};
			
 
				++
			
 
				+ static int nf_tables_updtable(struct nft_ctx *ctx)
			
 
				+ {
			
 
				+ 	struct nft_trans *trans;
			
 
				+@@ -914,19 +920,17 @@ static int nf_tables_updtable(struct nft
			
 
				+ 
			
 
				+ 	if ((flags & NFT_TABLE_F_DORMANT) &&
			
 
				+ 	    !(ctx->table->flags & NFT_TABLE_F_DORMANT)) {
			
 
				+-		nft_trans_table_enable(trans) = false;
			
 
				++		nft_trans_table_state(trans) = NFT_TABLE_STATE_DORMANT;
			
 
				+ 	} else if (!(flags & NFT_TABLE_F_DORMANT) &&
			
 
				+ 		   ctx->table->flags & NFT_TABLE_F_DORMANT) {
			
 
				+-		ctx->table->flags &= ~NFT_TABLE_F_DORMANT;
			
 
				+ 		ret = nf_tables_table_enable(ctx->net, ctx->table);
			
 
				+ 		if (ret >= 0)
			
 
				+-			nft_trans_table_enable(trans) = true;
			
 
				+-		else
			
 
				+-			ctx->table->flags |= NFT_TABLE_F_DORMANT;
			
 
				++			nft_trans_table_state(trans) = NFT_TABLE_STATE_WAKEUP;
			
 
				+ 	}
			
 
				+ 	if (ret < 0)
			
 
				+ 		goto err;
			
 
				+ 
			
 
				++	nft_trans_table_flags(trans) = flags;
			
 
				+ 	nft_trans_table_update(trans) = true;
			
 
				+ 	list_add_tail(&trans->list, &ctx->net->nft.commit_list);
			
 
				+ 	return 0;
			
 
				+@@ -7908,11 +7912,10 @@ static int nf_tables_commit(struct net *
			
 
				+ 		switch (trans->msg_type) {
			
 
				+ 		case NFT_MSG_NEWTABLE:
			
 
				+ 			if (nft_trans_table_update(trans)) {
			
 
				+-				if (!nft_trans_table_enable(trans)) {
			
 
				+-					nf_tables_table_disable(net,
			
 
				+-								trans->ctx.table);
			
 
				+-					trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
			
 
				+-				}
			
 
				++				if (nft_trans_table_state(trans) == NFT_TABLE_STATE_DORMANT)
			
 
				++					nf_tables_table_disable(net, trans->ctx.table);
			
 
				++
			
 
				++				trans->ctx.table->flags = nft_trans_table_flags(trans);
			
 
				+ 			} else {
			
 
				+ 				nft_clear(net, trans->ctx.table);
			
 
				+ 			}
			
 
				+@@ -8125,11 +8128,9 @@ static int __nf_tables_abort(struct net
			
 
				+ 		switch (trans->msg_type) {
			
 
				+ 		case NFT_MSG_NEWTABLE:
			
 
				+ 			if (nft_trans_table_update(trans)) {
			
 
				+-				if (nft_trans_table_enable(trans)) {
			
 
				+-					nf_tables_table_disable(net,
			
 
				+-								trans->ctx.table);
			
 
				+-					trans->ctx.table->flags |= NFT_TABLE_F_DORMANT;
			
 
				+-				}
			
 
				++				if (nft_trans_table_state(trans) == NFT_TABLE_STATE_WAKEUP)
			
 
				++					nf_tables_table_disable(net, trans->ctx.table);
			
 
				++
			
 
				+ 				nft_trans_destroy(trans);
			
 
				+ 			} else {
			
 
				+ 				list_del_rcu(&trans->ctx.table->list);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-11-net-resolve-forwarding-path-from-virtual-netdevice-a.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-11-net-resolve-forwarding-path-from-virtual-netdevice-a.patch
@@ -0,0 +1,170 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:32 +0100
			
 
				+Subject: [PATCH] net: resolve forwarding path from virtual netdevice and
			
 
				+ HW destination address
			
 
				+
			
 
				+This patch adds dev_fill_forward_path() which resolves the path to reach
			
 
				+the real netdevice from the IP forwarding side. This function takes as
			
 
				+input the netdevice and the destination hardware address and it walks
			
 
				+down the devices calling .ndo_fill_forward_path() for each device until
			
 
				+the real device is found.
			
 
				+
			
 
				+For instance, assuming the following topology:
			
 
				+
			
 
				+               IP forwarding
			
 
				+              /             \
			
 
				+           br0              eth0
			
 
				+           / \
			
 
				+       eth1  eth2
			
 
				+        .
			
 
				+        .
			
 
				+        .
			
 
				+       ethX
			
 
				+ ab:cd:ef:ab:cd:ef
			
 
				+
			
 
				+where eth1 and eth2 are bridge ports and eth0 provides WAN connectivity.
			
 
				+ethX is the interface in another box which is connected to the eth1
			
 
				+bridge port.
			
 
				+
			
 
				+For packets going through IP forwarding to br0 whose destination MAC
			
 
				+address is ab:cd:ef:ab:cd:ef, dev_fill_forward_path() provides the
			
 
				+following path:
			
 
				+
			
 
				+	br0 -> eth1
			
 
				+
			
 
				+.ndo_fill_forward_path for br0 looks up at the FDB for the bridge port
			
 
				+from the destination MAC address to get the bridge port eth1.
			
 
				+
			
 
				+This information allows to create a fast path that bypasses the classic
			
 
				+bridge and IP forwarding paths, so packets go directly from the bridge
			
 
				+port eth1 to eth0 (wan interface) and vice versa.
			
 
				+
			
 
				+             fast path
			
 
				+      .------------------------.
			
 
				+     /                          \
			
 
				+    |           IP forwarding   |
			
 
				+    |          /             \  \/
			
 
				+    |       br0               eth0
			
 
				+    .       / \
			
 
				+     -> eth1  eth2
			
 
				+        .
			
 
				+        .
			
 
				+        .
			
 
				+       ethX
			
 
				+ ab:cd:ef:ab:cd:ef
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -827,6 +827,27 @@ typedef u16 (*select_queue_fallback_t)(s
			
 
				+ 				       struct sk_buff *skb,
			
 
				+ 				       struct net_device *sb_dev);
			
 
				+ 
			
 
				++enum net_device_path_type {
			
 
				++	DEV_PATH_ETHERNET = 0,
			
 
				++};
			
 
				++
			
 
				++struct net_device_path {
			
 
				++	enum net_device_path_type	type;
			
 
				++	const struct net_device		*dev;
			
 
				++};
			
 
				++
			
 
				++#define NET_DEVICE_PATH_STACK_MAX	5
			
 
				++
			
 
				++struct net_device_path_stack {
			
 
				++	int			num_paths;
			
 
				++	struct net_device_path	path[NET_DEVICE_PATH_STACK_MAX];
			
 
				++};
			
 
				++
			
 
				++struct net_device_path_ctx {
			
 
				++	const struct net_device *dev;
			
 
				++	const u8		*daddr;
			
 
				++};
			
 
				++
			
 
				+ enum tc_setup_type {
			
 
				+ 	TC_SETUP_QDISC_MQPRIO,
			
 
				+ 	TC_SETUP_CLSU32,
			
 
				+@@ -1273,6 +1294,8 @@ struct netdev_net_notifier {
			
 
				+  * struct net_device *(*ndo_get_peer_dev)(struct net_device *dev);
			
 
				+  *	If a device is paired with a peer device, return the peer instance.
			
 
				+  *	The caller must be under RCU read context.
			
 
				++ * int (*ndo_fill_forward_path)(struct net_device_path_ctx *ctx, struct net_device_path *path);
			
 
				++ *     Get the forwarding path to reach the real device from the HW destination address
			
 
				+  */
			
 
				+ struct net_device_ops {
			
 
				+ 	int			(*ndo_init)(struct net_device *dev);
			
 
				+@@ -1481,6 +1504,8 @@ struct net_device_ops {
			
 
				+ 	int			(*ndo_tunnel_ctl)(struct net_device *dev,
			
 
				+ 						  struct ip_tunnel_parm *p, int cmd);
			
 
				+ 	struct net_device *	(*ndo_get_peer_dev)(struct net_device *dev);
			
 
				++	int                     (*ndo_fill_forward_path)(struct net_device_path_ctx *ctx,
			
 
				++                                                         struct net_device_path *path);
			
 
				+ };
			
 
				+ 
			
 
				+ /**
			
 
				+@@ -2828,6 +2853,8 @@ void dev_remove_offload(struct packet_of
			
 
				+ 
			
 
				+ int dev_get_iflink(const struct net_device *dev);
			
 
				+ int dev_fill_metadata_dst(struct net_device *dev, struct sk_buff *skb);
			
 
				++int dev_fill_forward_path(const struct net_device *dev, const u8 *daddr,
			
 
				++			  struct net_device_path_stack *stack);
			
 
				+ struct net_device *__dev_get_by_flags(struct net *net, unsigned short flags,
			
 
				+ 				      unsigned short mask);
			
 
				+ struct net_device *dev_get_by_name(struct net *net, const char *name);
			
 
				+--- a/net/core/dev.c
			
 
				++++ b/net/core/dev.c
			
 
				+@@ -847,6 +847,52 @@ int dev_fill_metadata_dst(struct net_dev
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(dev_fill_metadata_dst);
			
 
				+ 
			
 
				++static struct net_device_path *dev_fwd_path(struct net_device_path_stack *stack)
			
 
				++{
			
 
				++	int k = stack->num_paths++;
			
 
				++
			
 
				++	if (WARN_ON_ONCE(k >= NET_DEVICE_PATH_STACK_MAX))
			
 
				++		return NULL;
			
 
				++
			
 
				++	return &stack->path[k];
			
 
				++}
			
 
				++
			
 
				++int dev_fill_forward_path(const struct net_device *dev, const u8 *daddr,
			
 
				++			  struct net_device_path_stack *stack)
			
 
				++{
			
 
				++	const struct net_device *last_dev;
			
 
				++	struct net_device_path_ctx ctx = {
			
 
				++		.dev	= dev,
			
 
				++		.daddr	= daddr,
			
 
				++	};
			
 
				++	struct net_device_path *path;
			
 
				++	int ret = 0;
			
 
				++
			
 
				++	stack->num_paths = 0;
			
 
				++	while (ctx.dev && ctx.dev->netdev_ops->ndo_fill_forward_path) {
			
 
				++		last_dev = ctx.dev;
			
 
				++		path = dev_fwd_path(stack);
			
 
				++		if (!path)
			
 
				++			return -1;
			
 
				++
			
 
				++		memset(path, 0, sizeof(struct net_device_path));
			
 
				++		ret = ctx.dev->netdev_ops->ndo_fill_forward_path(&ctx, path);
			
 
				++		if (ret < 0)
			
 
				++			return -1;
			
 
				++
			
 
				++		if (WARN_ON_ONCE(last_dev == ctx.dev))
			
 
				++			return -1;
			
 
				++	}
			
 
				++	path = dev_fwd_path(stack);
			
 
				++	if (!path)
			
 
				++		return -1;
			
 
				++	path->type = DEV_PATH_ETHERNET;
			
 
				++	path->dev = ctx.dev;
			
 
				++
			
 
				++	return ret;
			
 
				++}
			
 
				++EXPORT_SYMBOL_GPL(dev_fill_forward_path);
			
 
				++
			
 
				+ /**
			
 
				+  *	__dev_get_by_name	- find a device by its name
			
 
				+  *	@net: the applicable net namespace
			
--- a/target/linux/generic/backport-5.15/610-v5.13-12-net-8021q-resolve-forwarding-path-for-vlan-devices.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-12-net-8021q-resolve-forwarding-path-for-vlan-devices.patch
@@ -0,0 +1,80 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:33 +0100
			
 
				+Subject: [PATCH] net: 8021q: resolve forwarding path for vlan devices
			
 
				+
			
 
				+Add .ndo_fill_forward_path for vlan devices.
			
 
				+
			
 
				+For instance, assuming the following topology:
			
 
				+
			
 
				+                   IP forwarding
			
 
				+                  /             \
			
 
				+            eth0.100             eth0
			
 
				+            |
			
 
				+            eth0
			
 
				+            .
			
 
				+            .
			
 
				+            .
			
 
				+           ethX
			
 
				+     ab:cd:ef:ab:cd:ef
			
 
				+
			
 
				+For packets going through IP forwarding to eth0.100 whose destination
			
 
				+MAC address is ab:cd:ef:ab:cd:ef, dev_fill_forward_path() provides the
			
 
				+following path:
			
 
				+
			
 
				+        eth0.100 -> eth0
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -829,11 +829,18 @@ typedef u16 (*select_queue_fallback_t)(s
			
 
				+ 
			
 
				+ enum net_device_path_type {
			
 
				+ 	DEV_PATH_ETHERNET = 0,
			
 
				++	DEV_PATH_VLAN,
			
 
				+ };
			
 
				+ 
			
 
				+ struct net_device_path {
			
 
				+ 	enum net_device_path_type	type;
			
 
				+ 	const struct net_device		*dev;
			
 
				++	union {
			
 
				++		struct {
			
 
				++			u16		id;
			
 
				++			__be16		proto;
			
 
				++		} encap;
			
 
				++	};
			
 
				+ };
			
 
				+ 
			
 
				+ #define NET_DEVICE_PATH_STACK_MAX	5
			
 
				+--- a/net/8021q/vlan_dev.c
			
 
				++++ b/net/8021q/vlan_dev.c
			
 
				+@@ -770,6 +770,20 @@ static int vlan_dev_get_iflink(const str
			
 
				+ 	return real_dev->ifindex;
			
 
				+ }
			
 
				+ 
			
 
				++static int vlan_dev_fill_forward_path(struct net_device_path_ctx *ctx,
			
 
				++				      struct net_device_path *path)
			
 
				++{
			
 
				++	struct vlan_dev_priv *vlan = vlan_dev_priv(ctx->dev);
			
 
				++
			
 
				++	path->type = DEV_PATH_VLAN;
			
 
				++	path->encap.id = vlan->vlan_id;
			
 
				++	path->encap.proto = vlan->vlan_proto;
			
 
				++	path->dev = ctx->dev;
			
 
				++	ctx->dev = vlan->real_dev;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static const struct ethtool_ops vlan_ethtool_ops = {
			
 
				+ 	.get_link_ksettings	= vlan_ethtool_get_link_ksettings,
			
 
				+ 	.get_drvinfo	        = vlan_ethtool_get_drvinfo,
			
 
				+@@ -808,6 +822,7 @@ static const struct net_device_ops vlan_
			
 
				+ #endif
			
 
				+ 	.ndo_fix_features	= vlan_dev_fix_features,
			
 
				+ 	.ndo_get_iflink		= vlan_dev_get_iflink,
			
 
				++	.ndo_fill_forward_path	= vlan_dev_fill_forward_path,
			
 
				+ };
			
 
				+ 
			
 
				+ static void vlan_dev_free(struct net_device *dev)
			
--- a/target/linux/generic/backport-5.15/610-v5.13-13-net-bridge-resolve-forwarding-path-for-bridge-device.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-13-net-bridge-resolve-forwarding-path-for-bridge-device.patch
@@ -0,0 +1,62 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:34 +0100
			
 
				+Subject: [PATCH] net: bridge: resolve forwarding path for bridge devices
			
 
				+
			
 
				+Add .ndo_fill_forward_path for bridge devices.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -830,6 +830,7 @@ typedef u16 (*select_queue_fallback_t)(s
			
 
				+ enum net_device_path_type {
			
 
				+ 	DEV_PATH_ETHERNET = 0,
			
 
				+ 	DEV_PATH_VLAN,
			
 
				++	DEV_PATH_BRIDGE,
			
 
				+ };
			
 
				+ 
			
 
				+ struct net_device_path {
			
 
				+--- a/net/bridge/br_device.c
			
 
				++++ b/net/bridge/br_device.c
			
 
				+@@ -398,6 +398,32 @@ static int br_del_slave(struct net_devic
			
 
				+ 	return br_del_if(br, slave_dev);
			
 
				+ }
			
 
				+ 
			
 
				++static int br_fill_forward_path(struct net_device_path_ctx *ctx,
			
 
				++				struct net_device_path *path)
			
 
				++{
			
 
				++	struct net_bridge_fdb_entry *f;
			
 
				++	struct net_bridge_port *dst;
			
 
				++	struct net_bridge *br;
			
 
				++
			
 
				++	if (netif_is_bridge_port(ctx->dev))
			
 
				++		return -1;
			
 
				++
			
 
				++	br = netdev_priv(ctx->dev);
			
 
				++	f = br_fdb_find_rcu(br, ctx->daddr, 0);
			
 
				++	if (!f || !f->dst)
			
 
				++		return -1;
			
 
				++
			
 
				++	dst = READ_ONCE(f->dst);
			
 
				++	if (!dst)
			
 
				++		return -1;
			
 
				++
			
 
				++	path->type = DEV_PATH_BRIDGE;
			
 
				++	path->dev = dst->br->dev;
			
 
				++	ctx->dev = dst->dev;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static const struct ethtool_ops br_ethtool_ops = {
			
 
				+ 	.get_drvinfo		 = br_getinfo,
			
 
				+ 	.get_link		 = ethtool_op_get_link,
			
 
				+@@ -432,6 +458,7 @@ static const struct net_device_ops br_ne
			
 
				+ 	.ndo_bridge_setlink	 = br_setlink,
			
 
				+ 	.ndo_bridge_dellink	 = br_dellink,
			
 
				+ 	.ndo_features_check	 = passthru_features_check,
			
 
				++	.ndo_fill_forward_path	 = br_fill_forward_path,
			
 
				+ };
			
 
				+ 
			
 
				+ static struct device_type br_type = {
			
--- a/target/linux/generic/backport-5.15/610-v5.13-14-net-bridge-resolve-forwarding-path-for-VLAN-tag-acti.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-14-net-bridge-resolve-forwarding-path-for-VLAN-tag-acti.patch
@@ -0,0 +1,207 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:35 +0100
			
 
				+Subject: [PATCH] net: bridge: resolve forwarding path for VLAN tag
			
 
				+ actions in bridge devices
			
 
				+
			
 
				+Depending on the VLAN settings of the bridge and the port, the bridge can
			
 
				+either add or remove a tag. When vlan filtering is enabled, the fdb lookup
			
 
				+also needs to know the VLAN tag/proto for the destination address
			
 
				+To provide this, keep track of the stack of VLAN tags for the path in the
			
 
				+lookup context
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -841,10 +841,20 @@ struct net_device_path {
			
 
				+ 			u16		id;
			
 
				+ 			__be16		proto;
			
 
				+ 		} encap;
			
 
				++		struct {
			
 
				++			enum {
			
 
				++				DEV_PATH_BR_VLAN_KEEP,
			
 
				++				DEV_PATH_BR_VLAN_TAG,
			
 
				++				DEV_PATH_BR_VLAN_UNTAG,
			
 
				++			}		vlan_mode;
			
 
				++			u16		vlan_id;
			
 
				++			__be16		vlan_proto;
			
 
				++		} bridge;
			
 
				+ 	};
			
 
				+ };
			
 
				+ 
			
 
				+ #define NET_DEVICE_PATH_STACK_MAX	5
			
 
				++#define NET_DEVICE_PATH_VLAN_MAX	2
			
 
				+ 
			
 
				+ struct net_device_path_stack {
			
 
				+ 	int			num_paths;
			
 
				+@@ -854,6 +864,12 @@ struct net_device_path_stack {
			
 
				+ struct net_device_path_ctx {
			
 
				+ 	const struct net_device *dev;
			
 
				+ 	const u8		*daddr;
			
 
				++
			
 
				++	int			num_vlans;
			
 
				++	struct {
			
 
				++		u16		id;
			
 
				++		__be16		proto;
			
 
				++	} vlan[NET_DEVICE_PATH_VLAN_MAX];
			
 
				+ };
			
 
				+ 
			
 
				+ enum tc_setup_type {
			
 
				+--- a/net/8021q/vlan_dev.c
			
 
				++++ b/net/8021q/vlan_dev.c
			
 
				+@@ -780,6 +780,12 @@ static int vlan_dev_fill_forward_path(st
			
 
				+ 	path->encap.proto = vlan->vlan_proto;
			
 
				+ 	path->dev = ctx->dev;
			
 
				+ 	ctx->dev = vlan->real_dev;
			
 
				++	if (ctx->num_vlans >= ARRAY_SIZE(ctx->vlan))
			
 
				++		return -ENOSPC;
			
 
				++
			
 
				++	ctx->vlan[ctx->num_vlans].id = vlan->vlan_id;
			
 
				++	ctx->vlan[ctx->num_vlans].proto = vlan->vlan_proto;
			
 
				++	ctx->num_vlans++;
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+--- a/net/bridge/br_device.c
			
 
				++++ b/net/bridge/br_device.c
			
 
				+@@ -409,7 +409,10 @@ static int br_fill_forward_path(struct n
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	br = netdev_priv(ctx->dev);
			
 
				+-	f = br_fdb_find_rcu(br, ctx->daddr, 0);
			
 
				++
			
 
				++	br_vlan_fill_forward_path_pvid(br, ctx, path);
			
 
				++
			
 
				++	f = br_fdb_find_rcu(br, ctx->daddr, path->bridge.vlan_id);
			
 
				+ 	if (!f || !f->dst)
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+@@ -417,10 +420,28 @@ static int br_fill_forward_path(struct n
			
 
				+ 	if (!dst)
			
 
				+ 		return -1;
			
 
				+ 
			
 
				++	if (br_vlan_fill_forward_path_mode(br, dst, path))
			
 
				++		return -1;
			
 
				++
			
 
				+ 	path->type = DEV_PATH_BRIDGE;
			
 
				+ 	path->dev = dst->br->dev;
			
 
				+ 	ctx->dev = dst->dev;
			
 
				+ 
			
 
				++	switch (path->bridge.vlan_mode) {
			
 
				++	case DEV_PATH_BR_VLAN_TAG:
			
 
				++		if (ctx->num_vlans >= ARRAY_SIZE(ctx->vlan))
			
 
				++			return -ENOSPC;
			
 
				++		ctx->vlan[ctx->num_vlans].id = path->bridge.vlan_id;
			
 
				++		ctx->vlan[ctx->num_vlans].proto = path->bridge.vlan_proto;
			
 
				++		ctx->num_vlans++;
			
 
				++		break;
			
 
				++	case DEV_PATH_BR_VLAN_UNTAG:
			
 
				++		ctx->num_vlans--;
			
 
				++		break;
			
 
				++	case DEV_PATH_BR_VLAN_KEEP:
			
 
				++		break;
			
 
				++	}
			
 
				++
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+--- a/net/bridge/br_private.h
			
 
				++++ b/net/bridge/br_private.h
			
 
				+@@ -1093,6 +1093,13 @@ void br_vlan_notify(const struct net_bri
			
 
				+ bool br_vlan_can_enter_range(const struct net_bridge_vlan *v_curr,
			
 
				+ 			     const struct net_bridge_vlan *range_end);
			
 
				+ 
			
 
				++void br_vlan_fill_forward_path_pvid(struct net_bridge *br,
			
 
				++				    struct net_device_path_ctx *ctx,
			
 
				++				    struct net_device_path *path);
			
 
				++int br_vlan_fill_forward_path_mode(struct net_bridge *br,
			
 
				++				   struct net_bridge_port *dst,
			
 
				++				   struct net_device_path *path);
			
 
				++
			
 
				+ static inline struct net_bridge_vlan_group *br_vlan_group(
			
 
				+ 					const struct net_bridge *br)
			
 
				+ {
			
 
				+@@ -1250,6 +1257,19 @@ static inline int nbp_get_num_vlan_infos
			
 
				+ {
			
 
				+ 	return 0;
			
 
				+ }
			
 
				++
			
 
				++static inline void br_vlan_fill_forward_path_pvid(struct net_bridge *br,
			
 
				++						  struct net_device_path_ctx *ctx,
			
 
				++						  struct net_device_path *path)
			
 
				++{
			
 
				++}
			
 
				++
			
 
				++static inline int br_vlan_fill_forward_path_mode(struct net_bridge *br,
			
 
				++						 struct net_bridge_port *dst,
			
 
				++						 struct net_device_path *path)
			
 
				++{
			
 
				++	return 0;
			
 
				++}
			
 
				+ 
			
 
				+ static inline struct net_bridge_vlan_group *br_vlan_group(
			
 
				+ 					const struct net_bridge *br)
			
 
				+--- a/net/bridge/br_vlan.c
			
 
				++++ b/net/bridge/br_vlan.c
			
 
				+@@ -1327,6 +1327,59 @@ int br_vlan_get_pvid_rcu(const struct ne
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(br_vlan_get_pvid_rcu);
			
 
				+ 
			
 
				++void br_vlan_fill_forward_path_pvid(struct net_bridge *br,
			
 
				++				    struct net_device_path_ctx *ctx,
			
 
				++				    struct net_device_path *path)
			
 
				++{
			
 
				++	struct net_bridge_vlan_group *vg;
			
 
				++	int idx = ctx->num_vlans - 1;
			
 
				++	u16 vid;
			
 
				++
			
 
				++	path->bridge.vlan_mode = DEV_PATH_BR_VLAN_KEEP;
			
 
				++
			
 
				++	if (!br_opt_get(br, BROPT_VLAN_ENABLED))
			
 
				++		return;
			
 
				++
			
 
				++	vg = br_vlan_group(br);
			
 
				++
			
 
				++	if (idx >= 0 &&
			
 
				++	    ctx->vlan[idx].proto == br->vlan_proto) {
			
 
				++		vid = ctx->vlan[idx].id;
			
 
				++	} else {
			
 
				++		path->bridge.vlan_mode = DEV_PATH_BR_VLAN_TAG;
			
 
				++		vid = br_get_pvid(vg);
			
 
				++	}
			
 
				++
			
 
				++	path->bridge.vlan_id = vid;
			
 
				++	path->bridge.vlan_proto = br->vlan_proto;
			
 
				++}
			
 
				++
			
 
				++int br_vlan_fill_forward_path_mode(struct net_bridge *br,
			
 
				++				   struct net_bridge_port *dst,
			
 
				++				   struct net_device_path *path)
			
 
				++{
			
 
				++	struct net_bridge_vlan_group *vg;
			
 
				++	struct net_bridge_vlan *v;
			
 
				++
			
 
				++	if (!br_opt_get(br, BROPT_VLAN_ENABLED))
			
 
				++		return 0;
			
 
				++
			
 
				++	vg = nbp_vlan_group_rcu(dst);
			
 
				++	v = br_vlan_find(vg, path->bridge.vlan_id);
			
 
				++	if (!v || !br_vlan_should_use(v))
			
 
				++		return -EINVAL;
			
 
				++
			
 
				++	if (!(v->flags & BRIDGE_VLAN_INFO_UNTAGGED))
			
 
				++		return 0;
			
 
				++
			
 
				++	if (path->bridge.vlan_mode == DEV_PATH_BR_VLAN_TAG)
			
 
				++		path->bridge.vlan_mode = DEV_PATH_BR_VLAN_KEEP;
			
 
				++	else
			
 
				++		path->bridge.vlan_mode = DEV_PATH_BR_VLAN_UNTAG;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ int br_vlan_get_info(const struct net_device *dev, u16 vid,
			
 
				+ 		     struct bridge_vlan_info *p_vinfo)
			
 
				+ {
			
--- a/target/linux/generic/backport-5.15/610-v5.13-15-net-ppp-resolve-forwarding-path-for-bridge-pppoe-dev.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-15-net-ppp-resolve-forwarding-path-for-bridge-pppoe-dev.patch
@@ -0,0 +1,113 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:36 +0100
			
 
				+Subject: [PATCH] net: ppp: resolve forwarding path for bridge pppoe
			
 
				+ devices
			
 
				+
			
 
				+Pass on the PPPoE session ID, destination hardware address and the real
			
 
				+device.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/drivers/net/ppp/ppp_generic.c
			
 
				++++ b/drivers/net/ppp/ppp_generic.c
			
 
				+@@ -1466,12 +1466,34 @@ static void ppp_dev_priv_destructor(stru
			
 
				+ 		ppp_destroy_interface(ppp);
			
 
				+ }
			
 
				+ 
			
 
				++static int ppp_fill_forward_path(struct net_device_path_ctx *ctx,
			
 
				++				 struct net_device_path *path)
			
 
				++{
			
 
				++	struct ppp *ppp = netdev_priv(ctx->dev);
			
 
				++	struct ppp_channel *chan;
			
 
				++	struct channel *pch;
			
 
				++
			
 
				++	if (ppp->flags & SC_MULTILINK)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	if (list_empty(&ppp->channels))
			
 
				++		return -ENODEV;
			
 
				++
			
 
				++	pch = list_first_entry(&ppp->channels, struct channel, clist);
			
 
				++	chan = pch->chan;
			
 
				++	if (!chan->ops->fill_forward_path)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	return chan->ops->fill_forward_path(ctx, path, chan);
			
 
				++}
			
 
				++
			
 
				+ static const struct net_device_ops ppp_netdev_ops = {
			
 
				+ 	.ndo_init	 = ppp_dev_init,
			
 
				+ 	.ndo_uninit      = ppp_dev_uninit,
			
 
				+ 	.ndo_start_xmit  = ppp_start_xmit,
			
 
				+ 	.ndo_do_ioctl    = ppp_net_ioctl,
			
 
				+ 	.ndo_get_stats64 = ppp_get_stats64,
			
 
				++	.ndo_fill_forward_path = ppp_fill_forward_path,
			
 
				+ };
			
 
				+ 
			
 
				+ static struct device_type ppp_type = {
			
 
				+--- a/drivers/net/ppp/pppoe.c
			
 
				++++ b/drivers/net/ppp/pppoe.c
			
 
				+@@ -972,8 +972,31 @@ static int pppoe_xmit(struct ppp_channel
			
 
				+ 	return __pppoe_xmit(sk, skb);
			
 
				+ }
			
 
				+ 
			
 
				++static int pppoe_fill_forward_path(struct net_device_path_ctx *ctx,
			
 
				++				   struct net_device_path *path,
			
 
				++				   const struct ppp_channel *chan)
			
 
				++{
			
 
				++	struct sock *sk = (struct sock *)chan->private;
			
 
				++	struct pppox_sock *po = pppox_sk(sk);
			
 
				++	struct net_device *dev = po->pppoe_dev;
			
 
				++
			
 
				++	if (sock_flag(sk, SOCK_DEAD) ||
			
 
				++	    !(sk->sk_state & PPPOX_CONNECTED) || !dev)
			
 
				++		return -1;
			
 
				++
			
 
				++	path->type = DEV_PATH_PPPOE;
			
 
				++	path->encap.proto = htons(ETH_P_PPP_SES);
			
 
				++	path->encap.id = be16_to_cpu(po->num);
			
 
				++	memcpy(path->encap.h_dest, po->pppoe_pa.remote, ETH_ALEN);
			
 
				++	path->dev = ctx->dev;
			
 
				++	ctx->dev = dev;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static const struct ppp_channel_ops pppoe_chan_ops = {
			
 
				+ 	.start_xmit = pppoe_xmit,
			
 
				++	.fill_forward_path = pppoe_fill_forward_path,
			
 
				+ };
			
 
				+ 
			
 
				+ static int pppoe_recvmsg(struct socket *sock, struct msghdr *m,
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -831,6 +831,7 @@ enum net_device_path_type {
			
 
				+ 	DEV_PATH_ETHERNET = 0,
			
 
				+ 	DEV_PATH_VLAN,
			
 
				+ 	DEV_PATH_BRIDGE,
			
 
				++	DEV_PATH_PPPOE,
			
 
				+ };
			
 
				+ 
			
 
				+ struct net_device_path {
			
 
				+@@ -840,6 +841,7 @@ struct net_device_path {
			
 
				+ 		struct {
			
 
				+ 			u16		id;
			
 
				+ 			__be16		proto;
			
 
				++			u8		h_dest[ETH_ALEN];
			
 
				+ 		} encap;
			
 
				+ 		struct {
			
 
				+ 			enum {
			
 
				+--- a/include/linux/ppp_channel.h
			
 
				++++ b/include/linux/ppp_channel.h
			
 
				+@@ -28,6 +28,9 @@ struct ppp_channel_ops {
			
 
				+ 	int	(*start_xmit)(struct ppp_channel *, struct sk_buff *);
			
 
				+ 	/* Handle an ioctl call that has come in via /dev/ppp. */
			
 
				+ 	int	(*ioctl)(struct ppp_channel *, unsigned int, unsigned long);
			
 
				++	int	(*fill_forward_path)(struct net_device_path_ctx *,
			
 
				++				     struct net_device_path *,
			
 
				++				     const struct ppp_channel *);
			
 
				+ };
			
 
				+ 
			
 
				+ struct ppp_channel {
			
--- a/target/linux/generic/backport-5.15/610-v5.13-16-net-dsa-resolve-forwarding-path-for-dsa-slave-ports.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-16-net-dsa-resolve-forwarding-path-for-dsa-slave-ports.patch
@@ -0,0 +1,63 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:37 +0100
			
 
				+Subject: [PATCH] net: dsa: resolve forwarding path for dsa slave ports
			
 
				+
			
 
				+Add .ndo_fill_forward_path for dsa slave port devices
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -832,6 +832,7 @@ enum net_device_path_type {
			
 
				+ 	DEV_PATH_VLAN,
			
 
				+ 	DEV_PATH_BRIDGE,
			
 
				+ 	DEV_PATH_PPPOE,
			
 
				++	DEV_PATH_DSA,
			
 
				+ };
			
 
				+ 
			
 
				+ struct net_device_path {
			
 
				+@@ -852,6 +853,10 @@ struct net_device_path {
			
 
				+ 			u16		vlan_id;
			
 
				+ 			__be16		vlan_proto;
			
 
				+ 		} bridge;
			
 
				++		struct {
			
 
				++			int port;
			
 
				++			u16 proto;
			
 
				++		} dsa;
			
 
				+ 	};
			
 
				+ };
			
 
				+ 
			
 
				+--- a/net/dsa/slave.c
			
 
				++++ b/net/dsa/slave.c
			
 
				+@@ -1619,6 +1619,21 @@ static struct devlink_port *dsa_slave_ge
			
 
				+ 	return dp->ds->devlink ? &dp->devlink_port : NULL;
			
 
				+ }
			
 
				+ 
			
 
				++static int dsa_slave_fill_forward_path(struct net_device_path_ctx *ctx,
			
 
				++				       struct net_device_path *path)
			
 
				++{
			
 
				++	struct dsa_port *dp = dsa_slave_to_port(ctx->dev);
			
 
				++	struct dsa_port *cpu_dp = dp->cpu_dp;
			
 
				++
			
 
				++	path->dev = ctx->dev;
			
 
				++	path->type = DEV_PATH_DSA;
			
 
				++	path->dsa.proto = cpu_dp->tag_ops->proto;
			
 
				++	path->dsa.port = dp->index;
			
 
				++	ctx->dev = cpu_dp->master;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static const struct net_device_ops dsa_slave_netdev_ops = {
			
 
				+ 	.ndo_open	 	= dsa_slave_open,
			
 
				+ 	.ndo_stop		= dsa_slave_close,
			
 
				+@@ -1644,6 +1659,7 @@ static const struct net_device_ops dsa_s
			
 
				+ 	.ndo_vlan_rx_kill_vid	= dsa_slave_vlan_rx_kill_vid,
			
 
				+ 	.ndo_get_devlink_port	= dsa_slave_get_devlink_port,
			
 
				+ 	.ndo_change_mtu		= dsa_slave_change_mtu,
			
 
				++	.ndo_fill_forward_path	= dsa_slave_fill_forward_path,
			
 
				+ };
			
 
				+ 
			
 
				+ static struct device_type dsa_type = {
			
--- a/target/linux/generic/backport-5.15/610-v5.13-17-netfilter-flowtable-add-xmit-path-types.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-17-netfilter-flowtable-add-xmit-path-types.patch
@@ -0,0 +1,147 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:38 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add xmit path types
			
 
				+
			
 
				+Add the xmit_type field that defines the two supported xmit paths in the
			
 
				+flowtable data plane, which are the neighbour and the xfrm xmit paths.
			
 
				+This patch prepares for new flowtable xmit path types to come.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -89,6 +89,11 @@ enum flow_offload_tuple_dir {
			
 
				+ };
			
 
				+ #define FLOW_OFFLOAD_DIR_MAX	IP_CT_DIR_MAX
			
 
				+ 
			
 
				++enum flow_offload_xmit_type {
			
 
				++	FLOW_OFFLOAD_XMIT_NEIGH		= 0,
			
 
				++	FLOW_OFFLOAD_XMIT_XFRM,
			
 
				++};
			
 
				++
			
 
				+ struct flow_offload_tuple {
			
 
				+ 	union {
			
 
				+ 		struct in_addr		src_v4;
			
 
				+@@ -111,7 +116,8 @@ struct flow_offload_tuple {
			
 
				+ 	/* All members above are keys for lookups, see flow_offload_hash(). */
			
 
				+ 	struct { }			__hash;
			
 
				+ 
			
 
				+-	u8				dir;
			
 
				++	u8				dir:6,
			
 
				++					xmit_type:2;
			
 
				+ 
			
 
				+ 	u16				mtu;
			
 
				+ 
			
 
				+@@ -157,7 +163,8 @@ static inline __s32 nf_flow_timeout_delt
			
 
				+ 
			
 
				+ struct nf_flow_route {
			
 
				+ 	struct {
			
 
				+-		struct dst_entry	*dst;
			
 
				++		struct dst_entry		*dst;
			
 
				++		enum flow_offload_xmit_type	xmit_type;
			
 
				+ 	} tuple[FLOW_OFFLOAD_DIR_MAX];
			
 
				+ };
			
 
				+ 
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -95,6 +95,7 @@ static int flow_offload_fill_route(struc
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	flow_tuple->iifidx = other_dst->dev->ifindex;
			
 
				++	flow_tuple->xmit_type = route->tuple[dir].xmit_type;
			
 
				+ 	flow_tuple->dst_cache = dst;
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -235,8 +235,6 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 
			
 
				+ 	dir = tuplehash->tuple.dir;
			
 
				+ 	flow = container_of(tuplehash, struct flow_offload, tuplehash[dir]);
			
 
				+-	rt = (struct rtable *)flow->tuplehash[dir].tuple.dst_cache;
			
 
				+-	outdev = rt->dst.dev;
			
 
				+ 
			
 
				+ 	if (unlikely(nf_flow_exceeds_mtu(skb, flow->tuplehash[dir].tuple.mtu)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+@@ -265,13 +263,16 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (flow_table->flags & NF_FLOWTABLE_COUNTER)
			
 
				+ 		nf_ct_acct_update(flow->ct, tuplehash->tuple.dir, skb->len);
			
 
				+ 
			
 
				+-	if (unlikely(dst_xfrm(&rt->dst))) {
			
 
				++	rt = (struct rtable *)tuplehash->tuple.dst_cache;
			
 
				++
			
 
				++	if (unlikely(tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)) {
			
 
				+ 		memset(skb->cb, 0, sizeof(struct inet_skb_parm));
			
 
				+ 		IPCB(skb)->iif = skb->dev->ifindex;
			
 
				+ 		IPCB(skb)->flags = IPSKB_FORWARDED;
			
 
				+ 		return nf_flow_xmit_xfrm(skb, state, &rt->dst);
			
 
				+ 	}
			
 
				+ 
			
 
				++	outdev = rt->dst.dev;
			
 
				+ 	skb->dev = outdev;
			
 
				+ 	nexthop = rt_nexthop(rt, flow->tuplehash[!dir].tuple.src_v4.s_addr);
			
 
				+ 	skb_dst_set_noref(skb, &rt->dst);
			
 
				+@@ -456,8 +457,6 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 
			
 
				+ 	dir = tuplehash->tuple.dir;
			
 
				+ 	flow = container_of(tuplehash, struct flow_offload, tuplehash[dir]);
			
 
				+-	rt = (struct rt6_info *)flow->tuplehash[dir].tuple.dst_cache;
			
 
				+-	outdev = rt->dst.dev;
			
 
				+ 
			
 
				+ 	if (unlikely(nf_flow_exceeds_mtu(skb, flow->tuplehash[dir].tuple.mtu)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+@@ -485,13 +484,16 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	if (flow_table->flags & NF_FLOWTABLE_COUNTER)
			
 
				+ 		nf_ct_acct_update(flow->ct, tuplehash->tuple.dir, skb->len);
			
 
				+ 
			
 
				+-	if (unlikely(dst_xfrm(&rt->dst))) {
			
 
				++	rt = (struct rt6_info *)tuplehash->tuple.dst_cache;
			
 
				++
			
 
				++	if (unlikely(tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)) {
			
 
				+ 		memset(skb->cb, 0, sizeof(struct inet6_skb_parm));
			
 
				+ 		IP6CB(skb)->iif = skb->dev->ifindex;
			
 
				+ 		IP6CB(skb)->flags = IP6SKB_FORWARDED;
			
 
				+ 		return nf_flow_xmit_xfrm(skb, state, &rt->dst);
			
 
				+ 	}
			
 
				+ 
			
 
				++	outdev = rt->dst.dev;
			
 
				+ 	skb->dev = outdev;
			
 
				+ 	nexthop = rt6_nexthop(rt, &flow->tuplehash[!dir].tuple.src_v6);
			
 
				+ 	skb_dst_set_noref(skb, &rt->dst);
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -19,6 +19,22 @@ struct nft_flow_offload {
			
 
				+ 	struct nft_flowtable	*flowtable;
			
 
				+ };
			
 
				+ 
			
 
				++static enum flow_offload_xmit_type nft_xmit_type(struct dst_entry *dst)
			
 
				++{
			
 
				++	if (dst_xfrm(dst))
			
 
				++		return FLOW_OFFLOAD_XMIT_XFRM;
			
 
				++
			
 
				++	return FLOW_OFFLOAD_XMIT_NEIGH;
			
 
				++}
			
 
				++
			
 
				++static void nft_default_forward_path(struct nf_flow_route *route,
			
 
				++				     struct dst_entry *dst_cache,
			
 
				++				     enum ip_conntrack_dir dir)
			
 
				++{
			
 
				++	route->tuple[dir].dst		= dst_cache;
			
 
				++	route->tuple[dir].xmit_type	= nft_xmit_type(dst_cache);
			
 
				++}
			
 
				++
			
 
				+ static int nft_flow_route(const struct nft_pktinfo *pkt,
			
 
				+ 			  const struct nf_conn *ct,
			
 
				+ 			  struct nf_flow_route *route,
			
 
				+@@ -44,8 +60,8 @@ static int nft_flow_route(const struct n
			
 
				+ 	if (!other_dst)
			
 
				+ 		return -ENOENT;
			
 
				+ 
			
 
				+-	route->tuple[dir].dst		= this_dst;
			
 
				+-	route->tuple[!dir].dst		= other_dst;
			
 
				++	nft_default_forward_path(route, this_dst, dir);
			
 
				++	nft_default_forward_path(route, other_dst, !dir);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
--- a/target/linux/generic/backport-5.15/610-v5.13-18-netfilter-flowtable-use-dev_fill_forward_path-to-obt.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-18-netfilter-flowtable-use-dev_fill_forward_path-to-obt.patch
@@ -0,0 +1,191 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:39 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: use dev_fill_forward_path() to
			
 
				+ obtain ingress device
			
 
				+
			
 
				+Obtain the ingress device in the tuple from the route in the reply
			
 
				+direction. Use dev_fill_forward_path() instead to get the real ingress
			
 
				+device for this flow.
			
 
				+
			
 
				+Fall back to use the ingress device that the IP forwarding route
			
 
				+provides if:
			
 
				+
			
 
				+- dev_fill_forward_path() finds no real ingress device.
			
 
				+- the ingress device that is obtained is not part of the flowtable
			
 
				+  devices.
			
 
				+- this route has a xfrm policy.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -164,6 +164,9 @@ static inline __s32 nf_flow_timeout_delt
			
 
				+ struct nf_flow_route {
			
 
				+ 	struct {
			
 
				+ 		struct dst_entry		*dst;
			
 
				++		struct {
			
 
				++			u32			ifindex;
			
 
				++		} in;
			
 
				+ 		enum flow_offload_xmit_type	xmit_type;
			
 
				+ 	} tuple[FLOW_OFFLOAD_DIR_MAX];
			
 
				+ };
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -79,7 +79,6 @@ static int flow_offload_fill_route(struc
			
 
				+ 				   enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	struct flow_offload_tuple *flow_tuple = &flow->tuplehash[dir].tuple;
			
 
				+-	struct dst_entry *other_dst = route->tuple[!dir].dst;
			
 
				+ 	struct dst_entry *dst = route->tuple[dir].dst;
			
 
				+ 
			
 
				+ 	if (!dst_hold_safe(route->tuple[dir].dst))
			
 
				+@@ -94,7 +93,7 @@ static int flow_offload_fill_route(struc
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 
			
 
				+-	flow_tuple->iifidx = other_dst->dev->ifindex;
			
 
				++	flow_tuple->iifidx = route->tuple[dir].in.ifindex;
			
 
				+ 	flow_tuple->xmit_type = route->tuple[dir].xmit_type;
			
 
				+ 	flow_tuple->dst_cache = dst;
			
 
				+ 
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -31,14 +31,104 @@ static void nft_default_forward_path(str
			
 
				+ 				     struct dst_entry *dst_cache,
			
 
				+ 				     enum ip_conntrack_dir dir)
			
 
				+ {
			
 
				++	route->tuple[!dir].in.ifindex	= dst_cache->dev->ifindex;
			
 
				+ 	route->tuple[dir].dst		= dst_cache;
			
 
				+ 	route->tuple[dir].xmit_type	= nft_xmit_type(dst_cache);
			
 
				+ }
			
 
				+ 
			
 
				++static int nft_dev_fill_forward_path(const struct nf_flow_route *route,
			
 
				++				     const struct dst_entry *dst_cache,
			
 
				++				     const struct nf_conn *ct,
			
 
				++				     enum ip_conntrack_dir dir,
			
 
				++				     struct net_device_path_stack *stack)
			
 
				++{
			
 
				++	const void *daddr = &ct->tuplehash[!dir].tuple.src.u3;
			
 
				++	struct net_device *dev = dst_cache->dev;
			
 
				++	unsigned char ha[ETH_ALEN];
			
 
				++	struct neighbour *n;
			
 
				++	u8 nud_state;
			
 
				++
			
 
				++	n = dst_neigh_lookup(dst_cache, daddr);
			
 
				++	if (!n)
			
 
				++		return -1;
			
 
				++
			
 
				++	read_lock_bh(&n->lock);
			
 
				++	nud_state = n->nud_state;
			
 
				++	ether_addr_copy(ha, n->ha);
			
 
				++	read_unlock_bh(&n->lock);
			
 
				++	neigh_release(n);
			
 
				++
			
 
				++	if (!(nud_state & NUD_VALID))
			
 
				++		return -1;
			
 
				++
			
 
				++	return dev_fill_forward_path(dev, ha, stack);
			
 
				++}
			
 
				++
			
 
				++struct nft_forward_info {
			
 
				++	const struct net_device *indev;
			
 
				++};
			
 
				++
			
 
				++static void nft_dev_path_info(const struct net_device_path_stack *stack,
			
 
				++			      struct nft_forward_info *info)
			
 
				++{
			
 
				++	const struct net_device_path *path;
			
 
				++	int i;
			
 
				++
			
 
				++	for (i = 0; i < stack->num_paths; i++) {
			
 
				++		path = &stack->path[i];
			
 
				++		switch (path->type) {
			
 
				++		case DEV_PATH_ETHERNET:
			
 
				++			info->indev = path->dev;
			
 
				++			break;
			
 
				++		case DEV_PATH_VLAN:
			
 
				++		case DEV_PATH_BRIDGE:
			
 
				++		default:
			
 
				++			info->indev = NULL;
			
 
				++			break;
			
 
				++		}
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++static bool nft_flowtable_find_dev(const struct net_device *dev,
			
 
				++				   struct nft_flowtable *ft)
			
 
				++{
			
 
				++	struct nft_hook *hook;
			
 
				++	bool found = false;
			
 
				++
			
 
				++	list_for_each_entry_rcu(hook, &ft->hook_list, list) {
			
 
				++		if (hook->ops.dev != dev)
			
 
				++			continue;
			
 
				++
			
 
				++		found = true;
			
 
				++		break;
			
 
				++	}
			
 
				++
			
 
				++	return found;
			
 
				++}
			
 
				++
			
 
				++static void nft_dev_forward_path(struct nf_flow_route *route,
			
 
				++				 const struct nf_conn *ct,
			
 
				++				 enum ip_conntrack_dir dir,
			
 
				++				 struct nft_flowtable *ft)
			
 
				++{
			
 
				++	const struct dst_entry *dst = route->tuple[dir].dst;
			
 
				++	struct net_device_path_stack stack;
			
 
				++	struct nft_forward_info info = {};
			
 
				++
			
 
				++	if (nft_dev_fill_forward_path(route, dst, ct, dir, &stack) >= 0)
			
 
				++		nft_dev_path_info(&stack, &info);
			
 
				++
			
 
				++	if (!info.indev || !nft_flowtable_find_dev(info.indev, ft))
			
 
				++		return;
			
 
				++
			
 
				++	route->tuple[!dir].in.ifindex = info.indev->ifindex;
			
 
				++}
			
 
				++
			
 
				+ static int nft_flow_route(const struct nft_pktinfo *pkt,
			
 
				+ 			  const struct nf_conn *ct,
			
 
				+ 			  struct nf_flow_route *route,
			
 
				+-			  enum ip_conntrack_dir dir)
			
 
				++			  enum ip_conntrack_dir dir,
			
 
				++			  struct nft_flowtable *ft)
			
 
				+ {
			
 
				+ 	struct dst_entry *this_dst = skb_dst(pkt->skb);
			
 
				+ 	struct dst_entry *other_dst = NULL;
			
 
				+@@ -63,6 +153,12 @@ static int nft_flow_route(const struct n
			
 
				+ 	nft_default_forward_path(route, this_dst, dir);
			
 
				+ 	nft_default_forward_path(route, other_dst, !dir);
			
 
				+ 
			
 
				++	if (route->tuple[dir].xmit_type	== FLOW_OFFLOAD_XMIT_NEIGH &&
			
 
				++	    route->tuple[!dir].xmit_type == FLOW_OFFLOAD_XMIT_NEIGH) {
			
 
				++		nft_dev_forward_path(route, ct, dir, ft);
			
 
				++		nft_dev_forward_path(route, ct, !dir, ft);
			
 
				++	}
			
 
				++
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+@@ -90,8 +186,8 @@ static void nft_flow_offload_eval(const
			
 
				+ 	struct nft_flow_offload *priv = nft_expr_priv(expr);
			
 
				+ 	struct nf_flowtable *flowtable = &priv->flowtable->data;
			
 
				+ 	struct tcphdr _tcph, *tcph = NULL;
			
 
				++	struct nf_flow_route route = {};
			
 
				+ 	enum ip_conntrack_info ctinfo;
			
 
				+-	struct nf_flow_route route;
			
 
				+ 	struct flow_offload *flow;
			
 
				+ 	enum ip_conntrack_dir dir;
			
 
				+ 	struct nf_conn *ct;
			
 
				+@@ -128,7 +224,7 @@ static void nft_flow_offload_eval(const
			
 
				+ 		goto out;
			
 
				+ 
			
 
				+ 	dir = CTINFO2DIR(ctinfo);
			
 
				+-	if (nft_flow_route(pkt, ct, &route, dir) < 0)
			
 
				++	if (nft_flow_route(pkt, ct, &route, dir, priv->flowtable) < 0)
			
 
				+ 		goto err_flow_route;
			
 
				+ 
			
 
				+ 	flow = flow_offload_alloc(ct);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-19-netfilter-flowtable-use-dev_fill_forward_path-to-obt.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-19-netfilter-flowtable-use-dev_fill_forward_path-to-obt.patch
@@ -0,0 +1,374 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:40 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: use dev_fill_forward_path() to
			
 
				+ obtain egress device
			
 
				+
			
 
				+The egress device in the tuple is obtained from route. Use
			
 
				+dev_fill_forward_path() instead to provide the real egress device for
			
 
				+this flow whenever this is available.
			
 
				+
			
 
				+The new FLOW_OFFLOAD_XMIT_DIRECT type uses dev_queue_xmit() to transmit
			
 
				+ethernet frames. Cache the source and destination hardware address to
			
 
				+use dev_queue_xmit() to transfer packets.
			
 
				+
			
 
				+The FLOW_OFFLOAD_XMIT_DIRECT replaces FLOW_OFFLOAD_XMIT_NEIGH if
			
 
				+dev_fill_forward_path() finds a direct transmit path.
			
 
				+
			
 
				+In case of topology updates, if peer is moved to different bridge port,
			
 
				+the connection will time out, reconnect will result in a new entry with
			
 
				+the correct path. Snooping fdb updates would allow for cleaning up stale
			
 
				+flowtable entries.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -92,6 +92,7 @@ enum flow_offload_tuple_dir {
			
 
				+ enum flow_offload_xmit_type {
			
 
				+ 	FLOW_OFFLOAD_XMIT_NEIGH		= 0,
			
 
				+ 	FLOW_OFFLOAD_XMIT_XFRM,
			
 
				++	FLOW_OFFLOAD_XMIT_DIRECT,
			
 
				+ };
			
 
				+ 
			
 
				+ struct flow_offload_tuple {
			
 
				+@@ -120,8 +121,14 @@ struct flow_offload_tuple {
			
 
				+ 					xmit_type:2;
			
 
				+ 
			
 
				+ 	u16				mtu;
			
 
				+-
			
 
				+-	struct dst_entry		*dst_cache;
			
 
				++	union {
			
 
				++		struct dst_entry	*dst_cache;
			
 
				++		struct {
			
 
				++			u32		ifidx;
			
 
				++			u8		h_source[ETH_ALEN];
			
 
				++			u8		h_dest[ETH_ALEN];
			
 
				++		} out;
			
 
				++	};
			
 
				+ };
			
 
				+ 
			
 
				+ struct flow_offload_tuple_rhash {
			
 
				+@@ -167,6 +174,11 @@ struct nf_flow_route {
			
 
				+ 		struct {
			
 
				+ 			u32			ifindex;
			
 
				+ 		} in;
			
 
				++		struct {
			
 
				++			u32			ifindex;
			
 
				++			u8			h_source[ETH_ALEN];
			
 
				++			u8			h_dest[ETH_ALEN];
			
 
				++		} out;
			
 
				+ 		enum flow_offload_xmit_type	xmit_type;
			
 
				+ 	} tuple[FLOW_OFFLOAD_DIR_MAX];
			
 
				+ };
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -81,9 +81,6 @@ static int flow_offload_fill_route(struc
			
 
				+ 	struct flow_offload_tuple *flow_tuple = &flow->tuplehash[dir].tuple;
			
 
				+ 	struct dst_entry *dst = route->tuple[dir].dst;
			
 
				+ 
			
 
				+-	if (!dst_hold_safe(route->tuple[dir].dst))
			
 
				+-		return -1;
			
 
				+-
			
 
				+ 	switch (flow_tuple->l3proto) {
			
 
				+ 	case NFPROTO_IPV4:
			
 
				+ 		flow_tuple->mtu = ip_dst_mtu_maybe_forward(dst, true);
			
 
				+@@ -94,12 +91,36 @@ static int flow_offload_fill_route(struc
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	flow_tuple->iifidx = route->tuple[dir].in.ifindex;
			
 
				++
			
 
				++	switch (route->tuple[dir].xmit_type) {
			
 
				++	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				++		memcpy(flow_tuple->out.h_dest, route->tuple[dir].out.h_dest,
			
 
				++		       ETH_ALEN);
			
 
				++		memcpy(flow_tuple->out.h_source, route->tuple[dir].out.h_source,
			
 
				++		       ETH_ALEN);
			
 
				++		flow_tuple->out.ifidx = route->tuple[dir].out.ifindex;
			
 
				++		break;
			
 
				++	case FLOW_OFFLOAD_XMIT_XFRM:
			
 
				++	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		if (!dst_hold_safe(route->tuple[dir].dst))
			
 
				++			return -1;
			
 
				++
			
 
				++		flow_tuple->dst_cache = dst;
			
 
				++		break;
			
 
				++	}
			
 
				+ 	flow_tuple->xmit_type = route->tuple[dir].xmit_type;
			
 
				+-	flow_tuple->dst_cache = dst;
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				++static void nft_flow_dst_release(struct flow_offload *flow,
			
 
				++				 enum flow_offload_tuple_dir dir)
			
 
				++{
			
 
				++	if (flow->tuplehash[dir].tuple.xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				++	    flow->tuplehash[dir].tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)
			
 
				++		dst_release(flow->tuplehash[dir].tuple.dst_cache);
			
 
				++}
			
 
				++
			
 
				+ int flow_offload_route_init(struct flow_offload *flow,
			
 
				+ 			    const struct nf_flow_route *route)
			
 
				+ {
			
 
				+@@ -118,7 +139,7 @@ int flow_offload_route_init(struct flow_
			
 
				+ 	return 0;
			
 
				+ 
			
 
				+ err_route_reply:
			
 
				+-	dst_release(route->tuple[FLOW_OFFLOAD_DIR_ORIGINAL].dst);
			
 
				++	nft_flow_dst_release(flow, FLOW_OFFLOAD_DIR_ORIGINAL);
			
 
				+ 
			
 
				+ 	return err;
			
 
				+ }
			
 
				+@@ -169,8 +190,8 @@ static void flow_offload_fixup_ct(struct
			
 
				+ 
			
 
				+ static void flow_offload_route_release(struct flow_offload *flow)
			
 
				+ {
			
 
				+-	dst_release(flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple.dst_cache);
			
 
				+-	dst_release(flow->tuplehash[FLOW_OFFLOAD_DIR_REPLY].tuple.dst_cache);
			
 
				++	nft_flow_dst_release(flow, FLOW_OFFLOAD_DIR_ORIGINAL);
			
 
				++	nft_flow_dst_release(flow, FLOW_OFFLOAD_DIR_REPLY);
			
 
				+ }
			
 
				+ 
			
 
				+ void flow_offload_free(struct flow_offload *flow)
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -207,6 +207,24 @@ static unsigned int nf_flow_xmit_xfrm(st
			
 
				+ 	return NF_STOLEN;
			
 
				+ }
			
 
				+ 
			
 
				++static unsigned int nf_flow_queue_xmit(struct net *net, struct sk_buff *skb,
			
 
				++				       const struct flow_offload_tuple_rhash *tuplehash,
			
 
				++				       unsigned short type)
			
 
				++{
			
 
				++	struct net_device *outdev;
			
 
				++
			
 
				++	outdev = dev_get_by_index_rcu(net, tuplehash->tuple.out.ifidx);
			
 
				++	if (!outdev)
			
 
				++		return NF_DROP;
			
 
				++
			
 
				++	skb->dev = outdev;
			
 
				++	dev_hard_header(skb, skb->dev, type, tuplehash->tuple.out.h_dest,
			
 
				++			tuplehash->tuple.out.h_source, skb->len);
			
 
				++	dev_queue_xmit(skb);
			
 
				++
			
 
				++	return NF_STOLEN;
			
 
				++}
			
 
				++
			
 
				+ unsigned int
			
 
				+ nf_flow_offload_ip_hook(void *priv, struct sk_buff *skb,
			
 
				+ 			const struct nf_hook_state *state)
			
 
				+@@ -222,6 +240,7 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	struct iphdr *iph;
			
 
				+ 	__be32 nexthop;
			
 
				+ 	u32 hdrsize;
			
 
				++	int ret;
			
 
				+ 
			
 
				+ 	if (skb->protocol != htons(ETH_P_IP))
			
 
				+ 		return NF_ACCEPT;
			
 
				+@@ -244,9 +263,13 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (!dst_check(&rt->dst, 0)) {
			
 
				+-		flow_offload_teardown(flow);
			
 
				+-		return NF_ACCEPT;
			
 
				++	if (tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				++	    tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
			
 
				++		rt = (struct rtable *)tuplehash->tuple.dst_cache;
			
 
				++		if (!dst_check(&rt->dst, 0)) {
			
 
				++			flow_offload_teardown(flow);
			
 
				++			return NF_ACCEPT;
			
 
				++		}
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+@@ -263,8 +286,6 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (flow_table->flags & NF_FLOWTABLE_COUNTER)
			
 
				+ 		nf_ct_acct_update(flow->ct, tuplehash->tuple.dir, skb->len);
			
 
				+ 
			
 
				+-	rt = (struct rtable *)tuplehash->tuple.dst_cache;
			
 
				+-
			
 
				+ 	if (unlikely(tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)) {
			
 
				+ 		memset(skb->cb, 0, sizeof(struct inet_skb_parm));
			
 
				+ 		IPCB(skb)->iif = skb->dev->ifindex;
			
 
				+@@ -272,13 +293,23 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 		return nf_flow_xmit_xfrm(skb, state, &rt->dst);
			
 
				+ 	}
			
 
				+ 
			
 
				+-	outdev = rt->dst.dev;
			
 
				+-	skb->dev = outdev;
			
 
				+-	nexthop = rt_nexthop(rt, flow->tuplehash[!dir].tuple.src_v4.s_addr);
			
 
				+-	skb_dst_set_noref(skb, &rt->dst);
			
 
				+-	neigh_xmit(NEIGH_ARP_TABLE, outdev, &nexthop, skb);
			
 
				++	switch (tuplehash->tuple.xmit_type) {
			
 
				++	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		outdev = rt->dst.dev;
			
 
				++		skb->dev = outdev;
			
 
				++		nexthop = rt_nexthop(rt, flow->tuplehash[!dir].tuple.src_v4.s_addr);
			
 
				++		skb_dst_set_noref(skb, &rt->dst);
			
 
				++		neigh_xmit(NEIGH_ARP_TABLE, outdev, &nexthop, skb);
			
 
				++		ret = NF_STOLEN;
			
 
				++		break;
			
 
				++	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				++		ret = nf_flow_queue_xmit(state->net, skb, tuplehash, ETH_P_IP);
			
 
				++		if (ret == NF_DROP)
			
 
				++			flow_offload_teardown(flow);
			
 
				++		break;
			
 
				++	}
			
 
				+ 
			
 
				+-	return NF_STOLEN;
			
 
				++	return ret;
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(nf_flow_offload_ip_hook);
			
 
				+ 
			
 
				+@@ -444,6 +475,7 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	struct ipv6hdr *ip6h;
			
 
				+ 	struct rt6_info *rt;
			
 
				+ 	u32 hdrsize;
			
 
				++	int ret;
			
 
				+ 
			
 
				+ 	if (skb->protocol != htons(ETH_P_IPV6))
			
 
				+ 		return NF_ACCEPT;
			
 
				+@@ -465,9 +497,13 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 				sizeof(*ip6h)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (!dst_check(&rt->dst, 0)) {
			
 
				+-		flow_offload_teardown(flow);
			
 
				+-		return NF_ACCEPT;
			
 
				++	if (tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				++	    tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
			
 
				++		rt = (struct rt6_info *)tuplehash->tuple.dst_cache;
			
 
				++		if (!dst_check(&rt->dst, 0)) {
			
 
				++			flow_offload_teardown(flow);
			
 
				++			return NF_ACCEPT;
			
 
				++		}
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	if (skb_try_make_writable(skb, sizeof(*ip6h) + hdrsize))
			
 
				+@@ -484,8 +520,6 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	if (flow_table->flags & NF_FLOWTABLE_COUNTER)
			
 
				+ 		nf_ct_acct_update(flow->ct, tuplehash->tuple.dir, skb->len);
			
 
				+ 
			
 
				+-	rt = (struct rt6_info *)tuplehash->tuple.dst_cache;
			
 
				+-
			
 
				+ 	if (unlikely(tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)) {
			
 
				+ 		memset(skb->cb, 0, sizeof(struct inet6_skb_parm));
			
 
				+ 		IP6CB(skb)->iif = skb->dev->ifindex;
			
 
				+@@ -493,12 +527,22 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 		return nf_flow_xmit_xfrm(skb, state, &rt->dst);
			
 
				+ 	}
			
 
				+ 
			
 
				+-	outdev = rt->dst.dev;
			
 
				+-	skb->dev = outdev;
			
 
				+-	nexthop = rt6_nexthop(rt, &flow->tuplehash[!dir].tuple.src_v6);
			
 
				+-	skb_dst_set_noref(skb, &rt->dst);
			
 
				+-	neigh_xmit(NEIGH_ND_TABLE, outdev, nexthop, skb);
			
 
				++	switch (tuplehash->tuple.xmit_type) {
			
 
				++	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		outdev = rt->dst.dev;
			
 
				++		skb->dev = outdev;
			
 
				++		nexthop = rt6_nexthop(rt, &flow->tuplehash[!dir].tuple.src_v6);
			
 
				++		skb_dst_set_noref(skb, &rt->dst);
			
 
				++		neigh_xmit(NEIGH_ND_TABLE, outdev, nexthop, skb);
			
 
				++		ret = NF_STOLEN;
			
 
				++		break;
			
 
				++	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				++		ret = nf_flow_queue_xmit(state->net, skb, tuplehash, ETH_P_IPV6);
			
 
				++		if (ret == NF_DROP)
			
 
				++			flow_offload_teardown(flow);
			
 
				++		break;
			
 
				++	}
			
 
				+ 
			
 
				+-	return NF_STOLEN;
			
 
				++	return ret;
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(nf_flow_offload_ipv6_hook);
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -39,12 +39,11 @@ static void nft_default_forward_path(str
			
 
				+ static int nft_dev_fill_forward_path(const struct nf_flow_route *route,
			
 
				+ 				     const struct dst_entry *dst_cache,
			
 
				+ 				     const struct nf_conn *ct,
			
 
				+-				     enum ip_conntrack_dir dir,
			
 
				++				     enum ip_conntrack_dir dir, u8 *ha,
			
 
				+ 				     struct net_device_path_stack *stack)
			
 
				+ {
			
 
				+ 	const void *daddr = &ct->tuplehash[!dir].tuple.src.u3;
			
 
				+ 	struct net_device *dev = dst_cache->dev;
			
 
				+-	unsigned char ha[ETH_ALEN];
			
 
				+ 	struct neighbour *n;
			
 
				+ 	u8 nud_state;
			
 
				+ 
			
 
				+@@ -66,27 +65,43 @@ static int nft_dev_fill_forward_path(con
			
 
				+ 
			
 
				+ struct nft_forward_info {
			
 
				+ 	const struct net_device *indev;
			
 
				++	const struct net_device *outdev;
			
 
				++	u8 h_source[ETH_ALEN];
			
 
				++	u8 h_dest[ETH_ALEN];
			
 
				++	enum flow_offload_xmit_type xmit_type;
			
 
				+ };
			
 
				+ 
			
 
				+ static void nft_dev_path_info(const struct net_device_path_stack *stack,
			
 
				+-			      struct nft_forward_info *info)
			
 
				++			      struct nft_forward_info *info,
			
 
				++			      unsigned char *ha)
			
 
				+ {
			
 
				+ 	const struct net_device_path *path;
			
 
				+ 	int i;
			
 
				+ 
			
 
				++	memcpy(info->h_dest, ha, ETH_ALEN);
			
 
				++
			
 
				+ 	for (i = 0; i < stack->num_paths; i++) {
			
 
				+ 		path = &stack->path[i];
			
 
				+ 		switch (path->type) {
			
 
				+ 		case DEV_PATH_ETHERNET:
			
 
				+ 			info->indev = path->dev;
			
 
				++			if (is_zero_ether_addr(info->h_source))
			
 
				++				memcpy(info->h_source, path->dev->dev_addr, ETH_ALEN);
			
 
				+ 			break;
			
 
				+-		case DEV_PATH_VLAN:
			
 
				+ 		case DEV_PATH_BRIDGE:
			
 
				++			if (is_zero_ether_addr(info->h_source))
			
 
				++				memcpy(info->h_source, path->dev->dev_addr, ETH_ALEN);
			
 
				++
			
 
				++			info->xmit_type = FLOW_OFFLOAD_XMIT_DIRECT;
			
 
				++			break;
			
 
				++		case DEV_PATH_VLAN:
			
 
				+ 		default:
			
 
				+ 			info->indev = NULL;
			
 
				+ 			break;
			
 
				+ 		}
			
 
				+ 	}
			
 
				++	if (!info->outdev)
			
 
				++		info->outdev = info->indev;
			
 
				+ }
			
 
				+ 
			
 
				+ static bool nft_flowtable_find_dev(const struct net_device *dev,
			
 
				+@@ -114,14 +129,22 @@ static void nft_dev_forward_path(struct
			
 
				+ 	const struct dst_entry *dst = route->tuple[dir].dst;
			
 
				+ 	struct net_device_path_stack stack;
			
 
				+ 	struct nft_forward_info info = {};
			
 
				++	unsigned char ha[ETH_ALEN];
			
 
				+ 
			
 
				+-	if (nft_dev_fill_forward_path(route, dst, ct, dir, &stack) >= 0)
			
 
				+-		nft_dev_path_info(&stack, &info);
			
 
				++	if (nft_dev_fill_forward_path(route, dst, ct, dir, ha, &stack) >= 0)
			
 
				++		nft_dev_path_info(&stack, &info, ha);
			
 
				+ 
			
 
				+ 	if (!info.indev || !nft_flowtable_find_dev(info.indev, ft))
			
 
				+ 		return;
			
 
				+ 
			
 
				+ 	route->tuple[!dir].in.ifindex = info.indev->ifindex;
			
 
				++
			
 
				++	if (info.xmit_type == FLOW_OFFLOAD_XMIT_DIRECT) {
			
 
				++		memcpy(route->tuple[dir].out.h_source, info.h_source, ETH_ALEN);
			
 
				++		memcpy(route->tuple[dir].out.h_dest, info.h_dest, ETH_ALEN);
			
 
				++		route->tuple[dir].out.ifindex = info.outdev->ifindex;
			
 
				++		route->tuple[dir].xmit_type = info.xmit_type;
			
 
				++	}
			
 
				+ }
			
 
				+ 
			
 
				+ static int nft_flow_route(const struct nft_pktinfo *pkt,
			
--- a/target/linux/generic/backport-5.15/610-v5.13-20-netfilter-flowtable-add-vlan-support.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-20-netfilter-flowtable-add-vlan-support.patch
@@ -0,0 +1,410 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:41 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add vlan support
			
 
				+
			
 
				+Add the vlan id and protocol to the flow tuple to uniquely identify
			
 
				+flows from the receive path. For the transmit path, dev_hard_header() on
			
 
				+the vlan device push the headers. This patch includes support for two
			
 
				+vlan headers (QinQ) from the ingress path.
			
 
				+
			
 
				+Add a generic encap field to the flowtable entry which stores the
			
 
				+protocol and the tag id. This allows to reuse these fields in the PPPoE
			
 
				+support coming in a later patch.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -95,6 +95,8 @@ enum flow_offload_xmit_type {
			
 
				+ 	FLOW_OFFLOAD_XMIT_DIRECT,
			
 
				+ };
			
 
				+ 
			
 
				++#define NF_FLOW_TABLE_ENCAP_MAX		2
			
 
				++
			
 
				+ struct flow_offload_tuple {
			
 
				+ 	union {
			
 
				+ 		struct in_addr		src_v4;
			
 
				+@@ -113,13 +115,17 @@ struct flow_offload_tuple {
			
 
				+ 
			
 
				+ 	u8				l3proto;
			
 
				+ 	u8				l4proto;
			
 
				++	struct {
			
 
				++		u16			id;
			
 
				++		__be16			proto;
			
 
				++	} encap[NF_FLOW_TABLE_ENCAP_MAX];
			
 
				+ 
			
 
				+ 	/* All members above are keys for lookups, see flow_offload_hash(). */
			
 
				+ 	struct { }			__hash;
			
 
				+ 
			
 
				+-	u8				dir:6,
			
 
				+-					xmit_type:2;
			
 
				+-
			
 
				++	u8				dir:4,
			
 
				++					xmit_type:2,
			
 
				++					encap_num:2;
			
 
				+ 	u16				mtu;
			
 
				+ 	union {
			
 
				+ 		struct dst_entry	*dst_cache;
			
 
				+@@ -173,6 +179,11 @@ struct nf_flow_route {
			
 
				+ 		struct dst_entry		*dst;
			
 
				+ 		struct {
			
 
				+ 			u32			ifindex;
			
 
				++			struct {
			
 
				++				u16		id;
			
 
				++				__be16		proto;
			
 
				++			} encap[NF_FLOW_TABLE_ENCAP_MAX];
			
 
				++			u8			num_encaps;
			
 
				+ 		} in;
			
 
				+ 		struct {
			
 
				+ 			u32			ifindex;
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -80,6 +80,7 @@ static int flow_offload_fill_route(struc
			
 
				+ {
			
 
				+ 	struct flow_offload_tuple *flow_tuple = &flow->tuplehash[dir].tuple;
			
 
				+ 	struct dst_entry *dst = route->tuple[dir].dst;
			
 
				++	int i, j = 0;
			
 
				+ 
			
 
				+ 	switch (flow_tuple->l3proto) {
			
 
				+ 	case NFPROTO_IPV4:
			
 
				+@@ -91,6 +92,12 @@ static int flow_offload_fill_route(struc
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	flow_tuple->iifidx = route->tuple[dir].in.ifindex;
			
 
				++	for (i = route->tuple[dir].in.num_encaps - 1; i >= 0; i--) {
			
 
				++		flow_tuple->encap[j].id = route->tuple[dir].in.encap[i].id;
			
 
				++		flow_tuple->encap[j].proto = route->tuple[dir].in.encap[i].proto;
			
 
				++		j++;
			
 
				++	}
			
 
				++	flow_tuple->encap_num = route->tuple[dir].in.num_encaps;
			
 
				+ 
			
 
				+ 	switch (route->tuple[dir].xmit_type) {
			
 
				+ 	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -136,23 +136,44 @@ static bool ip_has_options(unsigned int
			
 
				+ 	return thoff != sizeof(struct iphdr);
			
 
				+ }
			
 
				+ 
			
 
				++static void nf_flow_tuple_encap(struct sk_buff *skb,
			
 
				++				struct flow_offload_tuple *tuple)
			
 
				++{
			
 
				++	int i = 0;
			
 
				++
			
 
				++	if (skb_vlan_tag_present(skb)) {
			
 
				++		tuple->encap[i].id = skb_vlan_tag_get(skb);
			
 
				++		tuple->encap[i].proto = skb->vlan_proto;
			
 
				++		i++;
			
 
				++	}
			
 
				++	if (skb->protocol == htons(ETH_P_8021Q)) {
			
 
				++		struct vlan_ethhdr *veth = (struct vlan_ethhdr *)skb_mac_header(skb);
			
 
				++
			
 
				++		tuple->encap[i].id = ntohs(veth->h_vlan_TCI);
			
 
				++		tuple->encap[i].proto = skb->protocol;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				+ static int nf_flow_tuple_ip(struct sk_buff *skb, const struct net_device *dev,
			
 
				+-			    struct flow_offload_tuple *tuple, u32 *hdrsize)
			
 
				++			    struct flow_offload_tuple *tuple, u32 *hdrsize,
			
 
				++			    u32 offset)
			
 
				+ {
			
 
				+ 	struct flow_ports *ports;
			
 
				+ 	unsigned int thoff;
			
 
				+ 	struct iphdr *iph;
			
 
				+ 
			
 
				+-	if (!pskb_may_pull(skb, sizeof(*iph)))
			
 
				++	if (!pskb_may_pull(skb, sizeof(*iph) + offset))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	iph = ip_hdr(skb);
			
 
				+-	thoff = iph->ihl * 4;
			
 
				++	iph = (struct iphdr *)(skb_network_header(skb) + offset);
			
 
				++	thoff = (iph->ihl * 4);
			
 
				+ 
			
 
				+ 	if (ip_is_fragment(iph) ||
			
 
				+ 	    unlikely(ip_has_options(thoff)))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				++	thoff += offset;
			
 
				++
			
 
				+ 	switch (iph->protocol) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+ 		*hdrsize = sizeof(struct tcphdr);
			
 
				+@@ -167,11 +188,10 @@ static int nf_flow_tuple_ip(struct sk_bu
			
 
				+ 	if (iph->ttl <= 1)
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	thoff = iph->ihl * 4;
			
 
				+ 	if (!pskb_may_pull(skb, thoff + *hdrsize))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	iph = ip_hdr(skb);
			
 
				++	iph = (struct iphdr *)(skb_network_header(skb) + offset);
			
 
				+ 	ports = (struct flow_ports *)(skb_network_header(skb) + thoff);
			
 
				+ 
			
 
				+ 	tuple->src_v4.s_addr	= iph->saddr;
			
 
				+@@ -181,6 +201,7 @@ static int nf_flow_tuple_ip(struct sk_bu
			
 
				+ 	tuple->l3proto		= AF_INET;
			
 
				+ 	tuple->l4proto		= iph->protocol;
			
 
				+ 	tuple->iifidx		= dev->ifindex;
			
 
				++	nf_flow_tuple_encap(skb, tuple);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+@@ -207,6 +228,43 @@ static unsigned int nf_flow_xmit_xfrm(st
			
 
				+ 	return NF_STOLEN;
			
 
				+ }
			
 
				+ 
			
 
				++static bool nf_flow_skb_encap_protocol(const struct sk_buff *skb, __be16 proto,
			
 
				++				       u32 *offset)
			
 
				++{
			
 
				++	if (skb->protocol == htons(ETH_P_8021Q)) {
			
 
				++		struct vlan_ethhdr *veth;
			
 
				++
			
 
				++		veth = (struct vlan_ethhdr *)skb_mac_header(skb);
			
 
				++		if (veth->h_vlan_encapsulated_proto == proto) {
			
 
				++			*offset += VLAN_HLEN;
			
 
				++			return true;
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				++	return false;
			
 
				++}
			
 
				++
			
 
				++static void nf_flow_encap_pop(struct sk_buff *skb,
			
 
				++			      struct flow_offload_tuple_rhash *tuplehash)
			
 
				++{
			
 
				++	struct vlan_hdr *vlan_hdr;
			
 
				++	int i;
			
 
				++
			
 
				++	for (i = 0; i < tuplehash->tuple.encap_num; i++) {
			
 
				++		if (skb_vlan_tag_present(skb)) {
			
 
				++			__vlan_hwaccel_clear_tag(skb);
			
 
				++			continue;
			
 
				++		}
			
 
				++		if (skb->protocol == htons(ETH_P_8021Q)) {
			
 
				++			vlan_hdr = (struct vlan_hdr *)skb->data;
			
 
				++			__skb_pull(skb, VLAN_HLEN);
			
 
				++			vlan_set_encap_proto(skb, vlan_hdr);
			
 
				++			skb_reset_network_header(skb);
			
 
				++			break;
			
 
				++		}
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				+ static unsigned int nf_flow_queue_xmit(struct net *net, struct sk_buff *skb,
			
 
				+ 				       const struct flow_offload_tuple_rhash *tuplehash,
			
 
				+ 				       unsigned short type)
			
 
				+@@ -235,17 +293,18 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	enum flow_offload_tuple_dir dir;
			
 
				+ 	struct flow_offload *flow;
			
 
				+ 	struct net_device *outdev;
			
 
				++	u32 hdrsize, offset = 0;
			
 
				++	unsigned int thoff, mtu;
			
 
				+ 	struct rtable *rt;
			
 
				+-	unsigned int thoff;
			
 
				+ 	struct iphdr *iph;
			
 
				+ 	__be32 nexthop;
			
 
				+-	u32 hdrsize;
			
 
				+ 	int ret;
			
 
				+ 
			
 
				+-	if (skb->protocol != htons(ETH_P_IP))
			
 
				++	if (skb->protocol != htons(ETH_P_IP) &&
			
 
				++	    !nf_flow_skb_encap_protocol(skb, htons(ETH_P_IP), &offset))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (nf_flow_tuple_ip(skb, state->in, &tuple, &hdrsize) < 0)
			
 
				++	if (nf_flow_tuple_ip(skb, state->in, &tuple, &hdrsize, offset) < 0)
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+ 	tuplehash = flow_offload_lookup(flow_table, &tuple);
			
 
				+@@ -255,11 +314,12 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	dir = tuplehash->tuple.dir;
			
 
				+ 	flow = container_of(tuplehash, struct flow_offload, tuplehash[dir]);
			
 
				+ 
			
 
				+-	if (unlikely(nf_flow_exceeds_mtu(skb, flow->tuplehash[dir].tuple.mtu)))
			
 
				++	mtu = flow->tuplehash[dir].tuple.mtu + offset;
			
 
				++	if (unlikely(nf_flow_exceeds_mtu(skb, mtu)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	iph = ip_hdr(skb);
			
 
				+-	thoff = iph->ihl * 4;
			
 
				++	iph = (struct iphdr *)(skb_network_header(skb) + offset);
			
 
				++	thoff = (iph->ihl * 4) + offset;
			
 
				+ 	if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+@@ -277,6 +337,9 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 
			
 
				+ 	flow_offload_refresh(flow_table, flow);
			
 
				+ 
			
 
				++	nf_flow_encap_pop(skb, tuplehash);
			
 
				++	thoff -= offset;
			
 
				++
			
 
				+ 	iph = ip_hdr(skb);
			
 
				+ 	nf_flow_nat_ip(flow, skb, thoff, dir, iph);
			
 
				+ 
			
 
				+@@ -418,16 +481,18 @@ static void nf_flow_nat_ipv6(const struc
			
 
				+ }
			
 
				+ 
			
 
				+ static int nf_flow_tuple_ipv6(struct sk_buff *skb, const struct net_device *dev,
			
 
				+-			      struct flow_offload_tuple *tuple, u32 *hdrsize)
			
 
				++			      struct flow_offload_tuple *tuple, u32 *hdrsize,
			
 
				++			      u32 offset)
			
 
				+ {
			
 
				+ 	struct flow_ports *ports;
			
 
				+ 	struct ipv6hdr *ip6h;
			
 
				+ 	unsigned int thoff;
			
 
				+ 
			
 
				+-	if (!pskb_may_pull(skb, sizeof(*ip6h)))
			
 
				++	thoff = sizeof(*ip6h) + offset;
			
 
				++	if (!pskb_may_pull(skb, thoff))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	ip6h = ipv6_hdr(skb);
			
 
				++	ip6h = (struct ipv6hdr *)(skb_network_header(skb) + offset);
			
 
				+ 
			
 
				+ 	switch (ip6h->nexthdr) {
			
 
				+ 	case IPPROTO_TCP:
			
 
				+@@ -443,11 +508,10 @@ static int nf_flow_tuple_ipv6(struct sk_
			
 
				+ 	if (ip6h->hop_limit <= 1)
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	thoff = sizeof(*ip6h);
			
 
				+ 	if (!pskb_may_pull(skb, thoff + *hdrsize))
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+-	ip6h = ipv6_hdr(skb);
			
 
				++	ip6h = (struct ipv6hdr *)(skb_network_header(skb) + offset);
			
 
				+ 	ports = (struct flow_ports *)(skb_network_header(skb) + thoff);
			
 
				+ 
			
 
				+ 	tuple->src_v6		= ip6h->saddr;
			
 
				+@@ -457,6 +521,7 @@ static int nf_flow_tuple_ipv6(struct sk_
			
 
				+ 	tuple->l3proto		= AF_INET6;
			
 
				+ 	tuple->l4proto		= ip6h->nexthdr;
			
 
				+ 	tuple->iifidx		= dev->ifindex;
			
 
				++	nf_flow_tuple_encap(skb, tuple);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+@@ -472,15 +537,17 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	const struct in6_addr *nexthop;
			
 
				+ 	struct flow_offload *flow;
			
 
				+ 	struct net_device *outdev;
			
 
				++	unsigned int thoff, mtu;
			
 
				++	u32 hdrsize, offset = 0;
			
 
				+ 	struct ipv6hdr *ip6h;
			
 
				+ 	struct rt6_info *rt;
			
 
				+-	u32 hdrsize;
			
 
				+ 	int ret;
			
 
				+ 
			
 
				+-	if (skb->protocol != htons(ETH_P_IPV6))
			
 
				++	if (skb->protocol != htons(ETH_P_IPV6) &&
			
 
				++	    !nf_flow_skb_encap_protocol(skb, htons(ETH_P_IPV6), &offset))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (nf_flow_tuple_ipv6(skb, state->in, &tuple, &hdrsize) < 0)
			
 
				++	if (nf_flow_tuple_ipv6(skb, state->in, &tuple, &hdrsize, offset) < 0)
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+ 	tuplehash = flow_offload_lookup(flow_table, &tuple);
			
 
				+@@ -490,11 +557,13 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	dir = tuplehash->tuple.dir;
			
 
				+ 	flow = container_of(tuplehash, struct flow_offload, tuplehash[dir]);
			
 
				+ 
			
 
				+-	if (unlikely(nf_flow_exceeds_mtu(skb, flow->tuplehash[dir].tuple.mtu)))
			
 
				++	mtu = flow->tuplehash[dir].tuple.mtu + offset;
			
 
				++	if (unlikely(nf_flow_exceeds_mtu(skb, mtu)))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (nf_flow_state_check(flow, ipv6_hdr(skb)->nexthdr, skb,
			
 
				+-				sizeof(*ip6h)))
			
 
				++	ip6h = (struct ipv6hdr *)(skb_network_header(skb) + offset);
			
 
				++	thoff = sizeof(*ip6h) + offset;
			
 
				++	if (nf_flow_state_check(flow, ip6h->nexthdr, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+ 	if (tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				+@@ -506,11 +575,13 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 		}
			
 
				+ 	}
			
 
				+ 
			
 
				+-	if (skb_try_make_writable(skb, sizeof(*ip6h) + hdrsize))
			
 
				++	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+ 	flow_offload_refresh(flow_table, flow);
			
 
				+ 
			
 
				++	nf_flow_encap_pop(skb, tuplehash);
			
 
				++
			
 
				+ 	ip6h = ipv6_hdr(skb);
			
 
				+ 	nf_flow_nat_ipv6(flow, skb, dir, ip6h);
			
 
				+ 
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -66,6 +66,11 @@ static int nft_dev_fill_forward_path(con
			
 
				+ struct nft_forward_info {
			
 
				+ 	const struct net_device *indev;
			
 
				+ 	const struct net_device *outdev;
			
 
				++	struct id {
			
 
				++		__u16	id;
			
 
				++		__be16	proto;
			
 
				++	} encap[NF_FLOW_TABLE_ENCAP_MAX];
			
 
				++	u8 num_encaps;
			
 
				+ 	u8 h_source[ETH_ALEN];
			
 
				+ 	u8 h_dest[ETH_ALEN];
			
 
				+ 	enum flow_offload_xmit_type xmit_type;
			
 
				+@@ -84,9 +89,23 @@ static void nft_dev_path_info(const stru
			
 
				+ 		path = &stack->path[i];
			
 
				+ 		switch (path->type) {
			
 
				+ 		case DEV_PATH_ETHERNET:
			
 
				++		case DEV_PATH_VLAN:
			
 
				+ 			info->indev = path->dev;
			
 
				+ 			if (is_zero_ether_addr(info->h_source))
			
 
				+ 				memcpy(info->h_source, path->dev->dev_addr, ETH_ALEN);
			
 
				++
			
 
				++			if (path->type == DEV_PATH_ETHERNET)
			
 
				++				break;
			
 
				++
			
 
				++			/* DEV_PATH_VLAN */
			
 
				++			if (info->num_encaps >= NF_FLOW_TABLE_ENCAP_MAX) {
			
 
				++				info->indev = NULL;
			
 
				++				break;
			
 
				++			}
			
 
				++			info->outdev = path->dev;
			
 
				++			info->encap[info->num_encaps].id = path->encap.id;
			
 
				++			info->encap[info->num_encaps].proto = path->encap.proto;
			
 
				++			info->num_encaps++;
			
 
				+ 			break;
			
 
				+ 		case DEV_PATH_BRIDGE:
			
 
				+ 			if (is_zero_ether_addr(info->h_source))
			
 
				+@@ -94,7 +113,6 @@ static void nft_dev_path_info(const stru
			
 
				+ 
			
 
				+ 			info->xmit_type = FLOW_OFFLOAD_XMIT_DIRECT;
			
 
				+ 			break;
			
 
				+-		case DEV_PATH_VLAN:
			
 
				+ 		default:
			
 
				+ 			info->indev = NULL;
			
 
				+ 			break;
			
 
				+@@ -130,6 +148,7 @@ static void nft_dev_forward_path(struct
			
 
				+ 	struct net_device_path_stack stack;
			
 
				+ 	struct nft_forward_info info = {};
			
 
				+ 	unsigned char ha[ETH_ALEN];
			
 
				++	int i;
			
 
				+ 
			
 
				+ 	if (nft_dev_fill_forward_path(route, dst, ct, dir, ha, &stack) >= 0)
			
 
				+ 		nft_dev_path_info(&stack, &info, ha);
			
 
				+@@ -138,6 +157,11 @@ static void nft_dev_forward_path(struct
			
 
				+ 		return;
			
 
				+ 
			
 
				+ 	route->tuple[!dir].in.ifindex = info.indev->ifindex;
			
 
				++	for (i = 0; i < info.num_encaps; i++) {
			
 
				++		route->tuple[!dir].in.encap[i].id = info.encap[i].id;
			
 
				++		route->tuple[!dir].in.encap[i].proto = info.encap[i].proto;
			
 
				++	}
			
 
				++	route->tuple[!dir].in.num_encaps = info.num_encaps;
			
 
				+ 
			
 
				+ 	if (info.xmit_type == FLOW_OFFLOAD_XMIT_DIRECT) {
			
 
				+ 		memcpy(route->tuple[dir].out.h_source, info.h_source, ETH_ALEN);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-21-netfilter-flowtable-add-bridge-vlan-filtering-suppor.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-21-netfilter-flowtable-add-bridge-vlan-filtering-suppor.patch
@@ -0,0 +1,30 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:42 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add bridge vlan filtering support
			
 
				+
			
 
				+Add the vlan tag based when PVID is set on.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -111,6 +111,18 @@ static void nft_dev_path_info(const stru
			
 
				+ 			if (is_zero_ether_addr(info->h_source))
			
 
				+ 				memcpy(info->h_source, path->dev->dev_addr, ETH_ALEN);
			
 
				+ 
			
 
				++			switch (path->bridge.vlan_mode) {
			
 
				++			case DEV_PATH_BR_VLAN_TAG:
			
 
				++				info->encap[info->num_encaps].id = path->bridge.vlan_id;
			
 
				++				info->encap[info->num_encaps].proto = path->bridge.vlan_proto;
			
 
				++				info->num_encaps++;
			
 
				++				break;
			
 
				++			case DEV_PATH_BR_VLAN_UNTAG:
			
 
				++				info->num_encaps--;
			
 
				++				break;
			
 
				++			case DEV_PATH_BR_VLAN_KEEP:
			
 
				++				break;
			
 
				++			}
			
 
				+ 			info->xmit_type = FLOW_OFFLOAD_XMIT_DIRECT;
			
 
				+ 			break;
			
 
				+ 		default:
			
--- a/target/linux/generic/backport-5.15/610-v5.13-22-netfilter-flowtable-add-pppoe-support.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-22-netfilter-flowtable-add-pppoe-support.patch
@@ -0,0 +1,145 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:43 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add pppoe support
			
 
				+
			
 
				+Add the PPPoE protocol and session id to the flow tuple using the encap
			
 
				+fields to uniquely identify flows from the receive path. For the
			
 
				+transmit path, dev_hard_header() on the vlan device push the headers.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -7,6 +7,9 @@
			
 
				+ #include <linux/ip.h>
			
 
				+ #include <linux/ipv6.h>
			
 
				+ #include <linux/netdevice.h>
			
 
				++#include <linux/if_ether.h>
			
 
				++#include <linux/if_pppox.h>
			
 
				++#include <linux/ppp_defs.h>
			
 
				+ #include <net/ip.h>
			
 
				+ #include <net/ipv6.h>
			
 
				+ #include <net/ip6_route.h>
			
 
				+@@ -139,6 +142,8 @@ static bool ip_has_options(unsigned int
			
 
				+ static void nf_flow_tuple_encap(struct sk_buff *skb,
			
 
				+ 				struct flow_offload_tuple *tuple)
			
 
				+ {
			
 
				++	struct vlan_ethhdr *veth;
			
 
				++	struct pppoe_hdr *phdr;
			
 
				+ 	int i = 0;
			
 
				+ 
			
 
				+ 	if (skb_vlan_tag_present(skb)) {
			
 
				+@@ -146,11 +151,17 @@ static void nf_flow_tuple_encap(struct s
			
 
				+ 		tuple->encap[i].proto = skb->vlan_proto;
			
 
				+ 		i++;
			
 
				+ 	}
			
 
				+-	if (skb->protocol == htons(ETH_P_8021Q)) {
			
 
				+-		struct vlan_ethhdr *veth = (struct vlan_ethhdr *)skb_mac_header(skb);
			
 
				+-
			
 
				++	switch (skb->protocol) {
			
 
				++	case htons(ETH_P_8021Q):
			
 
				++		veth = (struct vlan_ethhdr *)skb_mac_header(skb);
			
 
				+ 		tuple->encap[i].id = ntohs(veth->h_vlan_TCI);
			
 
				+ 		tuple->encap[i].proto = skb->protocol;
			
 
				++		break;
			
 
				++	case htons(ETH_P_PPP_SES):
			
 
				++		phdr = (struct pppoe_hdr *)skb_mac_header(skb);
			
 
				++		tuple->encap[i].id = ntohs(phdr->sid);
			
 
				++		tuple->encap[i].proto = skb->protocol;
			
 
				++		break;
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
 
				+@@ -228,17 +239,41 @@ static unsigned int nf_flow_xmit_xfrm(st
			
 
				+ 	return NF_STOLEN;
			
 
				+ }
			
 
				+ 
			
 
				++static inline __be16 nf_flow_pppoe_proto(const struct sk_buff *skb)
			
 
				++{
			
 
				++	__be16 proto;
			
 
				++
			
 
				++	proto = *((__be16 *)(skb_mac_header(skb) + ETH_HLEN +
			
 
				++			     sizeof(struct pppoe_hdr)));
			
 
				++	switch (proto) {
			
 
				++	case htons(PPP_IP):
			
 
				++		return htons(ETH_P_IP);
			
 
				++	case htons(PPP_IPV6):
			
 
				++		return htons(ETH_P_IPV6);
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static bool nf_flow_skb_encap_protocol(const struct sk_buff *skb, __be16 proto,
			
 
				+ 				       u32 *offset)
			
 
				+ {
			
 
				+-	if (skb->protocol == htons(ETH_P_8021Q)) {
			
 
				+-		struct vlan_ethhdr *veth;
			
 
				++	struct vlan_ethhdr *veth;
			
 
				+ 
			
 
				++	switch (skb->protocol) {
			
 
				++	case htons(ETH_P_8021Q):
			
 
				+ 		veth = (struct vlan_ethhdr *)skb_mac_header(skb);
			
 
				+ 		if (veth->h_vlan_encapsulated_proto == proto) {
			
 
				+ 			*offset += VLAN_HLEN;
			
 
				+ 			return true;
			
 
				+ 		}
			
 
				++		break;
			
 
				++	case htons(ETH_P_PPP_SES):
			
 
				++		if (nf_flow_pppoe_proto(skb) == proto) {
			
 
				++			*offset += PPPOE_SES_HLEN;
			
 
				++			return true;
			
 
				++		}
			
 
				++		break;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return false;
			
 
				+@@ -255,12 +290,18 @@ static void nf_flow_encap_pop(struct sk_
			
 
				+ 			__vlan_hwaccel_clear_tag(skb);
			
 
				+ 			continue;
			
 
				+ 		}
			
 
				+-		if (skb->protocol == htons(ETH_P_8021Q)) {
			
 
				++		switch (skb->protocol) {
			
 
				++		case htons(ETH_P_8021Q):
			
 
				+ 			vlan_hdr = (struct vlan_hdr *)skb->data;
			
 
				+ 			__skb_pull(skb, VLAN_HLEN);
			
 
				+ 			vlan_set_encap_proto(skb, vlan_hdr);
			
 
				+ 			skb_reset_network_header(skb);
			
 
				+ 			break;
			
 
				++		case htons(ETH_P_PPP_SES):
			
 
				++			skb->protocol = nf_flow_pppoe_proto(skb);
			
 
				++			skb_pull(skb, PPPOE_SES_HLEN);
			
 
				++			skb_reset_network_header(skb);
			
 
				++			break;
			
 
				+ 		}
			
 
				+ 	}
			
 
				+ }
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -90,6 +90,7 @@ static void nft_dev_path_info(const stru
			
 
				+ 		switch (path->type) {
			
 
				+ 		case DEV_PATH_ETHERNET:
			
 
				+ 		case DEV_PATH_VLAN:
			
 
				++		case DEV_PATH_PPPOE:
			
 
				+ 			info->indev = path->dev;
			
 
				+ 			if (is_zero_ether_addr(info->h_source))
			
 
				+ 				memcpy(info->h_source, path->dev->dev_addr, ETH_ALEN);
			
 
				+@@ -97,7 +98,7 @@ static void nft_dev_path_info(const stru
			
 
				+ 			if (path->type == DEV_PATH_ETHERNET)
			
 
				+ 				break;
			
 
				+ 
			
 
				+-			/* DEV_PATH_VLAN */
			
 
				++			/* DEV_PATH_VLAN and DEV_PATH_PPPOE */
			
 
				+ 			if (info->num_encaps >= NF_FLOW_TABLE_ENCAP_MAX) {
			
 
				+ 				info->indev = NULL;
			
 
				+ 				break;
			
 
				+@@ -106,6 +107,8 @@ static void nft_dev_path_info(const stru
			
 
				+ 			info->encap[info->num_encaps].id = path->encap.id;
			
 
				+ 			info->encap[info->num_encaps].proto = path->encap.proto;
			
 
				+ 			info->num_encaps++;
			
 
				++			if (path->type == DEV_PATH_PPPOE)
			
 
				++				memcpy(info->h_dest, path->encap.h_dest, ETH_ALEN);
			
 
				+ 			break;
			
 
				+ 		case DEV_PATH_BRIDGE:
			
 
				+ 			if (is_zero_ether_addr(info->h_source))
			
--- a/target/linux/generic/backport-5.15/610-v5.13-23-netfilter-flowtable-add-dsa-support.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-23-netfilter-flowtable-add-dsa-support.patch
@@ -0,0 +1,32 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:44 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add dsa support
			
 
				+
			
 
				+Replace the master ethernet device by the dsa slave port. Packets coming
			
 
				+in from the software ingress path use the dsa slave port as input
			
 
				+device.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -89,6 +89,7 @@ static void nft_dev_path_info(const stru
			
 
				+ 		path = &stack->path[i];
			
 
				+ 		switch (path->type) {
			
 
				+ 		case DEV_PATH_ETHERNET:
			
 
				++		case DEV_PATH_DSA:
			
 
				+ 		case DEV_PATH_VLAN:
			
 
				+ 		case DEV_PATH_PPPOE:
			
 
				+ 			info->indev = path->dev;
			
 
				+@@ -97,6 +98,10 @@ static void nft_dev_path_info(const stru
			
 
				+ 
			
 
				+ 			if (path->type == DEV_PATH_ETHERNET)
			
 
				+ 				break;
			
 
				++			if (path->type == DEV_PATH_DSA) {
			
 
				++				i = stack->num_paths;
			
 
				++				break;
			
 
				++			}
			
 
				+ 
			
 
				+ 			/* DEV_PATH_VLAN and DEV_PATH_PPPOE */
			
 
				+ 			if (info->num_encaps >= NF_FLOW_TABLE_ENCAP_MAX) {
			
--- a/target/linux/generic/backport-5.15/610-v5.13-24-selftests-netfilter-flowtable-bridge-and-vlan-suppor.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-24-selftests-netfilter-flowtable-bridge-and-vlan-suppor.patch
@@ -0,0 +1,107 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:45 +0100
			
 
				+Subject: [PATCH] selftests: netfilter: flowtable bridge and vlan support
			
 
				+
			
 
				+This patch adds two new tests to cover bridge and vlan support:
			
 
				+
			
 
				+- Add a bridge device to the Router1 (nsr1) container and attach the
			
 
				+  veth0 device to the bridge. Set the IP address to the bridge device
			
 
				+  to exercise the bridge forwarding path.
			
 
				+
			
 
				+- Add vlan encapsulation between to the bridge device in the Router1 and
			
 
				+  one of the sender containers (ns1).
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/tools/testing/selftests/netfilter/nft_flowtable.sh
			
 
				++++ b/tools/testing/selftests/netfilter/nft_flowtable.sh
			
 
				+@@ -370,6 +370,88 @@ else
			
 
				+ 	ip netns exec nsr1 nft list ruleset
			
 
				+ fi
			
 
				+ 
			
 
				++# Another test:
			
 
				++# Add bridge interface br0 to Router1, with NAT enabled.
			
 
				++ip -net nsr1 link add name br0 type bridge
			
 
				++ip -net nsr1 addr flush dev veth0
			
 
				++ip -net nsr1 link set up dev veth0
			
 
				++ip -net nsr1 link set veth0 master br0
			
 
				++ip -net nsr1 addr add 10.0.1.1/24 dev br0
			
 
				++ip -net nsr1 addr add dead:1::1/64 dev br0
			
 
				++ip -net nsr1 link set up dev br0
			
 
				++
			
 
				++ip netns exec nsr1 sysctl net.ipv4.conf.br0.forwarding=1 > /dev/null
			
 
				++
			
 
				++# br0 with NAT enabled.
			
 
				++ip netns exec nsr1 nft -f - <<EOF
			
 
				++flush table ip nat
			
 
				++table ip nat {
			
 
				++   chain prerouting {
			
 
				++      type nat hook prerouting priority 0; policy accept;
			
 
				++      meta iif "br0" ip daddr 10.6.6.6 tcp dport 1666 counter dnat ip to 10.0.2.99:12345
			
 
				++   }
			
 
				++
			
 
				++   chain postrouting {
			
 
				++      type nat hook postrouting priority 0; policy accept;
			
 
				++      meta oifname "veth1" counter masquerade
			
 
				++   }
			
 
				++}
			
 
				++EOF
			
 
				++
			
 
				++if test_tcp_forwarding_nat ns1 ns2; then
			
 
				++	echo "PASS: flow offloaded for ns1/ns2 with bridge NAT"
			
 
				++else
			
 
				++	echo "FAIL: flow offload for ns1/ns2 with bridge NAT" 1>&2
			
 
				++	ip netns exec nsr1 nft list ruleset
			
 
				++	ret=1
			
 
				++fi
			
 
				++
			
 
				++# Another test:
			
 
				++# Add bridge interface br0 to Router1, with NAT and VLAN.
			
 
				++ip -net nsr1 link set veth0 nomaster
			
 
				++ip -net nsr1 link set down dev veth0
			
 
				++ip -net nsr1 link add link veth0 name veth0.10 type vlan id 10
			
 
				++ip -net nsr1 link set up dev veth0
			
 
				++ip -net nsr1 link set up dev veth0.10
			
 
				++ip -net nsr1 link set veth0.10 master br0
			
 
				++
			
 
				++ip -net ns1 addr flush dev eth0
			
 
				++ip -net ns1 link add link eth0 name eth0.10 type vlan id 10
			
 
				++ip -net ns1 link set eth0 up
			
 
				++ip -net ns1 link set eth0.10 up
			
 
				++ip -net ns1 addr add 10.0.1.99/24 dev eth0.10
			
 
				++ip -net ns1 route add default via 10.0.1.1
			
 
				++ip -net ns1 addr add dead:1::99/64 dev eth0.10
			
 
				++
			
 
				++if test_tcp_forwarding_nat ns1 ns2; then
			
 
				++	echo "PASS: flow offloaded for ns1/ns2 with bridge NAT and VLAN"
			
 
				++else
			
 
				++	echo "FAIL: flow offload for ns1/ns2 with bridge NAT and VLAN" 1>&2
			
 
				++	ip netns exec nsr1 nft list ruleset
			
 
				++	ret=1
			
 
				++fi
			
 
				++
			
 
				++# restore test topology (remove bridge and VLAN)
			
 
				++ip -net nsr1 link set veth0 nomaster
			
 
				++ip -net nsr1 link set veth0 down
			
 
				++ip -net nsr1 link set veth0.10 down
			
 
				++ip -net nsr1 link delete veth0.10 type vlan
			
 
				++ip -net nsr1 link delete br0 type bridge
			
 
				++ip -net ns1 addr flush dev eth0.10
			
 
				++ip -net ns1 link set eth0.10 down
			
 
				++ip -net ns1 link set eth0 down
			
 
				++ip -net ns1 link delete eth0.10 type vlan
			
 
				++
			
 
				++# restore address in ns1 and nsr1
			
 
				++ip -net ns1 link set eth0 up
			
 
				++ip -net ns1 addr add 10.0.1.99/24 dev eth0
			
 
				++ip -net ns1 route add default via 10.0.1.1
			
 
				++ip -net ns1 addr add dead:1::99/64 dev eth0
			
 
				++ip -net ns1 route add default via dead:1::1
			
 
				++ip -net nsr1 addr add 10.0.1.1/24 dev veth0
			
 
				++ip -net nsr1 addr add dead:1::1/64 dev veth0
			
 
				++ip -net nsr1 link set up dev veth0
			
 
				++
			
 
				+ KEY_SHA="0x"$(ps -xaf | sha1sum | cut -d " " -f 1)
			
 
				+ KEY_AES="0x"$(ps -xaf | md5sum | cut -d " " -f 1)
			
 
				+ SPI1=$RANDOM
			
--- a/target/linux/generic/backport-5.15/610-v5.13-25-netfilter-flowtable-add-offload-support-for-xmit-pat.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-25-netfilter-flowtable-add-offload-support-for-xmit-pat.patch
@@ -0,0 +1,310 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:46 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: add offload support for xmit path
			
 
				+ types
			
 
				+
			
 
				+When the flow tuple xmit_type is set to FLOW_OFFLOAD_XMIT_DIRECT, the
			
 
				+dst_cache pointer is not valid, and the h_source/h_dest/ifidx out fields
			
 
				+need to be used.
			
 
				+
			
 
				+This patch also adds the FLOW_ACTION_VLAN_PUSH action to pass the VLAN
			
 
				+tag to the driver.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_offload.c
			
 
				++++ b/net/netfilter/nf_flow_table_offload.c
			
 
				+@@ -177,28 +177,45 @@ static int flow_offload_eth_src(struct n
			
 
				+ 				enum flow_offload_tuple_dir dir,
			
 
				+ 				struct nf_flow_rule *flow_rule)
			
 
				+ {
			
 
				+-	const struct flow_offload_tuple *tuple = &flow->tuplehash[!dir].tuple;
			
 
				+ 	struct flow_action_entry *entry0 = flow_action_entry_next(flow_rule);
			
 
				+ 	struct flow_action_entry *entry1 = flow_action_entry_next(flow_rule);
			
 
				+-	struct net_device *dev;
			
 
				++	const struct flow_offload_tuple *other_tuple, *this_tuple;
			
 
				++	struct net_device *dev = NULL;
			
 
				++	const unsigned char *addr;
			
 
				+ 	u32 mask, val;
			
 
				+ 	u16 val16;
			
 
				+ 
			
 
				+-	dev = dev_get_by_index(net, tuple->iifidx);
			
 
				+-	if (!dev)
			
 
				+-		return -ENOENT;
			
 
				++	this_tuple = &flow->tuplehash[dir].tuple;
			
 
				++
			
 
				++	switch (this_tuple->xmit_type) {
			
 
				++	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				++		addr = this_tuple->out.h_source;
			
 
				++		break;
			
 
				++	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				++		dev = dev_get_by_index(net, other_tuple->iifidx);
			
 
				++		if (!dev)
			
 
				++			return -ENOENT;
			
 
				++
			
 
				++		addr = dev->dev_addr;
			
 
				++		break;
			
 
				++	default:
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				+ 
			
 
				+ 	mask = ~0xffff0000;
			
 
				+-	memcpy(&val16, dev->dev_addr, 2);
			
 
				++	memcpy(&val16, addr, 2);
			
 
				+ 	val = val16 << 16;
			
 
				+ 	flow_offload_mangle(entry0, FLOW_ACT_MANGLE_HDR_TYPE_ETH, 4,
			
 
				+ 			    &val, &mask);
			
 
				+ 
			
 
				+ 	mask = ~0xffffffff;
			
 
				+-	memcpy(&val, dev->dev_addr + 2, 4);
			
 
				++	memcpy(&val, addr + 2, 4);
			
 
				+ 	flow_offload_mangle(entry1, FLOW_ACT_MANGLE_HDR_TYPE_ETH, 8,
			
 
				+ 			    &val, &mask);
			
 
				+-	dev_put(dev);
			
 
				++
			
 
				++	if (dev)
			
 
				++		dev_put(dev);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+@@ -210,27 +227,40 @@ static int flow_offload_eth_dst(struct n
			
 
				+ {
			
 
				+ 	struct flow_action_entry *entry0 = flow_action_entry_next(flow_rule);
			
 
				+ 	struct flow_action_entry *entry1 = flow_action_entry_next(flow_rule);
			
 
				+-	const void *daddr = &flow->tuplehash[!dir].tuple.src_v4;
			
 
				++	const struct flow_offload_tuple *other_tuple, *this_tuple;
			
 
				+ 	const struct dst_entry *dst_cache;
			
 
				+ 	unsigned char ha[ETH_ALEN];
			
 
				+ 	struct neighbour *n;
			
 
				++	const void *daddr;
			
 
				+ 	u32 mask, val;
			
 
				+ 	u8 nud_state;
			
 
				+ 	u16 val16;
			
 
				+ 
			
 
				+-	dst_cache = flow->tuplehash[dir].tuple.dst_cache;
			
 
				+-	n = dst_neigh_lookup(dst_cache, daddr);
			
 
				+-	if (!n)
			
 
				+-		return -ENOENT;
			
 
				+-
			
 
				+-	read_lock_bh(&n->lock);
			
 
				+-	nud_state = n->nud_state;
			
 
				+-	ether_addr_copy(ha, n->ha);
			
 
				+-	read_unlock_bh(&n->lock);
			
 
				++	this_tuple = &flow->tuplehash[dir].tuple;
			
 
				+ 
			
 
				+-	if (!(nud_state & NUD_VALID)) {
			
 
				++	switch (this_tuple->xmit_type) {
			
 
				++	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				++		ether_addr_copy(ha, this_tuple->out.h_dest);
			
 
				++		break;
			
 
				++	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				++		daddr = &other_tuple->src_v4;
			
 
				++		dst_cache = this_tuple->dst_cache;
			
 
				++		n = dst_neigh_lookup(dst_cache, daddr);
			
 
				++		if (!n)
			
 
				++			return -ENOENT;
			
 
				++
			
 
				++		read_lock_bh(&n->lock);
			
 
				++		nud_state = n->nud_state;
			
 
				++		ether_addr_copy(ha, n->ha);
			
 
				++		read_unlock_bh(&n->lock);
			
 
				+ 		neigh_release(n);
			
 
				+-		return -ENOENT;
			
 
				++
			
 
				++		if (!(nud_state & NUD_VALID))
			
 
				++			return -ENOENT;
			
 
				++		break;
			
 
				++	default:
			
 
				++		return -EOPNOTSUPP;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	mask = ~0xffffffff;
			
 
				+@@ -243,7 +273,6 @@ static int flow_offload_eth_dst(struct n
			
 
				+ 	val = val16;
			
 
				+ 	flow_offload_mangle(entry1, FLOW_ACT_MANGLE_HDR_TYPE_ETH, 4,
			
 
				+ 			    &val, &mask);
			
 
				+-	neigh_release(n);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+@@ -465,27 +494,52 @@ static void flow_offload_ipv4_checksum(s
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
 
				+-static void flow_offload_redirect(const struct flow_offload *flow,
			
 
				++static void flow_offload_redirect(struct net *net,
			
 
				++				  const struct flow_offload *flow,
			
 
				+ 				  enum flow_offload_tuple_dir dir,
			
 
				+ 				  struct nf_flow_rule *flow_rule)
			
 
				+ {
			
 
				+-	struct flow_action_entry *entry = flow_action_entry_next(flow_rule);
			
 
				+-	struct rtable *rt;
			
 
				++	const struct flow_offload_tuple *this_tuple, *other_tuple;
			
 
				++	struct flow_action_entry *entry;
			
 
				++	struct net_device *dev;
			
 
				++	int ifindex;
			
 
				++
			
 
				++	this_tuple = &flow->tuplehash[dir].tuple;
			
 
				++	switch (this_tuple->xmit_type) {
			
 
				++	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				++		this_tuple = &flow->tuplehash[dir].tuple;
			
 
				++		ifindex = this_tuple->out.ifidx;
			
 
				++		break;
			
 
				++	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				++		ifindex = other_tuple->iifidx;
			
 
				++		break;
			
 
				++	default:
			
 
				++		return;
			
 
				++	}
			
 
				+ 
			
 
				+-	rt = (struct rtable *)flow->tuplehash[dir].tuple.dst_cache;
			
 
				++	dev = dev_get_by_index(net, ifindex);
			
 
				++	if (!dev)
			
 
				++		return;
			
 
				++
			
 
				++	entry = flow_action_entry_next(flow_rule);
			
 
				+ 	entry->id = FLOW_ACTION_REDIRECT;
			
 
				+-	entry->dev = rt->dst.dev;
			
 
				+-	dev_hold(rt->dst.dev);
			
 
				++	entry->dev = dev;
			
 
				+ }
			
 
				+ 
			
 
				+ static void flow_offload_encap_tunnel(const struct flow_offload *flow,
			
 
				+ 				      enum flow_offload_tuple_dir dir,
			
 
				+ 				      struct nf_flow_rule *flow_rule)
			
 
				+ {
			
 
				++	const struct flow_offload_tuple *this_tuple;
			
 
				+ 	struct flow_action_entry *entry;
			
 
				+ 	struct dst_entry *dst;
			
 
				+ 
			
 
				+-	dst = flow->tuplehash[dir].tuple.dst_cache;
			
 
				++	this_tuple = &flow->tuplehash[dir].tuple;
			
 
				++	if (this_tuple->xmit_type == FLOW_OFFLOAD_XMIT_DIRECT)
			
 
				++		return;
			
 
				++
			
 
				++	dst = this_tuple->dst_cache;
			
 
				+ 	if (dst && dst->lwtstate) {
			
 
				+ 		struct ip_tunnel_info *tun_info;
			
 
				+ 
			
 
				+@@ -502,10 +556,15 @@ static void flow_offload_decap_tunnel(co
			
 
				+ 				      enum flow_offload_tuple_dir dir,
			
 
				+ 				      struct nf_flow_rule *flow_rule)
			
 
				+ {
			
 
				++	const struct flow_offload_tuple *other_tuple;
			
 
				+ 	struct flow_action_entry *entry;
			
 
				+ 	struct dst_entry *dst;
			
 
				+ 
			
 
				+-	dst = flow->tuplehash[!dir].tuple.dst_cache;
			
 
				++	other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				++	if (other_tuple->xmit_type == FLOW_OFFLOAD_XMIT_DIRECT)
			
 
				++		return;
			
 
				++
			
 
				++	dst = other_tuple->dst_cache;
			
 
				+ 	if (dst && dst->lwtstate) {
			
 
				+ 		struct ip_tunnel_info *tun_info;
			
 
				+ 
			
 
				+@@ -517,10 +576,14 @@ static void flow_offload_decap_tunnel(co
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
 
				+-int nf_flow_rule_route_ipv4(struct net *net, const struct flow_offload *flow,
			
 
				+-			    enum flow_offload_tuple_dir dir,
			
 
				+-			    struct nf_flow_rule *flow_rule)
			
 
				++static int
			
 
				++nf_flow_rule_route_common(struct net *net, const struct flow_offload *flow,
			
 
				++			  enum flow_offload_tuple_dir dir,
			
 
				++			  struct nf_flow_rule *flow_rule)
			
 
				+ {
			
 
				++	const struct flow_offload_tuple *other_tuple;
			
 
				++	int i;
			
 
				++
			
 
				+ 	flow_offload_decap_tunnel(flow, dir, flow_rule);
			
 
				+ 	flow_offload_encap_tunnel(flow, dir, flow_rule);
			
 
				+ 
			
 
				+@@ -528,6 +591,26 @@ int nf_flow_rule_route_ipv4(struct net *
			
 
				+ 	    flow_offload_eth_dst(net, flow, dir, flow_rule) < 0)
			
 
				+ 		return -1;
			
 
				+ 
			
 
				++	other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				++
			
 
				++	for (i = 0; i < other_tuple->encap_num; i++) {
			
 
				++		struct flow_action_entry *entry = flow_action_entry_next(flow_rule);
			
 
				++
			
 
				++		entry->id = FLOW_ACTION_VLAN_PUSH;
			
 
				++		entry->vlan.vid = other_tuple->encap[i].id;
			
 
				++		entry->vlan.proto = other_tuple->encap[i].proto;
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int nf_flow_rule_route_ipv4(struct net *net, const struct flow_offload *flow,
			
 
				++			    enum flow_offload_tuple_dir dir,
			
 
				++			    struct nf_flow_rule *flow_rule)
			
 
				++{
			
 
				++	if (nf_flow_rule_route_common(net, flow, dir, flow_rule) < 0)
			
 
				++		return -1;
			
 
				++
			
 
				+ 	if (test_bit(NF_FLOW_SNAT, &flow->flags)) {
			
 
				+ 		flow_offload_ipv4_snat(net, flow, dir, flow_rule);
			
 
				+ 		flow_offload_port_snat(net, flow, dir, flow_rule);
			
 
				+@@ -540,7 +623,7 @@ int nf_flow_rule_route_ipv4(struct net *
			
 
				+ 	    test_bit(NF_FLOW_DNAT, &flow->flags))
			
 
				+ 		flow_offload_ipv4_checksum(net, flow, flow_rule);
			
 
				+ 
			
 
				+-	flow_offload_redirect(flow, dir, flow_rule);
			
 
				++	flow_offload_redirect(net, flow, dir, flow_rule);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+@@ -550,11 +633,7 @@ int nf_flow_rule_route_ipv6(struct net *
			
 
				+ 			    enum flow_offload_tuple_dir dir,
			
 
				+ 			    struct nf_flow_rule *flow_rule)
			
 
				+ {
			
 
				+-	flow_offload_decap_tunnel(flow, dir, flow_rule);
			
 
				+-	flow_offload_encap_tunnel(flow, dir, flow_rule);
			
 
				+-
			
 
				+-	if (flow_offload_eth_src(net, flow, dir, flow_rule) < 0 ||
			
 
				+-	    flow_offload_eth_dst(net, flow, dir, flow_rule) < 0)
			
 
				++	if (nf_flow_rule_route_common(net, flow, dir, flow_rule) < 0)
			
 
				+ 		return -1;
			
 
				+ 
			
 
				+ 	if (test_bit(NF_FLOW_SNAT, &flow->flags)) {
			
 
				+@@ -566,7 +645,7 @@ int nf_flow_rule_route_ipv6(struct net *
			
 
				+ 		flow_offload_port_dnat(net, flow, dir, flow_rule);
			
 
				+ 	}
			
 
				+ 
			
 
				+-	flow_offload_redirect(flow, dir, flow_rule);
			
 
				++	flow_offload_redirect(net, flow, dir, flow_rule);
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+@@ -580,10 +659,10 @@ nf_flow_offload_rule_alloc(struct net *n
			
 
				+ 			   enum flow_offload_tuple_dir dir)
			
 
				+ {
			
 
				+ 	const struct nf_flowtable *flowtable = offload->flowtable;
			
 
				++	const struct flow_offload_tuple *tuple, *other_tuple;
			
 
				+ 	const struct flow_offload *flow = offload->flow;
			
 
				+-	const struct flow_offload_tuple *tuple;
			
 
				++	struct dst_entry *other_dst = NULL;
			
 
				+ 	struct nf_flow_rule *flow_rule;
			
 
				+-	struct dst_entry *other_dst;
			
 
				+ 	int err = -ENOMEM;
			
 
				+ 
			
 
				+ 	flow_rule = kzalloc(sizeof(*flow_rule), GFP_KERNEL);
			
 
				+@@ -599,7 +678,10 @@ nf_flow_offload_rule_alloc(struct net *n
			
 
				+ 	flow_rule->rule->match.key = &flow_rule->match.key;
			
 
				+ 
			
 
				+ 	tuple = &flow->tuplehash[dir].tuple;
			
 
				+-	other_dst = flow->tuplehash[!dir].tuple.dst_cache;
			
 
				++	other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				++	if (other_tuple->xmit_type == FLOW_OFFLOAD_XMIT_NEIGH)
			
 
				++		other_dst = other_tuple->dst_cache;
			
 
				++
			
 
				+ 	err = nf_flow_rule_match(&flow_rule->match, tuple, other_dst);
			
 
				+ 	if (err < 0)
			
 
				+ 		goto err_flow_match;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-26-netfilter-nft_flow_offload-use-direct-xmit-if-hardwa.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-26-netfilter-nft_flow_offload-use-direct-xmit-if-hardwa.patch
@@ -0,0 +1,114 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:47 +0100
			
 
				+Subject: [PATCH] netfilter: nft_flow_offload: use direct xmit if
			
 
				+ hardware offload is enabled
			
 
				+
			
 
				+If there is a forward path to reach an ethernet device and hardware
			
 
				+offload is enabled, then use the direct xmit path.
			
 
				+
			
 
				+Moreover, store the real device in the direct xmit path info since
			
 
				+software datapath uses dev_hard_header() to push the layer encapsulation
			
 
				+headers while hardware offload refers to the real device.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -131,6 +131,7 @@ struct flow_offload_tuple {
			
 
				+ 		struct dst_entry	*dst_cache;
			
 
				+ 		struct {
			
 
				+ 			u32		ifidx;
			
 
				++			u32		hw_ifidx;
			
 
				+ 			u8		h_source[ETH_ALEN];
			
 
				+ 			u8		h_dest[ETH_ALEN];
			
 
				+ 		} out;
			
 
				+@@ -187,6 +188,7 @@ struct nf_flow_route {
			
 
				+ 		} in;
			
 
				+ 		struct {
			
 
				+ 			u32			ifindex;
			
 
				++			u32			hw_ifindex;
			
 
				+ 			u8			h_source[ETH_ALEN];
			
 
				+ 			u8			h_dest[ETH_ALEN];
			
 
				+ 		} out;
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -106,6 +106,7 @@ static int flow_offload_fill_route(struc
			
 
				+ 		memcpy(flow_tuple->out.h_source, route->tuple[dir].out.h_source,
			
 
				+ 		       ETH_ALEN);
			
 
				+ 		flow_tuple->out.ifidx = route->tuple[dir].out.ifindex;
			
 
				++		flow_tuple->out.hw_ifidx = route->tuple[dir].out.hw_ifindex;
			
 
				+ 		break;
			
 
				+ 	case FLOW_OFFLOAD_XMIT_XFRM:
			
 
				+ 	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				+--- a/net/netfilter/nf_flow_table_offload.c
			
 
				++++ b/net/netfilter/nf_flow_table_offload.c
			
 
				+@@ -508,7 +508,7 @@ static void flow_offload_redirect(struct
			
 
				+ 	switch (this_tuple->xmit_type) {
			
 
				+ 	case FLOW_OFFLOAD_XMIT_DIRECT:
			
 
				+ 		this_tuple = &flow->tuplehash[dir].tuple;
			
 
				+-		ifindex = this_tuple->out.ifidx;
			
 
				++		ifindex = this_tuple->out.hw_ifidx;
			
 
				+ 		break;
			
 
				+ 	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				+ 		other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -66,6 +66,7 @@ static int nft_dev_fill_forward_path(con
			
 
				+ struct nft_forward_info {
			
 
				+ 	const struct net_device *indev;
			
 
				+ 	const struct net_device *outdev;
			
 
				++	const struct net_device *hw_outdev;
			
 
				+ 	struct id {
			
 
				+ 		__u16	id;
			
 
				+ 		__be16	proto;
			
 
				+@@ -76,9 +77,18 @@ struct nft_forward_info {
			
 
				+ 	enum flow_offload_xmit_type xmit_type;
			
 
				+ };
			
 
				+ 
			
 
				++static bool nft_is_valid_ether_device(const struct net_device *dev)
			
 
				++{
			
 
				++	if (!dev || (dev->flags & IFF_LOOPBACK) || dev->type != ARPHRD_ETHER ||
			
 
				++	    dev->addr_len != ETH_ALEN || !is_valid_ether_addr(dev->dev_addr))
			
 
				++		return false;
			
 
				++
			
 
				++	return true;
			
 
				++}
			
 
				++
			
 
				+ static void nft_dev_path_info(const struct net_device_path_stack *stack,
			
 
				+ 			      struct nft_forward_info *info,
			
 
				+-			      unsigned char *ha)
			
 
				++			      unsigned char *ha, struct nf_flowtable *flowtable)
			
 
				+ {
			
 
				+ 	const struct net_device_path *path;
			
 
				+ 	int i;
			
 
				+@@ -140,6 +150,12 @@ static void nft_dev_path_info(const stru
			
 
				+ 	}
			
 
				+ 	if (!info->outdev)
			
 
				+ 		info->outdev = info->indev;
			
 
				++
			
 
				++	info->hw_outdev = info->indev;
			
 
				++
			
 
				++	if (nf_flowtable_hw_offload(flowtable) &&
			
 
				++	    nft_is_valid_ether_device(info->indev))
			
 
				++		info->xmit_type = FLOW_OFFLOAD_XMIT_DIRECT;
			
 
				+ }
			
 
				+ 
			
 
				+ static bool nft_flowtable_find_dev(const struct net_device *dev,
			
 
				+@@ -171,7 +187,7 @@ static void nft_dev_forward_path(struct
			
 
				+ 	int i;
			
 
				+ 
			
 
				+ 	if (nft_dev_fill_forward_path(route, dst, ct, dir, ha, &stack) >= 0)
			
 
				+-		nft_dev_path_info(&stack, &info, ha);
			
 
				++		nft_dev_path_info(&stack, &info, ha, &ft->data);
			
 
				+ 
			
 
				+ 	if (!info.indev || !nft_flowtable_find_dev(info.indev, ft))
			
 
				+ 		return;
			
 
				+@@ -187,6 +203,7 @@ static void nft_dev_forward_path(struct
			
 
				+ 		memcpy(route->tuple[dir].out.h_source, info.h_source, ETH_ALEN);
			
 
				+ 		memcpy(route->tuple[dir].out.h_dest, info.h_dest, ETH_ALEN);
			
 
				+ 		route->tuple[dir].out.ifindex = info.outdev->ifindex;
			
 
				++		route->tuple[dir].out.hw_ifindex = info.hw_outdev->ifindex;
			
 
				+ 		route->tuple[dir].xmit_type = info.xmit_type;
			
 
				+ 	}
			
 
				+ }
			
--- a/target/linux/generic/backport-5.15/610-v5.13-27-netfilter-flowtable-bridge-vlan-hardware-offload-and.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-27-netfilter-flowtable-bridge-vlan-hardware-offload-and.patch
@@ -0,0 +1,123 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:48 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: bridge vlan hardware offload and
			
 
				+ switchdev
			
 
				+
			
 
				+The switch might have already added the VLAN tag through PVID hardware
			
 
				+offload. Keep this extra VLAN in the flowtable but skip it on egress.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/linux/netdevice.h
			
 
				++++ b/include/linux/netdevice.h
			
 
				+@@ -849,6 +849,7 @@ struct net_device_path {
			
 
				+ 				DEV_PATH_BR_VLAN_KEEP,
			
 
				+ 				DEV_PATH_BR_VLAN_TAG,
			
 
				+ 				DEV_PATH_BR_VLAN_UNTAG,
			
 
				++				DEV_PATH_BR_VLAN_UNTAG_HW,
			
 
				+ 			}		vlan_mode;
			
 
				+ 			u16		vlan_id;
			
 
				+ 			__be16		vlan_proto;
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -123,9 +123,10 @@ struct flow_offload_tuple {
			
 
				+ 	/* All members above are keys for lookups, see flow_offload_hash(). */
			
 
				+ 	struct { }			__hash;
			
 
				+ 
			
 
				+-	u8				dir:4,
			
 
				++	u8				dir:2,
			
 
				+ 					xmit_type:2,
			
 
				+-					encap_num:2;
			
 
				++					encap_num:2,
			
 
				++					in_vlan_ingress:2;
			
 
				+ 	u16				mtu;
			
 
				+ 	union {
			
 
				+ 		struct dst_entry	*dst_cache;
			
 
				+@@ -184,7 +185,8 @@ struct nf_flow_route {
			
 
				+ 				u16		id;
			
 
				+ 				__be16		proto;
			
 
				+ 			} encap[NF_FLOW_TABLE_ENCAP_MAX];
			
 
				+-			u8			num_encaps;
			
 
				++			u8			num_encaps:2,
			
 
				++						ingress_vlans:2;
			
 
				+ 		} in;
			
 
				+ 		struct {
			
 
				+ 			u32			ifindex;
			
 
				+--- a/net/bridge/br_device.c
			
 
				++++ b/net/bridge/br_device.c
			
 
				+@@ -435,6 +435,7 @@ static int br_fill_forward_path(struct n
			
 
				+ 		ctx->vlan[ctx->num_vlans].proto = path->bridge.vlan_proto;
			
 
				+ 		ctx->num_vlans++;
			
 
				+ 		break;
			
 
				++	case DEV_PATH_BR_VLAN_UNTAG_HW:
			
 
				+ 	case DEV_PATH_BR_VLAN_UNTAG:
			
 
				+ 		ctx->num_vlans--;
			
 
				+ 		break;
			
 
				+--- a/net/bridge/br_vlan.c
			
 
				++++ b/net/bridge/br_vlan.c
			
 
				+@@ -1374,6 +1374,8 @@ int br_vlan_fill_forward_path_mode(struc
			
 
				+ 
			
 
				+ 	if (path->bridge.vlan_mode == DEV_PATH_BR_VLAN_TAG)
			
 
				+ 		path->bridge.vlan_mode = DEV_PATH_BR_VLAN_KEEP;
			
 
				++	else if (v->priv_flags & BR_VLFLAG_ADDED_BY_SWITCHDEV)
			
 
				++		path->bridge.vlan_mode = DEV_PATH_BR_VLAN_UNTAG_HW;
			
 
				+ 	else
			
 
				+ 		path->bridge.vlan_mode = DEV_PATH_BR_VLAN_UNTAG;
			
 
				+ 
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -95,6 +95,8 @@ static int flow_offload_fill_route(struc
			
 
				+ 	for (i = route->tuple[dir].in.num_encaps - 1; i >= 0; i--) {
			
 
				+ 		flow_tuple->encap[j].id = route->tuple[dir].in.encap[i].id;
			
 
				+ 		flow_tuple->encap[j].proto = route->tuple[dir].in.encap[i].proto;
			
 
				++		if (route->tuple[dir].in.ingress_vlans & BIT(i))
			
 
				++			flow_tuple->in_vlan_ingress |= BIT(j);
			
 
				+ 		j++;
			
 
				+ 	}
			
 
				+ 	flow_tuple->encap_num = route->tuple[dir].in.num_encaps;
			
 
				+--- a/net/netfilter/nf_flow_table_offload.c
			
 
				++++ b/net/netfilter/nf_flow_table_offload.c
			
 
				+@@ -594,8 +594,12 @@ nf_flow_rule_route_common(struct net *ne
			
 
				+ 	other_tuple = &flow->tuplehash[!dir].tuple;
			
 
				+ 
			
 
				+ 	for (i = 0; i < other_tuple->encap_num; i++) {
			
 
				+-		struct flow_action_entry *entry = flow_action_entry_next(flow_rule);
			
 
				++		struct flow_action_entry *entry;
			
 
				+ 
			
 
				++		if (other_tuple->in_vlan_ingress & BIT(i))
			
 
				++			continue;
			
 
				++
			
 
				++		entry = flow_action_entry_next(flow_rule);
			
 
				+ 		entry->id = FLOW_ACTION_VLAN_PUSH;
			
 
				+ 		entry->vlan.vid = other_tuple->encap[i].id;
			
 
				+ 		entry->vlan.proto = other_tuple->encap[i].proto;
			
 
				+--- a/net/netfilter/nft_flow_offload.c
			
 
				++++ b/net/netfilter/nft_flow_offload.c
			
 
				+@@ -72,6 +72,7 @@ struct nft_forward_info {
			
 
				+ 		__be16	proto;
			
 
				+ 	} encap[NF_FLOW_TABLE_ENCAP_MAX];
			
 
				+ 	u8 num_encaps;
			
 
				++	u8 ingress_vlans;
			
 
				+ 	u8 h_source[ETH_ALEN];
			
 
				+ 	u8 h_dest[ETH_ALEN];
			
 
				+ 	enum flow_offload_xmit_type xmit_type;
			
 
				+@@ -130,6 +131,9 @@ static void nft_dev_path_info(const stru
			
 
				+ 				memcpy(info->h_source, path->dev->dev_addr, ETH_ALEN);
			
 
				+ 
			
 
				+ 			switch (path->bridge.vlan_mode) {
			
 
				++			case DEV_PATH_BR_VLAN_UNTAG_HW:
			
 
				++				info->ingress_vlans |= BIT(info->num_encaps - 1);
			
 
				++				break;
			
 
				+ 			case DEV_PATH_BR_VLAN_TAG:
			
 
				+ 				info->encap[info->num_encaps].id = path->bridge.vlan_id;
			
 
				+ 				info->encap[info->num_encaps].proto = path->bridge.vlan_proto;
			
 
				+@@ -198,6 +202,7 @@ static void nft_dev_forward_path(struct
			
 
				+ 		route->tuple[!dir].in.encap[i].proto = info.encap[i].proto;
			
 
				+ 	}
			
 
				+ 	route->tuple[!dir].in.num_encaps = info.num_encaps;
			
 
				++	route->tuple[!dir].in.ingress_vlans = info.ingress_vlans;
			
 
				+ 
			
 
				+ 	if (info.xmit_type == FLOW_OFFLOAD_XMIT_DIRECT) {
			
 
				+ 		memcpy(route->tuple[dir].out.h_source, info.h_source, ETH_ALEN);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-28-net-flow_offload-add-FLOW_ACTION_PPPOE_PUSH.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-28-net-flow_offload-add-FLOW_ACTION_PPPOE_PUSH.patch
@@ -0,0 +1,30 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:49 +0100
			
 
				+Subject: [PATCH] net: flow_offload: add FLOW_ACTION_PPPOE_PUSH
			
 
				+
			
 
				+Add an action to represent the PPPoE hardware offload support that
			
 
				+includes the session ID.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/flow_offload.h
			
 
				++++ b/include/net/flow_offload.h
			
 
				+@@ -147,6 +147,7 @@ enum flow_action_id {
			
 
				+ 	FLOW_ACTION_MPLS_POP,
			
 
				+ 	FLOW_ACTION_MPLS_MANGLE,
			
 
				+ 	FLOW_ACTION_GATE,
			
 
				++	FLOW_ACTION_PPPOE_PUSH,
			
 
				+ 	NUM_FLOW_ACTIONS,
			
 
				+ };
			
 
				+ 
			
 
				+@@ -271,6 +272,9 @@ struct flow_action_entry {
			
 
				+ 			u32		num_entries;
			
 
				+ 			struct action_gate_entry *entries;
			
 
				+ 		} gate;
			
 
				++		struct {				/* FLOW_ACTION_PPPOE_PUSH */
			
 
				++			u16		sid;
			
 
				++		} pppoe;
			
 
				+ 	};
			
 
				+ 	struct flow_action_cookie *cookie; /* user defined action cookie */
			
 
				+ };
			
--- a/target/linux/generic/backport-5.15/610-v5.13-29-netfilter-flowtable-support-for-FLOW_ACTION_PPPOE_PU.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-29-netfilter-flowtable-support-for-FLOW_ACTION_PPPOE_PU.patch
@@ -0,0 +1,35 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:50 +0100
			
 
				+Subject: [PATCH] netfilter: flowtable: support for
			
 
				+ FLOW_ACTION_PPPOE_PUSH
			
 
				+
			
 
				+Add a PPPoE push action if layer 2 protocol is ETH_P_PPP_SES to add
			
 
				+PPPoE flowtable hardware offload support.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/netfilter/nf_flow_table_offload.c
			
 
				++++ b/net/netfilter/nf_flow_table_offload.c
			
 
				+@@ -600,9 +600,18 @@ nf_flow_rule_route_common(struct net *ne
			
 
				+ 			continue;
			
 
				+ 
			
 
				+ 		entry = flow_action_entry_next(flow_rule);
			
 
				+-		entry->id = FLOW_ACTION_VLAN_PUSH;
			
 
				+-		entry->vlan.vid = other_tuple->encap[i].id;
			
 
				+-		entry->vlan.proto = other_tuple->encap[i].proto;
			
 
				++
			
 
				++		switch (other_tuple->encap[i].proto) {
			
 
				++		case htons(ETH_P_PPP_SES):
			
 
				++			entry->id = FLOW_ACTION_PPPOE_PUSH;
			
 
				++			entry->pppoe.sid = other_tuple->encap[i].id;
			
 
				++			break;
			
 
				++		case htons(ETH_P_8021Q):
			
 
				++			entry->id = FLOW_ACTION_VLAN_PUSH;
			
 
				++			entry->vlan.vid = other_tuple->encap[i].id;
			
 
				++			entry->vlan.proto = other_tuple->encap[i].proto;
			
 
				++			break;
			
 
				++		}
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return 0;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-30-dsa-slave-add-support-for-TC_SETUP_FT.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-30-dsa-slave-add-support-for-TC_SETUP_FT.patch
@@ -0,0 +1,53 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:51 +0100
			
 
				+Subject: [PATCH] dsa: slave: add support for TC_SETUP_FT
			
 
				+
			
 
				+The dsa infrastructure provides a well-defined hierarchy of devices,
			
 
				+pass up the call to set up the flow block to the master device. From the
			
 
				+software dataplane, the netfilter infrastructure uses the dsa slave
			
 
				+devices to refer to the input and output device for the given skbuff.
			
 
				+Similarly, the flowtable definition in the ruleset refers to the dsa
			
 
				+slave port devices.
			
 
				+
			
 
				+This patch adds the glue code to call ndo_setup_tc with TC_SETUP_FT
			
 
				+with the master device via the dsa slave devices.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/net/dsa/slave.c
			
 
				++++ b/net/dsa/slave.c
			
 
				+@@ -1239,14 +1239,32 @@ static int dsa_slave_setup_tc_block(stru
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
 
				++static int dsa_slave_setup_ft_block(struct dsa_switch *ds, int port,
			
 
				++				    void *type_data)
			
 
				++{
			
 
				++	struct dsa_port *cpu_dp = dsa_to_port(ds, port)->cpu_dp;
			
 
				++	struct net_device *master = cpu_dp->master;
			
 
				++
			
 
				++	if (!master->netdev_ops->ndo_setup_tc)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	return master->netdev_ops->ndo_setup_tc(master, TC_SETUP_FT, type_data);
			
 
				++}
			
 
				++
			
 
				+ static int dsa_slave_setup_tc(struct net_device *dev, enum tc_setup_type type,
			
 
				+ 			      void *type_data)
			
 
				+ {
			
 
				+ 	struct dsa_port *dp = dsa_slave_to_port(dev);
			
 
				+ 	struct dsa_switch *ds = dp->ds;
			
 
				+ 
			
 
				+-	if (type == TC_SETUP_BLOCK)
			
 
				++	switch (type) {
			
 
				++	case TC_SETUP_BLOCK:
			
 
				+ 		return dsa_slave_setup_tc_block(dev, type_data);
			
 
				++	case TC_SETUP_FT:
			
 
				++		return dsa_slave_setup_ft_block(ds, dp->index, type_data);
			
 
				++	default:
			
 
				++		break;
			
 
				++	}
			
 
				+ 
			
 
				+ 	if (!ds->ops->port_setup_tc)
			
 
				+ 		return -EOPNOTSUPP;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-31-net-ethernet-mtk_eth_soc-fix-parsing-packets-in-GDM.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-31-net-ethernet-mtk_eth_soc-fix-parsing-packets-in-GDM.patch
@@ -0,0 +1,68 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:52 +0100
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: fix parsing packets in GDM
			
 
				+
			
 
				+When using DSA, set the special tag in GDM ingress control to allow the MAC
			
 
				+to parse packets properly earlier. This affects rx DMA source port reporting.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -19,6 +19,7 @@
			
 
				+ #include <linux/interrupt.h>
			
 
				+ #include <linux/pinctrl/devinfo.h>
			
 
				+ #include <linux/phylink.h>
			
 
				++#include <net/dsa.h>
			
 
				+ 
			
 
				+ #include "mtk_eth_soc.h"
			
 
				+ 
			
 
				+@@ -1285,13 +1286,12 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 			break;
			
 
				+ 
			
 
				+ 		/* find out which mac the packet come from. values start at 1 */
			
 
				+-		if (MTK_HAS_CAPS(eth->soc->caps, MTK_SOC_MT7628)) {
			
 
				++		if (MTK_HAS_CAPS(eth->soc->caps, MTK_SOC_MT7628) ||
			
 
				++		    (trxd.rxd4 & RX_DMA_SPECIAL_TAG))
			
 
				+ 			mac = 0;
			
 
				+-		} else {
			
 
				+-			mac = (trxd.rxd4 >> RX_DMA_FPORT_SHIFT) &
			
 
				+-				RX_DMA_FPORT_MASK;
			
 
				+-			mac--;
			
 
				+-		}
			
 
				++		else
			
 
				++			mac = ((trxd.rxd4 >> RX_DMA_FPORT_SHIFT) &
			
 
				++			       RX_DMA_FPORT_MASK) - 1;
			
 
				+ 
			
 
				+ 		if (unlikely(mac < 0 || mac >= MTK_MAC_COUNT ||
			
 
				+ 			     !eth->netdev[mac]))
			
 
				+@@ -2254,6 +2254,9 @@ static void mtk_gdm_config(struct mtk_et
			
 
				+ 
			
 
				+ 		val |= config;
			
 
				+ 
			
 
				++		if (!i && eth->netdev[0] && netdev_uses_dsa(eth->netdev[0]))
			
 
				++			val |= MTK_GDMA_SPECIAL_TAG;
			
 
				++
			
 
				+ 		mtk_w32(eth, val, MTK_GDMA_FWD_CFG(i));
			
 
				+ 	}
			
 
				+ 	/* Reset and enable PSE */
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -81,6 +81,7 @@
			
 
				+ 
			
 
				+ /* GDM Exgress Control Register */
			
 
				+ #define MTK_GDMA_FWD_CFG(x)	(0x500 + (x * 0x1000))
			
 
				++#define MTK_GDMA_SPECIAL_TAG	BIT(24)
			
 
				+ #define MTK_GDMA_ICS_EN		BIT(22)
			
 
				+ #define MTK_GDMA_TCS_EN		BIT(21)
			
 
				+ #define MTK_GDMA_UCS_EN		BIT(20)
			
 
				+@@ -318,6 +319,7 @@
			
 
				+ #define RX_DMA_L4_VALID_PDMA	BIT(30)		/* when PDMA is used */
			
 
				+ #define RX_DMA_FPORT_SHIFT	19
			
 
				+ #define RX_DMA_FPORT_MASK	0x7
			
 
				++#define RX_DMA_SPECIAL_TAG	BIT(22)
			
 
				+ 
			
 
				+ /* PHY Indirect Access Control registers */
			
 
				+ #define MTK_PHY_IAC		0x10004
			
--- a/target/linux/generic/backport-5.15/610-v5.13-32-net-ethernet-mtk_eth_soc-add-support-for-initializin.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-32-net-ethernet-mtk_eth_soc-add-support-for-initializin.patch
@@ -0,0 +1,1308 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:53 +0100
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: add support for
			
 
				+ initializing the PPE
			
 
				+
			
 
				+The PPE (packet processing engine) is used to offload NAT/routed or even
			
 
				+bridged flows. This patch brings up the PPE and uses it to get a packet
			
 
				+hash. It also contains some functionality that will be used to bring up
			
 
				+flow offloading.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+ create mode 100644 drivers/net/ethernet/mediatek/mtk_ppe.c
			
 
				+ create mode 100644 drivers/net/ethernet/mediatek/mtk_ppe.h
			
 
				+ create mode 100644 drivers/net/ethernet/mediatek/mtk_ppe_debugfs.c
			
 
				+ create mode 100644 drivers/net/ethernet/mediatek/mtk_ppe_regs.h
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/Makefile
			
 
				++++ b/drivers/net/ethernet/mediatek/Makefile
			
 
				+@@ -4,5 +4,5 @@
			
 
				+ #
			
 
				+ 
			
 
				+ obj-$(CONFIG_NET_MEDIATEK_SOC) += mtk_eth.o
			
 
				+-mtk_eth-y := mtk_eth_soc.o mtk_sgmii.o mtk_eth_path.o
			
 
				++mtk_eth-y := mtk_eth_soc.o mtk_sgmii.o mtk_eth_path.o mtk_ppe.o mtk_ppe_debugfs.o
			
 
				+ obj-$(CONFIG_NET_MEDIATEK_STAR_EMAC) += mtk_star_emac.o
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -2279,12 +2279,17 @@ static int mtk_open(struct net_device *d
			
 
				+ 
			
 
				+ 	/* we run 2 netdevs on the same dma ring so we only bring it up once */
			
 
				+ 	if (!refcount_read(&eth->dma_refcnt)) {
			
 
				+-		int err = mtk_start_dma(eth);
			
 
				++		u32 gdm_config = MTK_GDMA_TO_PDMA;
			
 
				++		int err;
			
 
				+ 
			
 
				++		err = mtk_start_dma(eth);
			
 
				+ 		if (err)
			
 
				+ 			return err;
			
 
				+ 
			
 
				+-		mtk_gdm_config(eth, MTK_GDMA_TO_PDMA);
			
 
				++		if (eth->soc->offload_version && mtk_ppe_start(&eth->ppe) == 0)
			
 
				++			gdm_config = MTK_GDMA_TO_PPE;
			
 
				++
			
 
				++		mtk_gdm_config(eth, gdm_config);
			
 
				+ 
			
 
				+ 		napi_enable(&eth->tx_napi);
			
 
				+ 		napi_enable(&eth->rx_napi);
			
 
				+@@ -2351,6 +2356,9 @@ static int mtk_stop(struct net_device *d
			
 
				+ 
			
 
				+ 	mtk_dma_free(eth);
			
 
				+ 
			
 
				++	if (eth->soc->offload_version)
			
 
				++		mtk_ppe_stop(&eth->ppe);
			
 
				++
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				+@@ -3079,6 +3087,13 @@ static int mtk_probe(struct platform_dev
			
 
				+ 			goto err_free_dev;
			
 
				+ 	}
			
 
				+ 
			
 
				++	if (eth->soc->offload_version) {
			
 
				++		err = mtk_ppe_init(&eth->ppe, eth->dev,
			
 
				++				   eth->base + MTK_ETH_PPE_BASE, 2);
			
 
				++		if (err)
			
 
				++			goto err_free_dev;
			
 
				++	}
			
 
				++
			
 
				+ 	for (i = 0; i < MTK_MAX_DEVS; i++) {
			
 
				+ 		if (!eth->netdev[i])
			
 
				+ 			continue;
			
 
				+@@ -3153,6 +3168,7 @@ static const struct mtk_soc_data mt7621_
			
 
				+ 	.hw_features = MTK_HW_FEATURES,
			
 
				+ 	.required_clks = MT7621_CLKS_BITMAP,
			
 
				+ 	.required_pctl = false,
			
 
				++	.offload_version = 2,
			
 
				+ };
			
 
				+ 
			
 
				+ static const struct mtk_soc_data mt7622_data = {
			
 
				+@@ -3161,6 +3177,7 @@ static const struct mtk_soc_data mt7622_
			
 
				+ 	.hw_features = MTK_HW_FEATURES,
			
 
				+ 	.required_clks = MT7622_CLKS_BITMAP,
			
 
				+ 	.required_pctl = false,
			
 
				++	.offload_version = 2,
			
 
				+ };
			
 
				+ 
			
 
				+ static const struct mtk_soc_data mt7623_data = {
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -15,6 +15,7 @@
			
 
				+ #include <linux/u64_stats_sync.h>
			
 
				+ #include <linux/refcount.h>
			
 
				+ #include <linux/phylink.h>
			
 
				++#include "mtk_ppe.h"
			
 
				+ 
			
 
				+ #define MTK_QDMA_PAGE_SIZE	2048
			
 
				+ #define	MTK_MAX_RX_LENGTH	1536
			
 
				+@@ -86,6 +87,7 @@
			
 
				+ #define MTK_GDMA_TCS_EN		BIT(21)
			
 
				+ #define MTK_GDMA_UCS_EN		BIT(20)
			
 
				+ #define MTK_GDMA_TO_PDMA	0x0
			
 
				++#define MTK_GDMA_TO_PPE		0x4444
			
 
				+ #define MTK_GDMA_DROP_ALL       0x7777
			
 
				+ 
			
 
				+ /* Unicast Filter MAC Address Register - Low */
			
 
				+@@ -315,6 +317,12 @@
			
 
				+ #define RX_DMA_VID(_x)		((_x) & 0xfff)
			
 
				+ 
			
 
				+ /* QDMA descriptor rxd4 */
			
 
				++#define MTK_RXD4_FOE_ENTRY	GENMASK(13, 0)
			
 
				++#define MTK_RXD4_PPE_CPU_REASON	GENMASK(18, 14)
			
 
				++#define MTK_RXD4_SRC_PORT	GENMASK(21, 19)
			
 
				++#define MTK_RXD4_ALG		GENMASK(31, 22)
			
 
				++
			
 
				++/* QDMA descriptor rxd4 */
			
 
				+ #define RX_DMA_L4_VALID		BIT(24)
			
 
				+ #define RX_DMA_L4_VALID_PDMA	BIT(30)		/* when PDMA is used */
			
 
				+ #define RX_DMA_FPORT_SHIFT	19
			
 
				+@@ -819,6 +827,7 @@ struct mtk_soc_data {
			
 
				+ 	u32		caps;
			
 
				+ 	u32		required_clks;
			
 
				+ 	bool		required_pctl;
			
 
				++	u8		offload_version;
			
 
				+ 	netdev_features_t hw_features;
			
 
				+ };
			
 
				+ 
			
 
				+@@ -918,6 +927,8 @@ struct mtk_eth {
			
 
				+ 	u32				tx_int_status_reg;
			
 
				+ 	u32				rx_dma_l4_valid;
			
 
				+ 	int				ip_align;
			
 
				++
			
 
				++	struct mtk_ppe			ppe;
			
 
				+ };
			
 
				+ 
			
 
				+ /* struct mtk_mac -	the structure that holds the info about the MACs of the
			
 
				+--- /dev/null
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe.c
			
 
				+@@ -0,0 +1,511 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/* Copyright (C) 2020 Felix Fietkau <[email protected]> */
			
 
				++
			
 
				++#include <linux/kernel.h>
			
 
				++#include <linux/jiffies.h>
			
 
				++#include <linux/delay.h>
			
 
				++#include <linux/io.h>
			
 
				++#include <linux/etherdevice.h>
			
 
				++#include <linux/platform_device.h>
			
 
				++#include "mtk_ppe.h"
			
 
				++#include "mtk_ppe_regs.h"
			
 
				++
			
 
				++static void ppe_w32(struct mtk_ppe *ppe, u32 reg, u32 val)
			
 
				++{
			
 
				++	writel(val, ppe->base + reg);
			
 
				++}
			
 
				++
			
 
				++static u32 ppe_r32(struct mtk_ppe *ppe, u32 reg)
			
 
				++{
			
 
				++	return readl(ppe->base + reg);
			
 
				++}
			
 
				++
			
 
				++static u32 ppe_m32(struct mtk_ppe *ppe, u32 reg, u32 mask, u32 set)
			
 
				++{
			
 
				++	u32 val;
			
 
				++
			
 
				++	val = ppe_r32(ppe, reg);
			
 
				++	val &= ~mask;
			
 
				++	val |= set;
			
 
				++	ppe_w32(ppe, reg, val);
			
 
				++
			
 
				++	return val;
			
 
				++}
			
 
				++
			
 
				++static u32 ppe_set(struct mtk_ppe *ppe, u32 reg, u32 val)
			
 
				++{
			
 
				++	return ppe_m32(ppe, reg, 0, val);
			
 
				++}
			
 
				++
			
 
				++static u32 ppe_clear(struct mtk_ppe *ppe, u32 reg, u32 val)
			
 
				++{
			
 
				++	return ppe_m32(ppe, reg, val, 0);
			
 
				++}
			
 
				++
			
 
				++static int mtk_ppe_wait_busy(struct mtk_ppe *ppe)
			
 
				++{
			
 
				++	unsigned long timeout = jiffies + HZ;
			
 
				++
			
 
				++	while (time_is_before_jiffies(timeout)) {
			
 
				++		if (!(ppe_r32(ppe, MTK_PPE_GLO_CFG) & MTK_PPE_GLO_CFG_BUSY))
			
 
				++			return 0;
			
 
				++
			
 
				++		usleep_range(10, 20);
			
 
				++	}
			
 
				++
			
 
				++	dev_err(ppe->dev, "PPE table busy");
			
 
				++
			
 
				++	return -ETIMEDOUT;
			
 
				++}
			
 
				++
			
 
				++static void mtk_ppe_cache_clear(struct mtk_ppe *ppe)
			
 
				++{
			
 
				++	ppe_set(ppe, MTK_PPE_CACHE_CTL, MTK_PPE_CACHE_CTL_CLEAR);
			
 
				++	ppe_clear(ppe, MTK_PPE_CACHE_CTL, MTK_PPE_CACHE_CTL_CLEAR);
			
 
				++}
			
 
				++
			
 
				++static void mtk_ppe_cache_enable(struct mtk_ppe *ppe, bool enable)
			
 
				++{
			
 
				++	mtk_ppe_cache_clear(ppe);
			
 
				++
			
 
				++	ppe_m32(ppe, MTK_PPE_CACHE_CTL, MTK_PPE_CACHE_CTL_EN,
			
 
				++		enable * MTK_PPE_CACHE_CTL_EN);
			
 
				++}
			
 
				++
			
 
				++static u32 mtk_ppe_hash_entry(struct mtk_foe_entry *e)
			
 
				++{
			
 
				++	u32 hv1, hv2, hv3;
			
 
				++	u32 hash;
			
 
				++
			
 
				++	switch (FIELD_GET(MTK_FOE_IB1_PACKET_TYPE, e->ib1)) {
			
 
				++		case MTK_PPE_PKT_TYPE_BRIDGE:
			
 
				++			hv1 = e->bridge.src_mac_lo;
			
 
				++			hv1 ^= ((e->bridge.src_mac_hi & 0xffff) << 16);
			
 
				++			hv2 = e->bridge.src_mac_hi >> 16;
			
 
				++			hv2 ^= e->bridge.dest_mac_lo;
			
 
				++			hv3 = e->bridge.dest_mac_hi;
			
 
				++			break;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_ROUTE:
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_HNAPT:
			
 
				++			hv1 = e->ipv4.orig.ports;
			
 
				++			hv2 = e->ipv4.orig.dest_ip;
			
 
				++			hv3 = e->ipv4.orig.src_ip;
			
 
				++			break;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T:
			
 
				++		case MTK_PPE_PKT_TYPE_IPV6_ROUTE_5T:
			
 
				++			hv1 = e->ipv6.src_ip[3] ^ e->ipv6.dest_ip[3];
			
 
				++			hv1 ^= e->ipv6.ports;
			
 
				++
			
 
				++			hv2 = e->ipv6.src_ip[2] ^ e->ipv6.dest_ip[2];
			
 
				++			hv2 ^= e->ipv6.dest_ip[0];
			
 
				++
			
 
				++			hv3 = e->ipv6.src_ip[1] ^ e->ipv6.dest_ip[1];
			
 
				++			hv3 ^= e->ipv6.src_ip[0];
			
 
				++			break;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_DSLITE:
			
 
				++		case MTK_PPE_PKT_TYPE_IPV6_6RD:
			
 
				++		default:
			
 
				++			WARN_ON_ONCE(1);
			
 
				++			return MTK_PPE_HASH_MASK;
			
 
				++	}
			
 
				++
			
 
				++	hash = (hv1 & hv2) | ((~hv1) & hv3);
			
 
				++	hash = (hash >> 24) | ((hash & 0xffffff) << 8);
			
 
				++	hash ^= hv1 ^ hv2 ^ hv3;
			
 
				++	hash ^= hash >> 16;
			
 
				++	hash <<= 1;
			
 
				++	hash &= MTK_PPE_ENTRIES - 1;
			
 
				++
			
 
				++	return hash;
			
 
				++}
			
 
				++
			
 
				++static inline struct mtk_foe_mac_info *
			
 
				++mtk_foe_entry_l2(struct mtk_foe_entry *entry)
			
 
				++{
			
 
				++	int type = FIELD_GET(MTK_FOE_IB1_PACKET_TYPE, entry->ib1);
			
 
				++
			
 
				++	if (type >= MTK_PPE_PKT_TYPE_IPV4_DSLITE)
			
 
				++		return &entry->ipv6.l2;
			
 
				++
			
 
				++	return &entry->ipv4.l2;
			
 
				++}
			
 
				++
			
 
				++static inline u32 *
			
 
				++mtk_foe_entry_ib2(struct mtk_foe_entry *entry)
			
 
				++{
			
 
				++	int type = FIELD_GET(MTK_FOE_IB1_PACKET_TYPE, entry->ib1);
			
 
				++
			
 
				++	if (type >= MTK_PPE_PKT_TYPE_IPV4_DSLITE)
			
 
				++		return &entry->ipv6.ib2;
			
 
				++
			
 
				++	return &entry->ipv4.ib2;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_prepare(struct mtk_foe_entry *entry, int type, int l4proto,
			
 
				++			  u8 pse_port, u8 *src_mac, u8 *dest_mac)
			
 
				++{
			
 
				++	struct mtk_foe_mac_info *l2;
			
 
				++	u32 ports_pad, val;
			
 
				++
			
 
				++	memset(entry, 0, sizeof(*entry));
			
 
				++
			
 
				++	val = FIELD_PREP(MTK_FOE_IB1_STATE, MTK_FOE_STATE_BIND) |
			
 
				++	      FIELD_PREP(MTK_FOE_IB1_PACKET_TYPE, type) |
			
 
				++	      FIELD_PREP(MTK_FOE_IB1_UDP, l4proto == IPPROTO_UDP) |
			
 
				++	      MTK_FOE_IB1_BIND_TTL |
			
 
				++	      MTK_FOE_IB1_BIND_CACHE;
			
 
				++	entry->ib1 = val;
			
 
				++
			
 
				++	val = FIELD_PREP(MTK_FOE_IB2_PORT_MG, 0x3f) |
			
 
				++	      FIELD_PREP(MTK_FOE_IB2_PORT_AG, 0x1f) |
			
 
				++	      FIELD_PREP(MTK_FOE_IB2_DEST_PORT, pse_port);
			
 
				++
			
 
				++	if (is_multicast_ether_addr(dest_mac))
			
 
				++		val |= MTK_FOE_IB2_MULTICAST;
			
 
				++
			
 
				++	ports_pad = 0xa5a5a500 | (l4proto & 0xff);
			
 
				++	if (type == MTK_PPE_PKT_TYPE_IPV4_ROUTE)
			
 
				++		entry->ipv4.orig.ports = ports_pad;
			
 
				++	if (type == MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T)
			
 
				++		entry->ipv6.ports = ports_pad;
			
 
				++
			
 
				++	if (type >= MTK_PPE_PKT_TYPE_IPV4_DSLITE) {
			
 
				++		entry->ipv6.ib2 = val;
			
 
				++		l2 = &entry->ipv6.l2;
			
 
				++	} else {
			
 
				++		entry->ipv4.ib2 = val;
			
 
				++		l2 = &entry->ipv4.l2;
			
 
				++	}
			
 
				++
			
 
				++	l2->dest_mac_hi = get_unaligned_be32(dest_mac);
			
 
				++	l2->dest_mac_lo = get_unaligned_be16(dest_mac + 4);
			
 
				++	l2->src_mac_hi = get_unaligned_be32(src_mac);
			
 
				++	l2->src_mac_lo = get_unaligned_be16(src_mac + 4);
			
 
				++
			
 
				++	if (type >= MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T)
			
 
				++		l2->etype = ETH_P_IPV6;
			
 
				++	else
			
 
				++		l2->etype = ETH_P_IP;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_set_pse_port(struct mtk_foe_entry *entry, u8 port)
			
 
				++{
			
 
				++	u32 *ib2 = mtk_foe_entry_ib2(entry);
			
 
				++	u32 val;
			
 
				++
			
 
				++	val = *ib2;
			
 
				++	val &= ~MTK_FOE_IB2_DEST_PORT;
			
 
				++	val |= FIELD_PREP(MTK_FOE_IB2_DEST_PORT, port);
			
 
				++	*ib2 = val;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_set_ipv4_tuple(struct mtk_foe_entry *entry, bool egress,
			
 
				++				 __be32 src_addr, __be16 src_port,
			
 
				++				 __be32 dest_addr, __be16 dest_port)
			
 
				++{
			
 
				++	int type = FIELD_GET(MTK_FOE_IB1_PACKET_TYPE, entry->ib1);
			
 
				++	struct mtk_ipv4_tuple *t;
			
 
				++
			
 
				++	switch (type) {
			
 
				++	case MTK_PPE_PKT_TYPE_IPV4_HNAPT:
			
 
				++		if (egress) {
			
 
				++			t = &entry->ipv4.new;
			
 
				++			break;
			
 
				++		}
			
 
				++		fallthrough;
			
 
				++	case MTK_PPE_PKT_TYPE_IPV4_DSLITE:
			
 
				++	case MTK_PPE_PKT_TYPE_IPV4_ROUTE:
			
 
				++		t = &entry->ipv4.orig;
			
 
				++		break;
			
 
				++	case MTK_PPE_PKT_TYPE_IPV6_6RD:
			
 
				++		entry->ipv6_6rd.tunnel_src_ip = be32_to_cpu(src_addr);
			
 
				++		entry->ipv6_6rd.tunnel_dest_ip = be32_to_cpu(dest_addr);
			
 
				++		return 0;
			
 
				++	default:
			
 
				++		WARN_ON_ONCE(1);
			
 
				++		return -EINVAL;
			
 
				++	}
			
 
				++
			
 
				++	t->src_ip = be32_to_cpu(src_addr);
			
 
				++	t->dest_ip = be32_to_cpu(dest_addr);
			
 
				++
			
 
				++	if (type == MTK_PPE_PKT_TYPE_IPV4_ROUTE)
			
 
				++		return 0;
			
 
				++
			
 
				++	t->src_port = be16_to_cpu(src_port);
			
 
				++	t->dest_port = be16_to_cpu(dest_port);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_set_ipv6_tuple(struct mtk_foe_entry *entry,
			
 
				++				 __be32 *src_addr, __be16 src_port,
			
 
				++				 __be32 *dest_addr, __be16 dest_port)
			
 
				++{
			
 
				++	int type = FIELD_GET(MTK_FOE_IB1_PACKET_TYPE, entry->ib1);
			
 
				++	u32 *src, *dest;
			
 
				++	int i;
			
 
				++
			
 
				++	switch (type) {
			
 
				++	case MTK_PPE_PKT_TYPE_IPV4_DSLITE:
			
 
				++		src = entry->dslite.tunnel_src_ip;
			
 
				++		dest = entry->dslite.tunnel_dest_ip;
			
 
				++		break;
			
 
				++	case MTK_PPE_PKT_TYPE_IPV6_ROUTE_5T:
			
 
				++	case MTK_PPE_PKT_TYPE_IPV6_6RD:
			
 
				++		entry->ipv6.src_port = be16_to_cpu(src_port);
			
 
				++		entry->ipv6.dest_port = be16_to_cpu(dest_port);
			
 
				++		fallthrough;
			
 
				++	case MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T:
			
 
				++		src = entry->ipv6.src_ip;
			
 
				++		dest = entry->ipv6.dest_ip;
			
 
				++		break;
			
 
				++	default:
			
 
				++		WARN_ON_ONCE(1);
			
 
				++		return -EINVAL;
			
 
				++	};
			
 
				++
			
 
				++	for (i = 0; i < 4; i++)
			
 
				++		src[i] = be32_to_cpu(src_addr[i]);
			
 
				++	for (i = 0; i < 4; i++)
			
 
				++		dest[i] = be32_to_cpu(dest_addr[i]);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_set_dsa(struct mtk_foe_entry *entry, int port)
			
 
				++{
			
 
				++	struct mtk_foe_mac_info *l2 = mtk_foe_entry_l2(entry);
			
 
				++
			
 
				++	l2->etype = BIT(port);
			
 
				++
			
 
				++	if (!(entry->ib1 & MTK_FOE_IB1_BIND_VLAN_LAYER))
			
 
				++		entry->ib1 |= FIELD_PREP(MTK_FOE_IB1_BIND_VLAN_LAYER, 1);
			
 
				++	else
			
 
				++		l2->etype |= BIT(8);
			
 
				++
			
 
				++	entry->ib1 &= ~MTK_FOE_IB1_BIND_VLAN_TAG;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_set_vlan(struct mtk_foe_entry *entry, int vid)
			
 
				++{
			
 
				++	struct mtk_foe_mac_info *l2 = mtk_foe_entry_l2(entry);
			
 
				++
			
 
				++	switch (FIELD_GET(MTK_FOE_IB1_BIND_VLAN_LAYER, entry->ib1)) {
			
 
				++	case 0:
			
 
				++		entry->ib1 |= MTK_FOE_IB1_BIND_VLAN_TAG |
			
 
				++			      FIELD_PREP(MTK_FOE_IB1_BIND_VLAN_LAYER, 1);
			
 
				++		l2->vlan1 = vid;
			
 
				++		return 0;
			
 
				++	case 1:
			
 
				++		if (!(entry->ib1 & MTK_FOE_IB1_BIND_VLAN_TAG)) {
			
 
				++			l2->vlan1 = vid;
			
 
				++			l2->etype |= BIT(8);
			
 
				++		} else {
			
 
				++			l2->vlan2 = vid;
			
 
				++			entry->ib1 += FIELD_PREP(MTK_FOE_IB1_BIND_VLAN_LAYER, 1);
			
 
				++		}
			
 
				++		return 0;
			
 
				++	default:
			
 
				++		return -ENOSPC;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_set_pppoe(struct mtk_foe_entry *entry, int sid)
			
 
				++{
			
 
				++	struct mtk_foe_mac_info *l2 = mtk_foe_entry_l2(entry);
			
 
				++
			
 
				++	if (!(entry->ib1 & MTK_FOE_IB1_BIND_VLAN_LAYER) ||
			
 
				++	    (entry->ib1 & MTK_FOE_IB1_BIND_VLAN_TAG))
			
 
				++		l2->etype = ETH_P_PPP_SES;
			
 
				++
			
 
				++	entry->ib1 |= MTK_FOE_IB1_BIND_PPPOE;
			
 
				++	l2->pppoe_id = sid;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static inline bool mtk_foe_entry_usable(struct mtk_foe_entry *entry)
			
 
				++{
			
 
				++	return !(entry->ib1 & MTK_FOE_IB1_STATIC) &&
			
 
				++	       FIELD_GET(MTK_FOE_IB1_STATE, entry->ib1) != MTK_FOE_STATE_BIND;
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_commit(struct mtk_ppe *ppe, struct mtk_foe_entry *entry,
			
 
				++			 u16 timestamp)
			
 
				++{
			
 
				++	struct mtk_foe_entry *hwe;
			
 
				++	u32 hash;
			
 
				++
			
 
				++	timestamp &= MTK_FOE_IB1_BIND_TIMESTAMP;
			
 
				++	entry->ib1 &= ~MTK_FOE_IB1_BIND_TIMESTAMP;
			
 
				++	entry->ib1 |= FIELD_PREP(MTK_FOE_IB1_BIND_TIMESTAMP, timestamp);
			
 
				++
			
 
				++	hash = mtk_ppe_hash_entry(entry);
			
 
				++	hwe = &ppe->foe_table[hash];
			
 
				++	if (!mtk_foe_entry_usable(hwe)) {
			
 
				++		hwe++;
			
 
				++		hash++;
			
 
				++
			
 
				++		if (!mtk_foe_entry_usable(hwe))
			
 
				++			return -ENOSPC;
			
 
				++	}
			
 
				++
			
 
				++	memcpy(&hwe->data, &entry->data, sizeof(hwe->data));
			
 
				++	wmb();
			
 
				++	hwe->ib1 = entry->ib1;
			
 
				++
			
 
				++	dma_wmb();
			
 
				++
			
 
				++	mtk_ppe_cache_clear(ppe);
			
 
				++
			
 
				++	return hash;
			
 
				++}
			
 
				++
			
 
				++int mtk_ppe_init(struct mtk_ppe *ppe, struct device *dev, void __iomem *base,
			
 
				++		 int version)
			
 
				++{
			
 
				++	struct mtk_foe_entry *foe;
			
 
				++
			
 
				++	/* need to allocate a separate device, since it PPE DMA access is
			
 
				++	 * not coherent.
			
 
				++	 */
			
 
				++	ppe->base = base;
			
 
				++	ppe->dev = dev;
			
 
				++	ppe->version = version;
			
 
				++
			
 
				++	foe = dmam_alloc_coherent(ppe->dev, MTK_PPE_ENTRIES * sizeof(*foe),
			
 
				++				  &ppe->foe_phys, GFP_KERNEL);
			
 
				++	if (!foe)
			
 
				++		return -ENOMEM;
			
 
				++
			
 
				++	ppe->foe_table = foe;
			
 
				++
			
 
				++	mtk_ppe_debugfs_init(ppe);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static void mtk_ppe_init_foe_table(struct mtk_ppe *ppe)
			
 
				++{
			
 
				++	static const u8 skip[] = { 12, 25, 38, 51, 76, 89, 102 };
			
 
				++	int i, k;
			
 
				++
			
 
				++	memset(ppe->foe_table, 0, MTK_PPE_ENTRIES * sizeof(ppe->foe_table));
			
 
				++
			
 
				++	if (!IS_ENABLED(CONFIG_SOC_MT7621))
			
 
				++		return;
			
 
				++
			
 
				++	/* skip all entries that cross the 1024 byte boundary */
			
 
				++	for (i = 0; i < MTK_PPE_ENTRIES; i += 128)
			
 
				++		for (k = 0; k < ARRAY_SIZE(skip); k++)
			
 
				++			ppe->foe_table[i + skip[k]].ib1 |= MTK_FOE_IB1_STATIC;
			
 
				++}
			
 
				++
			
 
				++int mtk_ppe_start(struct mtk_ppe *ppe)
			
 
				++{
			
 
				++	u32 val;
			
 
				++
			
 
				++	mtk_ppe_init_foe_table(ppe);
			
 
				++	ppe_w32(ppe, MTK_PPE_TB_BASE, ppe->foe_phys);
			
 
				++
			
 
				++	val = MTK_PPE_TB_CFG_ENTRY_80B |
			
 
				++	      MTK_PPE_TB_CFG_AGE_NON_L4 |
			
 
				++	      MTK_PPE_TB_CFG_AGE_UNBIND |
			
 
				++	      MTK_PPE_TB_CFG_AGE_TCP |
			
 
				++	      MTK_PPE_TB_CFG_AGE_UDP |
			
 
				++	      MTK_PPE_TB_CFG_AGE_TCP_FIN |
			
 
				++	      FIELD_PREP(MTK_PPE_TB_CFG_SEARCH_MISS,
			
 
				++			 MTK_PPE_SEARCH_MISS_ACTION_FORWARD_BUILD) |
			
 
				++	      FIELD_PREP(MTK_PPE_TB_CFG_KEEPALIVE,
			
 
				++			 MTK_PPE_KEEPALIVE_DISABLE) |
			
 
				++	      FIELD_PREP(MTK_PPE_TB_CFG_HASH_MODE, 1) |
			
 
				++	      FIELD_PREP(MTK_PPE_TB_CFG_SCAN_MODE,
			
 
				++			 MTK_PPE_SCAN_MODE_KEEPALIVE_AGE) |
			
 
				++	      FIELD_PREP(MTK_PPE_TB_CFG_ENTRY_NUM,
			
 
				++			 MTK_PPE_ENTRIES_SHIFT);
			
 
				++	ppe_w32(ppe, MTK_PPE_TB_CFG, val);
			
 
				++
			
 
				++	ppe_w32(ppe, MTK_PPE_IP_PROTO_CHK,
			
 
				++		MTK_PPE_IP_PROTO_CHK_IPV4 | MTK_PPE_IP_PROTO_CHK_IPV6);
			
 
				++
			
 
				++	mtk_ppe_cache_enable(ppe, true);
			
 
				++
			
 
				++	val = MTK_PPE_FLOW_CFG_IP4_TCP_FRAG |
			
 
				++	      MTK_PPE_FLOW_CFG_IP4_UDP_FRAG |
			
 
				++	      MTK_PPE_FLOW_CFG_IP6_3T_ROUTE |
			
 
				++	      MTK_PPE_FLOW_CFG_IP6_5T_ROUTE |
			
 
				++	      MTK_PPE_FLOW_CFG_IP6_6RD |
			
 
				++	      MTK_PPE_FLOW_CFG_IP4_NAT |
			
 
				++	      MTK_PPE_FLOW_CFG_IP4_NAPT |
			
 
				++	      MTK_PPE_FLOW_CFG_IP4_DSLITE |
			
 
				++	      MTK_PPE_FLOW_CFG_L2_BRIDGE |
			
 
				++	      MTK_PPE_FLOW_CFG_IP4_NAT_FRAG;
			
 
				++	ppe_w32(ppe, MTK_PPE_FLOW_CFG, val);
			
 
				++
			
 
				++	val = FIELD_PREP(MTK_PPE_UNBIND_AGE_MIN_PACKETS, 1000) |
			
 
				++	      FIELD_PREP(MTK_PPE_UNBIND_AGE_DELTA, 3);
			
 
				++	ppe_w32(ppe, MTK_PPE_UNBIND_AGE, val);
			
 
				++
			
 
				++	val = FIELD_PREP(MTK_PPE_BIND_AGE0_DELTA_UDP, 12) |
			
 
				++	      FIELD_PREP(MTK_PPE_BIND_AGE0_DELTA_NON_L4, 1);
			
 
				++	ppe_w32(ppe, MTK_PPE_BIND_AGE0, val);
			
 
				++
			
 
				++	val = FIELD_PREP(MTK_PPE_BIND_AGE1_DELTA_TCP_FIN, 1) |
			
 
				++	      FIELD_PREP(MTK_PPE_BIND_AGE1_DELTA_TCP, 7);
			
 
				++	ppe_w32(ppe, MTK_PPE_BIND_AGE1, val);
			
 
				++
			
 
				++	val = MTK_PPE_BIND_LIMIT0_QUARTER | MTK_PPE_BIND_LIMIT0_HALF;
			
 
				++	ppe_w32(ppe, MTK_PPE_BIND_LIMIT0, val);
			
 
				++
			
 
				++	val = MTK_PPE_BIND_LIMIT1_FULL |
			
 
				++	      FIELD_PREP(MTK_PPE_BIND_LIMIT1_NON_L4, 1);
			
 
				++	ppe_w32(ppe, MTK_PPE_BIND_LIMIT1, val);
			
 
				++
			
 
				++	val = FIELD_PREP(MTK_PPE_BIND_RATE_BIND, 30) |
			
 
				++	      FIELD_PREP(MTK_PPE_BIND_RATE_PREBIND, 1);
			
 
				++	ppe_w32(ppe, MTK_PPE_BIND_RATE, val);
			
 
				++
			
 
				++	/* enable PPE */
			
 
				++	val = MTK_PPE_GLO_CFG_EN |
			
 
				++	      MTK_PPE_GLO_CFG_IP4_L4_CS_DROP |
			
 
				++	      MTK_PPE_GLO_CFG_IP4_CS_DROP |
			
 
				++	      MTK_PPE_GLO_CFG_FLOW_DROP_UPDATE;
			
 
				++	ppe_w32(ppe, MTK_PPE_GLO_CFG, val);
			
 
				++
			
 
				++	ppe_w32(ppe, MTK_PPE_DEFAULT_CPU_PORT, 0);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++int mtk_ppe_stop(struct mtk_ppe *ppe)
			
 
				++{
			
 
				++	u32 val;
			
 
				++	int i;
			
 
				++
			
 
				++	for (i = 0; i < MTK_PPE_ENTRIES; i++)
			
 
				++		ppe->foe_table[i].ib1 = FIELD_PREP(MTK_FOE_IB1_STATE,
			
 
				++						   MTK_FOE_STATE_INVALID);
			
 
				++
			
 
				++	mtk_ppe_cache_enable(ppe, false);
			
 
				++
			
 
				++	/* disable offload engine */
			
 
				++	ppe_clear(ppe, MTK_PPE_GLO_CFG, MTK_PPE_GLO_CFG_EN);
			
 
				++	ppe_w32(ppe, MTK_PPE_FLOW_CFG, 0);
			
 
				++
			
 
				++	/* disable aging */
			
 
				++	val = MTK_PPE_TB_CFG_AGE_NON_L4 |
			
 
				++	      MTK_PPE_TB_CFG_AGE_UNBIND |
			
 
				++	      MTK_PPE_TB_CFG_AGE_TCP |
			
 
				++	      MTK_PPE_TB_CFG_AGE_UDP |
			
 
				++	      MTK_PPE_TB_CFG_AGE_TCP_FIN;
			
 
				++	ppe_clear(ppe, MTK_PPE_TB_CFG, val);
			
 
				++
			
 
				++	return mtk_ppe_wait_busy(ppe);
			
 
				++}
			
 
				+--- /dev/null
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe.h
			
 
				+@@ -0,0 +1,287 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/* Copyright (C) 2020 Felix Fietkau <[email protected]> */
			
 
				++
			
 
				++#ifndef __MTK_PPE_H
			
 
				++#define __MTK_PPE_H
			
 
				++
			
 
				++#include <linux/kernel.h>
			
 
				++#include <linux/bitfield.h>
			
 
				++
			
 
				++#define MTK_ETH_PPE_BASE		0xc00
			
 
				++
			
 
				++#define MTK_PPE_ENTRIES_SHIFT		3
			
 
				++#define MTK_PPE_ENTRIES			(1024 << MTK_PPE_ENTRIES_SHIFT)
			
 
				++#define MTK_PPE_HASH_MASK		(MTK_PPE_ENTRIES - 1)
			
 
				++
			
 
				++#define MTK_FOE_IB1_UNBIND_TIMESTAMP	GENMASK(7, 0)
			
 
				++#define MTK_FOE_IB1_UNBIND_PACKETS	GENMASK(23, 8)
			
 
				++#define MTK_FOE_IB1_UNBIND_PREBIND	BIT(24)
			
 
				++
			
 
				++#define MTK_FOE_IB1_BIND_TIMESTAMP	GENMASK(14, 0)
			
 
				++#define MTK_FOE_IB1_BIND_KEEPALIVE	BIT(15)
			
 
				++#define MTK_FOE_IB1_BIND_VLAN_LAYER	GENMASK(18, 16)
			
 
				++#define MTK_FOE_IB1_BIND_PPPOE		BIT(19)
			
 
				++#define MTK_FOE_IB1_BIND_VLAN_TAG	BIT(20)
			
 
				++#define MTK_FOE_IB1_BIND_PKT_SAMPLE	BIT(21)
			
 
				++#define MTK_FOE_IB1_BIND_CACHE		BIT(22)
			
 
				++#define MTK_FOE_IB1_BIND_TUNNEL_DECAP	BIT(23)
			
 
				++#define MTK_FOE_IB1_BIND_TTL		BIT(24)
			
 
				++
			
 
				++#define MTK_FOE_IB1_PACKET_TYPE		GENMASK(27, 25)
			
 
				++#define MTK_FOE_IB1_STATE		GENMASK(29, 28)
			
 
				++#define MTK_FOE_IB1_UDP			BIT(30)
			
 
				++#define MTK_FOE_IB1_STATIC		BIT(31)
			
 
				++
			
 
				++enum {
			
 
				++	MTK_PPE_PKT_TYPE_IPV4_HNAPT = 0,
			
 
				++	MTK_PPE_PKT_TYPE_IPV4_ROUTE = 1,
			
 
				++	MTK_PPE_PKT_TYPE_BRIDGE = 2,
			
 
				++	MTK_PPE_PKT_TYPE_IPV4_DSLITE = 3,
			
 
				++	MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T = 4,
			
 
				++	MTK_PPE_PKT_TYPE_IPV6_ROUTE_5T = 5,
			
 
				++	MTK_PPE_PKT_TYPE_IPV6_6RD = 7,
			
 
				++};
			
 
				++
			
 
				++#define MTK_FOE_IB2_QID			GENMASK(3, 0)
			
 
				++#define MTK_FOE_IB2_PSE_QOS		BIT(4)
			
 
				++#define MTK_FOE_IB2_DEST_PORT		GENMASK(7, 5)
			
 
				++#define MTK_FOE_IB2_MULTICAST		BIT(8)
			
 
				++
			
 
				++#define MTK_FOE_IB2_WHNAT_QID2		GENMASK(13, 12)
			
 
				++#define MTK_FOE_IB2_WHNAT_DEVIDX	BIT(16)
			
 
				++#define MTK_FOE_IB2_WHNAT_NAT		BIT(17)
			
 
				++
			
 
				++#define MTK_FOE_IB2_PORT_MG		GENMASK(17, 12)
			
 
				++
			
 
				++#define MTK_FOE_IB2_PORT_AG		GENMASK(23, 18)
			
 
				++
			
 
				++#define MTK_FOE_IB2_DSCP		GENMASK(31, 24)
			
 
				++
			
 
				++#define MTK_FOE_VLAN2_WHNAT_BSS		GEMMASK(5, 0)
			
 
				++#define MTK_FOE_VLAN2_WHNAT_WCID	GENMASK(13, 6)
			
 
				++#define MTK_FOE_VLAN2_WHNAT_RING	GENMASK(15, 14)
			
 
				++
			
 
				++enum {
			
 
				++	MTK_FOE_STATE_INVALID,
			
 
				++	MTK_FOE_STATE_UNBIND,
			
 
				++	MTK_FOE_STATE_BIND,
			
 
				++	MTK_FOE_STATE_FIN
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_mac_info {
			
 
				++	u16 vlan1;
			
 
				++	u16 etype;
			
 
				++
			
 
				++	u32 dest_mac_hi;
			
 
				++
			
 
				++	u16 vlan2;
			
 
				++	u16 dest_mac_lo;
			
 
				++
			
 
				++	u32 src_mac_hi;
			
 
				++
			
 
				++	u16 pppoe_id;
			
 
				++	u16 src_mac_lo;
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_bridge {
			
 
				++	u32 dest_mac_hi;
			
 
				++
			
 
				++	u16 src_mac_lo;
			
 
				++	u16 dest_mac_lo;
			
 
				++
			
 
				++	u32 src_mac_hi;
			
 
				++
			
 
				++	u32 ib2;
			
 
				++
			
 
				++	u32 _rsv[5];
			
 
				++
			
 
				++	u32 udf_tsid;
			
 
				++	struct mtk_foe_mac_info l2;
			
 
				++};
			
 
				++
			
 
				++struct mtk_ipv4_tuple {
			
 
				++	u32 src_ip;
			
 
				++	u32 dest_ip;
			
 
				++	union {
			
 
				++		struct {
			
 
				++			u16 dest_port;
			
 
				++			u16 src_port;
			
 
				++		};
			
 
				++		struct {
			
 
				++			u8 protocol;
			
 
				++			u8 _pad[3]; /* fill with 0xa5a5a5 */
			
 
				++		};
			
 
				++		u32 ports;
			
 
				++	};
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_ipv4 {
			
 
				++	struct mtk_ipv4_tuple orig;
			
 
				++
			
 
				++	u32 ib2;
			
 
				++
			
 
				++	struct mtk_ipv4_tuple new;
			
 
				++
			
 
				++	u16 timestamp;
			
 
				++	u16 _rsv0[3];
			
 
				++
			
 
				++	u32 udf_tsid;
			
 
				++
			
 
				++	struct mtk_foe_mac_info l2;
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_ipv4_dslite {
			
 
				++	struct mtk_ipv4_tuple ip4;
			
 
				++
			
 
				++	u32 tunnel_src_ip[4];
			
 
				++	u32 tunnel_dest_ip[4];
			
 
				++
			
 
				++	u8 flow_label[3];
			
 
				++	u8 priority;
			
 
				++
			
 
				++	u32 udf_tsid;
			
 
				++
			
 
				++	u32 ib2;
			
 
				++
			
 
				++	struct mtk_foe_mac_info l2;
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_ipv6 {
			
 
				++	u32 src_ip[4];
			
 
				++	u32 dest_ip[4];
			
 
				++
			
 
				++	union {
			
 
				++		struct {
			
 
				++			u8 protocol;
			
 
				++			u8 _pad[3]; /* fill with 0xa5a5a5 */
			
 
				++		}; /* 3-tuple */
			
 
				++		struct {
			
 
				++			u16 dest_port;
			
 
				++			u16 src_port;
			
 
				++		}; /* 5-tuple */
			
 
				++		u32 ports;
			
 
				++	};
			
 
				++
			
 
				++	u32 _rsv[3];
			
 
				++
			
 
				++	u32 udf;
			
 
				++
			
 
				++	u32 ib2;
			
 
				++	struct mtk_foe_mac_info l2;
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_ipv6_6rd {
			
 
				++	u32 src_ip[4];
			
 
				++	u32 dest_ip[4];
			
 
				++	u16 dest_port;
			
 
				++	u16 src_port;
			
 
				++
			
 
				++	u32 tunnel_src_ip;
			
 
				++	u32 tunnel_dest_ip;
			
 
				++
			
 
				++	u16 hdr_csum;
			
 
				++	u8 dscp;
			
 
				++	u8 ttl;
			
 
				++
			
 
				++	u8 flag;
			
 
				++	u8 pad;
			
 
				++	u8 per_flow_6rd_id;
			
 
				++	u8 pad2;
			
 
				++
			
 
				++	u32 ib2;
			
 
				++	struct mtk_foe_mac_info l2;
			
 
				++};
			
 
				++
			
 
				++struct mtk_foe_entry {
			
 
				++	u32 ib1;
			
 
				++
			
 
				++	union {
			
 
				++		struct mtk_foe_bridge bridge;
			
 
				++		struct mtk_foe_ipv4 ipv4;
			
 
				++		struct mtk_foe_ipv4_dslite dslite;
			
 
				++		struct mtk_foe_ipv6 ipv6;
			
 
				++		struct mtk_foe_ipv6_6rd ipv6_6rd;
			
 
				++		u32 data[19];
			
 
				++	};
			
 
				++};
			
 
				++
			
 
				++enum {
			
 
				++	MTK_PPE_CPU_REASON_TTL_EXCEEDED			= 0x02,
			
 
				++	MTK_PPE_CPU_REASON_OPTION_HEADER		= 0x03,
			
 
				++	MTK_PPE_CPU_REASON_NO_FLOW			= 0x07,
			
 
				++	MTK_PPE_CPU_REASON_IPV4_FRAG			= 0x08,
			
 
				++	MTK_PPE_CPU_REASON_IPV4_DSLITE_FRAG		= 0x09,
			
 
				++	MTK_PPE_CPU_REASON_IPV4_DSLITE_NO_TCP_UDP	= 0x0a,
			
 
				++	MTK_PPE_CPU_REASON_IPV6_6RD_NO_TCP_UDP		= 0x0b,
			
 
				++	MTK_PPE_CPU_REASON_TCP_FIN_SYN_RST		= 0x0c,
			
 
				++	MTK_PPE_CPU_REASON_UN_HIT			= 0x0d,
			
 
				++	MTK_PPE_CPU_REASON_HIT_UNBIND			= 0x0e,
			
 
				++	MTK_PPE_CPU_REASON_HIT_UNBIND_RATE_REACHED	= 0x0f,
			
 
				++	MTK_PPE_CPU_REASON_HIT_BIND_TCP_FIN		= 0x10,
			
 
				++	MTK_PPE_CPU_REASON_HIT_TTL_1			= 0x11,
			
 
				++	MTK_PPE_CPU_REASON_HIT_BIND_VLAN_VIOLATION	= 0x12,
			
 
				++	MTK_PPE_CPU_REASON_KEEPALIVE_UC_OLD_HDR		= 0x13,
			
 
				++	MTK_PPE_CPU_REASON_KEEPALIVE_MC_NEW_HDR		= 0x14,
			
 
				++	MTK_PPE_CPU_REASON_KEEPALIVE_DUP_OLD_HDR	= 0x15,
			
 
				++	MTK_PPE_CPU_REASON_HIT_BIND_FORCE_CPU		= 0x16,
			
 
				++	MTK_PPE_CPU_REASON_TUNNEL_OPTION_HEADER		= 0x17,
			
 
				++	MTK_PPE_CPU_REASON_MULTICAST_TO_CPU		= 0x18,
			
 
				++	MTK_PPE_CPU_REASON_MULTICAST_TO_GMAC1_CPU	= 0x19,
			
 
				++	MTK_PPE_CPU_REASON_HIT_PRE_BIND			= 0x1a,
			
 
				++	MTK_PPE_CPU_REASON_PACKET_SAMPLING		= 0x1b,
			
 
				++	MTK_PPE_CPU_REASON_EXCEED_MTU			= 0x1c,
			
 
				++	MTK_PPE_CPU_REASON_PPE_BYPASS			= 0x1e,
			
 
				++	MTK_PPE_CPU_REASON_INVALID			= 0x1f,
			
 
				++};
			
 
				++
			
 
				++struct mtk_ppe {
			
 
				++	struct device *dev;
			
 
				++	void __iomem *base;
			
 
				++	int version;
			
 
				++
			
 
				++	struct mtk_foe_entry *foe_table;
			
 
				++	dma_addr_t foe_phys;
			
 
				++
			
 
				++	void *acct_table;
			
 
				++};
			
 
				++
			
 
				++int mtk_ppe_init(struct mtk_ppe *ppe, struct device *dev, void __iomem *base,
			
 
				++		 int version);
			
 
				++int mtk_ppe_start(struct mtk_ppe *ppe);
			
 
				++int mtk_ppe_stop(struct mtk_ppe *ppe);
			
 
				++
			
 
				++static inline void
			
 
				++mtk_foe_entry_clear(struct mtk_ppe *ppe, u16 hash)
			
 
				++{
			
 
				++	ppe->foe_table[hash].ib1 = 0;
			
 
				++	dma_wmb();
			
 
				++}
			
 
				++
			
 
				++static inline int
			
 
				++mtk_foe_entry_timestamp(struct mtk_ppe *ppe, u16 hash)
			
 
				++{
			
 
				++	u32 ib1 = READ_ONCE(ppe->foe_table[hash].ib1);
			
 
				++
			
 
				++	if (FIELD_GET(MTK_FOE_IB1_STATE, ib1) != MTK_FOE_STATE_BIND)
			
 
				++		return -1;
			
 
				++
			
 
				++	return FIELD_GET(MTK_FOE_IB1_BIND_TIMESTAMP, ib1);
			
 
				++}
			
 
				++
			
 
				++int mtk_foe_entry_prepare(struct mtk_foe_entry *entry, int type, int l4proto,
			
 
				++			  u8 pse_port, u8 *src_mac, u8 *dest_mac);
			
 
				++int mtk_foe_entry_set_pse_port(struct mtk_foe_entry *entry, u8 port);
			
 
				++int mtk_foe_entry_set_ipv4_tuple(struct mtk_foe_entry *entry, bool orig,
			
 
				++				 __be32 src_addr, __be16 src_port,
			
 
				++				 __be32 dest_addr, __be16 dest_port);
			
 
				++int mtk_foe_entry_set_ipv6_tuple(struct mtk_foe_entry *entry,
			
 
				++				 __be32 *src_addr, __be16 src_port,
			
 
				++				 __be32 *dest_addr, __be16 dest_port);
			
 
				++int mtk_foe_entry_set_dsa(struct mtk_foe_entry *entry, int port);
			
 
				++int mtk_foe_entry_set_vlan(struct mtk_foe_entry *entry, int vid);
			
 
				++int mtk_foe_entry_set_pppoe(struct mtk_foe_entry *entry, int sid);
			
 
				++int mtk_foe_entry_commit(struct mtk_ppe *ppe, struct mtk_foe_entry *entry,
			
 
				++			 u16 timestamp);
			
 
				++int mtk_ppe_debugfs_init(struct mtk_ppe *ppe);
			
 
				++
			
 
				++#endif
			
 
				+--- /dev/null
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe_debugfs.c
			
 
				+@@ -0,0 +1,217 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/* Copyright (C) 2020 Felix Fietkau <[email protected]> */
			
 
				++
			
 
				++#include <linux/kernel.h>
			
 
				++#include <linux/debugfs.h>
			
 
				++#include "mtk_eth_soc.h"
			
 
				++
			
 
				++struct mtk_flow_addr_info
			
 
				++{
			
 
				++	void *src, *dest;
			
 
				++	u16 *src_port, *dest_port;
			
 
				++	bool ipv6;
			
 
				++};
			
 
				++
			
 
				++static const char *mtk_foe_entry_state_str(int state)
			
 
				++{
			
 
				++	static const char * const state_str[] = {
			
 
				++		[MTK_FOE_STATE_INVALID] = "INV",
			
 
				++		[MTK_FOE_STATE_UNBIND] = "UNB",
			
 
				++		[MTK_FOE_STATE_BIND] = "BND",
			
 
				++		[MTK_FOE_STATE_FIN] = "FIN",
			
 
				++	};
			
 
				++
			
 
				++	if (state >= ARRAY_SIZE(state_str) || !state_str[state])
			
 
				++		return "UNK";
			
 
				++
			
 
				++	return state_str[state];
			
 
				++}
			
 
				++
			
 
				++static const char *mtk_foe_pkt_type_str(int type)
			
 
				++{
			
 
				++	static const char * const type_str[] = {
			
 
				++		[MTK_PPE_PKT_TYPE_IPV4_HNAPT] = "IPv4 5T",
			
 
				++		[MTK_PPE_PKT_TYPE_IPV4_ROUTE] = "IPv4 3T",
			
 
				++		[MTK_PPE_PKT_TYPE_BRIDGE] = "L2",
			
 
				++		[MTK_PPE_PKT_TYPE_IPV4_DSLITE] = "DS-LITE",
			
 
				++		[MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T] = "IPv6 3T",
			
 
				++		[MTK_PPE_PKT_TYPE_IPV6_ROUTE_5T] = "IPv6 5T",
			
 
				++		[MTK_PPE_PKT_TYPE_IPV6_6RD] = "6RD",
			
 
				++	};
			
 
				++
			
 
				++	if (type >= ARRAY_SIZE(type_str) || !type_str[type])
			
 
				++		return "UNKNOWN";
			
 
				++
			
 
				++	return type_str[type];
			
 
				++}
			
 
				++
			
 
				++static void
			
 
				++mtk_print_addr(struct seq_file *m, u32 *addr, bool ipv6)
			
 
				++{
			
 
				++	u32 n_addr[4];
			
 
				++	int i;
			
 
				++
			
 
				++	if (!ipv6) {
			
 
				++		seq_printf(m, "%pI4h", addr);
			
 
				++		return;
			
 
				++	}
			
 
				++
			
 
				++	for (i = 0; i < ARRAY_SIZE(n_addr); i++)
			
 
				++		n_addr[i] = htonl(addr[i]);
			
 
				++	seq_printf(m, "%pI6", n_addr);
			
 
				++}
			
 
				++
			
 
				++static void
			
 
				++mtk_print_addr_info(struct seq_file *m, struct mtk_flow_addr_info *ai)
			
 
				++{
			
 
				++	mtk_print_addr(m, ai->src, ai->ipv6);
			
 
				++	if (ai->src_port)
			
 
				++		seq_printf(m, ":%d", *ai->src_port);
			
 
				++	seq_printf(m, "->");
			
 
				++	mtk_print_addr(m, ai->dest, ai->ipv6);
			
 
				++	if (ai->dest_port)
			
 
				++		seq_printf(m, ":%d", *ai->dest_port);
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_ppe_debugfs_foe_show(struct seq_file *m, void *private, bool bind)
			
 
				++{
			
 
				++	struct mtk_ppe *ppe = m->private;
			
 
				++	int i, count;
			
 
				++
			
 
				++	for (i = 0, count = 0; i < MTK_PPE_ENTRIES; i++) {
			
 
				++		struct mtk_foe_entry *entry = &ppe->foe_table[i];
			
 
				++		struct mtk_foe_mac_info *l2;
			
 
				++		struct mtk_flow_addr_info ai = {};
			
 
				++		unsigned char h_source[ETH_ALEN];
			
 
				++		unsigned char h_dest[ETH_ALEN];
			
 
				++		int type, state;
			
 
				++		u32 ib2;
			
 
				++
			
 
				++
			
 
				++		state = FIELD_GET(MTK_FOE_IB1_STATE, entry->ib1);
			
 
				++		if (!state)
			
 
				++			continue;
			
 
				++
			
 
				++		if (bind && state != MTK_FOE_STATE_BIND)
			
 
				++			continue;
			
 
				++
			
 
				++		type = FIELD_GET(MTK_FOE_IB1_PACKET_TYPE, entry->ib1);
			
 
				++		seq_printf(m, "%05x %s %7s", i,
			
 
				++			   mtk_foe_entry_state_str(state),
			
 
				++			   mtk_foe_pkt_type_str(type));
			
 
				++
			
 
				++		switch (type) {
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_HNAPT:
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_DSLITE:
			
 
				++			ai.src_port = &entry->ipv4.orig.src_port;
			
 
				++			ai.dest_port = &entry->ipv4.orig.dest_port;
			
 
				++			fallthrough;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_ROUTE:
			
 
				++			ai.src = &entry->ipv4.orig.src_ip;
			
 
				++			ai.dest = &entry->ipv4.orig.dest_ip;
			
 
				++			break;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV6_ROUTE_5T:
			
 
				++			ai.src_port = &entry->ipv6.src_port;
			
 
				++			ai.dest_port = &entry->ipv6.dest_port;
			
 
				++			fallthrough;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV6_ROUTE_3T:
			
 
				++		case MTK_PPE_PKT_TYPE_IPV6_6RD:
			
 
				++			ai.src = &entry->ipv6.src_ip;
			
 
				++			ai.dest = &entry->ipv6.dest_ip;
			
 
				++			ai.ipv6 = true;
			
 
				++			break;
			
 
				++		}
			
 
				++
			
 
				++		seq_printf(m, " orig=");
			
 
				++		mtk_print_addr_info(m, &ai);
			
 
				++
			
 
				++		switch (type) {
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_HNAPT:
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_DSLITE:
			
 
				++			ai.src_port = &entry->ipv4.new.src_port;
			
 
				++			ai.dest_port = &entry->ipv4.new.dest_port;
			
 
				++			fallthrough;
			
 
				++		case MTK_PPE_PKT_TYPE_IPV4_ROUTE:
			
 
				++			ai.src = &entry->ipv4.new.src_ip;
			
 
				++			ai.dest = &entry->ipv4.new.dest_ip;
			
 
				++			seq_printf(m, " new=");
			
 
				++			mtk_print_addr_info(m, &ai);
			
 
				++			break;
			
 
				++		}
			
 
				++
			
 
				++		if (type >= MTK_PPE_PKT_TYPE_IPV4_DSLITE) {
			
 
				++			l2 = &entry->ipv6.l2;
			
 
				++			ib2 = entry->ipv6.ib2;
			
 
				++		} else {
			
 
				++			l2 = &entry->ipv4.l2;
			
 
				++			ib2 = entry->ipv4.ib2;
			
 
				++		}
			
 
				++
			
 
				++		*((__be32 *)h_source) = htonl(l2->src_mac_hi);
			
 
				++		*((__be16 *)&h_source[4]) = htons(l2->src_mac_lo);
			
 
				++		*((__be32 *)h_dest) = htonl(l2->dest_mac_hi);
			
 
				++		*((__be16 *)&h_dest[4]) = htons(l2->dest_mac_lo);
			
 
				++
			
 
				++		seq_printf(m, " eth=%pM->%pM etype=%04x"
			
 
				++			      " vlan=%d,%d ib1=%08x ib2=%08x\n",
			
 
				++			   h_source, h_dest, ntohs(l2->etype),
			
 
				++			   l2->vlan1, l2->vlan2, entry->ib1, ib2);
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_ppe_debugfs_foe_show_all(struct seq_file *m, void *private)
			
 
				++{
			
 
				++	return mtk_ppe_debugfs_foe_show(m, private, false);
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_ppe_debugfs_foe_show_bind(struct seq_file *m, void *private)
			
 
				++{
			
 
				++	return mtk_ppe_debugfs_foe_show(m, private, true);
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_ppe_debugfs_foe_open_all(struct inode *inode, struct file *file)
			
 
				++{
			
 
				++	return single_open(file, mtk_ppe_debugfs_foe_show_all,
			
 
				++			   inode->i_private);
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_ppe_debugfs_foe_open_bind(struct inode *inode, struct file *file)
			
 
				++{
			
 
				++	return single_open(file, mtk_ppe_debugfs_foe_show_bind,
			
 
				++			   inode->i_private);
			
 
				++}
			
 
				++
			
 
				++int mtk_ppe_debugfs_init(struct mtk_ppe *ppe)
			
 
				++{
			
 
				++	static const struct file_operations fops_all = {
			
 
				++		.open = mtk_ppe_debugfs_foe_open_all,
			
 
				++		.read = seq_read,
			
 
				++		.llseek = seq_lseek,
			
 
				++		.release = single_release,
			
 
				++	};
			
 
				++
			
 
				++	static const struct file_operations fops_bind = {
			
 
				++		.open = mtk_ppe_debugfs_foe_open_bind,
			
 
				++		.read = seq_read,
			
 
				++		.llseek = seq_lseek,
			
 
				++		.release = single_release,
			
 
				++	};
			
 
				++
			
 
				++	struct dentry *root;
			
 
				++
			
 
				++	root = debugfs_create_dir("mtk_ppe", NULL);
			
 
				++	if (!root)
			
 
				++		return -ENOMEM;
			
 
				++
			
 
				++	debugfs_create_file("entries", S_IRUGO, root, ppe, &fops_all);
			
 
				++	debugfs_create_file("bind", S_IRUGO, root, ppe, &fops_bind);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				+--- /dev/null
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe_regs.h
			
 
				+@@ -0,0 +1,144 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/* Copyright (C) 2020 Felix Fietkau <[email protected]> */
			
 
				++
			
 
				++#ifndef __MTK_PPE_REGS_H
			
 
				++#define __MTK_PPE_REGS_H
			
 
				++
			
 
				++#define MTK_PPE_GLO_CFG				0x200
			
 
				++#define MTK_PPE_GLO_CFG_EN			BIT(0)
			
 
				++#define MTK_PPE_GLO_CFG_TSID_EN			BIT(1)
			
 
				++#define MTK_PPE_GLO_CFG_IP4_L4_CS_DROP		BIT(2)
			
 
				++#define MTK_PPE_GLO_CFG_IP4_CS_DROP		BIT(3)
			
 
				++#define MTK_PPE_GLO_CFG_TTL0_DROP		BIT(4)
			
 
				++#define MTK_PPE_GLO_CFG_PPE_BSWAP		BIT(5)
			
 
				++#define MTK_PPE_GLO_CFG_PSE_HASH_OFS		BIT(6)
			
 
				++#define MTK_PPE_GLO_CFG_MCAST_TB_EN		BIT(7)
			
 
				++#define MTK_PPE_GLO_CFG_FLOW_DROP_KA		BIT(8)
			
 
				++#define MTK_PPE_GLO_CFG_FLOW_DROP_UPDATE	BIT(9)
			
 
				++#define MTK_PPE_GLO_CFG_UDP_LITE_EN		BIT(10)
			
 
				++#define MTK_PPE_GLO_CFG_UDP_LEN_DROP		BIT(11)
			
 
				++#define MTK_PPE_GLO_CFG_MCAST_ENTRIES		GNEMASK(13, 12)
			
 
				++#define MTK_PPE_GLO_CFG_BUSY			BIT(31)
			
 
				++
			
 
				++#define MTK_PPE_FLOW_CFG			0x204
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_TCP_FRAG		BIT(6)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_UDP_FRAG		BIT(7)
			
 
				++#define MTK_PPE_FLOW_CFG_IP6_3T_ROUTE		BIT(8)
			
 
				++#define MTK_PPE_FLOW_CFG_IP6_5T_ROUTE		BIT(9)
			
 
				++#define MTK_PPE_FLOW_CFG_IP6_6RD		BIT(10)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_NAT		BIT(12)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_NAPT		BIT(13)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_DSLITE		BIT(14)
			
 
				++#define MTK_PPE_FLOW_CFG_L2_BRIDGE		BIT(15)
			
 
				++#define MTK_PPE_FLOW_CFG_IP_PROTO_BLACKLIST	BIT(16)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_NAT_FRAG		BIT(17)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_HASH_FLOW_LABEL	BIT(18)
			
 
				++#define MTK_PPE_FLOW_CFG_IP4_HASH_GRE_KEY	BIT(19)
			
 
				++#define MTK_PPE_FLOW_CFG_IP6_HASH_GRE_KEY	BIT(20)
			
 
				++
			
 
				++#define MTK_PPE_IP_PROTO_CHK			0x208
			
 
				++#define MTK_PPE_IP_PROTO_CHK_IPV4		GENMASK(15, 0)
			
 
				++#define MTK_PPE_IP_PROTO_CHK_IPV6		GENMASK(31, 16)
			
 
				++
			
 
				++#define MTK_PPE_TB_CFG				0x21c
			
 
				++#define MTK_PPE_TB_CFG_ENTRY_NUM		GENMASK(2, 0)
			
 
				++#define MTK_PPE_TB_CFG_ENTRY_80B		BIT(3)
			
 
				++#define MTK_PPE_TB_CFG_SEARCH_MISS		GENMASK(5, 4)
			
 
				++#define MTK_PPE_TB_CFG_AGE_PREBIND		BIT(6)
			
 
				++#define MTK_PPE_TB_CFG_AGE_NON_L4		BIT(7)
			
 
				++#define MTK_PPE_TB_CFG_AGE_UNBIND		BIT(8)
			
 
				++#define MTK_PPE_TB_CFG_AGE_TCP			BIT(9)
			
 
				++#define MTK_PPE_TB_CFG_AGE_UDP			BIT(10)
			
 
				++#define MTK_PPE_TB_CFG_AGE_TCP_FIN		BIT(11)
			
 
				++#define MTK_PPE_TB_CFG_KEEPALIVE		GENMASK(13, 12)
			
 
				++#define MTK_PPE_TB_CFG_HASH_MODE		GENMASK(15, 14)
			
 
				++#define MTK_PPE_TB_CFG_SCAN_MODE		GENMASK(17, 16)
			
 
				++#define MTK_PPE_TB_CFG_HASH_DEBUG		GENMASK(19, 18)
			
 
				++
			
 
				++enum {
			
 
				++	MTK_PPE_SCAN_MODE_DISABLED,
			
 
				++	MTK_PPE_SCAN_MODE_CHECK_AGE,
			
 
				++	MTK_PPE_SCAN_MODE_KEEPALIVE_AGE,
			
 
				++};
			
 
				++
			
 
				++enum {
			
 
				++	MTK_PPE_KEEPALIVE_DISABLE,
			
 
				++	MTK_PPE_KEEPALIVE_UNICAST_CPU,
			
 
				++	MTK_PPE_KEEPALIVE_DUP_CPU = 3,
			
 
				++};
			
 
				++
			
 
				++enum {
			
 
				++	MTK_PPE_SEARCH_MISS_ACTION_DROP,
			
 
				++	MTK_PPE_SEARCH_MISS_ACTION_FORWARD = 2,
			
 
				++	MTK_PPE_SEARCH_MISS_ACTION_FORWARD_BUILD = 3,
			
 
				++};
			
 
				++
			
 
				++#define MTK_PPE_TB_BASE				0x220
			
 
				++
			
 
				++#define MTK_PPE_TB_USED				0x224
			
 
				++#define MTK_PPE_TB_USED_NUM			GENMASK(13, 0)
			
 
				++
			
 
				++#define MTK_PPE_BIND_RATE			0x228
			
 
				++#define MTK_PPE_BIND_RATE_BIND			GENMASK(15, 0)
			
 
				++#define MTK_PPE_BIND_RATE_PREBIND		GENMASK(31, 16)
			
 
				++
			
 
				++#define MTK_PPE_BIND_LIMIT0			0x22c
			
 
				++#define MTK_PPE_BIND_LIMIT0_QUARTER		GENMASK(13, 0)
			
 
				++#define MTK_PPE_BIND_LIMIT0_HALF		GENMASK(29, 16)
			
 
				++
			
 
				++#define MTK_PPE_BIND_LIMIT1			0x230
			
 
				++#define MTK_PPE_BIND_LIMIT1_FULL		GENMASK(13, 0)
			
 
				++#define MTK_PPE_BIND_LIMIT1_NON_L4		GENMASK(23, 16)
			
 
				++
			
 
				++#define MTK_PPE_KEEPALIVE			0x234
			
 
				++#define MTK_PPE_KEEPALIVE_TIME			GENMASK(15, 0)
			
 
				++#define MTK_PPE_KEEPALIVE_TIME_TCP		GENMASK(23, 16)
			
 
				++#define MTK_PPE_KEEPALIVE_TIME_UDP		GENMASK(31, 24)
			
 
				++
			
 
				++#define MTK_PPE_UNBIND_AGE			0x238
			
 
				++#define MTK_PPE_UNBIND_AGE_MIN_PACKETS		GENMASK(31, 16)
			
 
				++#define MTK_PPE_UNBIND_AGE_DELTA		GENMASK(7, 0)
			
 
				++
			
 
				++#define MTK_PPE_BIND_AGE0			0x23c
			
 
				++#define MTK_PPE_BIND_AGE0_DELTA_NON_L4		GENMASK(30, 16)
			
 
				++#define MTK_PPE_BIND_AGE0_DELTA_UDP		GENMASK(14, 0)
			
 
				++
			
 
				++#define MTK_PPE_BIND_AGE1			0x240
			
 
				++#define MTK_PPE_BIND_AGE1_DELTA_TCP_FIN		GENMASK(30, 16)
			
 
				++#define MTK_PPE_BIND_AGE1_DELTA_TCP		GENMASK(14, 0)
			
 
				++
			
 
				++#define MTK_PPE_HASH_SEED			0x244
			
 
				++
			
 
				++#define MTK_PPE_DEFAULT_CPU_PORT		0x248
			
 
				++#define MTK_PPE_DEFAULT_CPU_PORT_MASK(_n)	(GENMASK(2, 0) << ((_n) * 4))
			
 
				++
			
 
				++#define MTK_PPE_MTU_DROP			0x308
			
 
				++
			
 
				++#define MTK_PPE_VLAN_MTU0			0x30c
			
 
				++#define MTK_PPE_VLAN_MTU0_NONE			GENMASK(13, 0)
			
 
				++#define MTK_PPE_VLAN_MTU0_1TAG			GENMASK(29, 16)
			
 
				++
			
 
				++#define MTK_PPE_VLAN_MTU1			0x310
			
 
				++#define MTK_PPE_VLAN_MTU1_2TAG			GENMASK(13, 0)
			
 
				++#define MTK_PPE_VLAN_MTU1_3TAG			GENMASK(29, 16)
			
 
				++
			
 
				++#define MTK_PPE_VPM_TPID			0x318
			
 
				++
			
 
				++#define MTK_PPE_CACHE_CTL			0x320
			
 
				++#define MTK_PPE_CACHE_CTL_EN			BIT(0)
			
 
				++#define MTK_PPE_CACHE_CTL_LOCK_CLR		BIT(4)
			
 
				++#define MTK_PPE_CACHE_CTL_REQ			BIT(8)
			
 
				++#define MTK_PPE_CACHE_CTL_CLEAR			BIT(9)
			
 
				++#define MTK_PPE_CACHE_CTL_CMD			GENMASK(13, 12)
			
 
				++
			
 
				++#define MTK_PPE_MIB_CFG				0x334
			
 
				++#define MTK_PPE_MIB_CFG_EN			BIT(0)
			
 
				++#define MTK_PPE_MIB_CFG_RD_CLR			BIT(1)
			
 
				++
			
 
				++#define MTK_PPE_MIB_TB_BASE			0x338
			
 
				++
			
 
				++#define MTK_PPE_MIB_CACHE_CTL			0x350
			
 
				++#define MTK_PPE_MIB_CACHE_CTL_EN		BIT(0)
			
 
				++#define MTK_PPE_MIB_CACHE_CTL_FLUSH		BIT(2)
			
 
				++
			
 
				++#endif
			
--- a/target/linux/generic/backport-5.15/610-v5.13-33-net-ethernet-mtk_eth_soc-add-flow-offloading-support.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-33-net-ethernet-mtk_eth_soc-add-flow-offloading-support.patch
@@ -0,0 +1,568 @@
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:54 +0100
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: add flow offloading support
			
 
				+
			
 
				+This adds support for offloading IPv4 routed flows, including SNAT/DNAT,
			
 
				+one VLAN, PPPoE and DSA.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+ create mode 100644 drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/Makefile
			
 
				++++ b/drivers/net/ethernet/mediatek/Makefile
			
 
				+@@ -4,5 +4,5 @@
			
 
				+ #
			
 
				+ 
			
 
				+ obj-$(CONFIG_NET_MEDIATEK_SOC) += mtk_eth.o
			
 
				+-mtk_eth-y := mtk_eth_soc.o mtk_sgmii.o mtk_eth_path.o mtk_ppe.o mtk_ppe_debugfs.o
			
 
				++mtk_eth-y := mtk_eth_soc.o mtk_sgmii.o mtk_eth_path.o mtk_ppe.o mtk_ppe_debugfs.o mtk_ppe_offload.o
			
 
				+ obj-$(CONFIG_NET_MEDIATEK_STAR_EMAC) += mtk_star_emac.o
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -2834,6 +2834,7 @@ static const struct net_device_ops mtk_n
			
 
				+ #ifdef CONFIG_NET_POLL_CONTROLLER
			
 
				+ 	.ndo_poll_controller	= mtk_poll_controller,
			
 
				+ #endif
			
 
				++	.ndo_setup_tc		= mtk_eth_setup_tc,
			
 
				+ };
			
 
				+ 
			
 
				+ static int mtk_add_mac(struct mtk_eth *eth, struct device_node *np)
			
 
				+@@ -3092,6 +3093,10 @@ static int mtk_probe(struct platform_dev
			
 
				+ 				   eth->base + MTK_ETH_PPE_BASE, 2);
			
 
				+ 		if (err)
			
 
				+ 			goto err_free_dev;
			
 
				++
			
 
				++		err = mtk_eth_offload_init(eth);
			
 
				++		if (err)
			
 
				++			goto err_free_dev;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	for (i = 0; i < MTK_MAX_DEVS; i++) {
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -15,6 +15,7 @@
			
 
				+ #include <linux/u64_stats_sync.h>
			
 
				+ #include <linux/refcount.h>
			
 
				+ #include <linux/phylink.h>
			
 
				++#include <linux/rhashtable.h>
			
 
				+ #include "mtk_ppe.h"
			
 
				+ 
			
 
				+ #define MTK_QDMA_PAGE_SIZE	2048
			
 
				+@@ -40,7 +41,8 @@
			
 
				+ 				 NETIF_F_HW_VLAN_CTAG_RX | \
			
 
				+ 				 NETIF_F_SG | NETIF_F_TSO | \
			
 
				+ 				 NETIF_F_TSO6 | \
			
 
				+-				 NETIF_F_IPV6_CSUM)
			
 
				++				 NETIF_F_IPV6_CSUM |\
			
 
				++				 NETIF_F_HW_TC)
			
 
				+ #define MTK_HW_FEATURES_MT7628	(NETIF_F_SG | NETIF_F_RXCSUM)
			
 
				+ #define NEXT_DESP_IDX(X, Y)	(((X) + 1) & ((Y) - 1))
			
 
				+ 
			
 
				+@@ -929,6 +931,7 @@ struct mtk_eth {
			
 
				+ 	int				ip_align;
			
 
				+ 
			
 
				+ 	struct mtk_ppe			ppe;
			
 
				++	struct rhashtable		flow_table;
			
 
				+ };
			
 
				+ 
			
 
				+ /* struct mtk_mac -	the structure that holds the info about the MACs of the
			
 
				+@@ -973,4 +976,9 @@ int mtk_gmac_sgmii_path_setup(struct mtk
			
 
				+ int mtk_gmac_gephy_path_setup(struct mtk_eth *eth, int mac_id);
			
 
				+ int mtk_gmac_rgmii_path_setup(struct mtk_eth *eth, int mac_id);
			
 
				+ 
			
 
				++int mtk_eth_offload_init(struct mtk_eth *eth);
			
 
				++int mtk_eth_setup_tc(struct net_device *dev, enum tc_setup_type type,
			
 
				++		     void *type_data);
			
 
				++
			
 
				++
			
 
				+ #endif /* MTK_ETH_H */
			
 
				+--- /dev/null
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				+@@ -0,0 +1,485 @@
			
 
				++// SPDX-License-Identifier: GPL-2.0-only
			
 
				++/*
			
 
				++ *  Copyright (C) 2020 Felix Fietkau <[email protected]>
			
 
				++ */
			
 
				++
			
 
				++#include <linux/if_ether.h>
			
 
				++#include <linux/rhashtable.h>
			
 
				++#include <linux/if_ether.h>
			
 
				++#include <linux/ip.h>
			
 
				++#include <net/flow_offload.h>
			
 
				++#include <net/pkt_cls.h>
			
 
				++#include <net/dsa.h>
			
 
				++#include "mtk_eth_soc.h"
			
 
				++
			
 
				++struct mtk_flow_data {
			
 
				++	struct ethhdr eth;
			
 
				++
			
 
				++	union {
			
 
				++		struct {
			
 
				++			__be32 src_addr;
			
 
				++			__be32 dst_addr;
			
 
				++		} v4;
			
 
				++	};
			
 
				++
			
 
				++	__be16 src_port;
			
 
				++	__be16 dst_port;
			
 
				++
			
 
				++	struct {
			
 
				++		u16 id;
			
 
				++		__be16 proto;
			
 
				++		u8 num;
			
 
				++	} vlan;
			
 
				++	struct {
			
 
				++		u16 sid;
			
 
				++		u8 num;
			
 
				++	} pppoe;
			
 
				++};
			
 
				++
			
 
				++struct mtk_flow_entry {
			
 
				++	struct rhash_head node;
			
 
				++	unsigned long cookie;
			
 
				++	u16 hash;
			
 
				++};
			
 
				++
			
 
				++static const struct rhashtable_params mtk_flow_ht_params = {
			
 
				++	.head_offset = offsetof(struct mtk_flow_entry, node),
			
 
				++	.head_offset = offsetof(struct mtk_flow_entry, cookie),
			
 
				++	.key_len = sizeof(unsigned long),
			
 
				++	.automatic_shrinking = true,
			
 
				++};
			
 
				++
			
 
				++static u32
			
 
				++mtk_eth_timestamp(struct mtk_eth *eth)
			
 
				++{
			
 
				++	return mtk_r32(eth, 0x0010) & MTK_FOE_IB1_BIND_TIMESTAMP;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_set_ipv4_addr(struct mtk_foe_entry *foe, struct mtk_flow_data *data,
			
 
				++		       bool egress)
			
 
				++{
			
 
				++	return mtk_foe_entry_set_ipv4_tuple(foe, egress,
			
 
				++					    data->v4.src_addr, data->src_port,
			
 
				++					    data->v4.dst_addr, data->dst_port);
			
 
				++}
			
 
				++
			
 
				++static void
			
 
				++mtk_flow_offload_mangle_eth(const struct flow_action_entry *act, void *eth)
			
 
				++{
			
 
				++	void *dest = eth + act->mangle.offset;
			
 
				++	const void *src = &act->mangle.val;
			
 
				++
			
 
				++	if (act->mangle.offset > 8)
			
 
				++		return;
			
 
				++
			
 
				++	if (act->mangle.mask == 0xffff) {
			
 
				++		src += 2;
			
 
				++		dest += 2;
			
 
				++	}
			
 
				++
			
 
				++	memcpy(dest, src, act->mangle.mask ? 2 : 4);
			
 
				++}
			
 
				++
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_mangle_ports(const struct flow_action_entry *act,
			
 
				++		      struct mtk_flow_data *data)
			
 
				++{
			
 
				++	u32 val = ntohl(act->mangle.val);
			
 
				++
			
 
				++	switch (act->mangle.offset) {
			
 
				++	case 0:
			
 
				++		if (act->mangle.mask == ~htonl(0xffff))
			
 
				++			data->dst_port = cpu_to_be16(val);
			
 
				++		else
			
 
				++			data->src_port = cpu_to_be16(val >> 16);
			
 
				++		break;
			
 
				++	case 2:
			
 
				++		data->dst_port = cpu_to_be16(val);
			
 
				++		break;
			
 
				++	default:
			
 
				++		return -EINVAL;
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_mangle_ipv4(const struct flow_action_entry *act,
			
 
				++		     struct mtk_flow_data *data)
			
 
				++{
			
 
				++	__be32 *dest;
			
 
				++
			
 
				++	switch (act->mangle.offset) {
			
 
				++	case offsetof(struct iphdr, saddr):
			
 
				++		dest = &data->v4.src_addr;
			
 
				++		break;
			
 
				++	case offsetof(struct iphdr, daddr):
			
 
				++		dest = &data->v4.dst_addr;
			
 
				++		break;
			
 
				++	default:
			
 
				++		return -EINVAL;
			
 
				++	}
			
 
				++
			
 
				++	memcpy(dest, &act->mangle.val, sizeof(u32));
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_get_dsa_port(struct net_device **dev)
			
 
				++{
			
 
				++#if IS_ENABLED(CONFIG_NET_DSA)
			
 
				++	struct dsa_port *dp;
			
 
				++
			
 
				++	dp = dsa_port_from_netdev(*dev);
			
 
				++	if (IS_ERR(dp))
			
 
				++		return -ENODEV;
			
 
				++
			
 
				++	if (dp->cpu_dp->tag_ops->proto != DSA_TAG_PROTO_MTK)
			
 
				++		return -ENODEV;
			
 
				++
			
 
				++	*dev = dp->cpu_dp->master;
			
 
				++
			
 
				++	return dp->index;
			
 
				++#else
			
 
				++	return -ENODEV;
			
 
				++#endif
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_set_output_device(struct mtk_eth *eth, struct mtk_foe_entry *foe,
			
 
				++			   struct net_device *dev)
			
 
				++{
			
 
				++	int pse_port, dsa_port;
			
 
				++
			
 
				++	dsa_port = mtk_flow_get_dsa_port(&dev);
			
 
				++	if (dsa_port >= 0)
			
 
				++		mtk_foe_entry_set_dsa(foe, dsa_port);
			
 
				++
			
 
				++	if (dev == eth->netdev[0])
			
 
				++		pse_port = 1;
			
 
				++	else if (dev == eth->netdev[1])
			
 
				++		pse_port = 2;
			
 
				++	else
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	mtk_foe_entry_set_pse_port(foe, pse_port);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_offload_replace(struct mtk_eth *eth, struct flow_cls_offload *f)
			
 
				++{
			
 
				++	struct flow_rule *rule = flow_cls_offload_flow_rule(f);
			
 
				++	struct flow_action_entry *act;
			
 
				++	struct mtk_flow_data data = {};
			
 
				++	struct mtk_foe_entry foe;
			
 
				++	struct net_device *odev = NULL;
			
 
				++	struct mtk_flow_entry *entry;
			
 
				++	int offload_type = 0;
			
 
				++	u16 addr_type = 0;
			
 
				++	u32 timestamp;
			
 
				++	u8 l4proto = 0;
			
 
				++	int err = 0;
			
 
				++	int hash;
			
 
				++	int i;
			
 
				++
			
 
				++	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_META)) {
			
 
				++		struct flow_match_meta match;
			
 
				++
			
 
				++		flow_rule_match_meta(rule, &match);
			
 
				++	} else {
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++
			
 
				++	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_CONTROL)) {
			
 
				++		struct flow_match_control match;
			
 
				++
			
 
				++		flow_rule_match_control(rule, &match);
			
 
				++		addr_type = match.key->addr_type;
			
 
				++	} else {
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++
			
 
				++	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_BASIC)) {
			
 
				++		struct flow_match_basic match;
			
 
				++
			
 
				++		flow_rule_match_basic(rule, &match);
			
 
				++		l4proto = match.key->ip_proto;
			
 
				++	} else {
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++
			
 
				++	flow_action_for_each(i, act, &rule->action) {
			
 
				++		switch (act->id) {
			
 
				++		case FLOW_ACTION_MANGLE:
			
 
				++			if (act->mangle.htype == FLOW_ACT_MANGLE_HDR_TYPE_ETH)
			
 
				++				mtk_flow_offload_mangle_eth(act, &data.eth);
			
 
				++			break;
			
 
				++		case FLOW_ACTION_REDIRECT:
			
 
				++			odev = act->dev;
			
 
				++			break;
			
 
				++		case FLOW_ACTION_CSUM:
			
 
				++			break;
			
 
				++		case FLOW_ACTION_VLAN_PUSH:
			
 
				++			if (data.vlan.num == 1 ||
			
 
				++			    act->vlan.proto != htons(ETH_P_8021Q))
			
 
				++				return -EOPNOTSUPP;
			
 
				++
			
 
				++			data.vlan.id = act->vlan.vid;
			
 
				++			data.vlan.proto = act->vlan.proto;
			
 
				++			data.vlan.num++;
			
 
				++			break;
			
 
				++		case FLOW_ACTION_PPPOE_PUSH:
			
 
				++			if (data.pppoe.num == 1)
			
 
				++				return -EOPNOTSUPP;
			
 
				++
			
 
				++			data.pppoe.sid = act->pppoe.sid;
			
 
				++			data.pppoe.num++;
			
 
				++			break;
			
 
				++		default:
			
 
				++			return -EOPNOTSUPP;
			
 
				++		}
			
 
				++	}
			
 
				++
			
 
				++	switch (addr_type) {
			
 
				++	case FLOW_DISSECTOR_KEY_IPV4_ADDRS:
			
 
				++		offload_type = MTK_PPE_PKT_TYPE_IPV4_HNAPT;
			
 
				++		break;
			
 
				++	default:
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++
			
 
				++	if (!is_valid_ether_addr(data.eth.h_source) ||
			
 
				++	    !is_valid_ether_addr(data.eth.h_dest))
			
 
				++		return -EINVAL;
			
 
				++
			
 
				++	err = mtk_foe_entry_prepare(&foe, offload_type, l4proto, 0,
			
 
				++				    data.eth.h_source,
			
 
				++				    data.eth.h_dest);
			
 
				++	if (err)
			
 
				++		return err;
			
 
				++
			
 
				++	if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_PORTS)) {
			
 
				++		struct flow_match_ports ports;
			
 
				++
			
 
				++		flow_rule_match_ports(rule, &ports);
			
 
				++		data.src_port = ports.key->src;
			
 
				++		data.dst_port = ports.key->dst;
			
 
				++	} else {
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++
			
 
				++	if (addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS) {
			
 
				++		struct flow_match_ipv4_addrs addrs;
			
 
				++
			
 
				++		flow_rule_match_ipv4_addrs(rule, &addrs);
			
 
				++
			
 
				++		data.v4.src_addr = addrs.key->src;
			
 
				++		data.v4.dst_addr = addrs.key->dst;
			
 
				++
			
 
				++		mtk_flow_set_ipv4_addr(&foe, &data, false);
			
 
				++	}
			
 
				++
			
 
				++	flow_action_for_each(i, act, &rule->action) {
			
 
				++		if (act->id != FLOW_ACTION_MANGLE)
			
 
				++			continue;
			
 
				++
			
 
				++		switch (act->mangle.htype) {
			
 
				++		case FLOW_ACT_MANGLE_HDR_TYPE_TCP:
			
 
				++		case FLOW_ACT_MANGLE_HDR_TYPE_UDP:
			
 
				++			err = mtk_flow_mangle_ports(act, &data);
			
 
				++			break;
			
 
				++		case FLOW_ACT_MANGLE_HDR_TYPE_IP4:
			
 
				++			err = mtk_flow_mangle_ipv4(act, &data);
			
 
				++			break;
			
 
				++		case FLOW_ACT_MANGLE_HDR_TYPE_ETH:
			
 
				++			/* handled earlier */
			
 
				++			break;
			
 
				++		default:
			
 
				++			return -EOPNOTSUPP;
			
 
				++		}
			
 
				++
			
 
				++		if (err)
			
 
				++			return err;
			
 
				++	}
			
 
				++
			
 
				++	if (addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS) {
			
 
				++		err = mtk_flow_set_ipv4_addr(&foe, &data, true);
			
 
				++		if (err)
			
 
				++			return err;
			
 
				++	}
			
 
				++
			
 
				++	if (data.vlan.num == 1) {
			
 
				++		if (data.vlan.proto != htons(ETH_P_8021Q))
			
 
				++			return -EOPNOTSUPP;
			
 
				++
			
 
				++		mtk_foe_entry_set_vlan(&foe, data.vlan.id);
			
 
				++	}
			
 
				++	if (data.pppoe.num == 1)
			
 
				++		mtk_foe_entry_set_pppoe(&foe, data.pppoe.sid);
			
 
				++
			
 
				++	err = mtk_flow_set_output_device(eth, &foe, odev);
			
 
				++	if (err)
			
 
				++		return err;
			
 
				++
			
 
				++	entry = kzalloc(sizeof(*entry), GFP_KERNEL);
			
 
				++	if (!entry)
			
 
				++		return -ENOMEM;
			
 
				++
			
 
				++	entry->cookie = f->cookie;
			
 
				++	timestamp = mtk_eth_timestamp(eth);
			
 
				++	hash = mtk_foe_entry_commit(&eth->ppe, &foe, timestamp);
			
 
				++	if (hash < 0) {
			
 
				++		err = hash;
			
 
				++		goto free;
			
 
				++	}
			
 
				++
			
 
				++	entry->hash = hash;
			
 
				++	err = rhashtable_insert_fast(&eth->flow_table, &entry->node,
			
 
				++				     mtk_flow_ht_params);
			
 
				++	if (err < 0)
			
 
				++		goto clear_flow;
			
 
				++
			
 
				++	return 0;
			
 
				++clear_flow:
			
 
				++	mtk_foe_entry_clear(&eth->ppe, hash);
			
 
				++free:
			
 
				++	kfree(entry);
			
 
				++	return err;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_offload_destroy(struct mtk_eth *eth, struct flow_cls_offload *f)
			
 
				++{
			
 
				++	struct mtk_flow_entry *entry;
			
 
				++
			
 
				++	entry = rhashtable_lookup(&eth->flow_table, &f->cookie,
			
 
				++				  mtk_flow_ht_params);
			
 
				++	if (!entry)
			
 
				++		return -ENOENT;
			
 
				++
			
 
				++	mtk_foe_entry_clear(&eth->ppe, entry->hash);
			
 
				++	rhashtable_remove_fast(&eth->flow_table, &entry->node,
			
 
				++			       mtk_flow_ht_params);
			
 
				++	kfree(entry);
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_flow_offload_stats(struct mtk_eth *eth, struct flow_cls_offload *f)
			
 
				++{
			
 
				++	struct mtk_flow_entry *entry;
			
 
				++	int timestamp;
			
 
				++	u32 idle;
			
 
				++
			
 
				++	entry = rhashtable_lookup(&eth->flow_table, &f->cookie,
			
 
				++				  mtk_flow_ht_params);
			
 
				++	if (!entry)
			
 
				++		return -ENOENT;
			
 
				++
			
 
				++	timestamp = mtk_foe_entry_timestamp(&eth->ppe, entry->hash);
			
 
				++	if (timestamp < 0)
			
 
				++		return -ETIMEDOUT;
			
 
				++
			
 
				++	idle = mtk_eth_timestamp(eth) - timestamp;
			
 
				++	f->stats.lastused = jiffies - idle * HZ;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_eth_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
			
 
				++{
			
 
				++	struct flow_cls_offload *cls = type_data;
			
 
				++	struct net_device *dev = cb_priv;
			
 
				++	struct mtk_mac *mac = netdev_priv(dev);
			
 
				++	struct mtk_eth *eth = mac->hw;
			
 
				++
			
 
				++	if (!tc_can_offload(dev))
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	if (type != TC_SETUP_CLSFLOWER)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	switch (cls->command) {
			
 
				++	case FLOW_CLS_REPLACE:
			
 
				++		return mtk_flow_offload_replace(eth, cls);
			
 
				++	case FLOW_CLS_DESTROY:
			
 
				++		return mtk_flow_offload_destroy(eth, cls);
			
 
				++	case FLOW_CLS_STATS:
			
 
				++		return mtk_flow_offload_stats(eth, cls);
			
 
				++	default:
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				++static int
			
 
				++mtk_eth_setup_tc_block(struct net_device *dev, struct flow_block_offload *f)
			
 
				++{
			
 
				++	struct mtk_mac *mac = netdev_priv(dev);
			
 
				++	struct mtk_eth *eth = mac->hw;
			
 
				++	static LIST_HEAD(block_cb_list);
			
 
				++	struct flow_block_cb *block_cb;
			
 
				++	flow_setup_cb_t *cb;
			
 
				++
			
 
				++	if (!eth->ppe.foe_table)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	if (f->binder_type != FLOW_BLOCK_BINDER_TYPE_CLSACT_INGRESS)
			
 
				++		return -EOPNOTSUPP;
			
 
				++
			
 
				++	cb = mtk_eth_setup_tc_block_cb;
			
 
				++	f->driver_block_list = &block_cb_list;
			
 
				++
			
 
				++	switch (f->command) {
			
 
				++	case FLOW_BLOCK_BIND:
			
 
				++		block_cb = flow_block_cb_lookup(f->block, cb, dev);
			
 
				++		if (block_cb) {
			
 
				++			flow_block_cb_incref(block_cb);
			
 
				++			return 0;
			
 
				++		}
			
 
				++		block_cb = flow_block_cb_alloc(cb, dev, dev, NULL);
			
 
				++		if (IS_ERR(block_cb))
			
 
				++			return PTR_ERR(block_cb);
			
 
				++
			
 
				++		flow_block_cb_add(block_cb, f);
			
 
				++		list_add_tail(&block_cb->driver_list, &block_cb_list);
			
 
				++		return 0;
			
 
				++	case FLOW_BLOCK_UNBIND:
			
 
				++		block_cb = flow_block_cb_lookup(f->block, cb, dev);
			
 
				++		if (!block_cb)
			
 
				++			return -ENOENT;
			
 
				++
			
 
				++		if (flow_block_cb_decref(block_cb)) {
			
 
				++			flow_block_cb_remove(block_cb, f);
			
 
				++			list_del(&block_cb->driver_list);
			
 
				++		}
			
 
				++		return 0;
			
 
				++	default:
			
 
				++		return -EOPNOTSUPP;
			
 
				++	}
			
 
				++}
			
 
				++
			
 
				++int mtk_eth_setup_tc(struct net_device *dev, enum tc_setup_type type,
			
 
				++		     void *type_data)
			
 
				++{
			
 
				++	if (type == TC_SETUP_FT)
			
 
				++		return mtk_eth_setup_tc_block(dev, type_data);
			
 
				++
			
 
				++	return -EOPNOTSUPP;
			
 
				++}
			
 
				++
			
 
				++int mtk_eth_offload_init(struct mtk_eth *eth)
			
 
				++{
			
 
				++	if (!eth->ppe.foe_table)
			
 
				++		return 0;
			
 
				++
			
 
				++	return rhashtable_init(&eth->flow_table, &mtk_flow_ht_params);
			
 
				++}
			
--- a/target/linux/generic/backport-5.15/610-v5.13-34-docs-nf_flowtable-update-documentation-with-enhancem.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-34-docs-nf_flowtable-update-documentation-with-enhancem.patch
@@ -0,0 +1,236 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Wed, 24 Mar 2021 02:30:55 +0100
			
 
				+Subject: [PATCH] docs: nf_flowtable: update documentation with
			
 
				+ enhancements
			
 
				+
			
 
				+This patch updates the flowtable documentation to describe recent
			
 
				+enhancements:
			
 
				+
			
 
				+- Offload action is available after the first packets go through the
			
 
				+  classic forwarding path.
			
 
				+- IPv4 and IPv6 are supported. Only TCP and UDP layer 4 are supported at
			
 
				+  this stage.
			
 
				+- Tuple has been augmented to track VLAN id and PPPoE session id.
			
 
				+- Bridge and IP forwarding integration, including bridge VLAN filtering
			
 
				+  support.
			
 
				+- Hardware offload support.
			
 
				+- Describe the [OFFLOAD] and [HW_OFFLOAD] tags in the conntrack table
			
 
				+  listing.
			
 
				+- Replace 'flow offload' by 'flow add' in example rulesets (preferred
			
 
				+  syntax).
			
 
				+- Describe existing cache limitations.
			
 
				+
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/Documentation/networking/nf_flowtable.rst
			
 
				++++ b/Documentation/networking/nf_flowtable.rst
			
 
				+@@ -4,35 +4,38 @@
			
 
				+ Netfilter's flowtable infrastructure
			
 
				+ ====================================
			
 
				+ 
			
 
				+-This documentation describes the software flowtable infrastructure available in
			
 
				+-Netfilter since Linux kernel 4.16.
			
 
				++This documentation describes the Netfilter flowtable infrastructure which allows
			
 
				++you to define a fastpath through the flowtable datapath. This infrastructure
			
 
				++also provides hardware offload support. The flowtable supports for the layer 3
			
 
				++IPv4 and IPv6 and the layer 4 TCP and UDP protocols.
			
 
				+ 
			
 
				+ Overview
			
 
				+ --------
			
 
				+ 
			
 
				+-Initial packets follow the classic forwarding path, once the flow enters the
			
 
				+-established state according to the conntrack semantics (ie. we have seen traffic
			
 
				+-in both directions), then you can decide to offload the flow to the flowtable
			
 
				+-from the forward chain via the 'flow offload' action available in nftables.
			
 
				+-
			
 
				+-Packets that find an entry in the flowtable (ie. flowtable hit) are sent to the
			
 
				+-output netdevice via neigh_xmit(), hence, they bypass the classic forwarding
			
 
				+-path (the visible effect is that you do not see these packets from any of the
			
 
				+-netfilter hooks coming after the ingress). In case of flowtable miss, the packet
			
 
				+-follows the classic forward path.
			
 
				+-
			
 
				+-The flowtable uses a resizable hashtable, lookups are based on the following
			
 
				+-7-tuple selectors: source, destination, layer 3 and layer 4 protocols, source
			
 
				+-and destination ports and the input interface (useful in case there are several
			
 
				+-conntrack zones in place).
			
 
				+-
			
 
				+-Flowtables are populated via the 'flow offload' nftables action, so the user can
			
 
				+-selectively specify what flows are placed into the flow table. Hence, packets
			
 
				+-follow the classic forwarding path unless the user explicitly instruct packets
			
 
				+-to use this new alternative forwarding path via nftables policy.
			
 
				++Once the first packet of the flow successfully goes through the IP forwarding
			
 
				++path, from the second packet on, you might decide to offload the flow to the
			
 
				++flowtable through your ruleset. The flowtable infrastructure provides a rule
			
 
				++action that allows you to specify when to add a flow to the flowtable.
			
 
				++
			
 
				++A packet that finds a matching entry in the flowtable (ie. flowtable hit) is
			
 
				++transmitted to the output netdevice via neigh_xmit(), hence, packets bypass the
			
 
				++classic IP forwarding path (the visible effect is that you do not see these
			
 
				++packets from any of the Netfilter hooks coming after ingress). In case that
			
 
				++there is no matching entry in the flowtable (ie. flowtable miss), the packet
			
 
				++follows the classic IP forwarding path.
			
 
				++
			
 
				++The flowtable uses a resizable hashtable. Lookups are based on the following
			
 
				++n-tuple selectors: layer 2 protocol encapsulation (VLAN and PPPoE), layer 3
			
 
				++source and destination, layer 4 source and destination ports and the input
			
 
				++interface (useful in case there are several conntrack zones in place).
			
 
				++
			
 
				++The 'flow add' action allows you to populate the flowtable, the user selectively
			
 
				++specifies what flows are placed into the flowtable. Hence, packets follow the
			
 
				++classic IP forwarding path unless the user explicitly instruct flows to use this
			
 
				++new alternative forwarding path via policy.
			
 
				+ 
			
 
				+-This is represented in Fig.1, which describes the classic forwarding path
			
 
				+-including the Netfilter hooks and the flowtable fastpath bypass.
			
 
				++The flowtable datapath is represented in Fig.1, which describes the classic IP
			
 
				++forwarding path including the Netfilter hooks and the flowtable fastpath bypass.
			
 
				+ 
			
 
				+ ::
			
 
				+ 
			
 
				+@@ -67,11 +70,13 @@ including the Netfilter hooks and the fl
			
 
				+ 	       Fig.1 Netfilter hooks and flowtable interactions
			
 
				+ 
			
 
				+ The flowtable entry also stores the NAT configuration, so all packets are
			
 
				+-mangled according to the NAT policy that matches the initial packets that went
			
 
				+-through the classic forwarding path. The TTL is decremented before calling
			
 
				+-neigh_xmit(). Fragmented traffic is passed up to follow the classic forwarding
			
 
				+-path given that the transport selectors are missing, therefore flowtable lookup
			
 
				+-is not possible.
			
 
				++mangled according to the NAT policy that is specified from the classic IP
			
 
				++forwarding path. The TTL is decremented before calling neigh_xmit(). Fragmented
			
 
				++traffic is passed up to follow the classic IP forwarding path given that the
			
 
				++transport header is missing, in this case, flowtable lookups are not possible.
			
 
				++TCP RST and FIN packets are also passed up to the classic IP forwarding path to
			
 
				++release the flow gracefully. Packets that exceed the MTU are also passed up to
			
 
				++the classic forwarding path to report packet-too-big ICMP errors to the sender.
			
 
				+ 
			
 
				+ Example configuration
			
 
				+ ---------------------
			
 
				+@@ -85,7 +90,7 @@ flowtable and add one rule to your forwa
			
 
				+ 		}
			
 
				+ 		chain y {
			
 
				+ 			type filter hook forward priority 0; policy accept;
			
 
				+-			ip protocol tcp flow offload @f
			
 
				++			ip protocol tcp flow add @f
			
 
				+ 			counter packets 0 bytes 0
			
 
				+ 		}
			
 
				+ 	}
			
 
				+@@ -103,6 +108,117 @@ flow is offloaded, you will observe that
			
 
				+ does not get updated for the packets that are being forwarded through the
			
 
				+ forwarding bypass.
			
 
				+ 
			
 
				++You can identify offloaded flows through the [OFFLOAD] tag when listing your
			
 
				++connection tracking table.
			
 
				++
			
 
				++::
			
 
				++	# conntrack -L
			
 
				++	tcp      6 src=10.141.10.2 dst=192.168.10.2 sport=52728 dport=5201 src=192.168.10.2 dst=192.168.10.1 sport=5201 dport=52728 [OFFLOAD] mark=0 use=2
			
 
				++
			
 
				++
			
 
				++Layer 2 encapsulation
			
 
				++---------------------
			
 
				++
			
 
				++Since Linux kernel 5.13, the flowtable infrastructure discovers the real
			
 
				++netdevice behind VLAN and PPPoE netdevices. The flowtable software datapath
			
 
				++parses the VLAN and PPPoE layer 2 headers to extract the ethertype and the
			
 
				++VLAN ID / PPPoE session ID which are used for the flowtable lookups. The
			
 
				++flowtable datapath also deals with layer 2 decapsulation.
			
 
				++
			
 
				++You do not need to add the PPPoE and the VLAN devices to your flowtable,
			
 
				++instead the real device is sufficient for the flowtable to track your flows.
			
 
				++
			
 
				++Bridge and IP forwarding
			
 
				++------------------------
			
 
				++
			
 
				++Since Linux kernel 5.13, you can add bridge ports to the flowtable. The
			
 
				++flowtable infrastructure discovers the topology behind the bridge device. This
			
 
				++allows the flowtable to define a fastpath bypass between the bridge ports
			
 
				++(represented as eth1 and eth2 in the example figure below) and the gateway
			
 
				++device (represented as eth0) in your switch/router.
			
 
				++
			
 
				++::
			
 
				++                      fastpath bypass
			
 
				++               .-------------------------.
			
 
				++              /                           \
			
 
				++              |           IP forwarding   |
			
 
				++              |          /             \ \/
			
 
				++              |       br0               eth0 ..... eth0
			
 
				++              .       / \                          *host B*
			
 
				++               -> eth1  eth2
			
 
				++                   .           *switch/router*
			
 
				++                   .
			
 
				++                   .
			
 
				++                 eth0
			
 
				++               *host A*
			
 
				++
			
 
				++The flowtable infrastructure also supports for bridge VLAN filtering actions
			
 
				++such as PVID and untagged. You can also stack a classic VLAN device on top of
			
 
				++your bridge port.
			
 
				++
			
 
				++If you would like that your flowtable defines a fastpath between your bridge
			
 
				++ports and your IP forwarding path, you have to add your bridge ports (as
			
 
				++represented by the real netdevice) to your flowtable definition.
			
 
				++
			
 
				++Counters
			
 
				++--------
			
 
				++
			
 
				++The flowtable can synchronize packet and byte counters with the existing
			
 
				++connection tracking entry by specifying the counter statement in your flowtable
			
 
				++definition, e.g.
			
 
				++
			
 
				++::
			
 
				++	table inet x {
			
 
				++		flowtable f {
			
 
				++			hook ingress priority 0; devices = { eth0, eth1 };
			
 
				++			counter
			
 
				++		}
			
 
				++		...
			
 
				++	}
			
 
				++
			
 
				++Counter support is available since Linux kernel 5.7.
			
 
				++
			
 
				++Hardware offload
			
 
				++----------------
			
 
				++
			
 
				++If your network device provides hardware offload support, you can turn it on by
			
 
				++means of the 'offload' flag in your flowtable definition, e.g.
			
 
				++
			
 
				++::
			
 
				++	table inet x {
			
 
				++		flowtable f {
			
 
				++			hook ingress priority 0; devices = { eth0, eth1 };
			
 
				++			flags offload;
			
 
				++		}
			
 
				++		...
			
 
				++	}
			
 
				++
			
 
				++There is a workqueue that adds the flows to the hardware. Note that a few
			
 
				++packets might still run over the flowtable software path until the workqueue has
			
 
				++a chance to offload the flow to the network device.
			
 
				++
			
 
				++You can identify hardware offloaded flows through the [HW_OFFLOAD] tag when
			
 
				++listing your connection tracking table. Please, note that the [OFFLOAD] tag
			
 
				++refers to the software offload mode, so there is a distinction between [OFFLOAD]
			
 
				++which refers to the software flowtable fastpath and [HW_OFFLOAD] which refers
			
 
				++to the hardware offload datapath being used by the flow.
			
 
				++
			
 
				++The flowtable hardware offload infrastructure also supports for the DSA
			
 
				++(Distributed Switch Architecture).
			
 
				++
			
 
				++Limitations
			
 
				++-----------
			
 
				++
			
 
				++The flowtable behaves like a cache. The flowtable entries might get stale if
			
 
				++either the destination MAC address or the egress netdevice that is used for
			
 
				++transmission changes.
			
 
				++
			
 
				++This might be a problem if:
			
 
				++
			
 
				++- You run the flowtable in software mode and you combine bridge and IP
			
 
				++  forwarding in your setup.
			
 
				++- Hardware offload is enabled.
			
 
				++
			
 
				+ More reading
			
 
				+ ------------
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-35-net-ethernet-mediatek-ppe-fix-busy-wait-loop.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-35-net-ethernet-mediatek-ppe-fix-busy-wait-loop.patch
@@ -0,0 +1,72 @@
 
				+From c5d66587b8900201e1530b7c18d41e87bd5812f4 Mon Sep 17 00:00:00 2001
			
 
				+From: Ilya Lipnitskiy <[email protected]>
			
 
				+Date: Thu, 15 Apr 2021 17:37:48 -0700
			
 
				+Subject: [PATCH] net: ethernet: mediatek: ppe: fix busy wait loop
			
 
				+
			
 
				+The intention is for the loop to timeout if the body does not succeed.
			
 
				+The current logic calls time_is_before_jiffies(timeout) which is false
			
 
				+until after the timeout, so the loop body never executes.
			
 
				+
			
 
				+Fix by using readl_poll_timeout as a more standard and less error-prone
			
 
				+solution.
			
 
				+
			
 
				+Fixes: ba37b7caf1ed ("net: ethernet: mtk_eth_soc: add support for initializing the PPE")
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Cc: Felix Fietkau <[email protected]>
			
 
				+Reviewed-by: Andrew Lunn <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_ppe.c | 20 +++++++++-----------
			
 
				+ drivers/net/ethernet/mediatek/mtk_ppe.h |  1 +
			
 
				+ 2 files changed, 10 insertions(+), 11 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_ppe.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe.c
			
 
				+@@ -2,9 +2,8 @@
			
 
				+ /* Copyright (C) 2020 Felix Fietkau <[email protected]> */
			
 
				+ 
			
 
				+ #include <linux/kernel.h>
			
 
				+-#include <linux/jiffies.h>
			
 
				+-#include <linux/delay.h>
			
 
				+ #include <linux/io.h>
			
 
				++#include <linux/iopoll.h>
			
 
				+ #include <linux/etherdevice.h>
			
 
				+ #include <linux/platform_device.h>
			
 
				+ #include "mtk_ppe.h"
			
 
				+@@ -44,18 +43,17 @@ static u32 ppe_clear(struct mtk_ppe *ppe
			
 
				+ 
			
 
				+ static int mtk_ppe_wait_busy(struct mtk_ppe *ppe)
			
 
				+ {
			
 
				+-	unsigned long timeout = jiffies + HZ;
			
 
				+-
			
 
				+-	while (time_is_before_jiffies(timeout)) {
			
 
				+-		if (!(ppe_r32(ppe, MTK_PPE_GLO_CFG) & MTK_PPE_GLO_CFG_BUSY))
			
 
				+-			return 0;
			
 
				++	int ret;
			
 
				++	u32 val;
			
 
				+ 
			
 
				+-		usleep_range(10, 20);
			
 
				+-	}
			
 
				++	ret = readl_poll_timeout(ppe->base + MTK_PPE_GLO_CFG, val,
			
 
				++				 !(val & MTK_PPE_GLO_CFG_BUSY),
			
 
				++				 20, MTK_PPE_WAIT_TIMEOUT_US);
			
 
				+ 
			
 
				+-	dev_err(ppe->dev, "PPE table busy");
			
 
				++	if (ret)
			
 
				++		dev_err(ppe->dev, "PPE table busy");
			
 
				+ 
			
 
				+-	return -ETIMEDOUT;
			
 
				++	return ret;
			
 
				+ }
			
 
				+ 
			
 
				+ static void mtk_ppe_cache_clear(struct mtk_ppe *ppe)
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_ppe.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe.h
			
 
				+@@ -12,6 +12,7 @@
			
 
				+ #define MTK_PPE_ENTRIES_SHIFT		3
			
 
				+ #define MTK_PPE_ENTRIES			(1024 << MTK_PPE_ENTRIES_SHIFT)
			
 
				+ #define MTK_PPE_HASH_MASK		(MTK_PPE_ENTRIES - 1)
			
 
				++#define MTK_PPE_WAIT_TIMEOUT_US		1000000
			
 
				+ 
			
 
				+ #define MTK_FOE_IB1_UNBIND_TIMESTAMP	GENMASK(7, 0)
			
 
				+ #define MTK_FOE_IB1_UNBIND_PACKETS	GENMASK(23, 8)
			
--- a/target/linux/generic/backport-5.15/610-v5.13-36-net-ethernet-mediatek-fix-a-typo-bug-in-flow-offload.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-36-net-ethernet-mediatek-fix-a-typo-bug-in-flow-offload.patch
@@ -0,0 +1,29 @@
 
				+From 6ecaf81d4ac6365f9284f9d68d74f7c209e74f98 Mon Sep 17 00:00:00 2001
			
 
				+From: DENG Qingfang <[email protected]>
			
 
				+Date: Sat, 17 Apr 2021 15:29:04 +0800
			
 
				+Subject: [PATCH] net: ethernet: mediatek: fix a typo bug in flow offloading
			
 
				+
			
 
				+Issue was traffic problems after a while with increased ping times if
			
 
				+flow offload is active. It turns out that key_offset with cookie is
			
 
				+needed in rhashtable_params but was re-assigned to head_offset.
			
 
				+Fix the assignment.
			
 
				+
			
 
				+Fixes: 502e84e2382d ("net: ethernet: mtk_eth_soc: add flow offloading support")
			
 
				+Signed-off-by: DENG Qingfang <[email protected]>
			
 
				+Tested-by: Frank Wunderlich <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_ppe_offload.c | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				+@@ -44,7 +44,7 @@ struct mtk_flow_entry {
			
 
				+ 
			
 
				+ static const struct rhashtable_params mtk_flow_ht_params = {
			
 
				+ 	.head_offset = offsetof(struct mtk_flow_entry, node),
			
 
				+-	.head_offset = offsetof(struct mtk_flow_entry, cookie),
			
 
				++	.key_offset = offsetof(struct mtk_flow_entry, cookie),
			
 
				+ 	.key_len = sizeof(unsigned long),
			
 
				+ 	.automatic_shrinking = true,
			
 
				+ };
			
--- a/target/linux/generic/backport-5.15/610-v5.13-38-net-ethernet-mtk_eth_soc-unmap-RX-data-before-callin.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-38-net-ethernet-mtk_eth_soc-unmap-RX-data-before-callin.patch
@@ -0,0 +1,38 @@
 
				+From 5196c417854942e218a59ec87bf7d414b3bd581e Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:20:55 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: unmap RX data before calling
			
 
				+ build_skb
			
 
				+
			
 
				+Since build_skb accesses the data area (for initializing shinfo), dma unmap
			
 
				+needs to happen before that call
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+[Ilya: split build_skb cleanup fix into a separate commit]
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 5 +++--
			
 
				+ 1 file changed, 3 insertions(+), 2 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1319,6 +1319,9 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 			goto release_desc;
			
 
				+ 		}
			
 
				+ 
			
 
				++		dma_unmap_single(eth->dev, trxd.rxd1,
			
 
				++				 ring->buf_size, DMA_FROM_DEVICE);
			
 
				++
			
 
				+ 		/* receive data */
			
 
				+ 		skb = build_skb(data, ring->frag_size);
			
 
				+ 		if (unlikely(!skb)) {
			
 
				+@@ -1328,8 +1331,6 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		}
			
 
				+ 		skb_reserve(skb, NET_SKB_PAD + NET_IP_ALIGN);
			
 
				+ 
			
 
				+-		dma_unmap_single(eth->dev, trxd.rxd1,
			
 
				+-				 ring->buf_size, DMA_FROM_DEVICE);
			
 
				+ 		pktlen = RX_DMA_GET_PLEN0(trxd.rxd2);
			
 
				+ 		skb->dev = netdev;
			
 
				+ 		skb_put(skb, pktlen);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-39-net-ethernet-mtk_eth_soc-fix-build_skb-cleanup.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-39-net-ethernet-mtk_eth_soc-fix-build_skb-cleanup.patch
@@ -0,0 +1,38 @@
 
				+From 787082ab9f7be4711e52f67c388535eda74a1269 Mon Sep 17 00:00:00 2001
			
 
				+From: Ilya Lipnitskiy <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:20:56 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: fix build_skb cleanup
			
 
				+
			
 
				+In case build_skb fails, call skb_free_frag on the correct pointer. Also
			
 
				+update the DMA structures with the new mapping before exiting, because
			
 
				+the mapping was successful
			
 
				+
			
 
				+Suggested-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 5 +++--
			
 
				+ 1 file changed, 3 insertions(+), 2 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1325,9 +1325,9 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		/* receive data */
			
 
				+ 		skb = build_skb(data, ring->frag_size);
			
 
				+ 		if (unlikely(!skb)) {
			
 
				+-			skb_free_frag(new_data);
			
 
				++			skb_free_frag(data);
			
 
				+ 			netdev->stats.rx_dropped++;
			
 
				+-			goto release_desc;
			
 
				++			goto skip_rx;
			
 
				+ 		}
			
 
				+ 		skb_reserve(skb, NET_SKB_PAD + NET_IP_ALIGN);
			
 
				+ 
			
 
				+@@ -1347,6 +1347,7 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		skb_record_rx_queue(skb, 0);
			
 
				+ 		napi_gro_receive(napi, skb);
			
 
				+ 
			
 
				++skip_rx:
			
 
				+ 		ring->data[idx] = new_data;
			
 
				+ 		rxd->rxd1 = (unsigned int)dma_addr;
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-40-net-ethernet-mtk_eth_soc-use-napi_consume_skb.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-40-net-ethernet-mtk_eth_soc-use-napi_consume_skb.patch
@@ -0,0 +1,77 @@
 
				+From c30c4a82739090a2de4a4e3f245355ea4fb3ec14 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:20:57 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: use napi_consume_skb
			
 
				+
			
 
				+Should improve performance, since it can use bulk free
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 19 ++++++++++++-------
			
 
				+ 1 file changed, 12 insertions(+), 7 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -879,7 +879,8 @@ static int txd_to_idx(struct mtk_tx_ring
			
 
				+ 	return ((void *)dma - (void *)ring->dma) / sizeof(*dma);
			
 
				+ }
			
 
				+ 
			
 
				+-static void mtk_tx_unmap(struct mtk_eth *eth, struct mtk_tx_buf *tx_buf)
			
 
				++static void mtk_tx_unmap(struct mtk_eth *eth, struct mtk_tx_buf *tx_buf,
			
 
				++			 bool napi)
			
 
				+ {
			
 
				+ 	if (MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA)) {
			
 
				+ 		if (tx_buf->flags & MTK_TX_FLAGS_SINGLE0) {
			
 
				+@@ -911,8 +912,12 @@ static void mtk_tx_unmap(struct mtk_eth
			
 
				+ 
			
 
				+ 	tx_buf->flags = 0;
			
 
				+ 	if (tx_buf->skb &&
			
 
				+-	    (tx_buf->skb != (struct sk_buff *)MTK_DMA_DUMMY_DESC))
			
 
				+-		dev_kfree_skb_any(tx_buf->skb);
			
 
				++	    (tx_buf->skb != (struct sk_buff *)MTK_DMA_DUMMY_DESC)) {
			
 
				++		if (napi)
			
 
				++			napi_consume_skb(tx_buf->skb, napi);
			
 
				++		else
			
 
				++			dev_kfree_skb_any(tx_buf->skb);
			
 
				++	}
			
 
				+ 	tx_buf->skb = NULL;
			
 
				+ }
			
 
				+ 
			
 
				+@@ -1090,7 +1095,7 @@ err_dma:
			
 
				+ 		tx_buf = mtk_desc_to_tx_buf(ring, itxd);
			
 
				+ 
			
 
				+ 		/* unmap dma */
			
 
				+-		mtk_tx_unmap(eth, tx_buf);
			
 
				++		mtk_tx_unmap(eth, tx_buf, false);
			
 
				+ 
			
 
				+ 		itxd->txd3 = TX_DMA_LS0 | TX_DMA_OWNER_CPU;
			
 
				+ 		if (!MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA))
			
 
				+@@ -1409,7 +1414,7 @@ static int mtk_poll_tx_qdma(struct mtk_e
			
 
				+ 			done[mac]++;
			
 
				+ 			budget--;
			
 
				+ 		}
			
 
				+-		mtk_tx_unmap(eth, tx_buf);
			
 
				++		mtk_tx_unmap(eth, tx_buf, true);
			
 
				+ 
			
 
				+ 		ring->last_free = desc;
			
 
				+ 		atomic_inc(&ring->free_count);
			
 
				+@@ -1446,7 +1451,7 @@ static int mtk_poll_tx_pdma(struct mtk_e
			
 
				+ 			budget--;
			
 
				+ 		}
			
 
				+ 
			
 
				+-		mtk_tx_unmap(eth, tx_buf);
			
 
				++		mtk_tx_unmap(eth, tx_buf, true);
			
 
				+ 
			
 
				+ 		desc = &ring->dma[cpu];
			
 
				+ 		ring->last_free = desc;
			
 
				+@@ -1648,7 +1653,7 @@ static void mtk_tx_clean(struct mtk_eth
			
 
				+ 
			
 
				+ 	if (ring->buf) {
			
 
				+ 		for (i = 0; i < MTK_DMA_SIZE; i++)
			
 
				+-			mtk_tx_unmap(eth, &ring->buf[i]);
			
 
				++			mtk_tx_unmap(eth, &ring->buf[i], false);
			
 
				+ 		kfree(ring->buf);
			
 
				+ 		ring->buf = NULL;
			
 
				+ 	}
			
--- a/target/linux/generic/backport-5.15/610-v5.13-41-net-ethernet-mtk_eth_soc-reduce-MDIO-bus-access-late.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-41-net-ethernet-mtk_eth_soc-reduce-MDIO-bus-access-late.patch
@@ -0,0 +1,30 @@
 
				+From 3630d519d7c3eab92567658690e44ffe0517d109 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:20:58 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: reduce MDIO bus access latency
			
 
				+
			
 
				+usleep_range often ends up sleeping much longer than the 10-20us provided
			
 
				+as a range here. This causes significant latency in mdio bus acceses,
			
 
				+which easily adds multiple seconds to the boot time on MT7621 when polling
			
 
				+DSA slave ports.
			
 
				+Use cond_resched instead of usleep_range, since the MDIO access does not
			
 
				+take much time
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -86,7 +86,7 @@ static int mtk_mdio_busy_wait(struct mtk
			
 
				+ 			return 0;
			
 
				+ 		if (time_after(jiffies, t_start + PHY_IAC_TIMEOUT))
			
 
				+ 			break;
			
 
				+-		usleep_range(10, 20);
			
 
				++		cond_resched();
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	dev_err(eth->dev, "mdio: MDIO timeout\n");
			
--- a/target/linux/generic/backport-5.15/610-v5.13-42-net-ethernet-mtk_eth_soc-remove-unnecessary-TX-queue.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-42-net-ethernet-mtk_eth_soc-remove-unnecessary-TX-queue.patch
@@ -0,0 +1,54 @@
 
				+From 16ef670789b252b221700adc413497ed2f941d8a Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:20:59 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: remove unnecessary TX queue stops
			
 
				+
			
 
				+When running short on descriptors, only stop the queue for the netdev that
			
 
				+tx was attempted for. By the time something tries to send on the other
			
 
				+netdev, the ring might have some more room already.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 15 ++-------------
			
 
				+ 1 file changed, 2 insertions(+), 13 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1152,17 +1152,6 @@ static void mtk_wake_queue(struct mtk_et
			
 
				+ 	}
			
 
				+ }
			
 
				+ 
			
 
				+-static void mtk_stop_queue(struct mtk_eth *eth)
			
 
				+-{
			
 
				+-	int i;
			
 
				+-
			
 
				+-	for (i = 0; i < MTK_MAC_COUNT; i++) {
			
 
				+-		if (!eth->netdev[i])
			
 
				+-			continue;
			
 
				+-		netif_stop_queue(eth->netdev[i]);
			
 
				+-	}
			
 
				+-}
			
 
				+-
			
 
				+ static netdev_tx_t mtk_start_xmit(struct sk_buff *skb, struct net_device *dev)
			
 
				+ {
			
 
				+ 	struct mtk_mac *mac = netdev_priv(dev);
			
 
				+@@ -1183,7 +1172,7 @@ static netdev_tx_t mtk_start_xmit(struct
			
 
				+ 
			
 
				+ 	tx_num = mtk_cal_txd_req(skb);
			
 
				+ 	if (unlikely(atomic_read(&ring->free_count) <= tx_num)) {
			
 
				+-		mtk_stop_queue(eth);
			
 
				++		netif_stop_queue(dev);
			
 
				+ 		netif_err(eth, tx_queued, dev,
			
 
				+ 			  "Tx Ring full when queue awake!\n");
			
 
				+ 		spin_unlock(&eth->page_lock);
			
 
				+@@ -1209,7 +1198,7 @@ static netdev_tx_t mtk_start_xmit(struct
			
 
				+ 		goto drop;
			
 
				+ 
			
 
				+ 	if (unlikely(atomic_read(&ring->free_count) <= ring->thresh))
			
 
				+-		mtk_stop_queue(eth);
			
 
				++		netif_stop_queue(dev);
			
 
				+ 
			
 
				+ 	spin_unlock(&eth->page_lock);
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/610-v5.13-43-net-ethernet-mtk_eth_soc-use-larger-burst-size-for-Q.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-43-net-ethernet-mtk_eth_soc-use-larger-burst-size-for-Q.patch
@@ -0,0 +1,37 @@
 
				+From 59555a8d0dd39bf60b7ca1ba5e7393d293f7398d Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:00 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: use larger burst size for QDMA TX
			
 
				+
			
 
				+Improves tx performance
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 2 +-
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.h | 2 +-
			
 
				+ 2 files changed, 2 insertions(+), 2 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -2214,7 +2214,7 @@ static int mtk_start_dma(struct mtk_eth
			
 
				+ 	if (MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA)) {
			
 
				+ 		mtk_w32(eth,
			
 
				+ 			MTK_TX_WB_DDONE | MTK_TX_DMA_EN |
			
 
				+-			MTK_DMA_SIZE_16DWORDS | MTK_NDP_CO_PRO |
			
 
				++			MTK_TX_BT_32DWORDS | MTK_NDP_CO_PRO |
			
 
				+ 			MTK_RX_DMA_EN | MTK_RX_2B_OFFSET |
			
 
				+ 			MTK_RX_BT_32DWORDS,
			
 
				+ 			MTK_QDMA_GLO_CFG);
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -202,7 +202,7 @@
			
 
				+ #define MTK_RX_BT_32DWORDS	(3 << 11)
			
 
				+ #define MTK_NDP_CO_PRO		BIT(10)
			
 
				+ #define MTK_TX_WB_DDONE		BIT(6)
			
 
				+-#define MTK_DMA_SIZE_16DWORDS	(2 << 4)
			
 
				++#define MTK_TX_BT_32DWORDS	(3 << 4)
			
 
				+ #define MTK_RX_DMA_BUSY		BIT(3)
			
 
				+ #define MTK_TX_DMA_BUSY		BIT(1)
			
 
				+ #define MTK_RX_DMA_EN		BIT(2)
			
--- a/target/linux/generic/backport-5.15/610-v5.13-44-net-ethernet-mtk_eth_soc-increase-DMA-ring-sizes.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-44-net-ethernet-mtk_eth_soc-increase-DMA-ring-sizes.patch
@@ -0,0 +1,26 @@
 
				+From 6b4423b258b91032c50a5efca15d3d9bb194ea1d Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:01 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: increase DMA ring sizes
			
 
				+
			
 
				+256 descriptors is not enough for multi-gigabit traffic under load on
			
 
				+MT7622. Bump it to 512 to improve performance.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.h | 2 +-
			
 
				+ 1 file changed, 1 insertion(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -21,7 +21,7 @@
			
 
				+ #define MTK_QDMA_PAGE_SIZE	2048
			
 
				+ #define	MTK_MAX_RX_LENGTH	1536
			
 
				+ #define MTK_TX_DMA_BUF_LEN	0x3fff
			
 
				+-#define MTK_DMA_SIZE		256
			
 
				++#define MTK_DMA_SIZE		512
			
 
				+ #define MTK_NAPI_WEIGHT		64
			
 
				+ #define MTK_MAC_COUNT		2
			
 
				+ #define MTK_RX_ETH_HLEN		(VLAN_ETH_HLEN + VLAN_HLEN + ETH_FCS_LEN)
			
--- a/target/linux/generic/backport-5.15/610-v5.13-45-net-ethernet-mtk_eth_soc-implement-dynamic-interrupt.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-45-net-ethernet-mtk_eth_soc-implement-dynamic-interrupt.patch
@@ -0,0 +1,313 @@
 
				+From e9229ffd550b2d8c4997c67a501dbc3919fd4e26 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:02 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: implement dynamic interrupt
			
 
				+ moderation
			
 
				+
			
 
				+Reduces the number of interrupts under load
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+[Ilya: add documentation for new struct fields]
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/Kconfig       |  1 +
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 96 +++++++++++++++++++--
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.h | 41 +++++++--
			
 
				+ 3 files changed, 124 insertions(+), 14 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/Kconfig
			
 
				++++ b/drivers/net/ethernet/mediatek/Kconfig
			
 
				+@@ -10,6 +10,7 @@ if NET_VENDOR_MEDIATEK
			
 
				+ config NET_MEDIATEK_SOC
			
 
				+ 	tristate "MediaTek SoC Gigabit Ethernet support"
			
 
				+ 	select PHYLINK
			
 
				++	select DIMLIB
			
 
				+ 	help
			
 
				+ 	  This driver supports the gigabit ethernet MACs in the
			
 
				+ 	  MediaTek SoC family.
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1254,12 +1254,13 @@ static void mtk_update_rx_cpu_idx(struct
			
 
				+ static int mtk_poll_rx(struct napi_struct *napi, int budget,
			
 
				+ 		       struct mtk_eth *eth)
			
 
				+ {
			
 
				++	struct dim_sample dim_sample = {};
			
 
				+ 	struct mtk_rx_ring *ring;
			
 
				+ 	int idx;
			
 
				+ 	struct sk_buff *skb;
			
 
				+ 	u8 *data, *new_data;
			
 
				+ 	struct mtk_rx_dma *rxd, trxd;
			
 
				+-	int done = 0;
			
 
				++	int done = 0, bytes = 0;
			
 
				+ 
			
 
				+ 	while (done < budget) {
			
 
				+ 		struct net_device *netdev;
			
 
				+@@ -1333,6 +1334,7 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		else
			
 
				+ 			skb_checksum_none_assert(skb);
			
 
				+ 		skb->protocol = eth_type_trans(skb, netdev);
			
 
				++		bytes += pktlen;
			
 
				+ 
			
 
				+ 		if (netdev->features & NETIF_F_HW_VLAN_CTAG_RX &&
			
 
				+ 		    (trxd.rxd2 & RX_DMA_VTAG))
			
 
				+@@ -1365,6 +1367,12 @@ rx_done:
			
 
				+ 		mtk_update_rx_cpu_idx(eth);
			
 
				+ 	}
			
 
				+ 
			
 
				++	eth->rx_packets += done;
			
 
				++	eth->rx_bytes += bytes;
			
 
				++	dim_update_sample(eth->rx_events, eth->rx_packets, eth->rx_bytes,
			
 
				++			  &dim_sample);
			
 
				++	net_dim(&eth->rx_dim, dim_sample);
			
 
				++
			
 
				+ 	return done;
			
 
				+ }
			
 
				+ 
			
 
				+@@ -1457,6 +1465,7 @@ static int mtk_poll_tx_pdma(struct mtk_e
			
 
				+ static int mtk_poll_tx(struct mtk_eth *eth, int budget)
			
 
				+ {
			
 
				+ 	struct mtk_tx_ring *ring = &eth->tx_ring;
			
 
				++	struct dim_sample dim_sample = {};
			
 
				+ 	unsigned int done[MTK_MAX_DEVS];
			
 
				+ 	unsigned int bytes[MTK_MAX_DEVS];
			
 
				+ 	int total = 0, i;
			
 
				+@@ -1474,8 +1483,14 @@ static int mtk_poll_tx(struct mtk_eth *e
			
 
				+ 			continue;
			
 
				+ 		netdev_completed_queue(eth->netdev[i], done[i], bytes[i]);
			
 
				+ 		total += done[i];
			
 
				++		eth->tx_packets += done[i];
			
 
				++		eth->tx_bytes += bytes[i];
			
 
				+ 	}
			
 
				+ 
			
 
				++	dim_update_sample(eth->tx_events, eth->tx_packets, eth->tx_bytes,
			
 
				++			  &dim_sample);
			
 
				++	net_dim(&eth->tx_dim, dim_sample);
			
 
				++
			
 
				+ 	if (mtk_queue_stopped(eth) &&
			
 
				+ 	    (atomic_read(&ring->free_count) > ring->thresh))
			
 
				+ 		mtk_wake_queue(eth);
			
 
				+@@ -2150,6 +2165,7 @@ static irqreturn_t mtk_handle_irq_rx(int
			
 
				+ {
			
 
				+ 	struct mtk_eth *eth = _eth;
			
 
				+ 
			
 
				++	eth->rx_events++;
			
 
				+ 	if (likely(napi_schedule_prep(&eth->rx_napi))) {
			
 
				+ 		__napi_schedule(&eth->rx_napi);
			
 
				+ 		mtk_rx_irq_disable(eth, MTK_RX_DONE_INT);
			
 
				+@@ -2162,6 +2178,7 @@ static irqreturn_t mtk_handle_irq_tx(int
			
 
				+ {
			
 
				+ 	struct mtk_eth *eth = _eth;
			
 
				+ 
			
 
				++	eth->tx_events++;
			
 
				+ 	if (likely(napi_schedule_prep(&eth->tx_napi))) {
			
 
				+ 		__napi_schedule(&eth->tx_napi);
			
 
				+ 		mtk_tx_irq_disable(eth, MTK_TX_DONE_INT);
			
 
				+@@ -2346,6 +2363,9 @@ static int mtk_stop(struct net_device *d
			
 
				+ 	napi_disable(&eth->tx_napi);
			
 
				+ 	napi_disable(&eth->rx_napi);
			
 
				+ 
			
 
				++	cancel_work_sync(&eth->rx_dim.work);
			
 
				++	cancel_work_sync(&eth->tx_dim.work);
			
 
				++
			
 
				+ 	if (MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA))
			
 
				+ 		mtk_stop_dma(eth, MTK_QDMA_GLO_CFG);
			
 
				+ 	mtk_stop_dma(eth, MTK_PDMA_GLO_CFG);
			
 
				+@@ -2398,6 +2418,64 @@ err_disable_clks:
			
 
				+ 	return ret;
			
 
				+ }
			
 
				+ 
			
 
				++static void mtk_dim_rx(struct work_struct *work)
			
 
				++{
			
 
				++	struct dim *dim = container_of(work, struct dim, work);
			
 
				++	struct mtk_eth *eth = container_of(dim, struct mtk_eth, rx_dim);
			
 
				++	struct dim_cq_moder cur_profile;
			
 
				++	u32 val, cur;
			
 
				++
			
 
				++	cur_profile = net_dim_get_rx_moderation(eth->rx_dim.mode,
			
 
				++						dim->profile_ix);
			
 
				++	spin_lock_bh(&eth->dim_lock);
			
 
				++
			
 
				++	val = mtk_r32(eth, MTK_PDMA_DELAY_INT);
			
 
				++	val &= MTK_PDMA_DELAY_TX_MASK;
			
 
				++	val |= MTK_PDMA_DELAY_RX_EN;
			
 
				++
			
 
				++	cur = min_t(u32, DIV_ROUND_UP(cur_profile.usec, 20), MTK_PDMA_DELAY_PTIME_MASK);
			
 
				++	val |= cur << MTK_PDMA_DELAY_RX_PTIME_SHIFT;
			
 
				++
			
 
				++	cur = min_t(u32, cur_profile.pkts, MTK_PDMA_DELAY_PINT_MASK);
			
 
				++	val |= cur << MTK_PDMA_DELAY_RX_PINT_SHIFT;
			
 
				++
			
 
				++	mtk_w32(eth, val, MTK_PDMA_DELAY_INT);
			
 
				++	mtk_w32(eth, val, MTK_QDMA_DELAY_INT);
			
 
				++
			
 
				++	spin_unlock_bh(&eth->dim_lock);
			
 
				++
			
 
				++	dim->state = DIM_START_MEASURE;
			
 
				++}
			
 
				++
			
 
				++static void mtk_dim_tx(struct work_struct *work)
			
 
				++{
			
 
				++	struct dim *dim = container_of(work, struct dim, work);
			
 
				++	struct mtk_eth *eth = container_of(dim, struct mtk_eth, tx_dim);
			
 
				++	struct dim_cq_moder cur_profile;
			
 
				++	u32 val, cur;
			
 
				++
			
 
				++	cur_profile = net_dim_get_tx_moderation(eth->tx_dim.mode,
			
 
				++						dim->profile_ix);
			
 
				++	spin_lock_bh(&eth->dim_lock);
			
 
				++
			
 
				++	val = mtk_r32(eth, MTK_PDMA_DELAY_INT);
			
 
				++	val &= MTK_PDMA_DELAY_RX_MASK;
			
 
				++	val |= MTK_PDMA_DELAY_TX_EN;
			
 
				++
			
 
				++	cur = min_t(u32, DIV_ROUND_UP(cur_profile.usec, 20), MTK_PDMA_DELAY_PTIME_MASK);
			
 
				++	val |= cur << MTK_PDMA_DELAY_TX_PTIME_SHIFT;
			
 
				++
			
 
				++	cur = min_t(u32, cur_profile.pkts, MTK_PDMA_DELAY_PINT_MASK);
			
 
				++	val |= cur << MTK_PDMA_DELAY_TX_PINT_SHIFT;
			
 
				++
			
 
				++	mtk_w32(eth, val, MTK_PDMA_DELAY_INT);
			
 
				++	mtk_w32(eth, val, MTK_QDMA_DELAY_INT);
			
 
				++
			
 
				++	spin_unlock_bh(&eth->dim_lock);
			
 
				++
			
 
				++	dim->state = DIM_START_MEASURE;
			
 
				++}
			
 
				++
			
 
				+ static int mtk_hw_init(struct mtk_eth *eth)
			
 
				+ {
			
 
				+ 	int i, val, ret;
			
 
				+@@ -2419,9 +2497,6 @@ static int mtk_hw_init(struct mtk_eth *e
			
 
				+ 			goto err_disable_pm;
			
 
				+ 		}
			
 
				+ 
			
 
				+-		/* enable interrupt delay for RX */
			
 
				+-		mtk_w32(eth, MTK_PDMA_DELAY_RX_DELAY, MTK_PDMA_DELAY_INT);
			
 
				+-
			
 
				+ 		/* disable delay and normal interrupt */
			
 
				+ 		mtk_tx_irq_disable(eth, ~0);
			
 
				+ 		mtk_rx_irq_disable(eth, ~0);
			
 
				+@@ -2460,11 +2535,11 @@ static int mtk_hw_init(struct mtk_eth *e
			
 
				+ 	/* Enable RX VLan Offloading */
			
 
				+ 	mtk_w32(eth, 1, MTK_CDMP_EG_CTRL);
			
 
				+ 
			
 
				+-	/* enable interrupt delay for RX */
			
 
				+-	mtk_w32(eth, MTK_PDMA_DELAY_RX_DELAY, MTK_PDMA_DELAY_INT);
			
 
				++	/* set interrupt delays based on current Net DIM sample */
			
 
				++	mtk_dim_rx(&eth->rx_dim.work);
			
 
				++	mtk_dim_tx(&eth->tx_dim.work);
			
 
				+ 
			
 
				+ 	/* disable delay and normal interrupt */
			
 
				+-	mtk_w32(eth, 0, MTK_QDMA_DELAY_INT);
			
 
				+ 	mtk_tx_irq_disable(eth, ~0);
			
 
				+ 	mtk_rx_irq_disable(eth, ~0);
			
 
				+ 
			
 
				+@@ -2969,6 +3044,13 @@ static int mtk_probe(struct platform_dev
			
 
				+ 	spin_lock_init(&eth->page_lock);
			
 
				+ 	spin_lock_init(&eth->tx_irq_lock);
			
 
				+ 	spin_lock_init(&eth->rx_irq_lock);
			
 
				++	spin_lock_init(&eth->dim_lock);
			
 
				++
			
 
				++	eth->rx_dim.mode = DIM_CQ_PERIOD_MODE_START_FROM_EQE;
			
 
				++	INIT_WORK(&eth->rx_dim.work, mtk_dim_rx);
			
 
				++
			
 
				++	eth->tx_dim.mode = DIM_CQ_PERIOD_MODE_START_FROM_EQE;
			
 
				++	INIT_WORK(&eth->tx_dim.work, mtk_dim_tx);
			
 
				+ 
			
 
				+ 	if (!MTK_HAS_CAPS(eth->soc->caps, MTK_SOC_MT7628)) {
			
 
				+ 		eth->ethsys = syscon_regmap_lookup_by_phandle(pdev->dev.of_node,
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -16,6 +16,7 @@
			
 
				+ #include <linux/refcount.h>
			
 
				+ #include <linux/phylink.h>
			
 
				+ #include <linux/rhashtable.h>
			
 
				++#include <linux/dim.h>
			
 
				+ #include "mtk_ppe.h"
			
 
				+ 
			
 
				+ #define MTK_QDMA_PAGE_SIZE	2048
			
 
				+@@ -136,13 +137,18 @@
			
 
				+ 
			
 
				+ /* PDMA Delay Interrupt Register */
			
 
				+ #define MTK_PDMA_DELAY_INT		0xa0c
			
 
				++#define MTK_PDMA_DELAY_RX_MASK		GENMASK(15, 0)
			
 
				+ #define MTK_PDMA_DELAY_RX_EN		BIT(15)
			
 
				+-#define MTK_PDMA_DELAY_RX_PINT		4
			
 
				+ #define MTK_PDMA_DELAY_RX_PINT_SHIFT	8
			
 
				+-#define MTK_PDMA_DELAY_RX_PTIME		4
			
 
				+-#define MTK_PDMA_DELAY_RX_DELAY		\
			
 
				+-	(MTK_PDMA_DELAY_RX_EN | MTK_PDMA_DELAY_RX_PTIME | \
			
 
				+-	(MTK_PDMA_DELAY_RX_PINT << MTK_PDMA_DELAY_RX_PINT_SHIFT))
			
 
				++#define MTK_PDMA_DELAY_RX_PTIME_SHIFT	0
			
 
				++
			
 
				++#define MTK_PDMA_DELAY_TX_MASK		GENMASK(31, 16)
			
 
				++#define MTK_PDMA_DELAY_TX_EN		BIT(31)
			
 
				++#define MTK_PDMA_DELAY_TX_PINT_SHIFT	24
			
 
				++#define MTK_PDMA_DELAY_TX_PTIME_SHIFT	16
			
 
				++
			
 
				++#define MTK_PDMA_DELAY_PINT_MASK	0x7f
			
 
				++#define MTK_PDMA_DELAY_PTIME_MASK	0xff
			
 
				+ 
			
 
				+ /* PDMA Interrupt Status Register */
			
 
				+ #define MTK_PDMA_INT_STATUS	0xa20
			
 
				+@@ -224,6 +230,7 @@
			
 
				+ /* QDMA Interrupt Status Register */
			
 
				+ #define MTK_QDMA_INT_STATUS	0x1A18
			
 
				+ #define MTK_RX_DONE_DLY		BIT(30)
			
 
				++#define MTK_TX_DONE_DLY		BIT(28)
			
 
				+ #define MTK_RX_DONE_INT3	BIT(19)
			
 
				+ #define MTK_RX_DONE_INT2	BIT(18)
			
 
				+ #define MTK_RX_DONE_INT1	BIT(17)
			
 
				+@@ -233,8 +240,7 @@
			
 
				+ #define MTK_TX_DONE_INT1	BIT(1)
			
 
				+ #define MTK_TX_DONE_INT0	BIT(0)
			
 
				+ #define MTK_RX_DONE_INT		MTK_RX_DONE_DLY
			
 
				+-#define MTK_TX_DONE_INT		(MTK_TX_DONE_INT0 | MTK_TX_DONE_INT1 | \
			
 
				+-				 MTK_TX_DONE_INT2 | MTK_TX_DONE_INT3)
			
 
				++#define MTK_TX_DONE_INT		MTK_TX_DONE_DLY
			
 
				+ 
			
 
				+ /* QDMA Interrupt grouping registers */
			
 
				+ #define MTK_QDMA_INT_GRP1	0x1a20
			
 
				+@@ -863,6 +869,7 @@ struct mtk_sgmii {
			
 
				+  * @page_lock:		Make sure that register operations are atomic
			
 
				+  * @tx_irq__lock:	Make sure that IRQ register operations are atomic
			
 
				+  * @rx_irq__lock:	Make sure that IRQ register operations are atomic
			
 
				++ * @dim_lock:		Make sure that Net DIM operations are atomic
			
 
				+  * @dummy_dev:		we run 2 netdevs on 1 physical DMA ring and need a
			
 
				+  *			dummy for NAPI to work
			
 
				+  * @netdev:		The netdev instances
			
 
				+@@ -881,6 +888,14 @@ struct mtk_sgmii {
			
 
				+  * @rx_ring_qdma:	Pointer to the memory holding info about the QDMA RX ring
			
 
				+  * @tx_napi:		The TX NAPI struct
			
 
				+  * @rx_napi:		The RX NAPI struct
			
 
				++ * @rx_events:		Net DIM RX event counter
			
 
				++ * @rx_packets:		Net DIM RX packet counter
			
 
				++ * @rx_bytes:		Net DIM RX byte counter
			
 
				++ * @rx_dim:		Net DIM RX context
			
 
				++ * @tx_events:		Net DIM TX event counter
			
 
				++ * @tx_packets:		Net DIM TX packet counter
			
 
				++ * @tx_bytes:		Net DIM TX byte counter
			
 
				++ * @tx_dim:		Net DIM TX context
			
 
				+  * @scratch_ring:	Newer SoCs need memory for a second HW managed TX ring
			
 
				+  * @phy_scratch_ring:	physical address of scratch_ring
			
 
				+  * @scratch_head:	The scratch memory that scratch_ring points to.
			
 
				+@@ -925,6 +940,18 @@ struct mtk_eth {
			
 
				+ 
			
 
				+ 	const struct mtk_soc_data	*soc;
			
 
				+ 
			
 
				++	spinlock_t			dim_lock;
			
 
				++
			
 
				++	u32				rx_events;
			
 
				++	u32				rx_packets;
			
 
				++	u32				rx_bytes;
			
 
				++	struct dim			rx_dim;
			
 
				++
			
 
				++	u32				tx_events;
			
 
				++	u32				tx_packets;
			
 
				++	u32				tx_bytes;
			
 
				++	struct dim			tx_dim;
			
 
				++
			
 
				+ 	u32				tx_int_mask_reg;
			
 
				+ 	u32				tx_int_status_reg;
			
 
				+ 	u32				rx_dma_l4_valid;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-46-net-ethernet-mtk_eth_soc-cache-HW-pointer-of-last-fr.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-46-net-ethernet-mtk_eth_soc-cache-HW-pointer-of-last-fr.patch
@@ -0,0 +1,73 @@
 
				+From 4e6bf609569c59b6bd6acf4a607c096cbd820d79 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:03 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: cache HW pointer of last freed TX
			
 
				+ descriptor
			
 
				+
			
 
				+The value is only updated by the CPU, so it is cheaper to access from the
			
 
				+ring data structure than from a hardware register.
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 8 ++++----
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.h | 2 ++
			
 
				+ 2 files changed, 6 insertions(+), 4 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1385,7 +1385,7 @@ static int mtk_poll_tx_qdma(struct mtk_e
			
 
				+ 	struct mtk_tx_buf *tx_buf;
			
 
				+ 	u32 cpu, dma;
			
 
				+ 
			
 
				+-	cpu = mtk_r32(eth, MTK_QTX_CRX_PTR);
			
 
				++	cpu = ring->last_free_ptr;
			
 
				+ 	dma = mtk_r32(eth, MTK_QTX_DRX_PTR);
			
 
				+ 
			
 
				+ 	desc = mtk_qdma_phys_to_virt(ring, cpu);
			
 
				+@@ -1419,6 +1419,7 @@ static int mtk_poll_tx_qdma(struct mtk_e
			
 
				+ 		cpu = next_cpu;
			
 
				+ 	}
			
 
				+ 
			
 
				++	ring->last_free_ptr = cpu;
			
 
				+ 	mtk_w32(eth, cpu, MTK_QTX_CRX_PTR);
			
 
				+ 
			
 
				+ 	return budget;
			
 
				+@@ -1619,6 +1620,7 @@ static int mtk_tx_alloc(struct mtk_eth *
			
 
				+ 	atomic_set(&ring->free_count, MTK_DMA_SIZE - 2);
			
 
				+ 	ring->next_free = &ring->dma[0];
			
 
				+ 	ring->last_free = &ring->dma[MTK_DMA_SIZE - 1];
			
 
				++	ring->last_free_ptr = (u32)(ring->phys + ((MTK_DMA_SIZE - 1) * sz));
			
 
				+ 	ring->thresh = MAX_SKB_FRAGS;
			
 
				+ 
			
 
				+ 	/* make sure that all changes to the dma ring are flushed before we
			
 
				+@@ -1632,9 +1634,7 @@ static int mtk_tx_alloc(struct mtk_eth *
			
 
				+ 		mtk_w32(eth,
			
 
				+ 			ring->phys + ((MTK_DMA_SIZE - 1) * sz),
			
 
				+ 			MTK_QTX_CRX_PTR);
			
 
				+-		mtk_w32(eth,
			
 
				+-			ring->phys + ((MTK_DMA_SIZE - 1) * sz),
			
 
				+-			MTK_QTX_DRX_PTR);
			
 
				++		mtk_w32(eth, ring->last_free_ptr, MTK_QTX_DRX_PTR);
			
 
				+ 		mtk_w32(eth, (QDMA_RES_THRES << 8) | QDMA_RES_THRES,
			
 
				+ 			MTK_QTX_CFG(0));
			
 
				+ 	} else {
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -656,6 +656,7 @@ struct mtk_tx_buf {
			
 
				+  * @phys:		The physical addr of tx_buf
			
 
				+  * @next_free:		Pointer to the next free descriptor
			
 
				+  * @last_free:		Pointer to the last free descriptor
			
 
				++ * @last_free_ptr:	Hardware pointer value of the last free descriptor
			
 
				+  * @thresh:		The threshold of minimum amount of free descriptors
			
 
				+  * @free_count:		QDMA uses a linked list. Track how many free descriptors
			
 
				+  *			are present
			
 
				+@@ -666,6 +667,7 @@ struct mtk_tx_ring {
			
 
				+ 	dma_addr_t phys;
			
 
				+ 	struct mtk_tx_dma *next_free;
			
 
				+ 	struct mtk_tx_dma *last_free;
			
 
				++	u32 last_free_ptr;
			
 
				+ 	u16 thresh;
			
 
				+ 	atomic_t free_count;
			
 
				+ 	int dma_size;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-47-net-ethernet-mtk_eth_soc-only-read-the-full-RX-descr.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-47-net-ethernet-mtk_eth_soc-only-read-the-full-RX-descr.patch
@@ -0,0 +1,49 @@
 
				+From 816ac3e6e67bdd78d86226c6eb53619780750e92 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:04 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: only read the full RX descriptor
			
 
				+ if DMA is done
			
 
				+
			
 
				+Uncached memory access is expensive, and there is no need to access all
			
 
				+descriptor words if we can't process them anyway
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 12 ++++++++----
			
 
				+ 1 file changed, 8 insertions(+), 4 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -798,13 +798,18 @@ static inline int mtk_max_buf_size(int f
			
 
				+ 	return buf_size;
			
 
				+ }
			
 
				+ 
			
 
				+-static inline void mtk_rx_get_desc(struct mtk_rx_dma *rxd,
			
 
				++static inline bool mtk_rx_get_desc(struct mtk_rx_dma *rxd,
			
 
				+ 				   struct mtk_rx_dma *dma_rxd)
			
 
				+ {
			
 
				+-	rxd->rxd1 = READ_ONCE(dma_rxd->rxd1);
			
 
				+ 	rxd->rxd2 = READ_ONCE(dma_rxd->rxd2);
			
 
				++	if (!(rxd->rxd2 & RX_DMA_DONE))
			
 
				++		return false;
			
 
				++
			
 
				++	rxd->rxd1 = READ_ONCE(dma_rxd->rxd1);
			
 
				+ 	rxd->rxd3 = READ_ONCE(dma_rxd->rxd3);
			
 
				+ 	rxd->rxd4 = READ_ONCE(dma_rxd->rxd4);
			
 
				++
			
 
				++	return true;
			
 
				+ }
			
 
				+ 
			
 
				+ /* the qdma core needs scratch memory to be setup */
			
 
				+@@ -1276,8 +1281,7 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		rxd = &ring->dma[idx];
			
 
				+ 		data = ring->data[idx];
			
 
				+ 
			
 
				+-		mtk_rx_get_desc(&trxd, rxd);
			
 
				+-		if (!(trxd.rxd2 & RX_DMA_DONE))
			
 
				++		if (!mtk_rx_get_desc(&trxd, rxd))
			
 
				+ 			break;
			
 
				+ 
			
 
				+ 		/* find out which mac the packet come from. values start at 1 */
			
--- a/target/linux/generic/backport-5.15/610-v5.13-48-net-ethernet-mtk_eth_soc-reduce-unnecessary-interrup.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-48-net-ethernet-mtk_eth_soc-reduce-unnecessary-interrup.patch
@@ -0,0 +1,39 @@
 
				+From 16769a8923fad5a5377253bcd76b0e0d64976c73 Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:05 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: reduce unnecessary interrupts
			
 
				+
			
 
				+Avoid rearming interrupt if napi_complete returns false
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 9 +++++----
			
 
				+ 1 file changed, 5 insertions(+), 4 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1540,8 +1540,8 @@ static int mtk_napi_tx(struct napi_struc
			
 
				+ 	if (status & MTK_TX_DONE_INT)
			
 
				+ 		return budget;
			
 
				+ 
			
 
				+-	napi_complete(napi);
			
 
				+-	mtk_tx_irq_enable(eth, MTK_TX_DONE_INT);
			
 
				++	if (napi_complete(napi))
			
 
				++		mtk_tx_irq_enable(eth, MTK_TX_DONE_INT);
			
 
				+ 
			
 
				+ 	return tx_done;
			
 
				+ }
			
 
				+@@ -1574,8 +1574,9 @@ poll_again:
			
 
				+ 		remain_budget -= rx_done;
			
 
				+ 		goto poll_again;
			
 
				+ 	}
			
 
				+-	napi_complete(napi);
			
 
				+-	mtk_rx_irq_enable(eth, MTK_RX_DONE_INT);
			
 
				++
			
 
				++	if (napi_complete(napi))
			
 
				++		mtk_rx_irq_enable(eth, MTK_RX_DONE_INT);
			
 
				+ 
			
 
				+ 	return rx_done + budget - remain_budget;
			
 
				+ }
			
--- a/target/linux/generic/backport-5.15/610-v5.13-49-net-ethernet-mtk_eth_soc-rework-NAPI-callbacks.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-49-net-ethernet-mtk_eth_soc-rework-NAPI-callbacks.patch
@@ -0,0 +1,110 @@
 
				+From db2c7b353db3b3f71b55f9ff4627d8a786446fbe Mon Sep 17 00:00:00 2001
			
 
				+From: Ilya Lipnitskiy <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:06 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: rework NAPI callbacks
			
 
				+
			
 
				+Use napi_complete_done to communicate total TX and RX work done to NAPI.
			
 
				+Count total RX work up instead of remaining work down for clarity.
			
 
				+Remove unneeded local variables for clarity. Use do {} while instead of
			
 
				+goto for clarity.
			
 
				+
			
 
				+Suggested-by: Jakub Kicinski <[email protected]>
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 54 +++++++++------------
			
 
				+ 1 file changed, 24 insertions(+), 30 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -1517,7 +1517,6 @@ static void mtk_handle_status_irq(struct
			
 
				+ static int mtk_napi_tx(struct napi_struct *napi, int budget)
			
 
				+ {
			
 
				+ 	struct mtk_eth *eth = container_of(napi, struct mtk_eth, tx_napi);
			
 
				+-	u32 status, mask;
			
 
				+ 	int tx_done = 0;
			
 
				+ 
			
 
				+ 	if (MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA))
			
 
				+@@ -1526,21 +1525,19 @@ static int mtk_napi_tx(struct napi_struc
			
 
				+ 	tx_done = mtk_poll_tx(eth, budget);
			
 
				+ 
			
 
				+ 	if (unlikely(netif_msg_intr(eth))) {
			
 
				+-		status = mtk_r32(eth, eth->tx_int_status_reg);
			
 
				+-		mask = mtk_r32(eth, eth->tx_int_mask_reg);
			
 
				+ 		dev_info(eth->dev,
			
 
				+-			 "done tx %d, intr 0x%08x/0x%x\n",
			
 
				+-			 tx_done, status, mask);
			
 
				++			 "done tx %d, intr 0x%08x/0x%x\n", tx_done,
			
 
				++			 mtk_r32(eth, eth->tx_int_status_reg),
			
 
				++			 mtk_r32(eth, eth->tx_int_mask_reg));
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	if (tx_done == budget)
			
 
				+ 		return budget;
			
 
				+ 
			
 
				+-	status = mtk_r32(eth, eth->tx_int_status_reg);
			
 
				+-	if (status & MTK_TX_DONE_INT)
			
 
				++	if (mtk_r32(eth, eth->tx_int_status_reg) & MTK_TX_DONE_INT)
			
 
				+ 		return budget;
			
 
				+ 
			
 
				+-	if (napi_complete(napi))
			
 
				++	if (napi_complete_done(napi, tx_done))
			
 
				+ 		mtk_tx_irq_enable(eth, MTK_TX_DONE_INT);
			
 
				+ 
			
 
				+ 	return tx_done;
			
 
				+@@ -1549,36 +1546,33 @@ static int mtk_napi_tx(struct napi_struc
			
 
				+ static int mtk_napi_rx(struct napi_struct *napi, int budget)
			
 
				+ {
			
 
				+ 	struct mtk_eth *eth = container_of(napi, struct mtk_eth, rx_napi);
			
 
				+-	u32 status, mask;
			
 
				+-	int rx_done = 0;
			
 
				+-	int remain_budget = budget;
			
 
				++	int rx_done_total = 0;
			
 
				+ 
			
 
				+ 	mtk_handle_status_irq(eth);
			
 
				+ 
			
 
				+-poll_again:
			
 
				+-	mtk_w32(eth, MTK_RX_DONE_INT, MTK_PDMA_INT_STATUS);
			
 
				+-	rx_done = mtk_poll_rx(napi, remain_budget, eth);
			
 
				++	do {
			
 
				++		int rx_done;
			
 
				+ 
			
 
				+-	if (unlikely(netif_msg_intr(eth))) {
			
 
				+-		status = mtk_r32(eth, MTK_PDMA_INT_STATUS);
			
 
				+-		mask = mtk_r32(eth, MTK_PDMA_INT_MASK);
			
 
				+-		dev_info(eth->dev,
			
 
				+-			 "done rx %d, intr 0x%08x/0x%x\n",
			
 
				+-			 rx_done, status, mask);
			
 
				+-	}
			
 
				+-	if (rx_done == remain_budget)
			
 
				+-		return budget;
			
 
				++		mtk_w32(eth, MTK_RX_DONE_INT, MTK_PDMA_INT_STATUS);
			
 
				++		rx_done = mtk_poll_rx(napi, budget - rx_done_total, eth);
			
 
				++		rx_done_total += rx_done;
			
 
				++
			
 
				++		if (unlikely(netif_msg_intr(eth))) {
			
 
				++			dev_info(eth->dev,
			
 
				++				 "done rx %d, intr 0x%08x/0x%x\n", rx_done,
			
 
				++				 mtk_r32(eth, MTK_PDMA_INT_STATUS),
			
 
				++				 mtk_r32(eth, MTK_PDMA_INT_MASK));
			
 
				++		}
			
 
				+ 
			
 
				+-	status = mtk_r32(eth, MTK_PDMA_INT_STATUS);
			
 
				+-	if (status & MTK_RX_DONE_INT) {
			
 
				+-		remain_budget -= rx_done;
			
 
				+-		goto poll_again;
			
 
				+-	}
			
 
				++		if (rx_done_total == budget)
			
 
				++			return budget;
			
 
				++
			
 
				++	} while (mtk_r32(eth, MTK_PDMA_INT_STATUS) & MTK_RX_DONE_INT);
			
 
				+ 
			
 
				+-	if (napi_complete(napi))
			
 
				++	if (napi_complete_done(napi, rx_done_total))
			
 
				+ 		mtk_rx_irq_enable(eth, MTK_RX_DONE_INT);
			
 
				+ 
			
 
				+-	return rx_done + budget - remain_budget;
			
 
				++	return rx_done_total;
			
 
				+ }
			
 
				+ 
			
 
				+ static int mtk_tx_alloc(struct mtk_eth *eth)
			
--- a/target/linux/generic/backport-5.15/610-v5.13-50-net-ethernet-mtk_eth_soc-set-PPE-flow-hash-as-skb-ha.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-50-net-ethernet-mtk_eth_soc-set-PPE-flow-hash-as-skb-ha.patch
@@ -0,0 +1,47 @@
 
				+From fa817272c37ef78e25dc14e4760ac78a7043a18a Mon Sep 17 00:00:00 2001
			
 
				+From: Felix Fietkau <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:07 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: set PPE flow hash as skb hash if
			
 
				+ present
			
 
				+
			
 
				+This improves GRO performance
			
 
				+
			
 
				+Signed-off-by: Felix Fietkau <[email protected]>
			
 
				+[Ilya: Use MTK_RXD4_FOE_ENTRY instead of GENMASK(13, 0)]
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 8 ++++++++
			
 
				+ 1 file changed, 8 insertions(+)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -19,6 +19,7 @@
			
 
				+ #include <linux/interrupt.h>
			
 
				+ #include <linux/pinctrl/devinfo.h>
			
 
				+ #include <linux/phylink.h>
			
 
				++#include <linux/jhash.h>
			
 
				+ #include <net/dsa.h>
			
 
				+ 
			
 
				+ #include "mtk_eth_soc.h"
			
 
				+@@ -1271,6 +1272,7 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		struct net_device *netdev;
			
 
				+ 		unsigned int pktlen;
			
 
				+ 		dma_addr_t dma_addr;
			
 
				++		u32 hash;
			
 
				+ 		int mac;
			
 
				+ 
			
 
				+ 		ring = mtk_get_rx_ring(eth);
			
 
				+@@ -1340,6 +1342,12 @@ static int mtk_poll_rx(struct napi_struc
			
 
				+ 		skb->protocol = eth_type_trans(skb, netdev);
			
 
				+ 		bytes += pktlen;
			
 
				+ 
			
 
				++		hash = trxd.rxd4 & MTK_RXD4_FOE_ENTRY;
			
 
				++		if (hash != MTK_RXD4_FOE_ENTRY) {
			
 
				++			hash = jhash_1word(hash, 0);
			
 
				++			skb_set_hash(skb, hash, PKT_HASH_TYPE_L4);
			
 
				++		}
			
 
				++
			
 
				+ 		if (netdev->features & NETIF_F_HW_VLAN_CTAG_RX &&
			
 
				+ 		    (trxd.rxd2 & RX_DMA_VTAG))
			
 
				+ 			__vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
			
--- a/target/linux/generic/backport-5.15/610-v5.13-51-net-ethernet-mtk_eth_soc-use-iopoll.h-macro-for-DMA-.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-51-net-ethernet-mtk_eth_soc-use-iopoll.h-macro-for-DMA-.patch
@@ -0,0 +1,71 @@
 
				+From 3bc8e0aff23be0526af0dbc7973a8866a08d73f1 Mon Sep 17 00:00:00 2001
			
 
				+From: Ilya Lipnitskiy <[email protected]>
			
 
				+Date: Thu, 22 Apr 2021 22:21:08 -0700
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: use iopoll.h macro for DMA init
			
 
				+
			
 
				+Replace a tight busy-wait loop without a pause with a standard
			
 
				+readx_poll_timeout_atomic routine with a 5 us poll period.
			
 
				+
			
 
				+Tested by booting a MT7621 device to ensure the driver initializes
			
 
				+properly.
			
 
				+
			
 
				+Signed-off-by: Ilya Lipnitskiy <[email protected]>
			
 
				+Reviewed-by: Andrew Lunn <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 29 +++++++++------------
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.h |  2 +-
			
 
				+ 2 files changed, 14 insertions(+), 17 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -2054,25 +2054,22 @@ static int mtk_set_features(struct net_d
			
 
				+ /* wait for DMA to finish whatever it is doing before we start using it again */
			
 
				+ static int mtk_dma_busy_wait(struct mtk_eth *eth)
			
 
				+ {
			
 
				+-	unsigned long t_start = jiffies;
			
 
				++	unsigned int reg;
			
 
				++	int ret;
			
 
				++	u32 val;
			
 
				+ 
			
 
				+-	while (1) {
			
 
				+-		if (MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA)) {
			
 
				+-			if (!(mtk_r32(eth, MTK_QDMA_GLO_CFG) &
			
 
				+-			      (MTK_RX_DMA_BUSY | MTK_TX_DMA_BUSY)))
			
 
				+-				return 0;
			
 
				+-		} else {
			
 
				+-			if (!(mtk_r32(eth, MTK_PDMA_GLO_CFG) &
			
 
				+-			      (MTK_RX_DMA_BUSY | MTK_TX_DMA_BUSY)))
			
 
				+-				return 0;
			
 
				+-		}
			
 
				++	if (MTK_HAS_CAPS(eth->soc->caps, MTK_QDMA))
			
 
				++		reg = MTK_QDMA_GLO_CFG;
			
 
				++	else
			
 
				++		reg = MTK_PDMA_GLO_CFG;
			
 
				+ 
			
 
				+-		if (time_after(jiffies, t_start + MTK_DMA_BUSY_TIMEOUT))
			
 
				+-			break;
			
 
				+-	}
			
 
				++	ret = readx_poll_timeout_atomic(__raw_readl, eth->base + reg, val,
			
 
				++					!(val & (MTK_RX_DMA_BUSY | MTK_TX_DMA_BUSY)),
			
 
				++					5, MTK_DMA_BUSY_TIMEOUT_US);
			
 
				++	if (ret)
			
 
				++		dev_err(eth->dev, "DMA init timeout\n");
			
 
				+ 
			
 
				+-	dev_err(eth->dev, "DMA init timeout\n");
			
 
				+-	return -1;
			
 
				++	return ret;
			
 
				+ }
			
 
				+ 
			
 
				+ static int mtk_dma_init(struct mtk_eth *eth)
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -213,7 +213,7 @@
			
 
				+ #define MTK_TX_DMA_BUSY		BIT(1)
			
 
				+ #define MTK_RX_DMA_EN		BIT(2)
			
 
				+ #define MTK_TX_DMA_EN		BIT(0)
			
 
				+-#define MTK_DMA_BUSY_TIMEOUT	HZ
			
 
				++#define MTK_DMA_BUSY_TIMEOUT_US	1000000
			
 
				+ 
			
 
				+ /* QDMA Reset Index Register */
			
 
				+ #define MTK_QDMA_RST_IDX	0x1A08
			
--- a/target/linux/generic/backport-5.15/610-v5.13-52-net-ethernet-mtk_eth_soc-missing-mutex.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-52-net-ethernet-mtk_eth_soc-missing-mutex.patch
@@ -0,0 +1,63 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Sun, 18 Apr 2021 23:11:44 +0200
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: missing mutex
			
 
				+
			
 
				+Patch 2ed37183abb7 ("netfilter: flowtable: separate replace, destroy and
			
 
				+stats to different workqueues") splits the workqueue per event type. Add
			
 
				+a mutex to serialize updates.
			
 
				+
			
 
				+Fixes: 502e84e2382d ("net: ethernet: mtk_eth_soc: add flow offloading support")
			
 
				+Reported-by: Frank Wunderlich <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				+@@ -392,6 +392,8 @@ mtk_flow_offload_stats(struct mtk_eth *e
			
 
				+ 	return 0;
			
 
				+ }
			
 
				+ 
			
 
				++static DEFINE_MUTEX(mtk_flow_offload_mutex);
			
 
				++
			
 
				+ static int
			
 
				+ mtk_eth_setup_tc_block_cb(enum tc_setup_type type, void *type_data, void *cb_priv)
			
 
				+ {
			
 
				+@@ -399,6 +401,7 @@ mtk_eth_setup_tc_block_cb(enum tc_setup_
			
 
				+ 	struct net_device *dev = cb_priv;
			
 
				+ 	struct mtk_mac *mac = netdev_priv(dev);
			
 
				+ 	struct mtk_eth *eth = mac->hw;
			
 
				++	int err;
			
 
				+ 
			
 
				+ 	if (!tc_can_offload(dev))
			
 
				+ 		return -EOPNOTSUPP;
			
 
				+@@ -406,18 +409,24 @@ mtk_eth_setup_tc_block_cb(enum tc_setup_
			
 
				+ 	if (type != TC_SETUP_CLSFLOWER)
			
 
				+ 		return -EOPNOTSUPP;
			
 
				+ 
			
 
				++	mutex_lock(&mtk_flow_offload_mutex);
			
 
				+ 	switch (cls->command) {
			
 
				+ 	case FLOW_CLS_REPLACE:
			
 
				+-		return mtk_flow_offload_replace(eth, cls);
			
 
				++		err = mtk_flow_offload_replace(eth, cls);
			
 
				++		break;
			
 
				+ 	case FLOW_CLS_DESTROY:
			
 
				+-		return mtk_flow_offload_destroy(eth, cls);
			
 
				++		err = mtk_flow_offload_destroy(eth, cls);
			
 
				++		break;
			
 
				+ 	case FLOW_CLS_STATS:
			
 
				+-		return mtk_flow_offload_stats(eth, cls);
			
 
				++		err = mtk_flow_offload_stats(eth, cls);
			
 
				++		break;
			
 
				+ 	default:
			
 
				+-		return -EOPNOTSUPP;
			
 
				++		err = -EOPNOTSUPP;
			
 
				++		break;
			
 
				+ 	}
			
 
				++	mutex_unlock(&mtk_flow_offload_mutex);
			
 
				+ 
			
 
				+-	return 0;
			
 
				++	return err;
			
 
				+ }
			
 
				+ 
			
 
				+ static int
			
--- a/target/linux/generic/backport-5.15/610-v5.13-53-net-ethernet-mtk_eth_soc-handle-VLAN-pop-action.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-53-net-ethernet-mtk_eth_soc-handle-VLAN-pop-action.patch
@@ -0,0 +1,22 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Sun, 18 Apr 2021 23:11:45 +0200
			
 
				+Subject: [PATCH] net: ethernet: mtk_eth_soc: handle VLAN pop action
			
 
				+
			
 
				+Do not hit EOPNOTSUPP when flowtable offload provides a VLAN pop action.
			
 
				+
			
 
				+Fixes: efce49dfe6a8 ("netfilter: flowtable: add vlan pop action offload support")
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_ppe_offload.c
			
 
				+@@ -233,6 +233,8 @@ mtk_flow_offload_replace(struct mtk_eth
			
 
				+ 			data.vlan.proto = act->vlan.proto;
			
 
				+ 			data.vlan.num++;
			
 
				+ 			break;
			
 
				++		case FLOW_ACTION_VLAN_POP:
			
 
				++			break;
			
 
				+ 		case FLOW_ACTION_PPPOE_PUSH:
			
 
				+ 			if (data.pppoe.num == 1)
			
 
				+ 				return -EOPNOTSUPP;
			
--- a/target/linux/generic/backport-5.15/610-v5.13-54-netfilter-flowtable-dst_check-from-garbage-collector.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-54-netfilter-flowtable-dst_check-from-garbage-collector.patch
@@ -0,0 +1,159 @@
 
				+From: Pablo Neira Ayuso <[email protected]>
			
 
				+Date: Sun, 28 Mar 2021 23:08:55 +0200
			
 
				+Subject: [PATCH] netfilter: flowtable: dst_check() from garbage collector path
			
 
				+
			
 
				+Move dst_check() to the garbage collector path. Stale routes trigger the
			
 
				+flow entry teardown state which makes affected flows go back to the
			
 
				+classic forwarding path to re-evaluate flow offloading.
			
 
				+
			
 
				+IPv6 requires the dst cookie to work, store it in the flow_tuple,
			
 
				+otherwise dst_check() always fails.
			
 
				+
			
 
				+Fixes: e5075c0badaa ("netfilter: flowtable: call dst_check() to fall back to classic forwarding")
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -129,7 +129,10 @@ struct flow_offload_tuple {
			
 
				+ 					in_vlan_ingress:2;
			
 
				+ 	u16				mtu;
			
 
				+ 	union {
			
 
				+-		struct dst_entry	*dst_cache;
			
 
				++		struct {
			
 
				++			struct dst_entry *dst_cache;
			
 
				++			u32		dst_cookie;
			
 
				++		};
			
 
				+ 		struct {
			
 
				+ 			u32		ifidx;
			
 
				+ 			u32		hw_ifidx;
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -74,6 +74,18 @@ err_ct_refcnt:
			
 
				+ }
			
 
				+ EXPORT_SYMBOL_GPL(flow_offload_alloc);
			
 
				+ 
			
 
				++static u32 flow_offload_dst_cookie(struct flow_offload_tuple *flow_tuple)
			
 
				++{
			
 
				++	const struct rt6_info *rt;
			
 
				++
			
 
				++	if (flow_tuple->l3proto == NFPROTO_IPV6) {
			
 
				++		rt = (const struct rt6_info *)flow_tuple->dst_cache;
			
 
				++		return rt6_get_cookie(rt);
			
 
				++	}
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static int flow_offload_fill_route(struct flow_offload *flow,
			
 
				+ 				   const struct nf_flow_route *route,
			
 
				+ 				   enum flow_offload_tuple_dir dir)
			
 
				+@@ -116,6 +128,7 @@ static int flow_offload_fill_route(struc
			
 
				+ 			return -1;
			
 
				+ 
			
 
				+ 		flow_tuple->dst_cache = dst;
			
 
				++		flow_tuple->dst_cookie = flow_offload_dst_cookie(flow_tuple);
			
 
				+ 		break;
			
 
				+ 	}
			
 
				+ 	flow_tuple->xmit_type = route->tuple[dir].xmit_type;
			
 
				+@@ -389,11 +402,33 @@ nf_flow_table_iterate(struct nf_flowtabl
			
 
				+ 	return err;
			
 
				+ }
			
 
				+ 
			
 
				++static bool flow_offload_stale_dst(struct flow_offload_tuple *tuple)
			
 
				++{
			
 
				++	struct dst_entry *dst;
			
 
				++
			
 
				++	if (tuple->xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				++	    tuple->xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
			
 
				++		dst = tuple->dst_cache;
			
 
				++		if (!dst_check(dst, tuple->dst_cookie))
			
 
				++			return true;
			
 
				++	}
			
 
				++
			
 
				++	return false;
			
 
				++}
			
 
				++
			
 
				++static bool nf_flow_has_stale_dst(struct flow_offload *flow)
			
 
				++{
			
 
				++	return flow_offload_stale_dst(&flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple) ||
			
 
				++	       flow_offload_stale_dst(&flow->tuplehash[FLOW_OFFLOAD_DIR_REPLY].tuple);
			
 
				++}
			
 
				++
			
 
				+ static void nf_flow_offload_gc_step(struct flow_offload *flow, void *data)
			
 
				+ {
			
 
				+ 	struct nf_flowtable *flow_table = data;
			
 
				+ 
			
 
				+-	if (nf_flow_has_expired(flow) || nf_ct_is_dying(flow->ct))
			
 
				++	if (nf_flow_has_expired(flow) ||
			
 
				++	    nf_ct_is_dying(flow->ct) ||
			
 
				++	    nf_flow_has_stale_dst(flow))
			
 
				+ 		set_bit(NF_FLOW_TEARDOWN, &flow->flags);
			
 
				+ 
			
 
				+ 	if (test_bit(NF_FLOW_TEARDOWN, &flow->flags)) {
			
 
				+--- a/net/netfilter/nf_flow_table_ip.c
			
 
				++++ b/net/netfilter/nf_flow_table_ip.c
			
 
				+@@ -364,15 +364,6 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 	if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				+-	    tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
			
 
				+-		rt = (struct rtable *)tuplehash->tuple.dst_cache;
			
 
				+-		if (!dst_check(&rt->dst, 0)) {
			
 
				+-			flow_offload_teardown(flow);
			
 
				+-			return NF_ACCEPT;
			
 
				+-		}
			
 
				+-	}
			
 
				+-
			
 
				+ 	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+@@ -391,6 +382,7 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 		nf_ct_acct_update(flow->ct, tuplehash->tuple.dir, skb->len);
			
 
				+ 
			
 
				+ 	if (unlikely(tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)) {
			
 
				++		rt = (struct rtable *)tuplehash->tuple.dst_cache;
			
 
				+ 		memset(skb->cb, 0, sizeof(struct inet_skb_parm));
			
 
				+ 		IPCB(skb)->iif = skb->dev->ifindex;
			
 
				+ 		IPCB(skb)->flags = IPSKB_FORWARDED;
			
 
				+@@ -399,6 +391,7 @@ nf_flow_offload_ip_hook(void *priv, stru
			
 
				+ 
			
 
				+ 	switch (tuplehash->tuple.xmit_type) {
			
 
				+ 	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		rt = (struct rtable *)tuplehash->tuple.dst_cache;
			
 
				+ 		outdev = rt->dst.dev;
			
 
				+ 		skb->dev = outdev;
			
 
				+ 		nexthop = rt_nexthop(rt, flow->tuplehash[!dir].tuple.src_v4.s_addr);
			
 
				+@@ -607,15 +600,6 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 	if (nf_flow_state_check(flow, ip6h->nexthdr, skb, thoff))
			
 
				+ 		return NF_ACCEPT;
			
 
				+ 
			
 
				+-	if (tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
			
 
				+-	    tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
			
 
				+-		rt = (struct rt6_info *)tuplehash->tuple.dst_cache;
			
 
				+-		if (!dst_check(&rt->dst, 0)) {
			
 
				+-			flow_offload_teardown(flow);
			
 
				+-			return NF_ACCEPT;
			
 
				+-		}
			
 
				+-	}
			
 
				+-
			
 
				+ 	if (skb_try_make_writable(skb, thoff + hdrsize))
			
 
				+ 		return NF_DROP;
			
 
				+ 
			
 
				+@@ -633,6 +617,7 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 		nf_ct_acct_update(flow->ct, tuplehash->tuple.dir, skb->len);
			
 
				+ 
			
 
				+ 	if (unlikely(tuplehash->tuple.xmit_type == FLOW_OFFLOAD_XMIT_XFRM)) {
			
 
				++		rt = (struct rt6_info *)tuplehash->tuple.dst_cache;
			
 
				+ 		memset(skb->cb, 0, sizeof(struct inet6_skb_parm));
			
 
				+ 		IP6CB(skb)->iif = skb->dev->ifindex;
			
 
				+ 		IP6CB(skb)->flags = IP6SKB_FORWARDED;
			
 
				+@@ -641,6 +626,7 @@ nf_flow_offload_ipv6_hook(void *priv, st
			
 
				+ 
			
 
				+ 	switch (tuplehash->tuple.xmit_type) {
			
 
				+ 	case FLOW_OFFLOAD_XMIT_NEIGH:
			
 
				++		rt = (struct rt6_info *)tuplehash->tuple.dst_cache;
			
 
				+ 		outdev = rt->dst.dev;
			
 
				+ 		skb->dev = outdev;
			
 
				+ 		nexthop = rt6_nexthop(rt, &flow->tuplehash[!dir].tuple.src_v6);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-55-netfilter-conntrack-Introduce-tcp-offload-timeout-co.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-55-netfilter-conntrack-Introduce-tcp-offload-timeout-co.patch
@@ -0,0 +1,94 @@
 
				+From: Oz Shlomo <[email protected]>
			
 
				+Date: Thu, 3 Jun 2021 15:12:33 +0300
			
 
				+Subject: [PATCH] netfilter: conntrack: Introduce tcp offload timeout
			
 
				+ configuration
			
 
				+
			
 
				+TCP connections may be offloaded from nf conntrack to nf flow table.
			
 
				+Offloaded connections are aged after 30 seconds of inactivity.
			
 
				+Once aged, ownership is returned to conntrack with a hard coded pickup
			
 
				+time of 120 seconds, after which the connection may be deleted.
			
 
				+eted. The current aging intervals may be too aggressive for some users.
			
 
				+
			
 
				+Provide users with the ability to control the nf flow table offload
			
 
				+aging and pickup time intervals via sysctl parameter as a pre-step for
			
 
				+configuring the nf flow table GC timeout intervals.
			
 
				+
			
 
				+Signed-off-by: Oz Shlomo <[email protected]>
			
 
				+Reviewed-by: Paul Blakey <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netns/conntrack.h
			
 
				++++ b/include/net/netns/conntrack.h
			
 
				+@@ -27,6 +27,10 @@ struct nf_tcp_net {
			
 
				+ 	int tcp_loose;
			
 
				+ 	int tcp_be_liberal;
			
 
				+ 	int tcp_max_retrans;
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	unsigned int offload_timeout;
			
 
				++	unsigned int offload_pickup;
			
 
				++#endif
			
 
				+ };
			
 
				+ 
			
 
				+ enum udp_conntrack {
			
 
				+--- a/net/netfilter/nf_conntrack_proto_tcp.c
			
 
				++++ b/net/netfilter/nf_conntrack_proto_tcp.c
			
 
				+@@ -1438,6 +1438,11 @@ void nf_conntrack_tcp_init_net(struct ne
			
 
				+ 	tn->tcp_loose = nf_ct_tcp_loose;
			
 
				+ 	tn->tcp_be_liberal = nf_ct_tcp_be_liberal;
			
 
				+ 	tn->tcp_max_retrans = nf_ct_tcp_max_retrans;
			
 
				++
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	tn->offload_timeout = 30 * HZ;
			
 
				++	tn->offload_pickup = 120 * HZ;
			
 
				++#endif
			
 
				+ }
			
 
				+ 
			
 
				+ const struct nf_conntrack_l4proto nf_conntrack_l4proto_tcp =
			
 
				+--- a/net/netfilter/nf_conntrack_standalone.c
			
 
				++++ b/net/netfilter/nf_conntrack_standalone.c
			
 
				+@@ -567,6 +567,10 @@ enum nf_ct_sysctl_index {
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_CLOSE,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_RETRANS,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_UNACK,
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_OFFLOAD,
			
 
				++	NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_OFFLOAD_PICKUP,
			
 
				++#endif
			
 
				+ 	NF_SYSCTL_CT_PROTO_TCP_LOOSE,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TCP_LIBERAL,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TCP_MAX_RETRANS,
			
 
				+@@ -758,6 +762,20 @@ static struct ctl_table nf_ct_sysctl_tab
			
 
				+ 		.mode		= 0644,
			
 
				+ 		.proc_handler	= proc_dointvec_jiffies,
			
 
				+ 	},
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	[NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_OFFLOAD] = {
			
 
				++		.procname	= "nf_flowtable_tcp_timeout",
			
 
				++		.maxlen		= sizeof(unsigned int),
			
 
				++		.mode		= 0644,
			
 
				++		.proc_handler	= proc_dointvec_jiffies,
			
 
				++	},
			
 
				++	[NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_OFFLOAD_PICKUP] = {
			
 
				++		.procname	= "nf_flowtable_tcp_pickup",
			
 
				++		.maxlen		= sizeof(unsigned int),
			
 
				++		.mode		= 0644,
			
 
				++		.proc_handler	= proc_dointvec_jiffies,
			
 
				++	},
			
 
				++#endif
			
 
				+ 	[NF_SYSCTL_CT_PROTO_TCP_LOOSE] = {
			
 
				+ 		.procname	= "nf_conntrack_tcp_loose",
			
 
				+ 		.maxlen		= sizeof(int),
			
 
				+@@ -967,6 +985,12 @@ static void nf_conntrack_standalone_init
			
 
				+ 	XASSIGN(LIBERAL, &tn->tcp_be_liberal);
			
 
				+ 	XASSIGN(MAX_RETRANS, &tn->tcp_max_retrans);
			
 
				+ #undef XASSIGN
			
 
				++
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	table[NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_OFFLOAD].data = &tn->offload_timeout;
			
 
				++	table[NF_SYSCTL_CT_PROTO_TIMEOUT_TCP_OFFLOAD_PICKUP].data = &tn->offload_pickup;
			
 
				++#endif
			
 
				++
			
 
				+ }
			
 
				+ 
			
 
				+ static void nf_conntrack_standalone_init_sctp_sysctl(struct net *net,
			
--- a/target/linux/generic/backport-5.15/610-v5.13-56-netfilter-conntrack-Introduce-udp-offload-timeout-co.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-56-netfilter-conntrack-Introduce-udp-offload-timeout-co.patch
@@ -0,0 +1,92 @@
 
				+From: Oz Shlomo <[email protected]>
			
 
				+Date: Thu, 3 Jun 2021 15:12:34 +0300
			
 
				+Subject: [PATCH] netfilter: conntrack: Introduce udp offload timeout
			
 
				+ configuration
			
 
				+
			
 
				+UDP connections may be offloaded from nf conntrack to nf flow table.
			
 
				+Offloaded connections are aged after 30 seconds of inactivity.
			
 
				+Once aged, ownership is returned to conntrack with a hard coded pickup
			
 
				+time of 30 seconds, after which the connection may be deleted.
			
 
				+eted. The current aging intervals may be too aggressive for some users.
			
 
				+
			
 
				+Provide users with the ability to control the nf flow table offload
			
 
				+aging and pickup time intervals via sysctl parameter as a pre-step for
			
 
				+configuring the nf flow table GC timeout intervals.
			
 
				+
			
 
				+Signed-off-by: Oz Shlomo <[email protected]>
			
 
				+Reviewed-by: Paul Blakey <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netns/conntrack.h
			
 
				++++ b/include/net/netns/conntrack.h
			
 
				+@@ -41,6 +41,10 @@ enum udp_conntrack {
			
 
				+ 
			
 
				+ struct nf_udp_net {
			
 
				+ 	unsigned int timeouts[UDP_CT_MAX];
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	unsigned int offload_timeout;
			
 
				++	unsigned int offload_pickup;
			
 
				++#endif
			
 
				+ };
			
 
				+ 
			
 
				+ struct nf_icmp_net {
			
 
				+--- a/net/netfilter/nf_conntrack_proto_udp.c
			
 
				++++ b/net/netfilter/nf_conntrack_proto_udp.c
			
 
				+@@ -273,6 +273,11 @@ void nf_conntrack_udp_init_net(struct ne
			
 
				+ 
			
 
				+ 	for (i = 0; i < UDP_CT_MAX; i++)
			
 
				+ 		un->timeouts[i] = udp_timeouts[i];
			
 
				++
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	un->offload_timeout = 30 * HZ;
			
 
				++	un->offload_pickup = 30 * HZ;
			
 
				++#endif
			
 
				+ }
			
 
				+ 
			
 
				+ const struct nf_conntrack_l4proto nf_conntrack_l4proto_udp =
			
 
				+--- a/net/netfilter/nf_conntrack_standalone.c
			
 
				++++ b/net/netfilter/nf_conntrack_standalone.c
			
 
				+@@ -576,6 +576,10 @@ enum nf_ct_sysctl_index {
			
 
				+ 	NF_SYSCTL_CT_PROTO_TCP_MAX_RETRANS,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_UDP,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_STREAM,
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_OFFLOAD,
			
 
				++	NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_OFFLOAD_PICKUP,
			
 
				++#endif
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_ICMP,
			
 
				+ 	NF_SYSCTL_CT_PROTO_TIMEOUT_ICMPV6,
			
 
				+ #ifdef CONFIG_NF_CT_PROTO_SCTP
			
 
				+@@ -810,6 +814,20 @@ static struct ctl_table nf_ct_sysctl_tab
			
 
				+ 		.mode		= 0644,
			
 
				+ 		.proc_handler	= proc_dointvec_jiffies,
			
 
				+ 	},
			
 
				++#if IS_ENABLED(CONFIG_NFT_FLOW_OFFLOAD)
			
 
				++	[NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_OFFLOAD] = {
			
 
				++		.procname	= "nf_flowtable_udp_timeout",
			
 
				++		.maxlen		= sizeof(unsigned int),
			
 
				++		.mode		= 0644,
			
 
				++		.proc_handler	= proc_dointvec_jiffies,
			
 
				++	},
			
 
				++	[NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_OFFLOAD_PICKUP] = {
			
 
				++		.procname	= "nf_flowtable_udp_pickup",
			
 
				++		.maxlen		= sizeof(unsigned int),
			
 
				++		.mode		= 0644,
			
 
				++		.proc_handler	= proc_dointvec_jiffies,
			
 
				++	},
			
 
				++#endif
			
 
				+ 	[NF_SYSCTL_CT_PROTO_TIMEOUT_ICMP] = {
			
 
				+ 		.procname	= "nf_conntrack_icmp_timeout",
			
 
				+ 		.maxlen		= sizeof(unsigned int),
			
 
				+@@ -1078,6 +1096,10 @@ static int nf_conntrack_standalone_init_
			
 
				+ 	table[NF_SYSCTL_CT_PROTO_TIMEOUT_ICMPV6].data = &nf_icmpv6_pernet(net)->timeout;
			
 
				+ 	table[NF_SYSCTL_CT_PROTO_TIMEOUT_UDP].data = &un->timeouts[UDP_CT_UNREPLIED];
			
 
				+ 	table[NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_STREAM].data = &un->timeouts[UDP_CT_REPLIED];
			
 
				++#if IS_ENABLED(CONFIG_NF_FLOW_TABLE)
			
 
				++	table[NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_OFFLOAD].data = &un->offload_timeout;
			
 
				++	table[NF_SYSCTL_CT_PROTO_TIMEOUT_UDP_OFFLOAD_PICKUP].data = &un->offload_pickup;
			
 
				++#endif
			
 
				+ 
			
 
				+ 	nf_conntrack_standalone_init_tcp_sysctl(net, table);
			
 
				+ 	nf_conntrack_standalone_init_sctp_sysctl(net, table);
			
--- a/target/linux/generic/backport-5.15/610-v5.13-57-netfilter-flowtable-Set-offload-timeouts-according-t.patch
+++ b/target/linux/generic/backport-5.15/610-v5.13-57-netfilter-flowtable-Set-offload-timeouts-according-t.patch
@@ -0,0 +1,134 @@
 
				+From: Oz Shlomo <[email protected]>
			
 
				+Date: Thu, 3 Jun 2021 15:12:35 +0300
			
 
				+Subject: [PATCH] netfilter: flowtable: Set offload timeouts according to proto
			
 
				+ values
			
 
				+
			
 
				+Currently the aging period for tcp/udp connections is hard coded to
			
 
				+30 seconds. Aged tcp/udp connections configure a hard coded 120/30
			
 
				+seconds pickup timeout for conntrack.
			
 
				+This configuration may be too aggressive or permissive for some users.
			
 
				+
			
 
				+Dynamically configure the nf flow table GC timeout intervals according
			
 
				+to the user defined values.
			
 
				+
			
 
				+Signed-off-by: Oz Shlomo <[email protected]>
			
 
				+Reviewed-by: Paul Blakey <[email protected]>
			
 
				+Signed-off-by: Pablo Neira Ayuso <[email protected]>
			
 
				+---
			
 
				+
			
 
				+--- a/include/net/netfilter/nf_flow_table.h
			
 
				++++ b/include/net/netfilter/nf_flow_table.h
			
 
				+@@ -174,6 +174,8 @@ struct flow_offload {
			
 
				+ #define NF_FLOW_TIMEOUT (30 * HZ)
			
 
				+ #define nf_flowtable_time_stamp	(u32)jiffies
			
 
				+ 
			
 
				++unsigned long flow_offload_get_timeout(struct flow_offload *flow);
			
 
				++
			
 
				+ static inline __s32 nf_flow_timeout_delta(unsigned int timeout)
			
 
				+ {
			
 
				+ 	return (__s32)(timeout - nf_flowtable_time_stamp);
			
 
				+--- a/net/netfilter/nf_flow_table_core.c
			
 
				++++ b/net/netfilter/nf_flow_table_core.c
			
 
				+@@ -175,12 +175,10 @@ static void flow_offload_fixup_tcp(struc
			
 
				+ 	tcp->seen[1].td_maxwin = 0;
			
 
				+ }
			
 
				+ 
			
 
				+-#define NF_FLOWTABLE_TCP_PICKUP_TIMEOUT	(120 * HZ)
			
 
				+-#define NF_FLOWTABLE_UDP_PICKUP_TIMEOUT	(30 * HZ)
			
 
				+-
			
 
				+ static void flow_offload_fixup_ct_timeout(struct nf_conn *ct)
			
 
				+ {
			
 
				+ 	const struct nf_conntrack_l4proto *l4proto;
			
 
				++	struct net *net = nf_ct_net(ct);
			
 
				+ 	int l4num = nf_ct_protonum(ct);
			
 
				+ 	unsigned int timeout;
			
 
				+ 
			
 
				+@@ -188,12 +186,17 @@ static void flow_offload_fixup_ct_timeou
			
 
				+ 	if (!l4proto)
			
 
				+ 		return;
			
 
				+ 
			
 
				+-	if (l4num == IPPROTO_TCP)
			
 
				+-		timeout = NF_FLOWTABLE_TCP_PICKUP_TIMEOUT;
			
 
				+-	else if (l4num == IPPROTO_UDP)
			
 
				+-		timeout = NF_FLOWTABLE_UDP_PICKUP_TIMEOUT;
			
 
				+-	else
			
 
				++	if (l4num == IPPROTO_TCP) {
			
 
				++		struct nf_tcp_net *tn = nf_tcp_pernet(net);
			
 
				++
			
 
				++		timeout = tn->offload_pickup;
			
 
				++	} else if (l4num == IPPROTO_UDP) {
			
 
				++		struct nf_udp_net *tn = nf_udp_pernet(net);
			
 
				++
			
 
				++		timeout = tn->offload_pickup;
			
 
				++	} else {
			
 
				+ 		return;
			
 
				++	}
			
 
				+ 
			
 
				+ 	if (nf_flow_timeout_delta(READ_ONCE(ct->timeout)) > (__s32)timeout)
			
 
				+ 		WRITE_ONCE(ct->timeout, nfct_time_stamp + timeout);
			
 
				+@@ -265,11 +268,35 @@ static const struct rhashtable_params nf
			
 
				+ 	.automatic_shrinking	= true,
			
 
				+ };
			
 
				+ 
			
 
				++unsigned long flow_offload_get_timeout(struct flow_offload *flow)
			
 
				++{
			
 
				++	const struct nf_conntrack_l4proto *l4proto;
			
 
				++	unsigned long timeout = NF_FLOW_TIMEOUT;
			
 
				++	struct net *net = nf_ct_net(flow->ct);
			
 
				++	int l4num = nf_ct_protonum(flow->ct);
			
 
				++
			
 
				++	l4proto = nf_ct_l4proto_find(l4num);
			
 
				++	if (!l4proto)
			
 
				++		return timeout;
			
 
				++
			
 
				++	if (l4num == IPPROTO_TCP) {
			
 
				++		struct nf_tcp_net *tn = nf_tcp_pernet(net);
			
 
				++
			
 
				++		timeout = tn->offload_timeout;
			
 
				++	} else if (l4num == IPPROTO_UDP) {
			
 
				++		struct nf_udp_net *tn = nf_udp_pernet(net);
			
 
				++
			
 
				++		timeout = tn->offload_timeout;
			
 
				++	}
			
 
				++
			
 
				++	return timeout;
			
 
				++}
			
 
				++
			
 
				+ int flow_offload_add(struct nf_flowtable *flow_table, struct flow_offload *flow)
			
 
				+ {
			
 
				+ 	int err;
			
 
				+ 
			
 
				+-	flow->timeout = nf_flowtable_time_stamp + NF_FLOW_TIMEOUT;
			
 
				++	flow->timeout = nf_flowtable_time_stamp + flow_offload_get_timeout(flow);
			
 
				+ 
			
 
				+ 	err = rhashtable_insert_fast(&flow_table->rhashtable,
			
 
				+ 				     &flow->tuplehash[0].node,
			
 
				+@@ -301,7 +328,7 @@ EXPORT_SYMBOL_GPL(flow_offload_add);
			
 
				+ void flow_offload_refresh(struct nf_flowtable *flow_table,
			
 
				+ 			  struct flow_offload *flow)
			
 
				+ {
			
 
				+-	flow->timeout = nf_flowtable_time_stamp + NF_FLOW_TIMEOUT;
			
 
				++	flow->timeout = nf_flowtable_time_stamp + flow_offload_get_timeout(flow);
			
 
				+ 
			
 
				+ 	if (likely(!nf_flowtable_hw_offload(flow_table)))
			
 
				+ 		return;
			
 
				+--- a/net/netfilter/nf_flow_table_offload.c
			
 
				++++ b/net/netfilter/nf_flow_table_offload.c
			
 
				+@@ -885,7 +885,7 @@ static void flow_offload_work_stats(stru
			
 
				+ 
			
 
				+ 	lastused = max_t(u64, stats[0].lastused, stats[1].lastused);
			
 
				+ 	offload->flow->timeout = max_t(u64, offload->flow->timeout,
			
 
				+-				       lastused + NF_FLOW_TIMEOUT);
			
 
				++				       lastused + flow_offload_get_timeout(offload->flow));
			
 
				+ 
			
 
				+ 	if (offload->flowtable->flags & NF_FLOWTABLE_COUNTER) {
			
 
				+ 		if (stats[0].pkts)
			
 
				+@@ -989,7 +989,7 @@ void nf_flow_offload_stats(struct nf_flo
			
 
				+ 	__s32 delta;
			
 
				+ 
			
 
				+ 	delta = nf_flow_timeout_delta(flow->timeout);
			
 
				+-	if ((delta >= (9 * NF_FLOW_TIMEOUT) / 10))
			
 
				++	if ((delta >= (9 * flow_offload_get_timeout(flow)) / 10))
			
 
				+ 		return;
			
 
				+ 
			
 
				+ 	offload = nf_flow_offload_work_alloc(flowtable, flow, FLOW_CLS_STATS);
			
--- a/target/linux/generic/backport-5.15/611-v5.12-net-ethernet-mediatek-support-setting-MTU.patch
+++ b/target/linux/generic/backport-5.15/611-v5.12-net-ethernet-mediatek-support-setting-MTU.patch
@@ -0,0 +1,138 @@
 
				+From 4fd59792097a6b2fb949d41264386a7ecade469e Mon Sep 17 00:00:00 2001
			
 
				+From: DENG Qingfang <[email protected]>
			
 
				+Date: Mon, 25 Jan 2021 12:20:46 +0800
			
 
				+Subject: [PATCH] net: ethernet: mediatek: support setting MTU
			
 
				+
			
 
				+MT762x HW, except for MT7628, supports frame length up to 2048
			
 
				+(maximum length on GDM), so allow setting MTU up to 2030.
			
 
				+
			
 
				+Also set the default frame length to the hardware default 1518.
			
 
				+
			
 
				+Signed-off-by: DENG Qingfang <[email protected]>
			
 
				+Reviewed-by: Andrew Lunn <[email protected]>
			
 
				+Link: https://lore.kernel.org/r/[email protected]
			
 
				+Signed-off-by: Jakub Kicinski <[email protected]>
			
 
				+---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.c | 43 ++++++++++++++++++---
			
 
				+ drivers/net/ethernet/mediatek/mtk_eth_soc.h | 12 ++++--
			
 
				+ 2 files changed, 47 insertions(+), 8 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.c
			
 
				+@@ -355,7 +355,7 @@ static void mtk_mac_config(struct phylin
			
 
				+ 	/* Setup gmac */
			
 
				+ 	mcr_cur = mtk_r32(mac->hw, MTK_MAC_MCR(mac->id));
			
 
				+ 	mcr_new = mcr_cur;
			
 
				+-	mcr_new |= MAC_MCR_MAX_RX_1536 | MAC_MCR_IPG_CFG | MAC_MCR_FORCE_MODE |
			
 
				++	mcr_new |= MAC_MCR_IPG_CFG | MAC_MCR_FORCE_MODE |
			
 
				+ 		   MAC_MCR_BACKOFF_EN | MAC_MCR_BACKPR_EN | MAC_MCR_FORCE_LINK;
			
 
				+ 
			
 
				+ 	/* Only update control register when needed! */
			
 
				+@@ -782,8 +782,8 @@ static void mtk_get_stats64(struct net_d
			
 
				+ static inline int mtk_max_frag_size(int mtu)
			
 
				+ {
			
 
				+ 	/* make sure buf_size will be at least MTK_MAX_RX_LENGTH */
			
 
				+-	if (mtu + MTK_RX_ETH_HLEN < MTK_MAX_RX_LENGTH)
			
 
				+-		mtu = MTK_MAX_RX_LENGTH - MTK_RX_ETH_HLEN;
			
 
				++	if (mtu + MTK_RX_ETH_HLEN < MTK_MAX_RX_LENGTH_2K)
			
 
				++		mtu = MTK_MAX_RX_LENGTH_2K - MTK_RX_ETH_HLEN;
			
 
				+ 
			
 
				+ 	return SKB_DATA_ALIGN(MTK_RX_HLEN + mtu) +
			
 
				+ 		SKB_DATA_ALIGN(sizeof(struct skb_shared_info));
			
 
				+@@ -794,7 +794,7 @@ static inline int mtk_max_buf_size(int f
			
 
				+ 	int buf_size = frag_size - NET_SKB_PAD - NET_IP_ALIGN -
			
 
				+ 		       SKB_DATA_ALIGN(sizeof(struct skb_shared_info));
			
 
				+ 
			
 
				+-	WARN_ON(buf_size < MTK_MAX_RX_LENGTH);
			
 
				++	WARN_ON(buf_size < MTK_MAX_RX_LENGTH_2K);
			
 
				+ 
			
 
				+ 	return buf_size;
			
 
				+ }
			
 
				+@@ -2606,6 +2606,35 @@ static void mtk_uninit(struct net_device
			
 
				+ 	mtk_rx_irq_disable(eth, ~0);
			
 
				+ }
			
 
				+ 
			
 
				++static int mtk_change_mtu(struct net_device *dev, int new_mtu)
			
 
				++{
			
 
				++	int length = new_mtu + MTK_RX_ETH_HLEN;
			
 
				++	struct mtk_mac *mac = netdev_priv(dev);
			
 
				++	struct mtk_eth *eth = mac->hw;
			
 
				++	u32 mcr_cur, mcr_new;
			
 
				++
			
 
				++	if (!MTK_HAS_CAPS(eth->soc->caps, MTK_SOC_MT7628)) {
			
 
				++		mcr_cur = mtk_r32(mac->hw, MTK_MAC_MCR(mac->id));
			
 
				++		mcr_new = mcr_cur & ~MAC_MCR_MAX_RX_MASK;
			
 
				++
			
 
				++		if (length <= 1518)
			
 
				++			mcr_new |= MAC_MCR_MAX_RX(MAC_MCR_MAX_RX_1518);
			
 
				++		else if (length <= 1536)
			
 
				++			mcr_new |= MAC_MCR_MAX_RX(MAC_MCR_MAX_RX_1536);
			
 
				++		else if (length <= 1552)
			
 
				++			mcr_new |= MAC_MCR_MAX_RX(MAC_MCR_MAX_RX_1552);
			
 
				++		else
			
 
				++			mcr_new |= MAC_MCR_MAX_RX(MAC_MCR_MAX_RX_2048);
			
 
				++
			
 
				++		if (mcr_new != mcr_cur)
			
 
				++			mtk_w32(mac->hw, mcr_new, MTK_MAC_MCR(mac->id));
			
 
				++	}
			
 
				++
			
 
				++	dev->mtu = new_mtu;
			
 
				++
			
 
				++	return 0;
			
 
				++}
			
 
				++
			
 
				+ static int mtk_do_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
			
 
				+ {
			
 
				+ 	struct mtk_mac *mac = netdev_priv(dev);
			
 
				+@@ -2902,6 +2931,7 @@ static const struct net_device_ops mtk_n
			
 
				+ 	.ndo_set_mac_address	= mtk_set_mac_address,
			
 
				+ 	.ndo_validate_addr	= eth_validate_addr,
			
 
				+ 	.ndo_do_ioctl		= mtk_do_ioctl,
			
 
				++	.ndo_change_mtu		= mtk_change_mtu,
			
 
				+ 	.ndo_tx_timeout		= mtk_tx_timeout,
			
 
				+ 	.ndo_get_stats64        = mtk_get_stats64,
			
 
				+ 	.ndo_fix_features	= mtk_fix_features,
			
 
				+@@ -3004,7 +3034,10 @@ static int mtk_add_mac(struct mtk_eth *e
			
 
				+ 	eth->netdev[id]->irq = eth->irq[0];
			
 
				+ 	eth->netdev[id]->dev.of_node = np;
			
 
				+ 
			
 
				+-	eth->netdev[id]->max_mtu = MTK_MAX_RX_LENGTH - MTK_RX_ETH_HLEN;
			
 
				++	if (MTK_HAS_CAPS(eth->soc->caps, MTK_SOC_MT7628))
			
 
				++		eth->netdev[id]->max_mtu = MTK_MAX_RX_LENGTH - MTK_RX_ETH_HLEN;
			
 
				++	else
			
 
				++		eth->netdev[id]->max_mtu = MTK_MAX_RX_LENGTH_2K - MTK_RX_ETH_HLEN;
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+ 
			
 
				+--- a/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				++++ b/drivers/net/ethernet/mediatek/mtk_eth_soc.h
			
 
				+@@ -20,12 +20,13 @@
			
 
				+ #include "mtk_ppe.h"
			
 
				+ 
			
 
				+ #define MTK_QDMA_PAGE_SIZE	2048
			
 
				+-#define	MTK_MAX_RX_LENGTH	1536
			
 
				++#define MTK_MAX_RX_LENGTH	1536
			
 
				++#define MTK_MAX_RX_LENGTH_2K	2048
			
 
				+ #define MTK_TX_DMA_BUF_LEN	0x3fff
			
 
				+ #define MTK_DMA_SIZE		512
			
 
				+ #define MTK_NAPI_WEIGHT		64
			
 
				+ #define MTK_MAC_COUNT		2
			
 
				+-#define MTK_RX_ETH_HLEN		(VLAN_ETH_HLEN + VLAN_HLEN + ETH_FCS_LEN)
			
 
				++#define MTK_RX_ETH_HLEN		(ETH_HLEN + ETH_FCS_LEN)
			
 
				+ #define MTK_RX_HLEN		(NET_SKB_PAD + MTK_RX_ETH_HLEN + NET_IP_ALIGN)
			
 
				+ #define MTK_DMA_DUMMY_DESC	0xffffffff
			
 
				+ #define MTK_DEFAULT_MSG_ENABLE	(NETIF_MSG_DRV | \
			
 
				+@@ -352,7 +353,12 @@
			
 
				+ 
			
 
				+ /* Mac control registers */
			
 
				+ #define MTK_MAC_MCR(x)		(0x10100 + (x * 0x100))
			
 
				+-#define MAC_MCR_MAX_RX_1536	BIT(24)
			
 
				++#define MAC_MCR_MAX_RX_MASK	GENMASK(25, 24)
			
 
				++#define MAC_MCR_MAX_RX(_x)	(MAC_MCR_MAX_RX_MASK & ((_x) << 24))
			
 
				++#define MAC_MCR_MAX_RX_1518	0x0
			
 
				++#define MAC_MCR_MAX_RX_1536	0x1
			
 
				++#define MAC_MCR_MAX_RX_1552	0x2
			
 
				++#define MAC_MCR_MAX_RX_2048	0x3
			
 
				+ #define MAC_MCR_IPG_CFG		(BIT(18) | BIT(16))
			
 
				+ #define MAC_MCR_FORCE_MODE	BIT(15)
			
 
				+ #define MAC_MCR_TX_EN		BIT(14)
			
--- a/target/linux/generic/backport-5.15/705-net-phy-at803x-select-correct-page-on-config-init.patch
+++ b/target/linux/generic/backport-5.15/705-net-phy-at803x-select-correct-page-on-config-init.patch
@@ -0,0 +1,108 @@
 
				+From c329e5afb42ff0a88285eb4d8a391a18793e4777 Mon Sep 17 00:00:00 2001
			
 
				+From: David Bauer <[email protected]>
			
 
				+Date: Thu, 15 Apr 2021 03:26:50 +0200
			
 
				+Subject: [PATCH] net: phy: at803x: select correct page on config init
			
 
				+
			
 
				+The Atheros AR8031 and AR8033 expose different registers for SGMII/Fiber
			
 
				+as well as the copper side of the PHY depending on the BT_BX_REG_SEL bit
			
 
				+in the chip configure register.
			
 
				+
			
 
				+The driver assumes the copper side is selected on probe, but this might
			
 
				+not be the case depending which page was last selected by the
			
 
				+bootloader. Notably, Ubiquiti UniFi bootloaders show this behavior.
			
 
				+
			
 
				+Select the copper page when probing to circumvent this.
			
 
				+
			
 
				+Signed-off-by: David Bauer <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/phy/at803x.c | 50 +++++++++++++++++++++++++++++++++++++++-
			
 
				+ 1 file changed, 49 insertions(+), 1 deletion(-)
			
 
				+
			
 
				+--- a/drivers/net/phy/at803x.c
			
 
				++++ b/drivers/net/phy/at803x.c
			
 
				+@@ -139,6 +139,9 @@
			
 
				+ #define ATH8035_PHY_ID 0x004dd072
			
 
				+ #define AT8030_PHY_ID_MASK			0xffffffef
			
 
				+ 
			
 
				++#define AT803X_PAGE_FIBER		0
			
 
				++#define AT803X_PAGE_COPPER		1
			
 
				++
			
 
				+ MODULE_DESCRIPTION("Qualcomm Atheros AR803x PHY driver");
			
 
				+ MODULE_AUTHOR("Matus Ujhelyi");
			
 
				+ MODULE_LICENSE("GPL");
			
 
				+@@ -190,6 +193,35 @@ static int at803x_debug_reg_mask(struct
			
 
				+ 	return phy_write(phydev, AT803X_DEBUG_DATA, val);
			
 
				+ }
			
 
				+ 
			
 
				++static int at803x_write_page(struct phy_device *phydev, int page)
			
 
				++{
			
 
				++	int mask;
			
 
				++	int set;
			
 
				++
			
 
				++	if (page == AT803X_PAGE_COPPER) {
			
 
				++		set = AT803X_BT_BX_REG_SEL;
			
 
				++		mask = 0;
			
 
				++	} else {
			
 
				++		set = 0;
			
 
				++		mask = AT803X_BT_BX_REG_SEL;
			
 
				++	}
			
 
				++
			
 
				++	return __phy_modify(phydev, AT803X_REG_CHIP_CONFIG, mask, set);
			
 
				++}
			
 
				++
			
 
				++static int at803x_read_page(struct phy_device *phydev)
			
 
				++{
			
 
				++	int ccr = __phy_read(phydev, AT803X_REG_CHIP_CONFIG);
			
 
				++
			
 
				++	if (ccr < 0)
			
 
				++		return ccr;
			
 
				++
			
 
				++	if (ccr & AT803X_BT_BX_REG_SEL)
			
 
				++		return AT803X_PAGE_COPPER;
			
 
				++
			
 
				++	return AT803X_PAGE_FIBER;
			
 
				++}
			
 
				++
			
 
				+ static int at803x_enable_rx_delay(struct phy_device *phydev)
			
 
				+ {
			
 
				+ 	return at803x_debug_reg_mask(phydev, AT803X_DEBUG_REG_0, 0,
			
 
				+@@ -508,6 +540,7 @@ static int at803x_probe(struct phy_devic
			
 
				+ {
			
 
				+ 	struct device *dev = &phydev->mdio.dev;
			
 
				+ 	struct at803x_priv *priv;
			
 
				++	int ret;
			
 
				+ 
			
 
				+ 	priv = devm_kzalloc(dev, sizeof(*priv), GFP_KERNEL);
			
 
				+ 	if (!priv)
			
 
				+@@ -515,7 +548,20 @@ static int at803x_probe(struct phy_devic
			
 
				+ 
			
 
				+ 	phydev->priv = priv;
			
 
				+ 
			
 
				+-	return at803x_parse_dt(phydev);
			
 
				++	ret = at803x_parse_dt(phydev);
			
 
				++	if (ret)
			
 
				++		return ret;
			
 
				++
			
 
				++	/* Some bootloaders leave the fiber page selected.
			
 
				++	 * Switch to the copper page, as otherwise we read
			
 
				++	 * the PHY capabilities from the fiber side.
			
 
				++	 */
			
 
				++	if (at803x_match_phy_id(phydev, ATH8031_PHY_ID)) {
			
 
				++		ret = phy_select_page(phydev, AT803X_PAGE_COPPER);
			
 
				++		ret = phy_restore_page(phydev, AT803X_PAGE_COPPER, ret);
			
 
				++	}
			
 
				++
			
 
				++	return ret;
			
 
				+ }
			
 
				+ 
			
 
				+ static void at803x_remove(struct phy_device *phydev)
			
 
				+@@ -1097,6 +1143,8 @@ static struct phy_driver at803x_driver[]
			
 
				+ 	.get_wol		= at803x_get_wol,
			
 
				+ 	.suspend		= at803x_suspend,
			
 
				+ 	.resume			= at803x_resume,
			
 
				++	.read_page		= at803x_read_page,
			
 
				++	.write_page		= at803x_write_page,
			
 
				+ 	/* PHY_GBIT_FEATURES */
			
 
				+ 	.read_status		= at803x_read_status,
			
 
				+ 	.aneg_done		= at803x_aneg_done,
			
--- a/target/linux/generic/backport-5.15/706-net-phy-at803x-fix-probe-error-if-copper-page-is-sel.patch
+++ b/target/linux/generic/backport-5.15/706-net-phy-at803x-fix-probe-error-if-copper-page-is-sel.patch
@@ -0,0 +1,73 @@
 
				+From 8f7e876273e294b732b42af2e5e6bba91d798954 Mon Sep 17 00:00:00 2001
			
 
				+From: Michael Walle <[email protected]>
			
 
				+Date: Tue, 20 Apr 2021 12:29:29 +0200
			
 
				+Subject: [PATCH] net: phy: at803x: fix probe error if copper page is selected
			
 
				+
			
 
				+The commit c329e5afb42f ("net: phy: at803x: select correct page on
			
 
				+config init") selects the copper page during probe. This fails if the
			
 
				+copper page was already selected. In this case, the value of the copper
			
 
				+page (which is 1) is propagated through phy_restore_page() and is
			
 
				+finally returned for at803x_probe(). Fix it, by just using the
			
 
				+at803x_page_write() directly.
			
 
				+
			
 
				+Also in case of an error, the regulator is not disabled and leads to a
			
 
				+WARN_ON() when the probe fails. This couldn't happen before, because
			
 
				+at803x_parse_dt() was the last call in at803x_probe(). It is hard to
			
 
				+see, that the parse_dt() actually enables the regulator. Thus move the
			
 
				+regulator_enable() to the probe function and undo it in case of an
			
 
				+error.
			
 
				+
			
 
				+Fixes: c329e5afb42f ("net: phy: at803x: select correct page on config init")
			
 
				+Signed-off-by: Michael Walle <[email protected]>
			
 
				+Reviewed-by: David Bauer <[email protected]>
			
 
				+Signed-off-by: David S. Miller <[email protected]>
			
 
				+---
			
 
				+ drivers/net/phy/at803x.c | 23 +++++++++++++++++------
			
 
				+ 1 file changed, 17 insertions(+), 6 deletions(-)
			
 
				+
			
 
				+--- a/drivers/net/phy/at803x.c
			
 
				++++ b/drivers/net/phy/at803x.c
			
 
				+@@ -527,10 +527,6 @@ static int at803x_parse_dt(struct phy_de
			
 
				+ 			phydev_err(phydev, "failed to get VDDIO regulator\n");
			
 
				+ 			return PTR_ERR(priv->vddio);
			
 
				+ 		}
			
 
				+-
			
 
				+-		ret = regulator_enable(priv->vddio);
			
 
				+-		if (ret < 0)
			
 
				+-			return ret;
			
 
				+ 	}
			
 
				+ 
			
 
				+ 	return 0;
			
 
				+@@ -552,15 +548,30 @@ static int at803x_probe(struct phy_devic
			
 
				+ 	if (ret)
			
 
				+ 		return ret;
			
 
				+ 
			
 
				++	if (priv->vddio) {
			
 
				++		ret = regulator_enable(priv->vddio);
			
 
				++		if (ret < 0)
			
 
				++			return ret;
			
 
				++	}
			
 
				++
			
 
				+ 	/* Some bootloaders leave the fiber page selected.
			
 
				+ 	 * Switch to the copper page, as otherwise we read
			
 
				+ 	 * the PHY capabilities from the fiber side.
			
 
				+ 	 */
			
 
				+ 	if (at803x_match_phy_id(phydev, ATH8031_PHY_ID)) {
			
 
				+-		ret = phy_select_page(phydev, AT803X_PAGE_COPPER);
			
 
				+-		ret = phy_restore_page(phydev, AT803X_PAGE_COPPER, ret);
			
 
				++		phy_lock_mdio_bus(phydev);
			
 
				++		ret = at803x_write_page(phydev, AT803X_PAGE_COPPER);
			
 
				++		phy_unlock_mdio_bus(phydev);
			
 
				++		if (ret)
			
 
				++			goto err;
			
 
				+ 	}
			
 
				+ 
			
 
				++	return 0;
			
 
				++
			
 
				++err:
			
 
				++	if (priv->vddio)
			
 
				++		regulator_disable(priv->vddio);
			
 
				++
			
 
				+ 	return ret;
			
 
				+ }
			
 
				+ 
			
--- a/target/linux/generic/backport-5.15/710-v5.12-net-phy-Add-100-base-x-mode.patch
+++ b/target/linux/generic/backport-5.15/710-v5.12-net-phy-Add-100-base-x-mode.patch
@@ -0,0 +1,56 @@
 
				+From b1ae3587d16a8c8fc9453e147c8708d6f006ffbb Mon Sep 17 00:00:00 2001
			
 
				+From: Bjarni Jonasson <[email protected]>
			
 
				+Date: Wed, 13 Jan 2021 12:56:25 +0100
			
 
				+Subject: [PATCH] net: phy: Add 100 base-x mode
			
 
				+
			
 
				+Sparx-5 supports this mode and it is missing in the PHY core.
			
 
				+
			
 
				+Signed-off-by: Bjarni Jonasson <[email protected]>
			
 
				+Reviewed-by: Russell King <[email protected]>
			
 
				+Signed-off-by: Jakub Kicinski <[email protected]>
			
 
				+---
			
 
				+ Documentation/networking/phy.rst | 5 +++++
			
 
				+ include/linux/phy.h              | 4 ++++
			
 
				+ 2 files changed, 9 insertions(+)
			
 
				+
			
 
				+--- a/Documentation/networking/phy.rst
			
 
				++++ b/Documentation/networking/phy.rst
			
 
				+@@ -286,6 +286,11 @@ Some of the interface modes are describe
			
 
				+     Note: due to legacy usage, some 10GBASE-R usage incorrectly makes
			
 
				+     use of this definition.
			
 
				+ 
			
 
				++``PHY_INTERFACE_MODE_100BASEX``
			
 
				++    This defines IEEE 802.3 Clause 24.  The link operates at a fixed data
			
 
				++    rate of 125Mpbs using a 4B/5B encoding scheme, resulting in an underlying
			
 
				++    data rate of 100Mpbs.
			
 
				++
			
 
				+ Pause frames / flow control
			
 
				+ ===========================
			
 
				+ 
			
 
				+--- a/include/linux/phy.h
			
 
				++++ b/include/linux/phy.h
			
 
				+@@ -104,6 +104,7 @@ extern const int phy_10gbit_features_arr
			
 
				+  * @PHY_INTERFACE_MODE_MOCA: Multimedia over Coax
			
 
				+  * @PHY_INTERFACE_MODE_QSGMII: Quad SGMII
			
 
				+  * @PHY_INTERFACE_MODE_TRGMII: Turbo RGMII
			
 
				++ * @PHY_INTERFACE_MODE_100BASEX: 100 BaseX
			
 
				+  * @PHY_INTERFACE_MODE_1000BASEX: 1000 BaseX
			
 
				+  * @PHY_INTERFACE_MODE_2500BASEX: 2500 BaseX
			
 
				+  * @PHY_INTERFACE_MODE_RXAUI: Reduced XAUI
			
 
				+@@ -135,6 +136,7 @@ typedef enum {
			
 
				+ 	PHY_INTERFACE_MODE_MOCA,
			
 
				+ 	PHY_INTERFACE_MODE_QSGMII,
			
 
				+ 	PHY_INTERFACE_MODE_TRGMII,
			
 
				++	PHY_INTERFACE_MODE_100BASEX,
			
 
				+ 	PHY_INTERFACE_MODE_1000BASEX,
			
 
				+ 	PHY_INTERFACE_MODE_2500BASEX,
			
 
				+ 	PHY_INTERFACE_MODE_RXAUI,
			
 
				+@@ -217,6 +219,8 @@ static inline const char *phy_modes(phy_
			
 
				+ 		return "usxgmii";
			
 
				+ 	case PHY_INTERFACE_MODE_10GKR:
			
 
				+ 		return "10gbase-kr";
			
 
				++	case PHY_INTERFACE_MODE_100BASEX:
			
 
				++		return "100base-x";
			
 
				+ 	default:
			
 
				+ 		return "unknown";
			
 
				+ 	}
			
--- a/target/linux/generic/backport-5.15/711-v5.12-sfp-add-support-for-100-base-x-SFPs.patch
+++ b/target/linux/generic/backport-5.15/711-v5.12-sfp-add-support-for-100-base-x-SFPs.patch
@@ -0,0 +1,40 @@
 
				+From 6e12f35cef6b8a458d7ecf507ae330e0bffaad8c Mon Sep 17 00:00:00 2001
			
 
				+From: Bjarni Jonasson <[email protected]>
			
 
				+Date: Wed, 13 Jan 2021 12:56:26 +0100
			
 
				+Subject: [PATCH] sfp: add support for 100 base-x SFPs
			
 
				+
			
 
				+Add support for 100Base-FX, 100Base-LX, 100Base-PX and 100Base-BX10 modules
			
 
				+This is needed for Sparx-5 switch.
			
 
				+
			
 
				+Signed-off-by: Bjarni Jonasson <[email protected]>
			
 
				+Reviewed-by: Russell King <[email protected]>
			
 
				+Signed-off-by: Jakub Kicinski <[email protected]>
			
 
				+---
			
 
				+ drivers/net/phy/sfp-bus.c | 9 +++++++++
			
 
				+ 1 file changed, 9 insertions(+)
			
 
				+
			
 
				+--- a/drivers/net/phy/sfp-bus.c
			
 
				++++ b/drivers/net/phy/sfp-bus.c
			
 
				+@@ -280,6 +280,12 @@ void sfp_parse_support(struct sfp_bus *b
			
 
				+ 	    br_min <= 1300 && br_max >= 1200)
			
 
				+ 		phylink_set(modes, 1000baseX_Full);
			
 
				+ 
			
 
				++	/* 100Base-FX, 100Base-LX, 100Base-PX, 100Base-BX10 */
			
 
				++	if (id->base.e100_base_fx || id->base.e100_base_lx)
			
 
				++		phylink_set(modes, 100baseFX_Full);
			
 
				++	if ((id->base.e_base_px || id->base.e_base_bx10) && br_nom == 100)
			
 
				++		phylink_set(modes, 100baseFX_Full);
			
 
				++
			
 
				+ 	/* For active or passive cables, select the link modes
			
 
				+ 	 * based on the bit rates and the cable compliance bytes.
			
 
				+ 	 */
			
 
				+@@ -399,6 +405,9 @@ phy_interface_t sfp_select_interface(str
			
 
				+ 	if (phylink_test(link_modes, 1000baseX_Full))
			
 
				+ 		return PHY_INTERFACE_MODE_1000BASEX;
			
 
				+ 
			
 
				++	if (phylink_test(link_modes, 100baseFX_Full))
			
 
				++		return PHY_INTERFACE_MODE_100BASEX;
			
 
				++
			
 
				+ 	dev_warn(bus->sfp_dev, "Unable to ascertain link mode\n");
			
 
				+ 
			
 
				+ 	return PHY_INTERFACE_MODE_NA;