kernel: backport flow offload fixes
authorRitaro Takenaka <ritarot634@gmail.com>
Tue, 24 May 2022 17:51:19 +0000 (02:51 +0900)
committerHauke Mehrtens <hauke@hauke-m.de>
Fri, 27 May 2022 12:15:43 +0000 (14:15 +0200)
Some dst in IPv6 flow offload table become invalid after the table is created.
So check_dst is needed in packet path.

Signed-off-by: Ritaro Takenaka <ritarot634@gmail.com>
[Add patch for kernel 5.15 too and rename file]
Signed-off-by: Hauke Mehrtens <hauke@hauke-m.de>
target/linux/generic/backport-5.10/610-v5.18-netfilter-flowtable-move-dst_check-to-packet-path.patch [new file with mode: 0644]
target/linux/generic/backport-5.15/610-v5.18-netfilter-flowtable-move-dst_check-to-packet-path.patch [new file with mode: 0644]
target/linux/generic/hack-5.10/650-netfilter-add-xt_FLOWOFFLOAD-target.patch
target/linux/generic/hack-5.15/650-netfilter-add-xt_FLOWOFFLOAD-target.patch

diff --git a/target/linux/generic/backport-5.10/610-v5.18-netfilter-flowtable-move-dst_check-to-packet-path.patch b/target/linux/generic/backport-5.10/610-v5.18-netfilter-flowtable-move-dst_check-to-packet-path.patch
new file mode 100644 (file)
index 0000000..99e40b9
--- /dev/null
@@ -0,0 +1,99 @@
+From 2738d9d963bd1f06d5114c2b4fa5771a95703991 Mon Sep 17 00:00:00 2001
+From: Ritaro Takenaka <ritarot634@gmail.com>
+Date: Tue, 17 May 2022 12:55:30 +0200
+Subject: [PATCH] netfilter: flowtable: move dst_check to packet path
+
+Fixes sporadic IPv6 packet loss when flow offloading is enabled.
+
+IPv6 route GC and flowtable GC are not synchronized.
+When dst_cache becomes stale and a packet passes through the flow before
+the flowtable GC teardowns it, the packet can be dropped.
+So, it is necessary to check dst every time in packet path.
+
+Fixes: 227e1e4d0d6c ("netfilter: nf_flowtable: skip device lookup from interface index")
+Signed-off-by: Ritaro Takenaka <ritarot634@gmail.com>
+Signed-off-by: Pablo Neira Ayuso <pablo@netfilter.org>
+---
+ net/netfilter/nf_flow_table_core.c | 23 +----------------------
+ net/netfilter/nf_flow_table_ip.c   | 19 +++++++++++++++++++
+ 2 files changed, 20 insertions(+), 22 deletions(-)
+
+--- a/net/netfilter/nf_flow_table_core.c
++++ b/net/netfilter/nf_flow_table_core.c
+@@ -433,33 +433,12 @@ nf_flow_table_iterate(struct nf_flowtabl
+       return err;
+ }
+-static bool flow_offload_stale_dst(struct flow_offload_tuple *tuple)
+-{
+-      struct dst_entry *dst;
+-
+-      if (tuple->xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
+-          tuple->xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
+-              dst = tuple->dst_cache;
+-              if (!dst_check(dst, tuple->dst_cookie))
+-                      return true;
+-      }
+-
+-      return false;
+-}
+-
+-static bool nf_flow_has_stale_dst(struct flow_offload *flow)
+-{
+-      return flow_offload_stale_dst(&flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple) ||
+-             flow_offload_stale_dst(&flow->tuplehash[FLOW_OFFLOAD_DIR_REPLY].tuple);
+-}
+-
+ static void nf_flow_offload_gc_step(struct flow_offload *flow, void *data)
+ {
+       struct nf_flowtable *flow_table = data;
+       if (nf_flow_has_expired(flow) ||
+-          nf_ct_is_dying(flow->ct) ||
+-          nf_flow_has_stale_dst(flow))
++          nf_ct_is_dying(flow->ct))
+               set_bit(NF_FLOW_TEARDOWN, &flow->flags);
+       if (test_bit(NF_FLOW_TEARDOWN, &flow->flags)) {
+--- a/net/netfilter/nf_flow_table_ip.c
++++ b/net/netfilter/nf_flow_table_ip.c
+@@ -229,6 +229,15 @@ static bool nf_flow_exceeds_mtu(const st
+       return true;
+ }
++static inline bool nf_flow_dst_check(struct flow_offload_tuple *tuple)
++{
++      if (tuple->xmit_type != FLOW_OFFLOAD_XMIT_NEIGH &&
++          tuple->xmit_type != FLOW_OFFLOAD_XMIT_XFRM)
++              return true;
++
++      return dst_check(tuple->dst_cache, tuple->dst_cookie);
++}
++
+ static unsigned int nf_flow_xmit_xfrm(struct sk_buff *skb,
+                                     const struct nf_hook_state *state,
+                                     struct dst_entry *dst)
+@@ -364,6 +373,11 @@ nf_flow_offload_ip_hook(void *priv, stru
+       if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
+               return NF_ACCEPT;
++      if (!nf_flow_dst_check(&tuplehash->tuple)) {
++              flow_offload_teardown(flow);
++              return NF_ACCEPT;
++      }
++
+       if (skb_try_make_writable(skb, thoff + hdrsize))
+               return NF_DROP;
+@@ -600,6 +614,11 @@ nf_flow_offload_ipv6_hook(void *priv, st
+       if (nf_flow_state_check(flow, ip6h->nexthdr, skb, thoff))
+               return NF_ACCEPT;
++      if (!nf_flow_dst_check(&tuplehash->tuple)) {
++              flow_offload_teardown(flow);
++              return NF_ACCEPT;
++      }
++
+       if (skb_try_make_writable(skb, thoff + hdrsize))
+               return NF_DROP;
diff --git a/target/linux/generic/backport-5.15/610-v5.18-netfilter-flowtable-move-dst_check-to-packet-path.patch b/target/linux/generic/backport-5.15/610-v5.18-netfilter-flowtable-move-dst_check-to-packet-path.patch
new file mode 100644 (file)
index 0000000..8d35531
--- /dev/null
@@ -0,0 +1,99 @@
+From 2738d9d963bd1f06d5114c2b4fa5771a95703991 Mon Sep 17 00:00:00 2001
+From: Ritaro Takenaka <ritarot634@gmail.com>
+Date: Tue, 17 May 2022 12:55:30 +0200
+Subject: [PATCH] netfilter: flowtable: move dst_check to packet path
+
+Fixes sporadic IPv6 packet loss when flow offloading is enabled.
+
+IPv6 route GC and flowtable GC are not synchronized.
+When dst_cache becomes stale and a packet passes through the flow before
+the flowtable GC teardowns it, the packet can be dropped.
+So, it is necessary to check dst every time in packet path.
+
+Fixes: 227e1e4d0d6c ("netfilter: nf_flowtable: skip device lookup from interface index")
+Signed-off-by: Ritaro Takenaka <ritarot634@gmail.com>
+Signed-off-by: Pablo Neira Ayuso <pablo@netfilter.org>
+---
+ net/netfilter/nf_flow_table_core.c | 23 +----------------------
+ net/netfilter/nf_flow_table_ip.c   | 19 +++++++++++++++++++
+ 2 files changed, 20 insertions(+), 22 deletions(-)
+
+--- a/net/netfilter/nf_flow_table_core.c
++++ b/net/netfilter/nf_flow_table_core.c
+@@ -431,33 +431,12 @@ nf_flow_table_iterate(struct nf_flowtabl
+       return err;
+ }
+-static bool flow_offload_stale_dst(struct flow_offload_tuple *tuple)
+-{
+-      struct dst_entry *dst;
+-
+-      if (tuple->xmit_type == FLOW_OFFLOAD_XMIT_NEIGH ||
+-          tuple->xmit_type == FLOW_OFFLOAD_XMIT_XFRM) {
+-              dst = tuple->dst_cache;
+-              if (!dst_check(dst, tuple->dst_cookie))
+-                      return true;
+-      }
+-
+-      return false;
+-}
+-
+-static bool nf_flow_has_stale_dst(struct flow_offload *flow)
+-{
+-      return flow_offload_stale_dst(&flow->tuplehash[FLOW_OFFLOAD_DIR_ORIGINAL].tuple) ||
+-             flow_offload_stale_dst(&flow->tuplehash[FLOW_OFFLOAD_DIR_REPLY].tuple);
+-}
+-
+ static void nf_flow_offload_gc_step(struct flow_offload *flow, void *data)
+ {
+       struct nf_flowtable *flow_table = data;
+       if (nf_flow_has_expired(flow) ||
+-          nf_ct_is_dying(flow->ct) ||
+-          nf_flow_has_stale_dst(flow))
++          nf_ct_is_dying(flow->ct))
+               set_bit(NF_FLOW_TEARDOWN, &flow->flags);
+       if (test_bit(NF_FLOW_TEARDOWN, &flow->flags)) {
+--- a/net/netfilter/nf_flow_table_ip.c
++++ b/net/netfilter/nf_flow_table_ip.c
+@@ -227,6 +227,15 @@ static bool nf_flow_exceeds_mtu(const st
+       return true;
+ }
++static inline bool nf_flow_dst_check(struct flow_offload_tuple *tuple)
++{
++      if (tuple->xmit_type != FLOW_OFFLOAD_XMIT_NEIGH &&
++          tuple->xmit_type != FLOW_OFFLOAD_XMIT_XFRM)
++              return true;
++
++      return dst_check(tuple->dst_cache, tuple->dst_cookie);
++}
++
+ static unsigned int nf_flow_xmit_xfrm(struct sk_buff *skb,
+                                     const struct nf_hook_state *state,
+                                     struct dst_entry *dst)
+@@ -346,6 +355,11 @@ nf_flow_offload_ip_hook(void *priv, stru
+       if (nf_flow_state_check(flow, iph->protocol, skb, thoff))
+               return NF_ACCEPT;
++      if (!nf_flow_dst_check(&tuplehash->tuple)) {
++              flow_offload_teardown(flow);
++              return NF_ACCEPT;
++      }
++
+       if (skb_try_make_writable(skb, thoff + hdrsize))
+               return NF_DROP;
+@@ -582,6 +596,11 @@ nf_flow_offload_ipv6_hook(void *priv, st
+       if (nf_flow_state_check(flow, ip6h->nexthdr, skb, thoff))
+               return NF_ACCEPT;
++      if (!nf_flow_dst_check(&tuplehash->tuple)) {
++              flow_offload_teardown(flow);
++              return NF_ACCEPT;
++      }
++
+       if (skb_try_make_writable(skb, thoff + hdrsize))
+               return NF_DROP;
index 8435ae71cd148fe4474129121427f65e14321244..6252f9a41847a14626b9eb39144eb087c470700a 100644 (file)
@@ -837,7 +837,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
  }
 +EXPORT_SYMBOL_GPL(nf_flow_table_iterate);
  
- static bool flow_offload_stale_dst(struct flow_offload_tuple *tuple)
+ static void nf_flow_offload_gc_step(struct flow_offload *flow, void *data)
  {
 --- /dev/null
 +++ b/include/uapi/linux/netfilter/xt_FLOWOFFLOAD.h
index 0eca9f8d8f2d11876d156824625264b0ff2b5d11..81432bbeab9f26ca2d9bccb43df5ea98f3fa7b58 100644 (file)
@@ -819,7 +819,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
  }
 +EXPORT_SYMBOL_GPL(nf_flow_table_iterate);
  
- static bool flow_offload_stale_dst(struct flow_offload_tuple *tuple)
+ static void nf_flow_offload_gc_step(struct flow_offload *flow, void *data)
  {
 --- /dev/null
 +++ b/include/uapi/linux/netfilter/xt_FLOWOFFLOAD.h