]> git.ipfire.org Git - thirdparty/linux.git/commitdiff
netfilter: nf_nat: remove bogus direction check
authorFlorian Westphal <fw@strlen.de>
Mon, 8 Dec 2025 15:00:34 +0000 (16:00 +0100)
committerFlorian Westphal <fw@strlen.de>
Thu, 11 Dec 2025 12:08:37 +0000 (13:08 +0100)
Jakub reports spurious failures of the 'conntrack_reverse_clash.sh'
selftest.  A bogus test makes nat core resort to port rewrite even
though there is no need for this.

When the test is made, nf_nat_used_tuple() would already have caused us
to return if no other CPU had added a colliding entry.
Moreover, nf_nat_used_tuple() would have ignored the colliding entry if
their origin tuples had been the same.

All that is left to check is if the colliding entry in the hash table
is subject to NAT, and, if its not, if our entry matches in the reverse
direction, e.g. hash table has

addr1:1234 -> addr2:80, and we want to commit
addr2:80   -> addr1:1234.

Because we already checked that neither the new nor the committed entry is
subject to NAT we only have to check origin vs. reply tuple:
for non-nat entries, the reply tuple is always the inverted original.

Just in case there are more problems extend the error reporting
in the selftest while at it and dump conntrack table/stats on error.

Reported-by: Jakub Kicinski <kuba@kernel.org>
Closes: https://lore.kernel.org/netdev/20251206175135.4a56591b@kernel.org/
Fixes: d8f84a9bc7c4 ("netfilter: nf_nat: don't try nat source port reallocation for reverse dir clash")
Signed-off-by: Florian Westphal <fw@strlen.de>
net/netfilter/nf_nat_core.c
tools/testing/selftests/net/netfilter/conntrack_reverse_clash.c
tools/testing/selftests/net/netfilter/conntrack_reverse_clash.sh

index 78a61dac4ade82322ab21f4f1eecf5bc48b98179..e6b24586d2fed546ddb534fd41c7f03c332ce2b7 100644 (file)
@@ -294,25 +294,13 @@ nf_nat_used_tuple_new(const struct nf_conntrack_tuple *tuple,
 
        ct = nf_ct_tuplehash_to_ctrack(thash);
 
-       /* NB: IP_CT_DIR_ORIGINAL should be impossible because
-        * nf_nat_used_tuple() handles origin collisions.
-        *
-        * Handle remote chance other CPU confirmed its ct right after.
-        */
-       if (thash->tuple.dst.dir != IP_CT_DIR_REPLY)
-               goto out;
-
        /* clashing connection subject to NAT? Retry with new tuple. */
        if (READ_ONCE(ct->status) & uses_nat)
                goto out;
 
        if (nf_ct_tuple_equal(&ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple,
-                             &ignored_ct->tuplehash[IP_CT_DIR_REPLY].tuple) &&
-           nf_ct_tuple_equal(&ct->tuplehash[IP_CT_DIR_REPLY].tuple,
-                             &ignored_ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple)) {
+                             &ignored_ct->tuplehash[IP_CT_DIR_REPLY].tuple))
                taken = false;
-               goto out;
-       }
 out:
        nf_ct_put(ct);
        return taken;
index 507930cee8cb698ec9ddefd3ac5508d6ce271cce..462d628cc3bdba7bb79d655d1c571ed640b65f4f 100644 (file)
@@ -33,9 +33,14 @@ static void die(const char *e)
        exit(111);
 }
 
-static void die_port(uint16_t got, uint16_t want)
+static void die_port(const struct sockaddr_in *sin, uint16_t want)
 {
-       fprintf(stderr, "Port number changed, wanted %d got %d\n", want, ntohs(got));
+       uint16_t got = ntohs(sin->sin_port);
+       char str[INET_ADDRSTRLEN];
+
+       inet_ntop(AF_INET, &sin->sin_addr, str, sizeof(str));
+
+       fprintf(stderr, "Port number changed, wanted %d got %d from %s\n", want, got, str);
        exit(1);
 }
 
@@ -100,7 +105,7 @@ int main(int argc, char *argv[])
                                die("child recvfrom");
 
                        if (peer.sin_port != htons(PORT))
-                               die_port(peer.sin_port, PORT);
+                               die_port(&peer, PORT);
                } else {
                        if (sendto(s2, buf, LEN, 0, (struct sockaddr *)&sa1, sizeof(sa1)) != LEN)
                                continue;
@@ -109,7 +114,7 @@ int main(int argc, char *argv[])
                                die("parent recvfrom");
 
                        if (peer.sin_port != htons((PORT + 1)))
-                               die_port(peer.sin_port, PORT + 1);
+                               die_port(&peer, PORT + 1);
                }
        }
 
index a24c896347a889619a6b66ad58bd98d93c1865cf..dc7e9d6da0624c8c6f649dce9f1f6a2048b8793e 100755 (executable)
@@ -45,6 +45,8 @@ if ip netns exec "$ns0" ./conntrack_reverse_clash; then
        echo "PASS: No SNAT performed for null bindings"
 else
        echo "ERROR: SNAT performed without any matching snat rule"
+       ip netns exec "$ns0" conntrack -L
+       ip netns exec "$ns0" conntrack -S
        exit 1
 fi