]> git.ipfire.org Git - thirdparty/kernel/linux.git/commitdiff
xfrm: delete x->tunnel as we delete x
authorSabrina Dubroca <sd@queasysnail.net>
Fri, 4 Jul 2025 14:54:33 +0000 (16:54 +0200)
committerSteffen Klassert <steffen.klassert@secunet.com>
Tue, 8 Jul 2025 11:28:27 +0000 (13:28 +0200)
The ipcomp fallback tunnels currently get deleted (from the various
lists and hashtables) as the last user state that needed that fallback
is destroyed (not deleted). If a reference to that user state still
exists, the fallback state will remain on the hashtables/lists,
triggering the WARN in xfrm_state_fini. Because of those remaining
references, the fix in commit f75a2804da39 ("xfrm: destroy xfrm_state
synchronously on net exit path") is not complete.

We recently fixed one such situation in TCP due to defered freeing of
skbs (commit 9b6412e6979f ("tcp: drop secpath at the same time as we
currently drop dst")). This can also happen due to IP reassembly: skbs
with a secpath remain on the reassembly queue until netns
destruction. If we can't guarantee that the queues are flushed by the
time xfrm_state_fini runs, there may still be references to a (user)
xfrm_state, preventing the timely deletion of the corresponding
fallback state.

Instead of chasing each instance of skbs holding a secpath one by one,
this patch fixes the issue directly within xfrm, by deleting the
fallback state as soon as the last user state depending on it has been
deleted. Destruction will still happen when the final reference is
dropped.

A separate lockdep class for the fallback state is required since
we're going to lock x->tunnel while x is locked.

Fixes: 9d4139c76905 ("netns xfrm: per-netns xfrm_state_all list")
Signed-off-by: Sabrina Dubroca <sd@queasysnail.net>
Signed-off-by: Steffen Klassert <steffen.klassert@secunet.com>
include/net/xfrm.h
net/ipv4/ipcomp.c
net/ipv6/ipcomp6.c
net/ipv6/xfrm6_tunnel.c
net/xfrm/xfrm_ipcomp.c
net/xfrm/xfrm_state.c

index e45a275fca26d760d39bdd478406ed33bfab8512..91d52a380e373fd524f75d3a494aa24cbc6daf6f 100644 (file)
@@ -441,7 +441,6 @@ int xfrm_input_register_afinfo(const struct xfrm_input_afinfo *afinfo);
 int xfrm_input_unregister_afinfo(const struct xfrm_input_afinfo *afinfo);
 
 void xfrm_flush_gc(void);
-void xfrm_state_delete_tunnel(struct xfrm_state *x);
 
 struct xfrm_type {
        struct module           *owner;
index 5a4fb2539b08b60212a42638a8e6c4e39eaa472c..9a45aed508d193de4f443a58a4d41cc8f6f93c85 100644 (file)
@@ -54,6 +54,7 @@ static int ipcomp4_err(struct sk_buff *skb, u32 info)
 }
 
 /* We always hold one tunnel user reference to indicate a tunnel */
+static struct lock_class_key xfrm_state_lock_key;
 static struct xfrm_state *ipcomp_tunnel_create(struct xfrm_state *x)
 {
        struct net *net = xs_net(x);
@@ -62,6 +63,7 @@ static struct xfrm_state *ipcomp_tunnel_create(struct xfrm_state *x)
        t = xfrm_state_alloc(net);
        if (!t)
                goto out;
+       lockdep_set_class(&t->lock, &xfrm_state_lock_key);
 
        t->id.proto = IPPROTO_IPIP;
        t->id.spi = x->props.saddr.a4;
index 72d4858dec18a0b985171c7ddda70e073aa0ac9d..8607569de34f3af5aa6354bec28746388b5d0c0f 100644 (file)
@@ -71,6 +71,7 @@ static int ipcomp6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
        return 0;
 }
 
+static struct lock_class_key xfrm_state_lock_key;
 static struct xfrm_state *ipcomp6_tunnel_create(struct xfrm_state *x)
 {
        struct net *net = xs_net(x);
@@ -79,6 +80,7 @@ static struct xfrm_state *ipcomp6_tunnel_create(struct xfrm_state *x)
        t = xfrm_state_alloc(net);
        if (!t)
                goto out;
+       lockdep_set_class(&t->lock, &xfrm_state_lock_key);
 
        t->id.proto = IPPROTO_IPV6;
        t->id.spi = xfrm6_tunnel_alloc_spi(net, (xfrm_address_t *)&x->props.saddr);
index bf140ef781c1f29db655ea75f44214cbd3da1826..7fd8bc08e6eb1a8df31c54d7614b62dd22acff3f 100644 (file)
@@ -334,8 +334,8 @@ static void __net_exit xfrm6_tunnel_net_exit(struct net *net)
        struct xfrm6_tunnel_net *xfrm6_tn = xfrm6_tunnel_pernet(net);
        unsigned int i;
 
-       xfrm_flush_gc();
        xfrm_state_flush(net, 0, false, true);
+       xfrm_flush_gc();
 
        for (i = 0; i < XFRM6_TUNNEL_SPI_BYADDR_HSIZE; i++)
                WARN_ON_ONCE(!hlist_empty(&xfrm6_tn->spi_byaddr[i]));
index a38545413b80152ae39515f6cf0b093902e921fa..43fdc6ed8dd178e4987138da5a46072325d0dc7f 100644 (file)
@@ -313,7 +313,6 @@ void ipcomp_destroy(struct xfrm_state *x)
        struct ipcomp_data *ipcd = x->data;
        if (!ipcd)
                return;
-       xfrm_state_delete_tunnel(x);
        ipcomp_free_data(ipcd);
        kfree(ipcd);
 }
index c7e6472c623dcbe5893256f5dfd0145439086867..f7110a6588972b0f5e60c18add2cfb719afbc38f 100644 (file)
@@ -811,6 +811,7 @@ void __xfrm_state_destroy(struct xfrm_state *x, bool sync)
 }
 EXPORT_SYMBOL(__xfrm_state_destroy);
 
+static void xfrm_state_delete_tunnel(struct xfrm_state *x);
 int __xfrm_state_delete(struct xfrm_state *x)
 {
        struct net *net = xs_net(x);
@@ -838,6 +839,8 @@ int __xfrm_state_delete(struct xfrm_state *x)
 
                xfrm_dev_state_delete(x);
 
+               xfrm_state_delete_tunnel(x);
+
                /* All xfrm_state objects are created by xfrm_state_alloc.
                 * The xfrm_state_alloc call gives a reference, and that
                 * is what we are dropping here.
@@ -941,10 +944,7 @@ restart:
                                err = xfrm_state_delete(x);
                                xfrm_audit_state_delete(x, err ? 0 : 1,
                                                        task_valid);
-                               if (sync)
-                                       xfrm_state_put_sync(x);
-                               else
-                                       xfrm_state_put(x);
+                               xfrm_state_put(x);
                                if (!err)
                                        cnt++;
 
@@ -3068,20 +3068,17 @@ void xfrm_flush_gc(void)
 }
 EXPORT_SYMBOL(xfrm_flush_gc);
 
-/* Temporarily located here until net/xfrm/xfrm_tunnel.c is created */
-void xfrm_state_delete_tunnel(struct xfrm_state *x)
+static void xfrm_state_delete_tunnel(struct xfrm_state *x)
 {
        if (x->tunnel) {
                struct xfrm_state *t = x->tunnel;
 
-               if (atomic_read(&t->tunnel_users) == 2)
+               if (atomic_dec_return(&t->tunnel_users) == 1)
                        xfrm_state_delete(t);
-               atomic_dec(&t->tunnel_users);
-               xfrm_state_put_sync(t);
+               xfrm_state_put(t);
                x->tunnel = NULL;
        }
 }
-EXPORT_SYMBOL(xfrm_state_delete_tunnel);
 
 u32 xfrm_state_mtu(struct xfrm_state *x, int mtu)
 {
@@ -3286,8 +3283,8 @@ void xfrm_state_fini(struct net *net)
        unsigned int sz;
 
        flush_work(&net->xfrm.state_hash_work);
-       flush_work(&xfrm_state_gc_work);
        xfrm_state_flush(net, 0, false, true);
+       flush_work(&xfrm_state_gc_work);
 
        WARN_ON(!list_empty(&net->xfrm.state_all));