tcp: avoid premature drops in tcp_add_backlog()

author Eric Dumazet <edumazet@google.com>

Tue, 23 Apr 2024 12:56:20 +0000 (12:56 +0000)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sun, 16 Jun 2024 11:28:35 +0000 (13:28 +0200)
author Eric Dumazet <edumazet@google.com>
Tue, 23 Apr 2024 12:56:20 +0000 (12:56 +0000)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sun, 16 Jun 2024 11:28:35 +0000 (13:28 +0200)
diff --git a/net/ipv4/tcp_ipv4.c b/net/ipv4/tcp_ipv4.c

index d29d4b8192643849432a6ccfb5c253db17ccf464..c18ad443ca7db7aad4a86a6b869719cdfff49ced 100644 (file)
--- a/net/ipv4/tcp_ipv4.c
+++ b/net/ipv4/tcp_ipv4.c
@@ -1678,7 +1678,7 @@ int tcp_v4_early_demux(struct sk_buff *skb)
  
  bool tcp_add_backlog(struct sock *sk, struct sk_buff *skb)
  {
-       u32 limit, tail_gso_size, tail_gso_segs;
+       u32 tail_gso_size, tail_gso_segs;
         struct skb_shared_info *shinfo;
         const struct tcphdr *th;
         struct tcphdr *thtail;
@@ -1687,6 +1687,7 @@ bool tcp_add_backlog(struct sock *sk, struct sk_buff *skb)
         bool fragstolen;
         u32 gso_segs;
         u32 gso_size;
+       u64 limit;
         int delta;
  
         /* In case all data was pulled from skb frags (in __pskb_pull_tail()),
@@ -1781,7 +1782,13 @@ bool tcp_add_backlog(struct sock *sk, struct sk_buff *skb)
         __skb_push(skb, hdrlen);
  
  no_coalesce:
-       limit = (u32)READ_ONCE(sk->sk_rcvbuf) + (u32)(READ_ONCE(sk->sk_sndbuf) >> 1);
+       /* sk->sk_backlog.len is reset only at the end of __release_sock().
+        * Both sk->sk_backlog.len and sk->sk_rmem_alloc could reach
+        * sk_rcvbuf in normal conditions.
+        */
+       limit = ((u64)READ_ONCE(sk->sk_rcvbuf)) << 1;
+
+       limit += ((u32)READ_ONCE(sk->sk_sndbuf)) >> 1;
  
         /* Only socket owner can try to collapse/prune rx queues
          * to reduce memory overhead, so add a little headroom here.
@@ -1789,6 +1796,8 @@ no_coalesce:
          */
         limit += 64 * 1024;
  
+       limit = min_t(u64, limit, UINT_MAX);
+
         if (unlikely(sk_add_backlog(sk, skb, limit))) {
                 bh_unlock_sock(sk);
                 __NET_INC_STATS(sock_net(sk), LINUX_MIB_TCPBACKLOGDROP);
author	Eric Dumazet <edumazet@google.com>
	Tue, 23 Apr 2024 12:56:20 +0000 (12:56 +0000)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sun, 16 Jun 2024 11:28:35 +0000 (13:28 +0200)