bpf: Reject TCP_NODELAY in bpf-tcp-cc

author KaFai Wan <kafai.wan@linux.dev>

Tue, 21 Apr 2026 15:58:02 +0000 (23:58 +0800)

committer Martin KaFai Lau <martin.lau@kernel.org>

Wed, 22 Apr 2026 19:58:57 +0000 (12:58 -0700)
author KaFai Wan <kafai.wan@linux.dev>
Tue, 21 Apr 2026 15:58:02 +0000 (23:58 +0800)
committer Martin KaFai Lau <martin.lau@kernel.org>
Wed, 22 Apr 2026 19:58:57 +0000 (12:58 -0700)
diff --git a/include/linux/bpf.h b/include/linux/bpf.h

index b4b703c90ca94f2528f04d87a9d429b7c6b70d6e..01e20396489287269f4ed940a2593677e9c40d58 100644 (file)
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -3725,6 +3725,7 @@ extern const struct bpf_func_proto bpf_for_each_map_elem_proto;
  extern const struct bpf_func_proto bpf_btf_find_by_name_kind_proto;
  extern const struct bpf_func_proto bpf_sk_setsockopt_proto;
  extern const struct bpf_func_proto bpf_sk_getsockopt_proto;
+extern const struct bpf_func_proto bpf_sk_setsockopt_nodelay_proto;
  extern const struct bpf_func_proto bpf_unlocked_sk_setsockopt_proto;
  extern const struct bpf_func_proto bpf_unlocked_sk_getsockopt_proto;
  extern const struct bpf_func_proto bpf_find_vma_proto;
diff --git a/net/core/filter.c b/net/core/filter.c

index 96849f4c1fbccdad06a2573a2ab52e38118042b3..2914f5330310d0026eec2e832aa03af7633b4de6 100644 (file)
--- a/net/core/filter.c
+++ b/net/core/filter.c
@@ -5688,6 +5688,30 @@ const struct bpf_func_proto bpf_sk_getsockopt_proto = {
         .arg5_type      = ARG_CONST_SIZE,
  };
  
+BPF_CALL_5(bpf_sk_setsockopt_nodelay, struct sock *, sk, int, level,
+          int, optname, char *, optval, int, optlen)
+{
+       /*
+        * TCP_NODELAY triggers tcp_push_pending_frames() and re-enters
+        * CA_EVENT_TX_START in bpf_tcp_cc.
+        */
+       if (level == SOL_TCP && optname == TCP_NODELAY)
+               return -EOPNOTSUPP;
+
+       return _bpf_setsockopt(sk, level, optname, optval, optlen);
+}
+
+const struct bpf_func_proto bpf_sk_setsockopt_nodelay_proto = {
+       .func           = bpf_sk_setsockopt_nodelay,
+       .gpl_only       = false,
+       .ret_type       = RET_INTEGER,
+       .arg1_type      = ARG_PTR_TO_BTF_ID_SOCK_COMMON,
+       .arg2_type      = ARG_ANYTHING,
+       .arg3_type      = ARG_ANYTHING,
+       .arg4_type      = ARG_PTR_TO_MEM | MEM_RDONLY,
+       .arg5_type      = ARG_CONST_SIZE,
+};
+
  BPF_CALL_5(bpf_unlocked_sk_setsockopt, struct sock *, sk, int, level,
            int, optname, char *, optval, int, optlen)
  {
diff --git a/net/ipv4/bpf_tcp_ca.c b/net/ipv4/bpf_tcp_ca.c

index 008edc7f6688523dc86963d90485655e9fa8374e..791e15063237c909c555143aac4982cf1ada03c9 100644 (file)
--- a/net/ipv4/bpf_tcp_ca.c
+++ b/net/ipv4/bpf_tcp_ca.c
@@ -168,7 +168,7 @@ bpf_tcp_ca_get_func_proto(enum bpf_func_id func_id,
                  */
                 if (prog_ops_moff(prog) !=
                     offsetof(struct tcp_congestion_ops, release))
-                       return &bpf_sk_setsockopt_proto;
+                       return &bpf_sk_setsockopt_nodelay_proto;
                 return NULL;
         case BPF_FUNC_getsockopt:
                 /* Since get/setsockopt is usually expected to
author	KaFai Wan <kafai.wan@linux.dev>
	Tue, 21 Apr 2026 15:58:02 +0000 (23:58 +0800)
committer	Martin KaFai Lau <martin.lau@kernel.org>
	Wed, 22 Apr 2026 19:58:57 +0000 (12:58 -0700)
include/linux/bpf.h		patch \| blob \| blame \| history
net/core/filter.c		patch \| blob \| blame \| history
net/ipv4/bpf_tcp_ca.c		patch \| blob \| blame \| history