bpf: Support associating BPF program with struct_ops

author Amery Hung <ameryhung@gmail.com>

Wed, 3 Dec 2025 23:37:44 +0000 (15:37 -0800)

committer Andrii Nakryiko <andrii@kernel.org>

Sat, 6 Dec 2025 00:17:57 +0000 (16:17 -0800)
author Amery Hung <ameryhung@gmail.com>
Wed, 3 Dec 2025 23:37:44 +0000 (15:37 -0800)
committer Andrii Nakryiko <andrii@kernel.org>
Sat, 6 Dec 2025 00:17:57 +0000 (16:17 -0800)
diff --git a/include/linux/bpf.h b/include/linux/bpf.h

index 6498be4c44f8c27534bad235c035a170d1fb40d4..28d8d6b7bb1ea9bec7572a803ea6e32e2a3fbdd6 100644 (file)
--- a/include/linux/bpf.h
+++ b/include/linux/bpf.h
@@ -1739,6 +1739,8 @@ struct bpf_prog_aux {
                 struct rcu_head rcu;
         };
         struct bpf_stream stream[2];
+       struct mutex st_ops_assoc_mutex;
+       struct bpf_map __rcu *st_ops_assoc;
  };
  
  struct bpf_prog {
@@ -2041,6 +2043,9 @@ static inline void bpf_module_put(const void *data, struct module *owner)
                 module_put(owner);
  }
  int bpf_struct_ops_link_create(union bpf_attr *attr);
+int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map);
+void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog);
+void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux);
  u32 bpf_struct_ops_id(const void *kdata);
  
  #ifdef CONFIG_NET
@@ -2088,6 +2093,17 @@ static inline int bpf_struct_ops_link_create(union bpf_attr *attr)
  {
         return -EOPNOTSUPP;
  }
+static inline int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map)
+{
+       return -EOPNOTSUPP;
+}
+static inline void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog)
+{
+}
+static inline void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux)
+{
+       return NULL;
+}
  static inline void bpf_map_struct_ops_info_fill(struct bpf_map_info *info, struct bpf_map *map)
  {
  }
diff --git a/include/uapi/linux/bpf.h b/include/uapi/linux/bpf.h

index f8d8513eda27bdb311def61872bfd263974979c3..84ced3ed2d21e6cfa41e2aca7a42e88e6862cea2 100644 (file)
--- a/include/uapi/linux/bpf.h
+++ b/include/uapi/linux/bpf.h
@@ -918,6 +918,16 @@ union bpf_iter_link_info {
   *             Number of bytes read from the stream on success, or -1 if an
   *             error occurred (in which case, *errno* is set appropriately).
   *
+ * BPF_PROG_ASSOC_STRUCT_OPS
+ *     Description
+ *             Associate a BPF program with a struct_ops map. The struct_ops
+ *             map is identified by *map_fd* and the BPF program is
+ *             identified by *prog_fd*.
+ *
+ *     Return
+ *             0 on success or -1 if an error occurred (in which case,
+ *             *errno* is set appropriately).
+ *
   * NOTES
   *     eBPF objects (maps and programs) can be shared between processes.
   *
@@ -974,6 +984,7 @@ enum bpf_cmd {
         BPF_PROG_BIND_MAP,
         BPF_TOKEN_CREATE,
         BPF_PROG_STREAM_READ_BY_FD,
+       BPF_PROG_ASSOC_STRUCT_OPS,
         __MAX_BPF_CMD,
  };
  
@@ -1894,6 +1905,12 @@ union bpf_attr {
                 __u32           prog_fd;
         } prog_stream_read;
  
+       struct {
+               __u32           map_fd;
+               __u32           prog_fd;
+               __u32           flags;
+       } prog_assoc_struct_ops;
+
  } __attribute__((aligned(8)));
  
  /* The description below is an attempt at providing documentation to eBPF
diff --git a/kernel/bpf/bpf_struct_ops.c b/kernel/bpf/bpf_struct_ops.c

index 278490683d28822c194162ba2c115e8a50dbdc87..c43346cb3d7644a6a57f1c47ed9b0cf590fbad12 100644 (file)
--- a/kernel/bpf/bpf_struct_ops.c
+++ b/kernel/bpf/bpf_struct_ops.c
@@ -533,6 +533,17 @@ static void bpf_struct_ops_map_put_progs(struct bpf_struct_ops_map *st_map)
         }
  }
  
+static void bpf_struct_ops_map_dissoc_progs(struct bpf_struct_ops_map *st_map)
+{
+       u32 i;
+
+       for (i = 0; i < st_map->funcs_cnt; i++) {
+               if (!st_map->links[i])
+                       break;
+               bpf_prog_disassoc_struct_ops(st_map->links[i]->prog);
+       }
+}
+
  static void bpf_struct_ops_map_free_image(struct bpf_struct_ops_map *st_map)
  {
         int i;
@@ -801,6 +812,9 @@ static long bpf_struct_ops_map_update_elem(struct bpf_map *map, void *key,
                         goto reset_unlock;
                 }
  
+               /* Poison pointer on error instead of return for backward compatibility */
+               bpf_prog_assoc_struct_ops(prog, &st_map->map);
+
                 link = kzalloc(sizeof(*link), GFP_USER);
                 if (!link) {
                         bpf_prog_put(prog);
@@ -980,6 +994,8 @@ static void bpf_struct_ops_map_free(struct bpf_map *map)
         if (btf_is_module(st_map->btf))
                 module_put(st_map->st_ops_desc->st_ops->owner);
  
+       bpf_struct_ops_map_dissoc_progs(st_map);
+
         bpf_struct_ops_map_del_ksyms(st_map);
  
         /* The struct_ops's function may switch to another struct_ops.
@@ -1396,6 +1412,78 @@ err_out:
         return err;
  }
  
+int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map)
+{
+       struct bpf_map *st_ops_assoc;
+
+       guard(mutex)(&prog->aux->st_ops_assoc_mutex);
+
+       st_ops_assoc = rcu_dereference_protected(prog->aux->st_ops_assoc,
+                                                lockdep_is_held(&prog->aux->st_ops_assoc_mutex));
+       if (st_ops_assoc && st_ops_assoc == map)
+               return 0;
+
+       if (st_ops_assoc) {
+               if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
+                       return -EBUSY;
+
+               rcu_assign_pointer(prog->aux->st_ops_assoc, BPF_PTR_POISON);
+       } else {
+               /*
+                * struct_ops map does not track associated non-struct_ops programs.
+                * Bump the refcount to make sure st_ops_assoc is always valid.
+                */
+               if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
+                       bpf_map_inc(map);
+
+               rcu_assign_pointer(prog->aux->st_ops_assoc, map);
+       }
+
+       return 0;
+}
+
+void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog)
+{
+       struct bpf_map *st_ops_assoc;
+
+       guard(mutex)(&prog->aux->st_ops_assoc_mutex);
+
+       st_ops_assoc = rcu_dereference_protected(prog->aux->st_ops_assoc,
+                                                lockdep_is_held(&prog->aux->st_ops_assoc_mutex));
+       if (!st_ops_assoc || st_ops_assoc == BPF_PTR_POISON)
+               return;
+
+       if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
+               bpf_map_put(st_ops_assoc);
+
+       RCU_INIT_POINTER(prog->aux->st_ops_assoc, NULL);
+}
+
+/*
+ * Get a reference to the struct_ops struct (i.e., kdata) associated with a
+ * program. Should only be called in BPF program context (e.g., in a kfunc).
+ *
+ * If the returned pointer is not NULL, it must points to a valid struct_ops.
+ * The struct_ops map is not guaranteed to be initialized nor attached.
+ * Kernel struct_ops implementers are responsible for tracking and checking
+ * the state of the struct_ops if the use case requires an initialized or
+ * attached struct_ops.
+ */
+void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux)
+{
+       struct bpf_struct_ops_map *st_map;
+       struct bpf_map *st_ops_assoc;
+
+       st_ops_assoc = rcu_dereference_check(aux->st_ops_assoc, bpf_rcu_lock_held());
+       if (!st_ops_assoc || st_ops_assoc == BPF_PTR_POISON)
+               return NULL;
+
+       st_map = (struct bpf_struct_ops_map *)st_ops_assoc;
+
+       return &st_map->kvalue.data;
+}
+EXPORT_SYMBOL_GPL(bpf_prog_get_assoc_struct_ops);
+
  void bpf_map_struct_ops_info_fill(struct bpf_map_info *info, struct bpf_map *map)
  {
         struct bpf_struct_ops_map *st_map = (struct bpf_struct_ops_map *)map;
diff --git a/kernel/bpf/core.c b/kernel/bpf/core.c

index c8ae6ab316510035f8fa7db05b83e34202e0ffb8..67226145a4db7a17b83c85971e90c42c21583e15 100644 (file)
--- a/kernel/bpf/core.c
+++ b/kernel/bpf/core.c
@@ -136,6 +136,7 @@ struct bpf_prog *bpf_prog_alloc_no_stats(unsigned int size, gfp_t gfp_extra_flag
         mutex_init(&fp->aux->used_maps_mutex);
         mutex_init(&fp->aux->ext_mutex);
         mutex_init(&fp->aux->dst_mutex);
+       mutex_init(&fp->aux->st_ops_assoc_mutex);
  
  #ifdef CONFIG_BPF_SYSCALL
         bpf_prog_stream_init(fp);
@@ -286,6 +287,7 @@ void __bpf_prog_free(struct bpf_prog *fp)
         if (fp->aux) {
                 mutex_destroy(&fp->aux->used_maps_mutex);
                 mutex_destroy(&fp->aux->dst_mutex);
+               mutex_destroy(&fp->aux->st_ops_assoc_mutex);
                 kfree(fp->aux->poke_tab);
                 kfree(fp->aux);
         }
@@ -2896,6 +2898,7 @@ static void bpf_prog_free_deferred(struct work_struct *work)
  #endif
         bpf_free_used_maps(aux);
         bpf_free_used_btfs(aux);
+       bpf_prog_disassoc_struct_ops(aux->prog);
         if (bpf_prog_is_dev_bound(aux))
                 bpf_prog_dev_bound_destroy(aux->prog);
  #ifdef CONFIG_PERF_EVENTS
diff --git a/kernel/bpf/syscall.c b/kernel/bpf/syscall.c

index 6589acc89ef8d7b5f272de6e6662c161d5c77d77..3080cc48bfc3d4e78a2d79173a448f0221d0c372 100644 (file)
--- a/kernel/bpf/syscall.c
+++ b/kernel/bpf/syscall.c
@@ -6122,6 +6122,49 @@ static int prog_stream_read(union bpf_attr *attr)
         return ret;
  }
  
+#define BPF_PROG_ASSOC_STRUCT_OPS_LAST_FIELD prog_assoc_struct_ops.prog_fd
+
+static int prog_assoc_struct_ops(union bpf_attr *attr)
+{
+       struct bpf_prog *prog;
+       struct bpf_map *map;
+       int ret;
+
+       if (CHECK_ATTR(BPF_PROG_ASSOC_STRUCT_OPS))
+               return -EINVAL;
+
+       if (attr->prog_assoc_struct_ops.flags)
+               return -EINVAL;
+
+       prog = bpf_prog_get(attr->prog_assoc_struct_ops.prog_fd);
+       if (IS_ERR(prog))
+               return PTR_ERR(prog);
+
+       if (prog->type == BPF_PROG_TYPE_STRUCT_OPS) {
+               ret = -EINVAL;
+               goto put_prog;
+       }
+
+       map = bpf_map_get(attr->prog_assoc_struct_ops.map_fd);
+       if (IS_ERR(map)) {
+               ret = PTR_ERR(map);
+               goto put_prog;
+       }
+
+       if (map->map_type != BPF_MAP_TYPE_STRUCT_OPS) {
+               ret = -EINVAL;
+               goto put_map;
+       }
+
+       ret = bpf_prog_assoc_struct_ops(prog, map);
+
+put_map:
+       bpf_map_put(map);
+put_prog:
+       bpf_prog_put(prog);
+       return ret;
+}
+
  static int __sys_bpf(enum bpf_cmd cmd, bpfptr_t uattr, unsigned int size)
  {
         union bpf_attr attr;
@@ -6261,6 +6304,9 @@ static int __sys_bpf(enum bpf_cmd cmd, bpfptr_t uattr, unsigned int size)
         case BPF_PROG_STREAM_READ_BY_FD:
                 err = prog_stream_read(&attr);
                 break;
+       case BPF_PROG_ASSOC_STRUCT_OPS:
+               err = prog_assoc_struct_ops(&attr);
+               break;
         default:
                 err = -EINVAL;
                 break;
diff --git a/tools/include/uapi/linux/bpf.h b/tools/include/uapi/linux/bpf.h

index be7d8e060e10423d304db3d9cd43fce45118eef0..6b92b0847ec2f28a7bd65d5ffb4f08c2fecab67d 100644 (file)
--- a/tools/include/uapi/linux/bpf.h
+++ b/tools/include/uapi/linux/bpf.h
@@ -918,6 +918,16 @@ union bpf_iter_link_info {
   *             Number of bytes read from the stream on success, or -1 if an
   *             error occurred (in which case, *errno* is set appropriately).
   *
+ * BPF_PROG_ASSOC_STRUCT_OPS
+ *     Description
+ *             Associate a BPF program with a struct_ops map. The struct_ops
+ *             map is identified by *map_fd* and the BPF program is
+ *             identified by *prog_fd*.
+ *
+ *     Return
+ *             0 on success or -1 if an error occurred (in which case,
+ *             *errno* is set appropriately).
+ *
   * NOTES
   *     eBPF objects (maps and programs) can be shared between processes.
   *
@@ -974,6 +984,7 @@ enum bpf_cmd {
         BPF_PROG_BIND_MAP,
         BPF_TOKEN_CREATE,
         BPF_PROG_STREAM_READ_BY_FD,
+       BPF_PROG_ASSOC_STRUCT_OPS,
         __MAX_BPF_CMD,
  };
  
@@ -1894,6 +1905,12 @@ union bpf_attr {
                 __u32           prog_fd;
         } prog_stream_read;
  
+       struct {
+               __u32           map_fd;
+               __u32           prog_fd;
+               __u32           flags;
+       } prog_assoc_struct_ops;
+
  } __attribute__((aligned(8)));
  
  /* The description below is an attempt at providing documentation to eBPF
author	Amery Hung <ameryhung@gmail.com>
	Wed, 3 Dec 2025 23:37:44 +0000 (15:37 -0800)
committer	Andrii Nakryiko <andrii@kernel.org>
	Sat, 6 Dec 2025 00:17:57 +0000 (16:17 -0800)
include/linux/bpf.h		patch \| blob \| blame \| history
include/uapi/linux/bpf.h		patch \| blob \| blame \| history
kernel/bpf/bpf_struct_ops.c		patch \| blob \| blame \| history
kernel/bpf/core.c		patch \| blob \| blame \| history
kernel/bpf/syscall.c		patch \| blob \| blame \| history
tools/include/uapi/linux/bpf.h		patch \| blob \| blame \| history