Skip to content

Commit b5709f6

Browse files
ameryhunganakryiko
authored andcommitted
bpf: Support associating BPF program with struct_ops
Add a new BPF command BPF_PROG_ASSOC_STRUCT_OPS to allow associating a BPF program with a struct_ops map. This command takes a file descriptor of a struct_ops map and a BPF program and set prog->aux->st_ops_assoc to the kdata of the struct_ops map. The command does not accept a struct_ops program nor a non-struct_ops map. Programs of a struct_ops map is automatically associated with the map during map update. If a program is shared between two struct_ops maps, prog->aux->st_ops_assoc will be poisoned to indicate that the associated struct_ops is ambiguous. The pointer, once poisoned, cannot be reset since we have lost track of associated struct_ops. For other program types, the associated struct_ops map, once set, cannot be changed later. This restriction may be lifted in the future if there is a use case. A kernel helper bpf_prog_get_assoc_struct_ops() can be used to retrieve the associated struct_ops pointer. The returned pointer, if not NULL, is guaranteed to be valid and point to a fully updated struct_ops struct. For struct_ops program reused in multiple struct_ops map, the return will be NULL. prog->aux->st_ops_assoc is protected by bumping the refcount for non-struct_ops programs and RCU for struct_ops programs. Since it would be inefficient to track programs associated with a struct_ops map, every non-struct_ops program will bump the refcount of the map to make sure st_ops_assoc stays valid. For a struct_ops program, it is protected by RCU as map_free will wait for an RCU grace period before disassociating the program with the map. The helper must be called in BPF program context or RCU read-side critical section. struct_ops implementers should note that the struct_ops returned may not be initialized nor attached yet. The struct_ops implementer will be responsible for tracking and checking the state of the associated struct_ops map if the use case expects an initialized or attached struct_ops. Signed-off-by: Amery Hung <[email protected]> Signed-off-by: Andrii Nakryiko <[email protected]> Acked-by: Andrii Nakryiko <[email protected]> Acked-by: Martin KaFai Lau <[email protected]> Link: https://lore.kernel.org/bpf/[email protected]
1 parent 1588c81 commit b5709f6

File tree

6 files changed

+187
-0
lines changed

6 files changed

+187
-0
lines changed

include/linux/bpf.h

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1739,6 +1739,8 @@ struct bpf_prog_aux {
17391739
struct rcu_head rcu;
17401740
};
17411741
struct bpf_stream stream[2];
1742+
struct mutex st_ops_assoc_mutex;
1743+
struct bpf_map __rcu *st_ops_assoc;
17421744
};
17431745

17441746
struct bpf_prog {
@@ -2041,6 +2043,9 @@ static inline void bpf_module_put(const void *data, struct module *owner)
20412043
module_put(owner);
20422044
}
20432045
int bpf_struct_ops_link_create(union bpf_attr *attr);
2046+
int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map);
2047+
void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog);
2048+
void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux);
20442049
u32 bpf_struct_ops_id(const void *kdata);
20452050

20462051
#ifdef CONFIG_NET
@@ -2088,6 +2093,17 @@ static inline int bpf_struct_ops_link_create(union bpf_attr *attr)
20882093
{
20892094
return -EOPNOTSUPP;
20902095
}
2096+
static inline int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map)
2097+
{
2098+
return -EOPNOTSUPP;
2099+
}
2100+
static inline void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog)
2101+
{
2102+
}
2103+
static inline void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux)
2104+
{
2105+
return NULL;
2106+
}
20912107
static inline void bpf_map_struct_ops_info_fill(struct bpf_map_info *info, struct bpf_map *map)
20922108
{
20932109
}

include/uapi/linux/bpf.h

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -918,6 +918,16 @@ union bpf_iter_link_info {
918918
* Number of bytes read from the stream on success, or -1 if an
919919
* error occurred (in which case, *errno* is set appropriately).
920920
*
921+
* BPF_PROG_ASSOC_STRUCT_OPS
922+
* Description
923+
* Associate a BPF program with a struct_ops map. The struct_ops
924+
* map is identified by *map_fd* and the BPF program is
925+
* identified by *prog_fd*.
926+
*
927+
* Return
928+
* 0 on success or -1 if an error occurred (in which case,
929+
* *errno* is set appropriately).
930+
*
921931
* NOTES
922932
* eBPF objects (maps and programs) can be shared between processes.
923933
*
@@ -974,6 +984,7 @@ enum bpf_cmd {
974984
BPF_PROG_BIND_MAP,
975985
BPF_TOKEN_CREATE,
976986
BPF_PROG_STREAM_READ_BY_FD,
987+
BPF_PROG_ASSOC_STRUCT_OPS,
977988
__MAX_BPF_CMD,
978989
};
979990

@@ -1894,6 +1905,12 @@ union bpf_attr {
18941905
__u32 prog_fd;
18951906
} prog_stream_read;
18961907

1908+
struct {
1909+
__u32 map_fd;
1910+
__u32 prog_fd;
1911+
__u32 flags;
1912+
} prog_assoc_struct_ops;
1913+
18971914
} __attribute__((aligned(8)));
18981915

18991916
/* The description below is an attempt at providing documentation to eBPF

kernel/bpf/bpf_struct_ops.c

Lines changed: 88 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -533,6 +533,17 @@ static void bpf_struct_ops_map_put_progs(struct bpf_struct_ops_map *st_map)
533533
}
534534
}
535535

536+
static void bpf_struct_ops_map_dissoc_progs(struct bpf_struct_ops_map *st_map)
537+
{
538+
u32 i;
539+
540+
for (i = 0; i < st_map->funcs_cnt; i++) {
541+
if (!st_map->links[i])
542+
break;
543+
bpf_prog_disassoc_struct_ops(st_map->links[i]->prog);
544+
}
545+
}
546+
536547
static void bpf_struct_ops_map_free_image(struct bpf_struct_ops_map *st_map)
537548
{
538549
int i;
@@ -801,6 +812,9 @@ static long bpf_struct_ops_map_update_elem(struct bpf_map *map, void *key,
801812
goto reset_unlock;
802813
}
803814

815+
/* Poison pointer on error instead of return for backward compatibility */
816+
bpf_prog_assoc_struct_ops(prog, &st_map->map);
817+
804818
link = kzalloc(sizeof(*link), GFP_USER);
805819
if (!link) {
806820
bpf_prog_put(prog);
@@ -980,6 +994,8 @@ static void bpf_struct_ops_map_free(struct bpf_map *map)
980994
if (btf_is_module(st_map->btf))
981995
module_put(st_map->st_ops_desc->st_ops->owner);
982996

997+
bpf_struct_ops_map_dissoc_progs(st_map);
998+
983999
bpf_struct_ops_map_del_ksyms(st_map);
9841000

9851001
/* The struct_ops's function may switch to another struct_ops.
@@ -1396,6 +1412,78 @@ int bpf_struct_ops_link_create(union bpf_attr *attr)
13961412
return err;
13971413
}
13981414

1415+
int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map)
1416+
{
1417+
struct bpf_map *st_ops_assoc;
1418+
1419+
guard(mutex)(&prog->aux->st_ops_assoc_mutex);
1420+
1421+
st_ops_assoc = rcu_dereference_protected(prog->aux->st_ops_assoc,
1422+
lockdep_is_held(&prog->aux->st_ops_assoc_mutex));
1423+
if (st_ops_assoc && st_ops_assoc == map)
1424+
return 0;
1425+
1426+
if (st_ops_assoc) {
1427+
if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
1428+
return -EBUSY;
1429+
1430+
rcu_assign_pointer(prog->aux->st_ops_assoc, BPF_PTR_POISON);
1431+
} else {
1432+
/*
1433+
* struct_ops map does not track associated non-struct_ops programs.
1434+
* Bump the refcount to make sure st_ops_assoc is always valid.
1435+
*/
1436+
if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
1437+
bpf_map_inc(map);
1438+
1439+
rcu_assign_pointer(prog->aux->st_ops_assoc, map);
1440+
}
1441+
1442+
return 0;
1443+
}
1444+
1445+
void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog)
1446+
{
1447+
struct bpf_map *st_ops_assoc;
1448+
1449+
guard(mutex)(&prog->aux->st_ops_assoc_mutex);
1450+
1451+
st_ops_assoc = rcu_dereference_protected(prog->aux->st_ops_assoc,
1452+
lockdep_is_held(&prog->aux->st_ops_assoc_mutex));
1453+
if (!st_ops_assoc || st_ops_assoc == BPF_PTR_POISON)
1454+
return;
1455+
1456+
if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
1457+
bpf_map_put(st_ops_assoc);
1458+
1459+
RCU_INIT_POINTER(prog->aux->st_ops_assoc, NULL);
1460+
}
1461+
1462+
/*
1463+
* Get a reference to the struct_ops struct (i.e., kdata) associated with a
1464+
* program. Should only be called in BPF program context (e.g., in a kfunc).
1465+
*
1466+
* If the returned pointer is not NULL, it must points to a valid struct_ops.
1467+
* The struct_ops map is not guaranteed to be initialized nor attached.
1468+
* Kernel struct_ops implementers are responsible for tracking and checking
1469+
* the state of the struct_ops if the use case requires an initialized or
1470+
* attached struct_ops.
1471+
*/
1472+
void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux)
1473+
{
1474+
struct bpf_struct_ops_map *st_map;
1475+
struct bpf_map *st_ops_assoc;
1476+
1477+
st_ops_assoc = rcu_dereference_check(aux->st_ops_assoc, bpf_rcu_lock_held());
1478+
if (!st_ops_assoc || st_ops_assoc == BPF_PTR_POISON)
1479+
return NULL;
1480+
1481+
st_map = (struct bpf_struct_ops_map *)st_ops_assoc;
1482+
1483+
return &st_map->kvalue.data;
1484+
}
1485+
EXPORT_SYMBOL_GPL(bpf_prog_get_assoc_struct_ops);
1486+
13991487
void bpf_map_struct_ops_info_fill(struct bpf_map_info *info, struct bpf_map *map)
14001488
{
14011489
struct bpf_struct_ops_map *st_map = (struct bpf_struct_ops_map *)map;

kernel/bpf/core.c

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -136,6 +136,7 @@ struct bpf_prog *bpf_prog_alloc_no_stats(unsigned int size, gfp_t gfp_extra_flag
136136
mutex_init(&fp->aux->used_maps_mutex);
137137
mutex_init(&fp->aux->ext_mutex);
138138
mutex_init(&fp->aux->dst_mutex);
139+
mutex_init(&fp->aux->st_ops_assoc_mutex);
139140

140141
#ifdef CONFIG_BPF_SYSCALL
141142
bpf_prog_stream_init(fp);
@@ -286,6 +287,7 @@ void __bpf_prog_free(struct bpf_prog *fp)
286287
if (fp->aux) {
287288
mutex_destroy(&fp->aux->used_maps_mutex);
288289
mutex_destroy(&fp->aux->dst_mutex);
290+
mutex_destroy(&fp->aux->st_ops_assoc_mutex);
289291
kfree(fp->aux->poke_tab);
290292
kfree(fp->aux);
291293
}
@@ -2896,6 +2898,7 @@ static void bpf_prog_free_deferred(struct work_struct *work)
28962898
#endif
28972899
bpf_free_used_maps(aux);
28982900
bpf_free_used_btfs(aux);
2901+
bpf_prog_disassoc_struct_ops(aux->prog);
28992902
if (bpf_prog_is_dev_bound(aux))
29002903
bpf_prog_dev_bound_destroy(aux->prog);
29012904
#ifdef CONFIG_PERF_EVENTS

kernel/bpf/syscall.c

Lines changed: 46 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6122,6 +6122,49 @@ static int prog_stream_read(union bpf_attr *attr)
61226122
return ret;
61236123
}
61246124

6125+
#define BPF_PROG_ASSOC_STRUCT_OPS_LAST_FIELD prog_assoc_struct_ops.prog_fd
6126+
6127+
static int prog_assoc_struct_ops(union bpf_attr *attr)
6128+
{
6129+
struct bpf_prog *prog;
6130+
struct bpf_map *map;
6131+
int ret;
6132+
6133+
if (CHECK_ATTR(BPF_PROG_ASSOC_STRUCT_OPS))
6134+
return -EINVAL;
6135+
6136+
if (attr->prog_assoc_struct_ops.flags)
6137+
return -EINVAL;
6138+
6139+
prog = bpf_prog_get(attr->prog_assoc_struct_ops.prog_fd);
6140+
if (IS_ERR(prog))
6141+
return PTR_ERR(prog);
6142+
6143+
if (prog->type == BPF_PROG_TYPE_STRUCT_OPS) {
6144+
ret = -EINVAL;
6145+
goto put_prog;
6146+
}
6147+
6148+
map = bpf_map_get(attr->prog_assoc_struct_ops.map_fd);
6149+
if (IS_ERR(map)) {
6150+
ret = PTR_ERR(map);
6151+
goto put_prog;
6152+
}
6153+
6154+
if (map->map_type != BPF_MAP_TYPE_STRUCT_OPS) {
6155+
ret = -EINVAL;
6156+
goto put_map;
6157+
}
6158+
6159+
ret = bpf_prog_assoc_struct_ops(prog, map);
6160+
6161+
put_map:
6162+
bpf_map_put(map);
6163+
put_prog:
6164+
bpf_prog_put(prog);
6165+
return ret;
6166+
}
6167+
61256168
static int __sys_bpf(enum bpf_cmd cmd, bpfptr_t uattr, unsigned int size)
61266169
{
61276170
union bpf_attr attr;
@@ -6261,6 +6304,9 @@ static int __sys_bpf(enum bpf_cmd cmd, bpfptr_t uattr, unsigned int size)
62616304
case BPF_PROG_STREAM_READ_BY_FD:
62626305
err = prog_stream_read(&attr);
62636306
break;
6307+
case BPF_PROG_ASSOC_STRUCT_OPS:
6308+
err = prog_assoc_struct_ops(&attr);
6309+
break;
62646310
default:
62656311
err = -EINVAL;
62666312
break;

tools/include/uapi/linux/bpf.h

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -918,6 +918,16 @@ union bpf_iter_link_info {
918918
* Number of bytes read from the stream on success, or -1 if an
919919
* error occurred (in which case, *errno* is set appropriately).
920920
*
921+
* BPF_PROG_ASSOC_STRUCT_OPS
922+
* Description
923+
* Associate a BPF program with a struct_ops map. The struct_ops
924+
* map is identified by *map_fd* and the BPF program is
925+
* identified by *prog_fd*.
926+
*
927+
* Return
928+
* 0 on success or -1 if an error occurred (in which case,
929+
* *errno* is set appropriately).
930+
*
921931
* NOTES
922932
* eBPF objects (maps and programs) can be shared between processes.
923933
*
@@ -974,6 +984,7 @@ enum bpf_cmd {
974984
BPF_PROG_BIND_MAP,
975985
BPF_TOKEN_CREATE,
976986
BPF_PROG_STREAM_READ_BY_FD,
987+
BPF_PROG_ASSOC_STRUCT_OPS,
977988
__MAX_BPF_CMD,
978989
};
979990

@@ -1894,6 +1905,12 @@ union bpf_attr {
18941905
__u32 prog_fd;
18951906
} prog_stream_read;
18961907

1908+
struct {
1909+
__u32 map_fd;
1910+
__u32 prog_fd;
1911+
__u32 flags;
1912+
} prog_assoc_struct_ops;
1913+
18971914
} __attribute__((aligned(8)));
18981915

18991916
/* The description below is an attempt at providing documentation to eBPF

0 commit comments

Comments
 (0)