Skip to content

Commit 81e0d45

Browse files
ameryhungKernel Patches Daemon
authored andcommitted
bpf: Support associating BPF program with struct_ops
Add a new BPF command BPF_PROG_ASSOC_STRUCT_OPS to allow associating a BPF program with a struct_ops map. This command takes a file descriptor of a struct_ops map and a BPF program and set prog->aux->st_ops_assoc to the kdata of the struct_ops map. The command does not accept a struct_ops program nor a non-struct_ops map. Programs of a struct_ops map is automatically associated with the map during map update. If a program is shared between two struct_ops maps, prog->aux->st_ops_assoc will be poisoned to indicate that the associated struct_ops is ambiguous. The pointer, once poisoned, cannot be reset since we have lost track of associated struct_ops. For other program types, the associated struct_ops map, once set, cannot be changed later. This restriction may be lifted in the future if there is a use case. A kernel helper bpf_prog_get_assoc_struct_ops() can be used to retrieve the associated struct_ops pointer. The returned pointer, if not NULL, is guaranteed to be valid and point to a fully updated struct_ops struct. For struct_ops program reused in multiple struct_ops map, the return will be NULL. To make sure the returned pointer to be valid, the command increases the refcount of the map for every associated non-struct_ops programs. For struct_ops programs, the destruction of a struct_ops map already waits for its BPF programs to finish running. A later patch will further make sure the map will not be freed when an async callback schedule from struct_ops is running. struct_ops implementers should note that the struct_ops returned may or may not be attached. The struct_ops implementer will be responsible for tracking and checking the state of the associated struct_ops map if the use case requires an attached struct_ops. Signed-off-by: Amery Hung <[email protected]>
1 parent 9fe8bf2 commit 81e0d45

File tree

6 files changed

+189
-0
lines changed

6 files changed

+189
-0
lines changed

include/linux/bpf.h

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1726,6 +1726,8 @@ struct bpf_prog_aux {
17261726
struct rcu_head rcu;
17271727
};
17281728
struct bpf_stream stream[2];
1729+
struct mutex st_ops_assoc_mutex;
1730+
struct bpf_map *st_ops_assoc;
17291731
};
17301732

17311733
struct bpf_prog {
@@ -2026,6 +2028,9 @@ static inline void bpf_module_put(const void *data, struct module *owner)
20262028
module_put(owner);
20272029
}
20282030
int bpf_struct_ops_link_create(union bpf_attr *attr);
2031+
int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map);
2032+
void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog);
2033+
void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux);
20292034
u32 bpf_struct_ops_id(const void *kdata);
20302035

20312036
#ifdef CONFIG_NET
@@ -2073,6 +2078,17 @@ static inline int bpf_struct_ops_link_create(union bpf_attr *attr)
20732078
{
20742079
return -EOPNOTSUPP;
20752080
}
2081+
static inline int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map)
2082+
{
2083+
return -EOPNOTSUPP;
2084+
}
2085+
static inline void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog)
2086+
{
2087+
}
2088+
static inline void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux)
2089+
{
2090+
return NULL;
2091+
}
20762092
static inline void bpf_map_struct_ops_info_fill(struct bpf_map_info *info, struct bpf_map *map)
20772093
{
20782094
}

include/uapi/linux/bpf.h

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -918,6 +918,16 @@ union bpf_iter_link_info {
918918
* Number of bytes read from the stream on success, or -1 if an
919919
* error occurred (in which case, *errno* is set appropriately).
920920
*
921+
* BPF_PROG_ASSOC_STRUCT_OPS
922+
* Description
923+
* Associate a BPF program with a struct_ops map. The struct_ops
924+
* map is identified by *map_fd* and the BPF program is
925+
* identified by *prog_fd*.
926+
*
927+
* Return
928+
* 0 on success or -1 if an error occurred (in which case,
929+
* *errno* is set appropriately).
930+
*
921931
* NOTES
922932
* eBPF objects (maps and programs) can be shared between processes.
923933
*
@@ -974,6 +984,7 @@ enum bpf_cmd {
974984
BPF_PROG_BIND_MAP,
975985
BPF_TOKEN_CREATE,
976986
BPF_PROG_STREAM_READ_BY_FD,
987+
BPF_PROG_ASSOC_STRUCT_OPS,
977988
__MAX_BPF_CMD,
978989
};
979990

@@ -1893,6 +1904,12 @@ union bpf_attr {
18931904
__u32 prog_fd;
18941905
} prog_stream_read;
18951906

1907+
struct {
1908+
__u32 map_fd;
1909+
__u32 prog_fd;
1910+
__u32 flags;
1911+
} prog_assoc_struct_ops;
1912+
18961913
} __attribute__((aligned(8)));
18971914

18981915
/* The description below is an attempt at providing documentation to eBPF

kernel/bpf/bpf_struct_ops.c

Lines changed: 90 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -533,6 +533,17 @@ static void bpf_struct_ops_map_put_progs(struct bpf_struct_ops_map *st_map)
533533
}
534534
}
535535

536+
static void bpf_struct_ops_map_dissoc_progs(struct bpf_struct_ops_map *st_map)
537+
{
538+
u32 i;
539+
540+
for (i = 0; i < st_map->funcs_cnt; i++) {
541+
if (!st_map->links[i])
542+
break;
543+
bpf_prog_disassoc_struct_ops(st_map->links[i]->prog);
544+
}
545+
}
546+
536547
static void bpf_struct_ops_map_free_image(struct bpf_struct_ops_map *st_map)
537548
{
538549
int i;
@@ -801,6 +812,12 @@ static long bpf_struct_ops_map_update_elem(struct bpf_map *map, void *key,
801812
goto reset_unlock;
802813
}
803814

815+
err = bpf_prog_assoc_struct_ops(prog, &st_map->map);
816+
if (err) {
817+
bpf_prog_put(prog);
818+
goto reset_unlock;
819+
}
820+
804821
link = kzalloc(sizeof(*link), GFP_USER);
805822
if (!link) {
806823
bpf_prog_put(prog);
@@ -980,6 +997,8 @@ static void bpf_struct_ops_map_free(struct bpf_map *map)
980997
if (btf_is_module(st_map->btf))
981998
module_put(st_map->st_ops_desc->st_ops->owner);
982999

1000+
bpf_struct_ops_map_dissoc_progs(st_map);
1001+
9831002
bpf_struct_ops_map_del_ksyms(st_map);
9841003

9851004
/* The struct_ops's function may switch to another struct_ops.
@@ -1394,6 +1413,77 @@ int bpf_struct_ops_link_create(union bpf_attr *attr)
13941413
return err;
13951414
}
13961415

1416+
int bpf_prog_assoc_struct_ops(struct bpf_prog *prog, struct bpf_map *map)
1417+
{
1418+
struct bpf_map *st_ops_assoc;
1419+
1420+
guard(mutex)(&prog->aux->st_ops_assoc_mutex);
1421+
1422+
st_ops_assoc = prog->aux->st_ops_assoc;
1423+
1424+
if (st_ops_assoc && st_ops_assoc == map)
1425+
return 0;
1426+
1427+
if (st_ops_assoc) {
1428+
if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
1429+
return -EBUSY;
1430+
1431+
WRITE_ONCE(prog->aux->st_ops_assoc, BPF_PTR_POISON);
1432+
} else {
1433+
if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
1434+
bpf_map_inc(map);
1435+
1436+
WRITE_ONCE(prog->aux->st_ops_assoc, map);
1437+
}
1438+
1439+
return 0;
1440+
}
1441+
1442+
void bpf_prog_disassoc_struct_ops(struct bpf_prog *prog)
1443+
{
1444+
struct bpf_map *st_ops_assoc;
1445+
1446+
guard(mutex)(&prog->aux->st_ops_assoc_mutex);
1447+
1448+
st_ops_assoc = prog->aux->st_ops_assoc;
1449+
1450+
if (!st_ops_assoc || st_ops_assoc == BPF_PTR_POISON)
1451+
return;
1452+
1453+
if (prog->type != BPF_PROG_TYPE_STRUCT_OPS)
1454+
bpf_map_put(st_ops_assoc);
1455+
1456+
WRITE_ONCE(prog->aux->st_ops_assoc, NULL);
1457+
}
1458+
1459+
/*
1460+
* Get a reference to the struct_ops struct (i.e., kdata) associated with a
1461+
* program.
1462+
*
1463+
* If the returned pointer is not NULL, it must points to a valid and
1464+
* initialized struct_ops. The struct_ops may or may not be attached.
1465+
* Kernel struct_ops implementers are responsible for tracking and checking
1466+
* the state of the struct_ops if the use case requires an attached struct_ops.
1467+
*/
1468+
void *bpf_prog_get_assoc_struct_ops(const struct bpf_prog_aux *aux)
1469+
{
1470+
struct bpf_map *st_ops_assoc = READ_ONCE(aux->st_ops_assoc);
1471+
struct bpf_struct_ops_map *st_map;
1472+
1473+
if (!st_ops_assoc || st_ops_assoc == BPF_PTR_POISON)
1474+
return NULL;
1475+
1476+
st_map = (struct bpf_struct_ops_map *)st_ops_assoc;
1477+
1478+
if (smp_load_acquire(&st_map->kvalue.common.state) == BPF_STRUCT_OPS_STATE_INIT) {
1479+
bpf_map_put(st_ops_assoc);
1480+
return NULL;
1481+
}
1482+
1483+
return &st_map->kvalue.data;
1484+
}
1485+
EXPORT_SYMBOL_GPL(bpf_prog_get_assoc_struct_ops);
1486+
13971487
void bpf_map_struct_ops_info_fill(struct bpf_map_info *info, struct bpf_map *map)
13981488
{
13991489
struct bpf_struct_ops_map *st_map = (struct bpf_struct_ops_map *)map;

kernel/bpf/core.c

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -136,6 +136,7 @@ struct bpf_prog *bpf_prog_alloc_no_stats(unsigned int size, gfp_t gfp_extra_flag
136136
mutex_init(&fp->aux->used_maps_mutex);
137137
mutex_init(&fp->aux->ext_mutex);
138138
mutex_init(&fp->aux->dst_mutex);
139+
mutex_init(&fp->aux->st_ops_assoc_mutex);
139140

140141
#ifdef CONFIG_BPF_SYSCALL
141142
bpf_prog_stream_init(fp);
@@ -286,6 +287,7 @@ void __bpf_prog_free(struct bpf_prog *fp)
286287
if (fp->aux) {
287288
mutex_destroy(&fp->aux->used_maps_mutex);
288289
mutex_destroy(&fp->aux->dst_mutex);
290+
mutex_destroy(&fp->aux->st_ops_assoc_mutex);
289291
kfree(fp->aux->poke_tab);
290292
kfree(fp->aux);
291293
}
@@ -2875,6 +2877,7 @@ static void bpf_prog_free_deferred(struct work_struct *work)
28752877
#endif
28762878
bpf_free_used_maps(aux);
28772879
bpf_free_used_btfs(aux);
2880+
bpf_prog_disassoc_struct_ops(aux->prog);
28782881
if (bpf_prog_is_dev_bound(aux))
28792882
bpf_prog_dev_bound_destroy(aux->prog);
28802883
#ifdef CONFIG_PERF_EVENTS

kernel/bpf/syscall.c

Lines changed: 46 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6107,6 +6107,49 @@ static int prog_stream_read(union bpf_attr *attr)
61076107
return ret;
61086108
}
61096109

6110+
#define BPF_PROG_ASSOC_STRUCT_OPS_LAST_FIELD prog_assoc_struct_ops.prog_fd
6111+
6112+
static int prog_assoc_struct_ops(union bpf_attr *attr)
6113+
{
6114+
struct bpf_prog *prog;
6115+
struct bpf_map *map;
6116+
int ret;
6117+
6118+
if (CHECK_ATTR(BPF_PROG_ASSOC_STRUCT_OPS))
6119+
return -EINVAL;
6120+
6121+
if (attr->prog_assoc_struct_ops.flags)
6122+
return -EINVAL;
6123+
6124+
prog = bpf_prog_get(attr->prog_assoc_struct_ops.prog_fd);
6125+
if (IS_ERR(prog))
6126+
return PTR_ERR(prog);
6127+
6128+
if (prog->type == BPF_PROG_TYPE_STRUCT_OPS) {
6129+
ret = -EINVAL;
6130+
goto put_prog;
6131+
}
6132+
6133+
map = bpf_map_get(attr->prog_assoc_struct_ops.map_fd);
6134+
if (IS_ERR(map)) {
6135+
ret = PTR_ERR(map);
6136+
goto put_prog;
6137+
}
6138+
6139+
if (map->map_type != BPF_MAP_TYPE_STRUCT_OPS) {
6140+
ret = -EINVAL;
6141+
goto put_map;
6142+
}
6143+
6144+
ret = bpf_prog_assoc_struct_ops(prog, map);
6145+
6146+
put_map:
6147+
bpf_map_put(map);
6148+
put_prog:
6149+
bpf_prog_put(prog);
6150+
return ret;
6151+
}
6152+
61106153
static int __sys_bpf(enum bpf_cmd cmd, bpfptr_t uattr, unsigned int size)
61116154
{
61126155
union bpf_attr attr;
@@ -6246,6 +6289,9 @@ static int __sys_bpf(enum bpf_cmd cmd, bpfptr_t uattr, unsigned int size)
62466289
case BPF_PROG_STREAM_READ_BY_FD:
62476290
err = prog_stream_read(&attr);
62486291
break;
6292+
case BPF_PROG_ASSOC_STRUCT_OPS:
6293+
err = prog_assoc_struct_ops(&attr);
6294+
break;
62496295
default:
62506296
err = -EINVAL;
62516297
break;

tools/include/uapi/linux/bpf.h

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -918,6 +918,16 @@ union bpf_iter_link_info {
918918
* Number of bytes read from the stream on success, or -1 if an
919919
* error occurred (in which case, *errno* is set appropriately).
920920
*
921+
* BPF_PROG_ASSOC_STRUCT_OPS
922+
* Description
923+
* Associate a BPF program with a struct_ops map. The struct_ops
924+
* map is identified by *map_fd* and the BPF program is
925+
* identified by *prog_fd*.
926+
*
927+
* Return
928+
* 0 on success or -1 if an error occurred (in which case,
929+
* *errno* is set appropriately).
930+
*
921931
* NOTES
922932
* eBPF objects (maps and programs) can be shared between processes.
923933
*
@@ -974,6 +984,7 @@ enum bpf_cmd {
974984
BPF_PROG_BIND_MAP,
975985
BPF_TOKEN_CREATE,
976986
BPF_PROG_STREAM_READ_BY_FD,
987+
BPF_PROG_ASSOC_STRUCT_OPS,
977988
__MAX_BPF_CMD,
978989
};
979990

@@ -1893,6 +1904,12 @@ union bpf_attr {
18931904
__u32 prog_fd;
18941905
} prog_stream_read;
18951906

1907+
struct {
1908+
__u32 map_fd;
1909+
__u32 prog_fd;
1910+
__u32 flags;
1911+
} prog_assoc_struct_ops;
1912+
18961913
} __attribute__((aligned(8)));
18971914

18981915
/* The description below is an attempt at providing documentation to eBPF

0 commit comments

Comments
 (0)