Skip to content

Commit 0a78cf7

Browse files
q2venkuba-moo
authored andcommitted
raw: Fix NULL deref in raw_get_next().
Dae R. Jeong reported a NULL deref in raw_get_next() [0]. It seems that the repro was running these sequences in parallel so that one thread was iterating on a socket that was being freed in another netns. unshare(0x40060200) r0 = syz_open_procfs(0x0, &(0x7f0000002080)='net/raw\x00') socket$inet_icmp_raw(0x2, 0x3, 0x1) pread64(r0, &(0x7f0000000000)=""/10, 0xa, 0x10000000007f) After commit 0daf07e ("raw: convert raw sockets to RCU"), we use RCU and hlist_nulls_for_each_entry() to iterate over SOCK_RAW sockets. However, we should use spinlock for slow paths to avoid the NULL deref. Also, SOCK_RAW does not use SLAB_TYPESAFE_BY_RCU, and the slab object is not reused during iteration in the grace period. In fact, the lockless readers do not check the nulls marker with get_nulls_value(). So, SOCK_RAW should use hlist instead of hlist_nulls. Instead of adding an unnecessary barrier by sk_nulls_for_each_rcu(), let's convert hlist_nulls to hlist and use sk_for_each_rcu() for fast paths and sk_for_each() and spinlock for /proc/net/raw. [0]: general protection fault, probably for non-canonical address 0xdffffc0000000005: 0000 [#1] PREEMPT SMP KASAN KASAN: null-ptr-deref in range [0x0000000000000028-0x000000000000002f] CPU: 2 PID: 20952 Comm: syz-executor.0 Not tainted 6.2.0-g048ec869bafd-dirty #7 Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS rel-1.14.0-0-g155821a1990b-prebuilt.qemu.org 04/01/2014 RIP: 0010:read_pnet include/net/net_namespace.h:383 [inline] RIP: 0010:sock_net include/net/sock.h:649 [inline] RIP: 0010:raw_get_next net/ipv4/raw.c:974 [inline] RIP: 0010:raw_get_idx net/ipv4/raw.c:986 [inline] RIP: 0010:raw_seq_start+0x431/0x800 net/ipv4/raw.c:995 Code: ef e8 33 3d 94 f7 49 8b 6d 00 4c 89 ef e8 b7 65 5f f7 49 89 ed 49 83 c5 98 0f 84 9a 00 00 00 48 83 c5 c8 48 89 e8 48 c1 e8 03 <42> 80 3c 30 00 74 08 48 89 ef e8 00 3d 94 f7 4c 8b 7d 00 48 89 ef RSP: 0018:ffffc9001154f9b0 EFLAGS: 00010206 RAX: 0000000000000005 RBX: 1ffff1100302c8fd RCX: 0000000000000000 RDX: 0000000000000028 RSI: ffffc9001154f988 RDI: ffffc9000f77a338 RBP: 0000000000000029 R08: ffffffff8a50ffb4 R09: fffffbfff24b6bd9 R10: fffffbfff24b6bd9 R11: 0000000000000000 R12: ffff88801db73b78 R13: fffffffffffffff9 R14: dffffc0000000000 R15: 0000000000000030 FS: 00007f843ae8e700(0000) GS:ffff888063700000(0000) knlGS:0000000000000000 CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 CR2: 000055bb9614b35f CR3: 000000003c672000 CR4: 00000000003506e0 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400 Call Trace: <TASK> seq_read_iter+0x4c6/0x10f0 fs/seq_file.c:225 seq_read+0x224/0x320 fs/seq_file.c:162 pde_read fs/proc/inode.c:316 [inline] proc_reg_read+0x23f/0x330 fs/proc/inode.c:328 vfs_read+0x31e/0xd30 fs/read_write.c:468 ksys_pread64 fs/read_write.c:665 [inline] __do_sys_pread64 fs/read_write.c:675 [inline] __se_sys_pread64 fs/read_write.c:672 [inline] __x64_sys_pread64+0x1e9/0x280 fs/read_write.c:672 do_syscall_x64 arch/x86/entry/common.c:51 [inline] do_syscall_64+0x4e/0xa0 arch/x86/entry/common.c:82 entry_SYSCALL_64_after_hwframe+0x63/0xcd RIP: 0033:0x478d29 Code: f7 d8 64 89 02 b8 ff ff ff ff c3 66 0f 1f 44 00 00 48 89 f8 48 89 f7 48 89 d6 48 89 ca 4d 89 c2 4d 89 c8 4c 8b 4c 24 08 0f 05 <48> 3d 01 f0 ff ff 73 01 c3 48 c7 c1 bc ff ff ff f7 d8 64 89 01 48 RSP: 002b:00007f843ae8dbe8 EFLAGS: 00000246 ORIG_RAX: 0000000000000011 RAX: ffffffffffffffda RBX: 0000000000791408 RCX: 0000000000478d29 RDX: 000000000000000a RSI: 0000000020000000 RDI: 0000000000000003 RBP: 00000000f477909a R08: 0000000000000000 R09: 0000000000000000 R10: 000010000000007f R11: 0000000000000246 R12: 0000000000791740 R13: 0000000000791414 R14: 0000000000791408 R15: 00007ffc2eb48a50 </TASK> Modules linked in: ---[ end trace 0000000000000000 ]--- RIP: 0010:read_pnet include/net/net_namespace.h:383 [inline] RIP: 0010:sock_net include/net/sock.h:649 [inline] RIP: 0010:raw_get_next net/ipv4/raw.c:974 [inline] RIP: 0010:raw_get_idx net/ipv4/raw.c:986 [inline] RIP: 0010:raw_seq_start+0x431/0x800 net/ipv4/raw.c:995 Code: ef e8 33 3d 94 f7 49 8b 6d 00 4c 89 ef e8 b7 65 5f f7 49 89 ed 49 83 c5 98 0f 84 9a 00 00 00 48 83 c5 c8 48 89 e8 48 c1 e8 03 <42> 80 3c 30 00 74 08 48 89 ef e8 00 3d 94 f7 4c 8b 7d 00 48 89 ef RSP: 0018:ffffc9001154f9b0 EFLAGS: 00010206 RAX: 0000000000000005 RBX: 1ffff1100302c8fd RCX: 0000000000000000 RDX: 0000000000000028 RSI: ffffc9001154f988 RDI: ffffc9000f77a338 RBP: 0000000000000029 R08: ffffffff8a50ffb4 R09: fffffbfff24b6bd9 R10: fffffbfff24b6bd9 R11: 0000000000000000 R12: ffff88801db73b78 R13: fffffffffffffff9 R14: dffffc0000000000 R15: 0000000000000030 FS: 00007f843ae8e700(0000) GS:ffff888063700000(0000) knlGS:0000000000000000 CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 CR2: 00007f92ff166000 CR3: 000000003c672000 CR4: 00000000003506e0 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400 Fixes: 0daf07e ("raw: convert raw sockets to RCU") Reported-by: syzbot <[email protected]> Reported-by: Dae R. Jeong <[email protected]> Link: https://lore.kernel.org/netdev/ZCA2mGV_cmq7lIfV@dragonet/ Signed-off-by: Kuniyuki Iwashima <[email protected]> Reviewed-by: Eric Dumazet <[email protected]> Signed-off-by: Jakub Kicinski <[email protected]>
1 parent 218c597 commit 0a78cf7

File tree

4 files changed

+29
-31
lines changed

4 files changed

+29
-31
lines changed

include/net/raw.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ int raw_rcv(struct sock *, struct sk_buff *);
3737
struct raw_hashinfo {
3838
spinlock_t lock;
3939

40-
struct hlist_nulls_head ht[RAW_HTABLE_SIZE] ____cacheline_aligned;
40+
struct hlist_head ht[RAW_HTABLE_SIZE] ____cacheline_aligned;
4141
};
4242

4343
static inline u32 raw_hashfunc(const struct net *net, u32 proto)
@@ -51,7 +51,7 @@ static inline void raw_hashinfo_init(struct raw_hashinfo *hashinfo)
5151

5252
spin_lock_init(&hashinfo->lock);
5353
for (i = 0; i < RAW_HTABLE_SIZE; i++)
54-
INIT_HLIST_NULLS_HEAD(&hashinfo->ht[i], i);
54+
INIT_HLIST_HEAD(&hashinfo->ht[i]);
5555
}
5656

5757
#ifdef CONFIG_PROC_FS

net/ipv4/raw.c

Lines changed: 19 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -91,12 +91,12 @@ EXPORT_SYMBOL_GPL(raw_v4_hashinfo);
9191
int raw_hash_sk(struct sock *sk)
9292
{
9393
struct raw_hashinfo *h = sk->sk_prot->h.raw_hash;
94-
struct hlist_nulls_head *hlist;
94+
struct hlist_head *hlist;
9595

9696
hlist = &h->ht[raw_hashfunc(sock_net(sk), inet_sk(sk)->inet_num)];
9797

9898
spin_lock(&h->lock);
99-
__sk_nulls_add_node_rcu(sk, hlist);
99+
sk_add_node_rcu(sk, hlist);
100100
sock_set_flag(sk, SOCK_RCU_FREE);
101101
spin_unlock(&h->lock);
102102
sock_prot_inuse_add(sock_net(sk), sk->sk_prot, 1);
@@ -110,7 +110,7 @@ void raw_unhash_sk(struct sock *sk)
110110
struct raw_hashinfo *h = sk->sk_prot->h.raw_hash;
111111

112112
spin_lock(&h->lock);
113-
if (__sk_nulls_del_node_init_rcu(sk))
113+
if (sk_del_node_init_rcu(sk))
114114
sock_prot_inuse_add(sock_net(sk), sk->sk_prot, -1);
115115
spin_unlock(&h->lock);
116116
}
@@ -163,16 +163,15 @@ static int icmp_filter(const struct sock *sk, const struct sk_buff *skb)
163163
static int raw_v4_input(struct net *net, struct sk_buff *skb,
164164
const struct iphdr *iph, int hash)
165165
{
166-
struct hlist_nulls_head *hlist;
167-
struct hlist_nulls_node *hnode;
168166
int sdif = inet_sdif(skb);
167+
struct hlist_head *hlist;
169168
int dif = inet_iif(skb);
170169
int delivered = 0;
171170
struct sock *sk;
172171

173172
hlist = &raw_v4_hashinfo.ht[hash];
174173
rcu_read_lock();
175-
sk_nulls_for_each(sk, hnode, hlist) {
174+
sk_for_each_rcu(sk, hlist) {
176175
if (!raw_v4_match(net, sk, iph->protocol,
177176
iph->saddr, iph->daddr, dif, sdif))
178177
continue;
@@ -264,10 +263,9 @@ static void raw_err(struct sock *sk, struct sk_buff *skb, u32 info)
264263
void raw_icmp_error(struct sk_buff *skb, int protocol, u32 info)
265264
{
266265
struct net *net = dev_net(skb->dev);
267-
struct hlist_nulls_head *hlist;
268-
struct hlist_nulls_node *hnode;
269266
int dif = skb->dev->ifindex;
270267
int sdif = inet_sdif(skb);
268+
struct hlist_head *hlist;
271269
const struct iphdr *iph;
272270
struct sock *sk;
273271
int hash;
@@ -276,7 +274,7 @@ void raw_icmp_error(struct sk_buff *skb, int protocol, u32 info)
276274
hlist = &raw_v4_hashinfo.ht[hash];
277275

278276
rcu_read_lock();
279-
sk_nulls_for_each(sk, hnode, hlist) {
277+
sk_for_each_rcu(sk, hlist) {
280278
iph = (const struct iphdr *)skb->data;
281279
if (!raw_v4_match(net, sk, iph->protocol,
282280
iph->daddr, iph->saddr, dif, sdif))
@@ -950,14 +948,13 @@ static struct sock *raw_get_first(struct seq_file *seq, int bucket)
950948
{
951949
struct raw_hashinfo *h = pde_data(file_inode(seq->file));
952950
struct raw_iter_state *state = raw_seq_private(seq);
953-
struct hlist_nulls_head *hlist;
954-
struct hlist_nulls_node *hnode;
951+
struct hlist_head *hlist;
955952
struct sock *sk;
956953

957954
for (state->bucket = bucket; state->bucket < RAW_HTABLE_SIZE;
958955
++state->bucket) {
959956
hlist = &h->ht[state->bucket];
960-
sk_nulls_for_each(sk, hnode, hlist) {
957+
sk_for_each(sk, hlist) {
961958
if (sock_net(sk) == seq_file_net(seq))
962959
return sk;
963960
}
@@ -970,7 +967,7 @@ static struct sock *raw_get_next(struct seq_file *seq, struct sock *sk)
970967
struct raw_iter_state *state = raw_seq_private(seq);
971968

972969
do {
973-
sk = sk_nulls_next(sk);
970+
sk = sk_next(sk);
974971
} while (sk && sock_net(sk) != seq_file_net(seq));
975972

976973
if (!sk)
@@ -989,9 +986,12 @@ static struct sock *raw_get_idx(struct seq_file *seq, loff_t pos)
989986
}
990987

991988
void *raw_seq_start(struct seq_file *seq, loff_t *pos)
992-
__acquires(RCU)
989+
__acquires(&h->lock)
993990
{
994-
rcu_read_lock();
991+
struct raw_hashinfo *h = pde_data(file_inode(seq->file));
992+
993+
spin_lock(&h->lock);
994+
995995
return *pos ? raw_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
996996
}
997997
EXPORT_SYMBOL_GPL(raw_seq_start);
@@ -1010,9 +1010,11 @@ void *raw_seq_next(struct seq_file *seq, void *v, loff_t *pos)
10101010
EXPORT_SYMBOL_GPL(raw_seq_next);
10111011

10121012
void raw_seq_stop(struct seq_file *seq, void *v)
1013-
__releases(RCU)
1013+
__releases(&h->lock)
10141014
{
1015-
rcu_read_unlock();
1015+
struct raw_hashinfo *h = pde_data(file_inode(seq->file));
1016+
1017+
spin_unlock(&h->lock);
10161018
}
10171019
EXPORT_SYMBOL_GPL(raw_seq_stop);
10181020

net/ipv4/raw_diag.c

Lines changed: 4 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -57,8 +57,7 @@ static bool raw_lookup(struct net *net, struct sock *sk,
5757
static struct sock *raw_sock_get(struct net *net, const struct inet_diag_req_v2 *r)
5858
{
5959
struct raw_hashinfo *hashinfo = raw_get_hashinfo(r);
60-
struct hlist_nulls_head *hlist;
61-
struct hlist_nulls_node *hnode;
60+
struct hlist_head *hlist;
6261
struct sock *sk;
6362
int slot;
6463

@@ -68,7 +67,7 @@ static struct sock *raw_sock_get(struct net *net, const struct inet_diag_req_v2
6867
rcu_read_lock();
6968
for (slot = 0; slot < RAW_HTABLE_SIZE; slot++) {
7069
hlist = &hashinfo->ht[slot];
71-
sk_nulls_for_each(sk, hnode, hlist) {
70+
sk_for_each_rcu(sk, hlist) {
7271
if (raw_lookup(net, sk, r)) {
7372
/*
7473
* Grab it and keep until we fill
@@ -142,9 +141,8 @@ static void raw_diag_dump(struct sk_buff *skb, struct netlink_callback *cb,
142141
struct raw_hashinfo *hashinfo = raw_get_hashinfo(r);
143142
struct net *net = sock_net(skb->sk);
144143
struct inet_diag_dump_data *cb_data;
145-
struct hlist_nulls_head *hlist;
146-
struct hlist_nulls_node *hnode;
147144
int num, s_num, slot, s_slot;
145+
struct hlist_head *hlist;
148146
struct sock *sk = NULL;
149147
struct nlattr *bc;
150148

@@ -161,7 +159,7 @@ static void raw_diag_dump(struct sk_buff *skb, struct netlink_callback *cb,
161159
num = 0;
162160

163161
hlist = &hashinfo->ht[slot];
164-
sk_nulls_for_each(sk, hnode, hlist) {
162+
sk_for_each_rcu(sk, hlist) {
165163
struct inet_sock *inet = inet_sk(sk);
166164

167165
if (!net_eq(sock_net(sk), net))

net/ipv6/raw.c

Lines changed: 4 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -141,10 +141,9 @@ EXPORT_SYMBOL(rawv6_mh_filter_unregister);
141141
static bool ipv6_raw_deliver(struct sk_buff *skb, int nexthdr)
142142
{
143143
struct net *net = dev_net(skb->dev);
144-
struct hlist_nulls_head *hlist;
145-
struct hlist_nulls_node *hnode;
146144
const struct in6_addr *saddr;
147145
const struct in6_addr *daddr;
146+
struct hlist_head *hlist;
148147
struct sock *sk;
149148
bool delivered = false;
150149
__u8 hash;
@@ -155,7 +154,7 @@ static bool ipv6_raw_deliver(struct sk_buff *skb, int nexthdr)
155154
hash = raw_hashfunc(net, nexthdr);
156155
hlist = &raw_v6_hashinfo.ht[hash];
157156
rcu_read_lock();
158-
sk_nulls_for_each(sk, hnode, hlist) {
157+
sk_for_each_rcu(sk, hlist) {
159158
int filtered;
160159

161160
if (!raw_v6_match(net, sk, nexthdr, daddr, saddr,
@@ -333,15 +332,14 @@ void raw6_icmp_error(struct sk_buff *skb, int nexthdr,
333332
u8 type, u8 code, int inner_offset, __be32 info)
334333
{
335334
struct net *net = dev_net(skb->dev);
336-
struct hlist_nulls_head *hlist;
337-
struct hlist_nulls_node *hnode;
335+
struct hlist_head *hlist;
338336
struct sock *sk;
339337
int hash;
340338

341339
hash = raw_hashfunc(net, nexthdr);
342340
hlist = &raw_v6_hashinfo.ht[hash];
343341
rcu_read_lock();
344-
sk_nulls_for_each(sk, hnode, hlist) {
342+
sk_for_each_rcu(sk, hlist) {
345343
/* Note: ipv6_hdr(skb) != skb->data */
346344
const struct ipv6hdr *ip6h = (const struct ipv6hdr *)skb->data;
347345

0 commit comments

Comments
 (0)