Skip to content

Commit f70d24c

Browse files
committed
Merge tag 'vfs-6.17-rc1.nsfs' of git://git.kernel.org/pub/scm/linux/kernel/git/vfs/vfs
Pull namespace updates from Christian Brauner: "This contains namespace updates. This time specifically for nsfs: - Userspace heavily relies on the root inode numbers for namespaces to identify the initial namespaces. That's already a hard dependency. So we cannot change that anymore. Move the initial inode numbers to a public header and align the only two namespaces that currently don't do that with all the other namespaces. - The root inode of /proc having a fixed inode number has been part of the core kernel ABI since its inception, and recently some userspace programs (mainly container runtimes) have started to explicitly depend on this behaviour. The main reason this is useful to userspace is that by checking that a suspect /proc handle has fstype PROC_SUPER_MAGIC and is PROCFS_ROOT_INO, they can then use openat2() together with RESOLVE_{NO_{XDEV,MAGICLINK},BENEATH} to ensure that there isn't a bind-mount that replaces some procfs file with a different one. This kind of attack has lead to security issues in container runtimes in the past (such as CVE-2019-19921) and libraries like libpathrs[1] use this feature of procfs to provide safe procfs handling functions" * tag 'vfs-6.17-rc1.nsfs' of git://git.kernel.org/pub/scm/linux/kernel/git/vfs/vfs: uapi: export PROCFS_ROOT_INO mntns: use stable inode number for initial mount ns netns: use stable inode number for initial mount ns nsfs: move root inode number to uapi
2 parents 934600d + 76fdb7e commit f70d24c

File tree

6 files changed

+47
-13
lines changed

6 files changed

+47
-13
lines changed

fs/namespace.c

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6090,9 +6090,11 @@ static void __init init_mount_tree(void)
60906090
if (IS_ERR(mnt))
60916091
panic("Can't create rootfs");
60926092

6093-
ns = alloc_mnt_ns(&init_user_ns, false);
6093+
ns = alloc_mnt_ns(&init_user_ns, true);
60946094
if (IS_ERR(ns))
60956095
panic("Can't allocate initial namespace");
6096+
ns->seq = atomic64_inc_return(&mnt_ns_seq);
6097+
ns->ns.inum = PROC_MNT_INIT_INO;
60966098
m = real_mount(mnt);
60976099
ns->root = m;
60986100
ns->nr_mounts = 1;

fs/proc/root.c

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -363,12 +363,12 @@ static const struct inode_operations proc_root_inode_operations = {
363363
* This is the root "inode" in the /proc tree..
364364
*/
365365
struct proc_dir_entry proc_root = {
366-
.low_ino = PROC_ROOT_INO,
367-
.namelen = 5,
368-
.mode = S_IFDIR | S_IRUGO | S_IXUGO,
369-
.nlink = 2,
366+
.low_ino = PROCFS_ROOT_INO,
367+
.namelen = 5,
368+
.mode = S_IFDIR | S_IRUGO | S_IXUGO,
369+
.nlink = 2,
370370
.refcnt = REFCOUNT_INIT(1),
371-
.proc_iops = &proc_root_inode_operations,
371+
.proc_iops = &proc_root_inode_operations,
372372
.proc_dir_ops = &proc_root_operations,
373373
.parent = &proc_root,
374374
.subdir = RB_ROOT,

include/linux/proc_ns.h

Lines changed: 9 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,7 @@
66
#define _LINUX_PROC_NS_H
77

88
#include <linux/ns_common.h>
9+
#include <uapi/linux/nsfs.h>
910

1011
struct pid_namespace;
1112
struct nsset;
@@ -39,13 +40,14 @@ extern const struct proc_ns_operations timens_for_children_operations;
3940
* We always define these enumerators
4041
*/
4142
enum {
42-
PROC_ROOT_INO = 1,
43-
PROC_IPC_INIT_INO = 0xEFFFFFFFU,
44-
PROC_UTS_INIT_INO = 0xEFFFFFFEU,
45-
PROC_USER_INIT_INO = 0xEFFFFFFDU,
46-
PROC_PID_INIT_INO = 0xEFFFFFFCU,
47-
PROC_CGROUP_INIT_INO = 0xEFFFFFFBU,
48-
PROC_TIME_INIT_INO = 0xEFFFFFFAU,
43+
PROC_IPC_INIT_INO = IPC_NS_INIT_INO,
44+
PROC_UTS_INIT_INO = UTS_NS_INIT_INO,
45+
PROC_USER_INIT_INO = USER_NS_INIT_INO,
46+
PROC_PID_INIT_INO = PID_NS_INIT_INO,
47+
PROC_CGROUP_INIT_INO = CGROUP_NS_INIT_INO,
48+
PROC_TIME_INIT_INO = TIME_NS_INIT_INO,
49+
PROC_NET_INIT_INO = NET_NS_INIT_INO,
50+
PROC_MNT_INIT_INO = MNT_NS_INIT_INO,
4951
};
5052

5153
#ifdef CONFIG_PROC_FS

include/uapi/linux/fs.h

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -60,6 +60,17 @@
6060
#define RENAME_EXCHANGE (1 << 1) /* Exchange source and dest */
6161
#define RENAME_WHITEOUT (1 << 2) /* Whiteout source */
6262

63+
/*
64+
* The root inode of procfs is guaranteed to always have the same inode number.
65+
* For programs that make heavy use of procfs, verifying that the root is a
66+
* real procfs root and using openat2(RESOLVE_{NO_{XDEV,MAGICLINKS},BENEATH})
67+
* will allow you to make sure you are never tricked into operating on the
68+
* wrong procfs file.
69+
*/
70+
enum procfs_ino {
71+
PROCFS_ROOT_INO = 1,
72+
};
73+
6374
struct file_clone_range {
6475
__s64 src_fd;
6576
__u64 src_offset;

include/uapi/linux/nsfs.h

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -42,4 +42,15 @@ struct mnt_ns_info {
4242
/* Get previous namespace. */
4343
#define NS_MNT_GET_PREV _IOR(NSIO, 12, struct mnt_ns_info)
4444

45+
enum init_ns_ino {
46+
IPC_NS_INIT_INO = 0xEFFFFFFFU,
47+
UTS_NS_INIT_INO = 0xEFFFFFFEU,
48+
USER_NS_INIT_INO = 0xEFFFFFFDU,
49+
PID_NS_INIT_INO = 0xEFFFFFFCU,
50+
CGROUP_NS_INIT_INO = 0xEFFFFFFBU,
51+
TIME_NS_INIT_INO = 0xEFFFFFFAU,
52+
NET_NS_INIT_INO = 0xEFFFFFF9U,
53+
MNT_NS_INIT_INO = 0xEFFFFFF8U,
54+
};
55+
4556
#endif /* __LINUX_NSFS_H */

net/core/net_namespace.c

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -796,11 +796,19 @@ static __net_init int net_ns_net_init(struct net *net)
796796
#ifdef CONFIG_NET_NS
797797
net->ns.ops = &netns_operations;
798798
#endif
799+
if (net == &init_net) {
800+
net->ns.inum = PROC_NET_INIT_INO;
801+
return 0;
802+
}
799803
return ns_alloc_inum(&net->ns);
800804
}
801805

802806
static __net_exit void net_ns_net_exit(struct net *net)
803807
{
808+
/*
809+
* Initial network namespace doesn't exit so we don't need any
810+
* special checks here.
811+
*/
804812
ns_free_inum(&net->ns);
805813
}
806814

0 commit comments

Comments
 (0)