From: Christian Brauner <brauner@kernel.org>
To: linux-fsdevel@vger.kernel.org, Josef Bacik <josef@toxicpanda.com>,
Jeff Layton <jlayton@kernel.org>
Cc: "Jann Horn" <jannh@google.com>, "Mike Yuan" <me@yhndnzj.com>,
"Zbigniew Jędrzejewski-Szmek" <zbyszek@in.waw.pl>,
"Lennart Poettering" <mzxreary@0pointer.de>,
"Daan De Meyer" <daan.j.demeyer@gmail.com>,
"Aleksa Sarai" <cyphar@cyphar.com>,
"Amir Goldstein" <amir73il@gmail.com>,
"Tejun Heo" <tj@kernel.org>,
"Johannes Weiner" <hannes@cmpxchg.org>,
"Thomas Gleixner" <tglx@linutronix.de>,
"Alexander Viro" <viro@zeniv.linux.org.uk>,
"Jan Kara" <jack@suse.cz>,
linux-kernel@vger.kernel.org, cgroups@vger.kernel.org,
bpf@vger.kernel.org, "Eric Dumazet" <edumazet@google.com>,
"Jakub Kicinski" <kuba@kernel.org>,
netdev@vger.kernel.org, "Arnd Bergmann" <arnd@arndb.de>,
"Christian Brauner" <brauner@kernel.org>
Subject: [PATCH v4 13/72] nstree: introduce a unified tree
Date: Wed, 29 Oct 2025 13:20:26 +0100 [thread overview]
Message-ID: <20251029-work-namespace-nstree-listns-v4-13-2e6f823ebdc0@kernel.org> (raw)
In-Reply-To: <20251029-work-namespace-nstree-listns-v4-0-2e6f823ebdc0@kernel.org>
This will allow userspace to lookup and stat a namespace simply by its
identifier without having to know what type of namespace it is.
Signed-off-by: Christian Brauner <brauner@kernel.org>
---
include/linux/ns_common.h | 4 ++
kernel/nscommon.c | 1 +
kernel/nstree.c | 114 ++++++++++++++++++++++++++++++++++++----------
3 files changed, 95 insertions(+), 24 deletions(-)
diff --git a/include/linux/ns_common.h b/include/linux/ns_common.h
index adc3542042af..88f27b678b4e 100644
--- a/include/linux/ns_common.h
+++ b/include/linux/ns_common.h
@@ -109,6 +109,10 @@ struct ns_common {
union {
struct {
u64 ns_id;
+ struct /* global namespace rbtree and list */ {
+ struct rb_node ns_unified_tree_node;
+ struct list_head ns_unified_list_node;
+ };
struct /* per type rbtree and list */ {
struct rb_node ns_tree_node;
struct list_head ns_list_node;
diff --git a/kernel/nscommon.c b/kernel/nscommon.c
index 1935f640f05a..98a237be64bc 100644
--- a/kernel/nscommon.c
+++ b/kernel/nscommon.c
@@ -61,6 +61,7 @@ int __ns_common_init(struct ns_common *ns, u32 ns_type, const struct proc_ns_ope
ns->ns_id = 0;
ns->ns_type = ns_type;
RB_CLEAR_NODE(&ns->ns_tree_node);
+ RB_CLEAR_NODE(&ns->ns_unified_tree_node);
INIT_LIST_HEAD(&ns->ns_list_node);
#ifdef CONFIG_DEBUG_VFS
diff --git a/kernel/nstree.c b/kernel/nstree.c
index a231cd2e9368..dbe4fb18f021 100644
--- a/kernel/nstree.c
+++ b/kernel/nstree.c
@@ -4,75 +4,86 @@
#include <linux/proc_ns.h>
#include <linux/vfsdebug.h>
+__cacheline_aligned_in_smp DEFINE_SEQLOCK(ns_tree_lock);
+static struct rb_root ns_unified_tree = RB_ROOT; /* protected by ns_tree_lock */
+
/**
* struct ns_tree - Namespace tree
* @ns_tree: Rbtree of namespaces of a particular type
* @ns_list: Sequentially walkable list of all namespaces of this type
- * @ns_tree_lock: Seqlock to protect the tree and list
* @type: type of namespaces in this tree
*/
struct ns_tree {
- struct rb_root ns_tree;
- struct list_head ns_list;
- seqlock_t ns_tree_lock;
- int type;
+ struct rb_root ns_tree;
+ struct list_head ns_list;
+#ifdef CONFIG_DEBUG_VFS
+ int type;
+#endif
};
struct ns_tree mnt_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(mnt_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(mnt_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWNS,
+#endif
};
struct ns_tree net_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(net_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(net_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWNET,
+#endif
};
EXPORT_SYMBOL_GPL(net_ns_tree);
struct ns_tree uts_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(uts_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(uts_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWUTS,
+#endif
};
struct ns_tree user_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(user_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(user_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWUSER,
+#endif
};
struct ns_tree ipc_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(ipc_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(ipc_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWIPC,
+#endif
};
struct ns_tree pid_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(pid_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(pid_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWPID,
+#endif
};
struct ns_tree cgroup_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(cgroup_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(cgroup_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWCGROUP,
+#endif
};
struct ns_tree time_ns_tree = {
.ns_tree = RB_ROOT,
.ns_list = LIST_HEAD_INIT(time_ns_tree.ns_list),
- .ns_tree_lock = __SEQLOCK_UNLOCKED(time_ns_tree.ns_tree_lock),
+#ifdef CONFIG_DEBUG_VFS
.type = CLONE_NEWTIME,
+#endif
};
DEFINE_COOKIE(namespace_cookie);
@@ -84,6 +95,13 @@ static inline struct ns_common *node_to_ns(const struct rb_node *node)
return rb_entry(node, struct ns_common, ns_tree_node);
}
+static inline struct ns_common *node_to_ns_unified(const struct rb_node *node)
+{
+ if (!node)
+ return NULL;
+ return rb_entry(node, struct ns_common, ns_unified_tree_node);
+}
+
static inline int ns_cmp(struct rb_node *a, const struct rb_node *b)
{
struct ns_common *ns_a = node_to_ns(a);
@@ -98,15 +116,27 @@ static inline int ns_cmp(struct rb_node *a, const struct rb_node *b)
return 0;
}
+static inline int ns_cmp_unified(struct rb_node *a, const struct rb_node *b)
+{
+ struct ns_common *ns_a = node_to_ns_unified(a);
+ struct ns_common *ns_b = node_to_ns_unified(b);
+ u64 ns_id_a = ns_a->ns_id;
+ u64 ns_id_b = ns_b->ns_id;
+
+ if (ns_id_a < ns_id_b)
+ return -1;
+ if (ns_id_a > ns_id_b)
+ return 1;
+ return 0;
+}
+
void __ns_tree_add_raw(struct ns_common *ns, struct ns_tree *ns_tree)
{
struct rb_node *node, *prev;
VFS_WARN_ON_ONCE(!ns->ns_id);
- write_seqlock(&ns_tree->ns_tree_lock);
-
- VFS_WARN_ON_ONCE(ns->ns_type != ns_tree->type);
+ write_seqlock(&ns_tree_lock);
node = rb_find_add_rcu(&ns->ns_tree_node, &ns_tree->ns_tree, ns_cmp);
/*
@@ -119,7 +149,8 @@ void __ns_tree_add_raw(struct ns_common *ns, struct ns_tree *ns_tree)
else
list_add_rcu(&ns->ns_list_node, &node_to_ns(prev)->ns_list_node);
- write_sequnlock(&ns_tree->ns_tree_lock);
+ rb_find_add_rcu(&ns->ns_unified_tree_node, &ns_unified_tree, ns_cmp_unified);
+ write_sequnlock(&ns_tree_lock);
VFS_WARN_ON_ONCE(node);
@@ -138,11 +169,12 @@ void __ns_tree_remove(struct ns_common *ns, struct ns_tree *ns_tree)
VFS_WARN_ON_ONCE(list_empty(&ns->ns_list_node));
VFS_WARN_ON_ONCE(ns->ns_type != ns_tree->type);
- write_seqlock(&ns_tree->ns_tree_lock);
+ write_seqlock(&ns_tree_lock);
rb_erase(&ns->ns_tree_node, &ns_tree->ns_tree);
+ rb_erase(&ns->ns_unified_tree_node, &ns_unified_tree);
list_bidir_del_rcu(&ns->ns_list_node);
RB_CLEAR_NODE(&ns->ns_tree_node);
- write_sequnlock(&ns_tree->ns_tree_lock);
+ write_sequnlock(&ns_tree_lock);
}
EXPORT_SYMBOL_GPL(__ns_tree_remove);
@@ -158,6 +190,17 @@ static int ns_find(const void *key, const struct rb_node *node)
return 0;
}
+static int ns_find_unified(const void *key, const struct rb_node *node)
+{
+ const u64 ns_id = *(u64 *)key;
+ const struct ns_common *ns = node_to_ns_unified(node);
+
+ if (ns_id < ns->ns_id)
+ return -1;
+ if (ns_id > ns->ns_id)
+ return 1;
+ return 0;
+}
static struct ns_tree *ns_tree_from_type(int ns_type)
{
@@ -183,28 +226,51 @@ static struct ns_tree *ns_tree_from_type(int ns_type)
return NULL;
}
-struct ns_common *ns_tree_lookup_rcu(u64 ns_id, int ns_type)
+static struct ns_common *__ns_unified_tree_lookup_rcu(u64 ns_id)
{
- struct ns_tree *ns_tree;
struct rb_node *node;
unsigned int seq;
- RCU_LOCKDEP_WARN(!rcu_read_lock_held(), "suspicious ns_tree_lookup_rcu() usage");
+ do {
+ seq = read_seqbegin(&ns_tree_lock);
+ node = rb_find_rcu(&ns_id, &ns_unified_tree, ns_find_unified);
+ if (node)
+ break;
+ } while (read_seqretry(&ns_tree_lock, seq));
+
+ return node_to_ns_unified(node);
+}
+
+static struct ns_common *__ns_tree_lookup_rcu(u64 ns_id, int ns_type)
+{
+ struct ns_tree *ns_tree;
+ struct rb_node *node;
+ unsigned int seq;
ns_tree = ns_tree_from_type(ns_type);
if (!ns_tree)
return NULL;
do {
- seq = read_seqbegin(&ns_tree->ns_tree_lock);
+ seq = read_seqbegin(&ns_tree_lock);
node = rb_find_rcu(&ns_id, &ns_tree->ns_tree, ns_find);
if (node)
break;
- } while (read_seqretry(&ns_tree->ns_tree_lock, seq));
+ } while (read_seqretry(&ns_tree_lock, seq));
return node_to_ns(node);
}
+struct ns_common *ns_tree_lookup_rcu(u64 ns_id, int ns_type)
+{
+ RCU_LOCKDEP_WARN(!rcu_read_lock_held(), "suspicious ns_tree_lookup_rcu() usage");
+
+ if (ns_type)
+ return __ns_tree_lookup_rcu(ns_id, ns_type);
+
+ return __ns_unified_tree_lookup_rcu(ns_id);
+}
+
/**
* ns_tree_adjoined_rcu - find the next/previous namespace in the same
* tree
--
2.47.3
next prev parent reply other threads:[~2025-10-29 12:21 UTC|newest]
Thread overview: 78+ messages / expand[flat|nested] mbox.gz Atom feed top
2025-10-29 12:20 [PATCH v4 00/72] nstree: listns() Christian Brauner
2025-10-29 12:20 ` [PATCH v4 01/72] libfs: allow to specify s_d_flags Christian Brauner
2025-10-29 12:20 ` [PATCH v4 02/72] nsfs: use inode_just_drop() Christian Brauner
2025-10-29 12:20 ` [PATCH v4 03/72] nsfs: raise DCACHE_DONTCACHE explicitly Christian Brauner
2025-10-29 12:20 ` [PATCH v4 04/72] pidfs: " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 05/72] nsfs: raise SB_I_NODEV and SB_I_NOEXEC Christian Brauner
2025-10-29 12:20 ` [PATCH v4 06/72] cgroup: add cgroup namespace to tree after owner is set Christian Brauner
2025-10-29 12:20 ` [PATCH v4 07/72] nstree: simplify return Christian Brauner
2025-10-29 12:20 ` [PATCH v4 08/72] ns: initialize ns_list_node for initial namespaces Christian Brauner
2025-10-29 12:20 ` [PATCH v4 09/72] ns: add __ns_ref_read() Christian Brauner
2025-10-29 12:20 ` [PATCH v4 10/72] ns: rename to exit_nsproxy_namespaces() Christian Brauner
2025-10-29 12:20 ` [PATCH v4 11/72] ns: add active reference count Christian Brauner
2025-10-29 12:20 ` [PATCH v4 12/72] ns: use anonymous struct to group list member Christian Brauner
2025-10-29 12:20 ` Christian Brauner [this message]
2025-10-29 14:44 ` [PATCH v4 13/72] nstree: introduce a unified tree kernel test robot
2025-10-29 14:55 ` kernel test robot
2025-10-29 12:20 ` [PATCH v4 14/72] nstree: allow lookup solely based on inode Christian Brauner
2025-10-29 12:20 ` [PATCH v4 15/72] nstree: assign fixed ids to the initial namespaces Christian Brauner
2025-10-29 12:20 ` [PATCH v4 16/72] nstree: maintain list of owned namespaces Christian Brauner
2025-10-29 12:20 ` [PATCH v4 17/72] nstree: simplify rbtree comparison helpers Christian Brauner
2025-10-30 13:48 ` Jeff Layton
2025-10-29 12:20 ` [PATCH v4 18/72] nstree: add unified namespace list Christian Brauner
2025-11-01 19:20 ` Thomas Gleixner
2025-11-03 11:21 ` Christian Brauner
2025-10-29 12:20 ` [PATCH v4 19/72] nstree: add listns() Christian Brauner
2025-10-29 12:20 ` [PATCH v4 20/72] arch: hookup listns() system call Christian Brauner
2025-10-29 12:20 ` [PATCH v4 21/72] nsfs: update tools header Christian Brauner
2025-10-29 12:20 ` [PATCH v4 22/72] selftests/filesystems: remove CLONE_NEWPIDNS from setup_userns() helper Christian Brauner
2025-10-29 12:20 ` [PATCH v4 23/72] selftests/namespaces: first active reference count tests Christian Brauner
2025-10-29 12:20 ` [PATCH v4 24/72] selftests/namespaces: second " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 25/72] selftests/namespaces: third " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 26/72] selftests/namespaces: fourth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 27/72] selftests/namespaces: fifth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 28/72] selftests/namespaces: sixth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 29/72] selftests/namespaces: seventh " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 30/72] selftests/namespaces: eigth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 31/72] selftests/namespaces: ninth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 32/72] selftests/namespaces: tenth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 33/72] selftests/namespaces: eleventh " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 34/72] selftests/namespaces: twelth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 35/72] selftests/namespaces: thirteenth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 36/72] selftests/namespaces: fourteenth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 37/72] selftests/namespaces: fifteenth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 38/72] selftests/namespaces: add listns() wrapper Christian Brauner
2025-10-29 12:20 ` [PATCH v4 39/72] selftests/namespaces: first listns() test Christian Brauner
2025-10-29 12:20 ` [PATCH v4 40/72] selftests/namespaces: second " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 41/72] selftests/namespaces: third " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 42/72] selftests/namespaces: fourth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 43/72] selftests/namespaces: fifth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 44/72] selftests/namespaces: sixth " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 45/72] selftests/namespaces: seventh " Christian Brauner
2025-10-29 12:20 ` [PATCH v4 46/72] selftests/namespaces: eigth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 47/72] selftests/namespaces: ninth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 48/72] selftests/namespaces: first listns() permission test Christian Brauner
2025-10-29 12:21 ` [PATCH v4 49/72] selftests/namespaces: second " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 50/72] selftests/namespaces: third " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 51/72] selftests/namespaces: fourth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 52/72] selftests/namespaces: fifth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 53/72] selftests/namespaces: sixth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 54/72] selftests/namespaces: seventh " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 55/72] selftests/namespaces: first inactive namespace resurrection test Christian Brauner
2025-10-29 12:21 ` [PATCH v4 56/72] selftests/namespaces: second " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 57/72] selftests/namespaces: third " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 58/72] selftests/namespaces: fourth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 59/72] selftests/namespaces: fifth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 60/72] selftests/namespaces: sixth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 61/72] selftests/namespaces: seventh " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 62/72] selftests/namespaces: eigth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 63/72] selftests/namespaces: ninth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 64/72] selftests/namespaces: tenth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 65/72] selftests/namespaces: eleventh " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 66/72] selftests/namespaces: twelth " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 67/72] selftests/namespace: first threaded active reference count test Christian Brauner
2025-10-29 12:21 ` [PATCH v4 68/72] selftests/namespace: second " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 69/72] selftests/namespace: third " Christian Brauner
2025-10-29 12:21 ` [PATCH v4 70/72] selftests/namespace: commit_creds() active reference tests Christian Brauner
2025-10-29 12:21 ` [PATCH v4 71/72] selftests/namespace: add stress test Christian Brauner
2025-10-29 12:21 ` [PATCH v4 72/72] selftests/namespace: test listns() pagination Christian Brauner
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20251029-work-namespace-nstree-listns-v4-13-2e6f823ebdc0@kernel.org \
--to=brauner@kernel.org \
--cc=amir73il@gmail.com \
--cc=arnd@arndb.de \
--cc=bpf@vger.kernel.org \
--cc=cgroups@vger.kernel.org \
--cc=cyphar@cyphar.com \
--cc=daan.j.demeyer@gmail.com \
--cc=edumazet@google.com \
--cc=hannes@cmpxchg.org \
--cc=jack@suse.cz \
--cc=jannh@google.com \
--cc=jlayton@kernel.org \
--cc=josef@toxicpanda.com \
--cc=kuba@kernel.org \
--cc=linux-fsdevel@vger.kernel.org \
--cc=linux-kernel@vger.kernel.org \
--cc=me@yhndnzj.com \
--cc=mzxreary@0pointer.de \
--cc=netdev@vger.kernel.org \
--cc=tglx@linutronix.de \
--cc=tj@kernel.org \
--cc=viro@zeniv.linux.org.uk \
--cc=zbyszek@in.waw.pl \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).