Aleksa Sarai writes: > > Felix reported weird behaviour on 4.16.0-rc6 with regards to mqueue[1], > which was introduced by 36735a6a2b5e ("mqueue: switch to on-demand > creation of internal mount"). > > Basically, the reproducer boils down to being able to mount mqueue if > you create a new user namespace, even if you don't unshare the IPC > namespace. > > Previously this was not possible, and you would get an -EPERM. The mount > is the *host* mqueue mount, which is being cached and just returned from > mqueue_mount(). To be honest, I'm not sure if this is safe or not (or if > it was intentional -- since I'm not familiar with mqueue). > > To me it looks like there is a missing permission check. I've included a > patch below that I've compile-tested, and should block the above case. > Can someone please tell me if I'm missing something? Is this actually > safe? > > > [1]: https://github.com/docker/docker/issues/36674 After examination of the code it might be safe by chance but it is definitely wrong. The missing permission checks are needed in the general case, and sb->s_user_ns needs to be set to ns->user_ns to give root in the user namespace the appropriate permissions over the filesystem. Fixes: 36735a6a2b5e ("mqueue: switch to on-demand creation of internal mount") Reported-by: Felix Abecassis <fabecassis@xxxxxxxxxx> Reported-by: Aleksa Sarai <asarai@xxxxxxx> Signed-off-by: "Eric W. Biederman" <ebiederm@xxxxxxxxxxxx> --- Unless there are objections I will push these fixes to Linus in a day or so. ipc/mqueue.c | 21 +++++++-------------- 1 file changed, 7 insertions(+), 14 deletions(-) diff --git a/ipc/mqueue.c b/ipc/mqueue.c index d7f309f74dec..832c1ec21318 100644 --- a/ipc/mqueue.c +++ b/ipc/mqueue.c @@ -325,9 +325,8 @@ static struct inode *mqueue_get_inode(struct super_block *sb, static int mqueue_fill_super(struct super_block *sb, void *data, int silent) { struct inode *inode; - struct ipc_namespace *ns = data; + struct ipc_namespace *ns = sb->s_fs_info; - sb->s_fs_info = ns; sb->s_iflags |= SB_I_NOEXEC | SB_I_NODEV; sb->s_blocksize = PAGE_SIZE; sb->s_blocksize_bits = PAGE_SHIFT; @@ -349,9 +348,9 @@ static struct file_system_type mqueue_fs_type; * Return value is pinned only by reference in ->mq_mnt; it will * live until ipcns dies. Caller does not need to drop it. */ -static struct vfsmount *mq_internal_mount(void) +static struct vfsmount *mq_internal_mount(void *nsp) { - struct ipc_namespace *ns = current->nsproxy->ipc_ns; + struct ipc_namespace *ns = nsp; struct vfsmount *m = ns->mq_mnt; if (m) return m; @@ -373,15 +372,9 @@ static struct dentry *mqueue_mount(struct file_system_type *fs_type, int flags, const char *dev_name, void *data) { - struct vfsmount *m; - if (flags & SB_KERNMOUNT) - return mount_nodev(fs_type, flags, data, mqueue_fill_super); - m = mq_internal_mount(); - if (IS_ERR(m)) - return ERR_CAST(m); - atomic_inc(&m->mnt_sb->s_active); - down_write(&m->mnt_sb->s_umount); - return dget(m->mnt_root); + struct ipc_namespace *ns = current->nsproxy->ipc_ns; + return mount_ns(fs_type, flags, data, ns, ns->user_ns, + mq_internal_mount, mqueue_fill_super); } static void init_once(void *foo) @@ -771,7 +764,7 @@ static int prepare_open(struct dentry *dentry, int oflag, int ro, static int do_mq_open(const char __user *u_name, int oflag, umode_t mode, struct mq_attr *attr) { - struct vfsmount *mnt = mq_internal_mount(); + struct vfsmount *mnt = mq_internal_mount(current->nsproxy->ipc_ns); struct dentry *root; struct filename *name; struct path path; -- 2.14.1 _______________________________________________ Containers mailing list Containers@xxxxxxxxxxxxxxxxxxxxxxxxxx https://lists.linuxfoundation.org/mailman/listinfo/containers