In rare cases a directory can be renamed out from under a bind mount. In those cases without special handling it becomes possible to walk up the directory tree to the root dentry of the filesystem and down from the root dentry to every other file or directory on the filesystem. Like division by zero .. from an unconnected path can not be given a useful semantic as there is no predicting at which path component the code will realize it is unconnected. We certainly can not match the current behavior as the current behavior is a security hole. Therefore when encounting .. when following an unconnected path return -ENOENT. - Add a function path_connected to verify nd->path.dentry is reachable from nd->path.mnt.mnt_root. AKA to validate that rename did not do something nasty to the bind mount. To avoid races path_connected must be called after following a path component to it's next path component. Signed-off-by: "Eric W. Biederman" <ebiederm@xxxxxxxxxxxx> --- fs/namei.c | 35 ++++++++++++++++++++++++++++++++--- 1 file changed, 32 insertions(+), 3 deletions(-) diff --git a/fs/namei.c b/fs/namei.c index ae4e4c18b2ac..bccd3810ff60 100644 --- a/fs/namei.c +++ b/fs/namei.c @@ -560,6 +560,27 @@ static int __nd_alloc_stack(struct nameidata *nd) return 0; } +/** + * path_connected - Verify that a nd->path.dentry is below nd->path.mnt->mnt.mnt_root + * @nd: nameidate to verify + * + * Rename can sometimes move a file or directory outside of a bind + * mount, path_connected allows those cases to be detected. + */ +static bool path_connected(struct nameidata *nd) +{ + struct vfsmount *mnt = nd->path.mnt; + unsigned escape_count = read_mnt_escape_count(mnt); + + if (likely(escape_count == 0)) + return true; + + if (!is_subdir(nd->path.dentry, mnt->mnt_root)) + return false; + + return true; +} + static inline int nd_alloc_stack(struct nameidata *nd) { if (likely(nd->depth != EMBEDDED_LEVELS)) @@ -1294,6 +1315,8 @@ static int follow_dotdot_rcu(struct nameidata *nd) seq = read_seqcount_begin(&parent->d_seq); if (unlikely(read_seqcount_retry(&old->d_seq, nd->seq))) return -ECHILD; + if (unlikely(!path_connected(nd))) + return -ENOENT; nd->path.dentry = parent; nd->seq = seq; break; @@ -1396,7 +1419,7 @@ static void follow_mount(struct path *path) } } -static void follow_dotdot(struct nameidata *nd) +static int follow_dotdot(struct nameidata *nd) { if (!nd->root.mnt) set_root(nd); @@ -1410,7 +1433,12 @@ static void follow_dotdot(struct nameidata *nd) } if (nd->path.dentry != nd->path.mnt->mnt_root) { /* rare case of legitimate dget_parent()... */ - nd->path.dentry = dget_parent(nd->path.dentry); + struct dentry *parent = dget_parent(nd->path.dentry); + if (unlikely(!path_connected(nd))) { + dput(parent); + return -ENOENT; + } + nd->path.dentry = parent; dput(old); break; } @@ -1419,6 +1447,7 @@ static void follow_dotdot(struct nameidata *nd) } follow_mount(&nd->path); nd->inode = nd->path.dentry->d_inode; + return 0; } /* @@ -1634,7 +1663,7 @@ static inline int handle_dots(struct nameidata *nd, int type) if (nd->flags & LOOKUP_RCU) { return follow_dotdot_rcu(nd); } else - follow_dotdot(nd); + return follow_dotdot(nd); } return 0; } -- 2.2.1 -- To unsubscribe from this list: send the line "unsubscribe linux-fsdevel" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html