[Devel] [PATCH] hook_ct: mount devtmpfs in CT

Andrew Vagin avagin at parallels.com
Wed Jan 22 23:07:10 PST 2014


On Wed, Jan 22, 2014 at 05:12:12PM -0800, Kir Kolyshkin wrote:
> On 01/22/2014 02:37 AM, Andrey Vagin wrote:
> >All modern distributions require devtmpfs in /dev. devtmpfs can't
> >be mounted from userns. This patch bind-mounts the host /dev.
> >It's secure, because permissions are handled according with uid and
> >gid maps for the user namespace.
> >
> >This patch removes old hacks about devices. They are not required any more.
> >
> >Signed-off-by: Andrey Vagin <avagin at openvz.org>
> 
> Applied, thanks. See a question below.
> 
> >---
> >  etc/dists/scripts/prestart.sh |  4 ---
> >  src/lib/hooks_ct.c            | 66 +++++++++++--------------------------------
> >  2 files changed, 16 insertions(+), 54 deletions(-)
> >
> >diff --git a/etc/dists/scripts/prestart.sh b/etc/dists/scripts/prestart.sh
> >index 5ab7895..8b2a0a3 100755
> >--- a/etc/dists/scripts/prestart.sh
> >+++ b/etc/dists/scripts/prestart.sh
> >@@ -41,10 +41,6 @@ fixup_udev()
> >  		fi
> >  		break
> >  	done
> >-
> >-	umount /dev/pts
> >-	umount /dev/shm
> >-	umount /dev -l
> >  }
> >  fixup_loginuid()
> >diff --git a/src/lib/hooks_ct.c b/src/lib/hooks_ct.c
> >index 2a0b54c..ab2f4fd 100644
> >--- a/src/lib/hooks_ct.c
> >+++ b/src/lib/hooks_ct.c
> >@@ -10,6 +10,7 @@
> >  #include <fcntl.h>
> >  #include <sched.h>
> >  #include <dirent.h>
> >+#include <sys/vfs.h>
> 
> What is the reason for this include?

It is a part of the previous version. Could you remove it from here?
Or I can send a patch.

> 
> >  #include "vzerror.h"
> >  #include "env.h"
> >@@ -108,7 +109,7 @@ int ct_chroot(const char *root)
> >  	 * Linux kernel commit 5ff9d8a6
> >  	 * "vfs: Lock in place mounts from more privileged users"
> >  	 */
> >-	if (mount(root, root, NULL, MS_BIND, NULL)) {
> >+	if (mount(root, root, NULL, MS_BIND | MS_REC, NULL)) {
> >  		logger(-1, errno, "Can't bind-mount root %s", root);
> >  		return ret;
> >  	}
> >@@ -269,51 +270,6 @@ out:
> >  	return ret;
> >  }
> >-/*
> >- * Those devices should exist in the container, and be valid device nodes with
> >- * user access permission. But we need to be absolutely sure this is the case,
> >- * so we will provide our own versions. That could actually happen since some
> >- * distributions may come with emptied /dev's, waiting for udev to populate them.
> >- * That won't happen, we do it ourselves.
> >- */
> >-static void create_devices(vps_handler *h, envid_t veid, const char *root)
> >-{
> >-	unsigned int i;
> >-	char *devices[] = {
> >-		"/dev/null",
> >-		"/dev/zero",
> >-		"/dev/random",
> >-		"/dev/urandom",
> >-	};
> >-
> >-	/*
> >-	 * We will tolerate errors, and keep the container running, because it is
> >-	 * likely we will be able to boot it to a barely functional state. But
> >-	 * be vocal about it
> >-	 */
> >-	for (i = 0; i < ARRAY_SIZE(devices); i++) {
> >-		char ct_devname[STR_SIZE];
> >-		int ret;
> >-
> >-		snprintf(ct_devname, sizeof(ct_devname), "%s%s", root, devices[i]);
> >-
> >-		/*
> >-		 * No need to be crazy about file flags. When we bind mount, the
> >-		 * source permissions will be inherited.
> >-		 */
> >-		ret = open(ct_devname, O_RDWR|O_CREAT, 0);
> >-		if (ret < 0) {
> >-			logger(-1, errno, "Could not touch device %s", devices[i]);
> >-			continue;
> >-		}
> >-		close(ret);
> >-
> >-		ret = mount(devices[i], ct_devname, "", MS_BIND, 0);
> >-		if (ret < 0)
> >-			logger(-1, errno, "Could not bind mount device %s", devices[i]);
> >-	}
> >-}
> >-
> >  static int _env_create(void *data)
> >  {
> >  	struct arg_start *arg = data;
> >@@ -338,10 +294,6 @@ static int _env_create(void *data)
> >  	if (arg->userns_p != -1)
> >  		close(arg->userns_p);
> >-	if (arg->h->can_join_userns) {
> >-		create_devices(arg->h, arg->veid, arg->res->fs.root);
> >-	}
> >-
> >  	ret = ct_chroot(arg->res->fs.root);
> >  	/* Probably means chroot failed */
> >  	if (ret)
> >@@ -400,11 +352,25 @@ static int ct_env_create_real(struct arg_start *arg)
> >  		userns_p[0] = userns_p[1] = -1;
> >  	} else {
> >+		char devpath[PATH_MAX];
> >+
> >  		clone_flags |= CLONE_NEWUSER;
> >  		if (pipe(userns_p) < 0) {
> >  			logger(-1, errno, "Can not create userns pipe");
> >  			return VZ_RESOURCE_ERROR;
> >  		}
> >+
> >+		/* Unshare mntns to not affect the host system */
> >+		if (unshare(CLONE_NEWNS)) {
> >+			logger(-1, errno, "Can not unshare mount namespace");
> >+			return VZ_RESOURCE_ERROR;
> >+		}
> >+
> >+		snprintf(devpath, sizeof(devpath), "%s/dev", arg->res->fs.root);
> >+		if (mount("dev", devpath, "devtmpfs", 0, NULL)) {
> >+			logger(-1, errno, "Can not mount devtmpfs");
> >+			return VZ_RESOURCE_ERROR;
> >+		}
> >  	}
> >  	arg->userns_p = userns_p[0];
> 



More information about the Devel mailing list