[CRIU] [PATCH 5/6] mnt: try to split a mount tree to restore over-mounted mounts
Pavel Emelyanov
xemul at virtuozzo.com
Wed Sep 21 00:37:10 PDT 2016
On 09/13/2016 07:19 AM, Andrei Vagin wrote:
> From: Andrei Vagin <avagin at virtuozzo.com>
>
> If a mount overmounts something else, we can try to restore it
> separetly and then move it to the right places after restoring
> all mounts.
Hm... Why not simply tune can_mount_new() to refuse mounting the
top-mounts until sub-mounts are?
> In this patch if we see that a mount is overmounts something,
> we create a new directory in the root yard and restore this
> mount and its sub-tree in this directory.
>
> https://bugs.openvz.org/browse/OVZ-6778
> Signed-off-by: Andrei Vagin <avagin at virtuozzo.com>
> ---
> criu/include/mount.h | 1 +
> criu/mount.c | 160 +++++++++++++++++++++++++++++++++++++++++++++++++--
> 2 files changed, 157 insertions(+), 4 deletions(-)
>
> diff --git a/criu/include/mount.h b/criu/include/mount.h
> index a266cd0..d9b1521 100644
> --- a/criu/include/mount.h
> +++ b/criu/include/mount.h
> @@ -65,6 +65,7 @@ struct mount_info {
> bool need_plugin;
> bool is_ns_root;
> bool deleted;
> + bool remap;
Unused.
> struct mount_info *next;
> struct ns_id *nsid;
>
> diff --git a/criu/mount.c b/criu/mount.c
> index e568249..6d61219 100644
> --- a/criu/mount.c
> +++ b/criu/mount.c
> @@ -2718,7 +2718,146 @@ static int do_umount_one(struct mount_info *mi)
> return 0;
> }
>
> -static int cr_pivot_root(char *root)
> +static struct mount_info *roots_mp = NULL;
This thing was moved from populate_mnt_ns(). This name is OK for the
on-stack variable, but for the file-wide one it's no longer nice.
> +
> +static inline int print_ns_root(struct ns_id *ns, int remap_id, char *buf, int bs);
> +static int get_mp_mountpoint(char *mountpoint, struct mount_info *mi, char *root, int root_len);
> +
> +static LIST_HEAD(mnt_remap_list);
> +static int remap_id;
> +
> +struct mnt_remap_entry {
> + struct mount_info *parent, *child;
> + struct list_head node;
Please, document the parent and child fields of this struct.
> +};
> +
> +/*
> + * If a mount overmounts other mounts, it is restored
> + * separetly and then moved to the right place.
> + * All these mounts are moved into the root yard.
> + */
> +static int do_mnt_remap(struct mount_info *m)
> +{
> + int len;
> +
> + if (m->nsid->type == NS_OTHER) {
> + /* A path in root_yard has a fixed size, so it can be replaced. */
> + len = print_ns_root(m->nsid, remap_id, m->mountpoint, PATH_MAX);
> + m->mountpoint[len] = '/';
> + } else {
Else what? type == NS_ROOT? And why is root's mounts are __that__ special?
> + char root[PATH_MAX], *mp, *ns_mp;
> + int len, ret;
> +
> + /* Add a root_yard path */
Please, write a MORE descriptive comment showing what is changed into what.
> + mp = m->mountpoint;
> + ns_mp = m->ns_mountpoint;
> +
> + len = print_ns_root(m->nsid, remap_id, root, PATH_MAX);
> +
> + ret = get_mp_mountpoint(ns_mp, m, root, len);
> + if (ret < 0)
> + return ret;
> + xfree(mp);
> + }
> + return 0;
> +}
> +
> +static int remap_mnt(struct mount_info *m)
> +{
> + struct mnt_remap_entry *r;
> +
> + if (!does_mnt_overmount(m))
> + return 0;
> +
> + BUG_ON(!m->parent || !list_empty(&m->parent->mnt_share));
> +
> + r = xmalloc(sizeof(struct mnt_remap_entry));
> + if (!r)
> + return -1;
> +
> + r->child = m;
> + list_add(&r->node, &mnt_remap_list);
> +
> + return 0;
> +}
> +
> +static int handle_overmounts(struct mount_info *root)
> +{
> + struct mnt_remap_entry *r;
> + struct mount_info *m;
> +
> + /*
> + * Mark mounts which have to be restored separetly,
> + * because it's imposiable to remove them from
> + * a tree without interrupting enumeration.
> + */
> + if (mnt_tree_for_each(root, remap_mnt))
> + return -1;
> +
> + /* Move remapped mounts to root_yard */
> + list_for_each_entry(r, &mnt_remap_list, node) {
> + m = r->child;
> + r->parent = m->parent;
> + m->parent = roots_mp;
> + list_del(&m->siblings);
> + list_add(&m->siblings, &roots_mp->children);
list_move()?
Why not do all of the above in remap_mnt()?
> +
> + remap_id++;
> + mnt_tree_for_each(m, do_mnt_remap);
> + pr_debug("Restore the %d mount in %s\n", m->mnt_id, m->mountpoint);
> + }
> +
> + return 0;
> +}
> +
> +/* Move remapped mounts to places where they have to be */
> +static int handle_mnt_remaps(int nsid, char *put_root)
Two handle_ routines in one patch :) Too generic names, can we come up with better ones?
> +{
> + struct mnt_remap_entry *r;
> + int cwd, exit_code = -1;
> +
> + cwd = open(".", O_PATH);
> + if (cwd < 0) {
> + pr_perror("Unable to open \".\"\n");
> + return -1;
> + }
> +
> + if (nsid != root_item->ids->mnt_ns_id && chdir(put_root)) {
What for?
> + pr_perror("Unable to change working directory");
> + return -1;
> + }
> +
> + list_for_each_entry(r, &mnt_remap_list, node) {
> + struct mount_info *m = r->child;
> +
> + if (r->child->nsid->id != nsid)
> + continue;
Where's the guarantee that the mnt_remap_list() is empty at the end?
> +
> + pr_debug("Move mount %s -> %s\n", m->mountpoint, m->ns_mountpoint);
> + if (mount(m->mountpoint, m->ns_mountpoint, NULL, MS_MOVE, NULL)) {
> + pr_perror("Unable to move mount %s -> %s", m->mountpoint, m->ns_mountpoint);
> + goto err;
> + }
> +
> + list_del(&r->child->siblings);
> + list_add(&r->child->siblings, &r->parent->children);
> + r->child->parent = r->parent;
Worth having 'reparent_mount()' helper? The same code is in handle_overmounts().
> + }
> +
> + exit_code = 0;
> +err:
> + if (fchdir(cwd)) {
> + pr_perror("Unable to change working directory");
> + close(cwd);
> + return -1;
> + }
> + close(cwd);
> +
> + return exit_code;
> +}
> +
> +
> +static int cr_pivot_root(char *root, int nsid)
> {
> char tmp_dir_tmpl[] = "crtools-put-root.XXXXXX";
> bool tmp_dir = false;
> @@ -2759,6 +2898,9 @@ static int cr_pivot_root(char *root)
> goto err_tmpfs;
> }
>
> + if (nsid > 0 && handle_mnt_remaps(nsid, put_root))
> + return -1;
> +
> if (mount("none", put_root, "none", MS_REC|MS_SLAVE, NULL)) {
> pr_perror("Can't remount root with MS_PRIVATE");
> return -1;
> @@ -3196,6 +3338,7 @@ void fini_restore_mntns(void)
> */
> static int populate_roots_yard(void)
> {
> + struct mnt_remap_entry *r;
> char path[PATH_MAX];
> struct ns_id *nsid;
>
> @@ -3216,6 +3359,13 @@ static int populate_roots_yard(void)
> }
> }
>
> + list_for_each_entry(r, &mnt_remap_list, node) {
> + if (mkdirpat(AT_FDCWD, r->child->mountpoint)) {
You mkdir() with names from image for all the namespaces found. What if names conflict?
> + pr_perror("Unable to create %s", r->child->mountpoint);
> + return -1;
> + }
> + }
> +
> return 0;
> }
>
> @@ -3223,7 +3373,6 @@ static int populate_mnt_ns(void)
> {
> struct mount_info *pms;
> struct ns_id *nsid;
> - struct mount_info *roots_mp = NULL;
> int ret;
>
> if (mnt_roots) {
> @@ -3258,6 +3407,9 @@ static int populate_mnt_ns(void)
> if (validate_mounts(mntinfo, false))
> return -1;
>
> + if (handle_overmounts(pms))
> + return -1;
> +
> /*
> * Set properties for the root before mounting a root yard,
> * otherwise the root yard can be propagated into the host
> @@ -3462,7 +3614,7 @@ int prepare_mnt_ns(void)
>
> ret = populate_mnt_ns();
> if (!ret && opts.root)
> - ret = cr_pivot_root(NULL);
> + ret = cr_pivot_root(NULL, root_item->ids->mnt_ns_id);
> if (ret)
> return -1;
>
> @@ -3495,7 +3647,7 @@ int prepare_mnt_ns(void)
> /* Set its root */
> path[0] = '/';
> print_ns_root(nsid, 0, path + 1, sizeof(path) - 1);
> - if (cr_pivot_root(path))
> + if (cr_pivot_root(path, nsid->id))
> goto err;
>
> /* Pin one with a file descriptor */
>
More information about the CRIU
mailing list