[CRIU] [PATCH] [POC] zdtm: check lazy-pages
Adrian Reber
areber at redhat.com
Wed Jun 15 06:30:55 PDT 2016
On Wed, Jun 15, 2016 at 03:47:21AM +0300, Andrey Vagin wrote:
> From: Andrew Vagin <avagin at virtuozzo.com>
>
> [root at fc22-vm criu]# python test/zdtm.py run -t zdtm/static/unlink_fstat04 --lazy-pages
> === Run 1/1 ================
>
> ===================== Run zdtm/static/unlink_fstat04 in h ======================
> Makefile:299: target 'mnt_enablefs.pid' given more than once in the same rule
> Start test
> Test is SUID
> Makefile:299: target 'mnt_enablefs.pid' given more than once in the same rule
> ./unlink_fstat04 --pidfile=unlink_fstat04.pid --outfile=unlink_fstat04.out --dirname=unlink_fstat04.test
> Run criu dump
> Run criu lazy-pages
> Run criu restore
> Wait for zdtm/static/unlink_fstat04 to die for 0.100000
> Removing dump/zdtm/static/unlink_fstat04/24
> ===================== Test zdtm/static/unlink_fstat04 PASS =====================
>
> ===================== Run zdtm/static/unlink_fstat04 in ns =====================
> Makefile:299: target 'mnt_enablefs.pid' given more than once in the same rule
> Start test
> Test is SUID
> Makefile:299: target 'mnt_enablefs.pid' given more than once in the same rule
> ./unlink_fstat04 --pidfile=unlink_fstat04.pid --outfile=unlink_fstat04.out --dirname=unlink_fstat04.test
> Run criu dump
> Run criu lazy-pages
> Run criu restore
> =[log]=> dump/zdtm/static/unlink_fstat04/54/1/restore.log
> ------------------------ grep Error ------------------------
> (00.183478) 1: Error (uffd.c:142): lazy-pages: connect to userfault.socket failed: No such file or directory
> (00.183623) 4: Error (uffd.c:142): lazy-pages: connect to userfault.socket failed: No such file or directory
> (00.191785) Error (cr-restore.c:992): 77 killed by signal 9: Killed
> (00.191807) Error (cr-restore.c:1877): Restoring FAILED.
> ------------------------ ERROR OVER ------------------------
Thanks, Andrew. Writing tests sounds like a good idea. Looking at the
output I am not entirely sure what the second message means? That it
didn't work restoring in a namespace. Before running the tests with
lazy-pages we would also need to make sure the kernel supports it.
Adrian
> Cc: Adrian Reber <areber at redhat.com>
> Cc: Mike Rapoport <rppt at linux.vnet.ibm.com>
> Signed-off-by: Andrew Vagin <avagin at virtuozzo.com>
> ---
> test/zdtm.py | 19 ++++++++++++++++++-
> 1 file changed, 18 insertions(+), 1 deletion(-)
>
> diff --git a/test/zdtm.py b/test/zdtm.py
> index d24429a..98345a4 100755
> --- a/test/zdtm.py
> +++ b/test/zdtm.py
> @@ -645,6 +645,7 @@ class criu_cli:
> self.__iter = 0
> self.__prev_dump_iter = None
> self.__page_server = (opts['page_server'] and True or False)
> + self.__lazy_pages = (opts['lazy_pages'] and True or False)
> self.__restore_sibling = (opts['sibling'] and True or False)
> self.__join_ns = (opts['join_ns'] and True or False)
> self.__unshare = (opts['unshare'] and True or False)
> @@ -687,6 +688,8 @@ class criu_cli:
> print "Forcing %s fault" % fault
> env = dict(os.environ, CRIU_FAULT = fault)
> cr = subprocess.Popen(strace + [criu_bin, action] + args, env = env, preexec_fn = preexec)
> + if action == "lazy-pages":
> + return cr
> return cr.wait()
>
> def set_user_id(self):
> @@ -721,6 +724,8 @@ class criu_cli:
> __ddir = self.__ddir()
>
> ret = self.__criu(action, s_args, self.__fault, strace, preexec)
> + if action == "lazy-pages":
> + return ret
> grep_errors(os.path.join(__ddir, log))
> if ret != 0:
> if self.__fault and int(self.__fault) < 128:
> @@ -801,8 +806,19 @@ class criu_cli:
> if os.getenv("GCOV"):
> r_opts.append("--ext-mount-map")
> r_opts.append("zdtm:%s" % criu_dir)
> +
> + lazy_pages_p = None
> + if self.__lazy_pages:
> + addr = "userfault.socket"
> + self.lazy_pages_p = self.__criu_act("lazy-pages", opts = ["--address", addr])
> + r_opts += ["--lazy-pages", "--address", addr]
> + time.sleep(1) # FIXME wait user fault fd socket
> +
> self.__criu_act("restore", opts = r_opts + ["--restore-detached"])
>
> + if lazy_pages_p and lazy_pages_p.wait():
> + raise test_fail_exc("CRIU lazy-pages")
> +
> @staticmethod
> def check(feature):
> return criu_cli.__criu("check", ["-v0", "--feature", feature]) == 0
> @@ -1146,7 +1162,7 @@ class launcher:
>
> nd = ('nocr', 'norst', 'pre', 'iters', 'page_server', 'sibling', 'unshare',
> 'fault', 'keep_img', 'report', 'snaps', 'sat', 'script',
> - 'join_ns', 'dedup', 'sbs', 'freezecg', 'user', 'dry_run', 'noauto_dedup')
> + 'join_ns', 'dedup', 'sbs', 'freezecg', 'user', 'dry_run', 'noauto_dedup', 'lazy_pages')
> arg = repr((name, desc, flavor, {d: self.__opts[d] for d in nd}))
>
> if self.__use_log:
> @@ -1603,6 +1619,7 @@ rp.add_argument("-k", "--keep-img", help = "Whether or not to keep images after
> choices = ['always', 'never', 'failed'], default = 'failed')
> rp.add_argument("--report", help = "Generate summary report in directory")
> rp.add_argument("--keep-going", help = "Keep running tests in spite of failures", action = 'store_true')
> +rp.add_argument("--lazy-pages", help = "restore pages on demand", action = 'store_true')
>
> lp = sp.add_parser("list", help = "List tests")
> lp.set_defaults(action = list_tests)
> --
> 2.7.4
>
More information about the CRIU
mailing list