[Devel] Re: [PATCH] user-cr: eclone x86-64 wrapper
Oren Laadan
orenl at cs.columbia.edu
Sun Dec 6 12:35:36 PST 2009
To test this, you need to update the kernel headers for user-cr
$ scripts/extract_headers -s PATH_TO_CR_KERNEL
Oren.
Oren Laadan wrote:
> Signed-off-by: Oren Laadan <orenl at cs.columbia.edu>
> ---
> clone_x86_64.c | 88 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++
> 1 files changed, 88 insertions(+), 0 deletions(-)
> create mode 100644 clone_x86_64.c
>
> diff --git a/clone_x86_64.c b/clone_x86_64.c
> new file mode 100644
> index 0000000..d6d7e6f
> --- /dev/null
> +++ b/clone_x86_64.c
> @@ -0,0 +1,88 @@
> +/*
> + * clone_x86_64.c: support for eclone() on x86_64
> + *
> + * Copyright (C) Oren Laadan <orenl at cs.columbia.edu>
> + * Copyright (C) Dave Hansen <daveh at linux.vnet.ibm.com>
> + *
> + * This file is subject to the terms and conditions of the GNU General Public
> + * License. See the file COPYING in the main directory of the Linux
> + * distribution for more details.
> + */
> +
> +#define _GNU_SOURCE
> +
> +#include <unistd.h>
> +#include <errno.h>
> +#include <sys/types.h>
> +#include <sys/syscall.h>
> +#include <asm/unistd.h>
> +
> +/*
> + * libc doesn't support eclone() yet...
> + * below is arch-dependent code to use the syscall
> + */
> +#include <linux/checkpoint.h>
> +
> +#include "eclone.h"
> +
> +#ifndef __NR_eclone
> +#define __NR_eclone 299
> +#endif
> +
> +int eclone(int (*fn)(void *), void *fn_arg, int clone_flags_low,
> + struct clone_args *clone_args, pid_t *pids)
> +{
> + struct clone_args my_args;
> + long retval;
> + void **newstack;
> +
> + if (clone_args->child_stack) {
> + /*
> + * Set up the stack for child:
> + * - fn_arg will be the argument for the child function
> + * - the fn pointer will be loaded into ebx after the clone
> + */
> + newstack = (void **)(unsigned long)(clone_args->child_stack +
> + clone_args->child_stack_size);
> + *--newstack = fn_arg;
> + *--newstack = fn;
> + } else
> + newstack = (void **)0;
> +
> + my_args = *clone_args;
> + my_args.child_stack = (unsigned long)newstack;
> + my_args.child_stack_size = 0;
> +
> + __asm__ __volatile__(
> + "movq %6, %%r10\n\t" /* pids in r10*/
> + "syscall\n\t" /* Linux/x86_64 system call */
> + "testq %0,%0\n\t" /* check return value */
> + "jne 1f\n\t" /* jump if parent */
> + "popq %%rax\n\t" /* get subthread function */
> + "popq %%rdi\n\t" /* get the subthread function arg */
> + "call *%%rax\n\t" /* start subthread function */
> + "movq %2,%0\n\t"
> + "syscall\n" /* exit system call: exit subthread */
> + "1:\n\t"
> + :"=a" (retval)
> + :"0" (__NR_eclone), "i" (__NR_exit),
> + "D" (clone_flags_low), /* rdi */
> + "S" (&my_args), /* rsi */
> + "d" (sizeof(my_args)), /* rdx */
> + "m" (pids) /* gets moved to r10 */
> + :"rcx", "r10", "r11", "cc"
> + );
> + /*
> + * glibc lists 'cc' as clobbered, so we might as
> + * well do it too. 'r11' and 'rcx' are clobbered
> + * by the 'syscall' instruction itself. 'r8' and
> + * 'r9' are clobbered by the clone, but that
> + * thread will exit before getting back out to C.
> + */
> +
> + if (retval < 0) {
> + errno = -retval;
> + retval = -1;
> + }
> + return retval;
> +}
_______________________________________________
Containers mailing list
Containers at lists.linux-foundation.org
https://lists.linux-foundation.org/mailman/listinfo/containers
More information about the Devel
mailing list