[PATCH v2 05/11] powerpc64: Add the clone3 wrapper
Paul E Murphy
murphyp@linux.ibm.com
Mon Nov 28 16:38:22 GMT 2022
On 11/4/22 2:01 PM, Adhemerval Zanella via Libc-alpha wrote:
> It follows the internal signature:
>
> extern int clone3 (struct clone_args *__cl_args, size_t __size,
> int (*__func) (void *__arg), void *__arg);
>
> The powerpc64 ABI requires an initial stackframe so the child can
> store/restore the TOC. Iit is create prior calling clone3 by
trivial nit, s/Iit/It/.
> adjusting the stack size (since kernel will compute the stack as
> stack plus size).
>
> Checked on powerpc64-linux-gnu (power8, kernel 6.0) and
> powerpc64le-linux-gnu (power9, kernel 4.18).
> ---
> .../sysv/linux/powerpc/powerpc64/clone3.S | 152 ++++++++++++++++++
> sysdeps/unix/sysv/linux/powerpc/sysdep.h | 1 +
> 2 files changed, 153 insertions(+)
> create mode 100644 sysdeps/unix/sysv/linux/powerpc/powerpc64/clone3.S
>
> diff --git a/sysdeps/unix/sysv/linux/powerpc/powerpc64/clone3.S b/sysdeps/unix/sysv/linux/powerpc/powerpc64/clone3.S
> new file mode 100644
> index 0000000000..0fe2fe91db
> --- /dev/null
> +++ b/sysdeps/unix/sysv/linux/powerpc/powerpc64/clone3.S
> @@ -0,0 +1,152 @@
> +/* The clone3 syscall wrapper. Linux/powerpc64 version.
> + Copyright (C) 2022 Free Software Foundation, Inc.
> +
> + This file is part of the GNU C Library.
> +
> + The GNU C Library is free software; you can redistribute it and/or
> + modify it under the terms of the GNU Lesser General Public
> + License as published by the Free Software Foundation; either
> + version 2.1 of the License, or (at your option) any later version.
> +
> + The GNU C Library is distributed in the hope that it will be useful,
> + but WITHOUT ANY WARRANTY; without even the implied warranty of
> + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> + Lesser General Public License for more details.
> +
> + You should have received a copy of the GNU Lesser General Public
> + License along with the GNU C Library; if not, see
> + <https://www.gnu.org/licenses/>. */
> +
> +#include <sysdep.h>
> +#define _ERRNO_H 1
> +#include <bits/errno.h>
> +
> +/* The userland implementation is:
> + int clone3 (struct clone_args *cl_args, size_t size,
> + int (*func)(void *arg), void *arg);
> +
> + the kernel entry is:
> + int clone3 (struct clone_args *cl_args, size_t size);
> +
> + The parameters are passed in registers from userland:
> + r3: cl_args
> + r4: size
> + r5: func
> + r6: arg */
> +
> + .text
> +ENTRY(__clone3)
> + CALL_MCOUNT 4
> +
> + /* Sanity checks args. */
> + cmpdi cr0, r3, 0
> + cmpdi cr1, r5, 0
> + cror cr0*4+eq, cr1*4+eq, cr0*4+eq
> + beq cr0,L(badargs)
> +
> + /* Save some regs in the "red zone". */
Is there reason to avoid explicitly stacking a frame in here? Also, does
the red zone exist on ELFv1?
> +#ifdef USE_PPC_SCV
> + std r28, -24(r1)
> + cfi_offset (r28, -24)
> +#endif
> + std r29, -16(r1)
> + std r30, -8(r1)
> + cfi_offset (r29, -16)
> + cfi_offset (r30, -8)
> +
> + /* Save fn and args across syscall. */
trivial nit, s/fn/func/ s/args/arg/.
> + mr r30, r5 /* Function in r30. */
> + mr r29, r6 /* Argument in r29. */
> +
> + /* End FDE now, because in the child the unwind info will be
> + wrong. */
> + cfi_endproc
> +
> + /* Setup a minimum stack fram for child. It needs to first calculate
s/fram/frame/.
> + the effective stack address, write the start NULL frame-pointer,
> + and update the frame size in the input cl_args. */
> + ld r7, 40(r3) /* Load stack value. */
> + ld r8, 48(r3) /* Load stack_size value. */
> + li r10, 0
> + add r7, r7, r8 /* Calculate effective stack address. */
> + std r10, -FRAME_MIN_SIZE_PARM(r7)
This is clearing the backchain pointer? Maybe a small comment here.
> + addi r8, r8, -FRAME_MIN_SIZE_PARM
> + std r8, 48(r3)
> +
> + /* Do the system call, the kernel expects:
> + r0: system call numer
> + r3: cl_args
> + r4: size */
> + li r0, SYS_ify(clone3)
> +#ifdef USE_PPC_SCV
> + CHECK_SCV_SUPPORT r28 0f
> + /* This is equivalent to DO_CALL_SCV, but we cannot use the macro here
> + because it uses CFI directives and we just called cfi_endproc. */
> + mflr r9
> + std r9, FRAME_LR_SAVE(r1)
> + .machine "push"
> + .machine "power9"
> + scv 0
> + .machine "pop"
> + ld r9, FRAME_LR_SAVE(r1)
> + mtlr r9
> +
> + /* When using scv, error is indicated by negative r3. */
With scv an, an error is a value -4095 <= x < 0. This test should be
more specific.
> + cmpdi cr1, r3, 0
> + b 1f
> +#endif
> +0: DO_CALL_SC
> +
> + /* With sc, error is indicated by cr0.SO. */
> + cmpdi cr1, r3, 0
> + crandc cr1*4+eq, cr1*4+eq, cr0*4+so > +
> +1: bne- cr1,L(parent)
> +
> + /* Child, load the function and arguments. */
> + std r2, FRAME_TOC_SAVE(r1)
> + PPC64_LOAD_FUNCPTR r30
> + mr r3, r29
> + bctrl
> + ld r2, FRAME_TOC_SAVE(r1)
> +
> + li r0, SYS_ify(exit)
> + DO_CALL_SC
Minor nit, this should also use scv if supported.
> + /* We won't ever get here but provide a nop so that the linker
> + will insert a toc adjusting stub if necessary. */
> + nop
> +
> +L(badargs):
> + cfi_startproc
> + li r3, EINVAL
> + TAIL_CALL_SYSCALL_ERROR
> +
> +L(parent):
> + /* Check if svc is available. */
s/svc/scv/.
> + cmpdi cr1, r28, 0
> +
> + /* Parent. Restore registers & return. */
> +#ifdef USE_PPC_SCV
> + cfi_offset (r28, -24)
> + ld r28, -24(r1)
> + cfi_restore (r28)
> +#endif
> + cfi_offset (r29,-16)
> + cfi_offset (r30,-8)
> + ld r29, -16(r1)
> + ld r30, -8(r1)
> + cfi_restore (r29)
> + cfi_restore (r30)
> +
> +#ifdef USE_PPC_SCV
> + beq cr1, 0f
> + RET_SCV
> + b 1f
> +#endif
> +0: RET_SC
> +1: TAIL_CALL_SYSCALL_ERROR
> +
> +PSEUDO_END (__clone3)
> +
> +libc_hidden_def (__clone3)
> +weak_alias (__clone3, clone3)
> diff --git a/sysdeps/unix/sysv/linux/powerpc/sysdep.h b/sysdeps/unix/sysv/linux/powerpc/sysdep.h
> index 9e44818978..af63b3974b 100644
> --- a/sysdeps/unix/sysv/linux/powerpc/sysdep.h
> +++ b/sysdeps/unix/sysv/linux/powerpc/sysdep.h
> @@ -214,6 +214,7 @@
> #if defined(__PPC64__) || defined(__powerpc64__)
> #define HAVE_CLOCK_GETRES64_VSYSCALL "__kernel_clock_getres"
> #define HAVE_CLOCK_GETTIME64_VSYSCALL "__kernel_clock_gettime"
> +#define HAVE_CLONE3_WRAPPER 1
> #else
> #define HAVE_CLOCK_GETRES_VSYSCALL "__kernel_clock_getres"
> #define HAVE_CLOCK_GETTIME_VSYSCALL "__kernel_clock_gettime"
More information about the Libc-alpha
mailing list