在2022年6月1日六月 上午10:59,Huacai Chen写道:
> Add system call support and related uaccess.h for LoongArch.
>
> Q: Why keep _ARCH_WANT_SYS_CLONE definition while there is clone3:
> A: The latest glibc release has some basic support for clone3 but it is
> not complete. E.g., pthread_create() and spawni() have converted to
> use clone3 but fork() will still use clone. Moreover, some seccomp
> related applications can still not work perfectly with clone3. E.g.,
> Chromium sandbox cannot work at all and there is no solution for it,
> which is more terrible than the fork() story [1].
>
> [1] https://chromium-review.googlesource.com/c/chromium/src/+/2936184
>
> Reviewed-by: WANG Xuerui <[email protected]>
> Signed-off-by: Huacai Chen <[email protected]>
Reviewed-by: Jiaxun Yang <[email protected]>
> ---
> arch/loongarch/include/asm/seccomp.h | 20 ++
> arch/loongarch/include/asm/syscall.h | 74 +++++++
> arch/loongarch/include/asm/uaccess.h | 269 +++++++++++++++++++++++
> arch/loongarch/include/asm/unistd.h | 11 +
> arch/loongarch/include/uapi/asm/unistd.h | 5 +
> arch/loongarch/kernel/entry.S | 89 ++++++++
> arch/loongarch/kernel/syscall.c | 63 ++++++
> 7 files changed, 531 insertions(+)
> create mode 100644 arch/loongarch/include/asm/seccomp.h
> create mode 100644 arch/loongarch/include/asm/syscall.h
> create mode 100644 arch/loongarch/include/asm/uaccess.h
> create mode 100644 arch/loongarch/include/asm/unistd.h
> create mode 100644 arch/loongarch/include/uapi/asm/unistd.h
> create mode 100644 arch/loongarch/kernel/entry.S
> create mode 100644 arch/loongarch/kernel/syscall.c
>
> diff --git a/arch/loongarch/include/asm/seccomp.h
> b/arch/loongarch/include/asm/seccomp.h
> new file mode 100644
> index 000000000000..31d6ab42e43e
> --- /dev/null
> +++ b/arch/loongarch/include/asm/seccomp.h
> @@ -0,0 +1,20 @@
> +/* SPDX-License-Identifier: GPL-2.0 */
> +
> +#ifndef _ASM_SECCOMP_H
> +#define _ASM_SECCOMP_H
> +
> +#include <asm/unistd.h>
> +
> +#include <asm-generic/seccomp.h>
> +
> +#ifdef CONFIG_32BIT
> +# define SECCOMP_ARCH_NATIVE AUDIT_ARCH_LOONGARCH32
> +# define SECCOMP_ARCH_NATIVE_NR NR_syscalls
> +# define SECCOMP_ARCH_NATIVE_NAME "loongarch32"
> +#else
> +# define SECCOMP_ARCH_NATIVE AUDIT_ARCH_LOONGARCH64
> +# define SECCOMP_ARCH_NATIVE_NR NR_syscalls
> +# define SECCOMP_ARCH_NATIVE_NAME "loongarch64"
> +#endif
> +
> +#endif /* _ASM_SECCOMP_H */
> diff --git a/arch/loongarch/include/asm/syscall.h
> b/arch/loongarch/include/asm/syscall.h
> new file mode 100644
> index 000000000000..e286dc58476e
> --- /dev/null
> +++ b/arch/loongarch/include/asm/syscall.h
> @@ -0,0 +1,74 @@
> +/* SPDX-License-Identifier: GPL-2.0+ */
> +/*
> + * Author: Hanlu Li <[email protected]>
> + * Huacai Chen <[email protected]>
> + *
> + * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
> + */
> +
> +#ifndef __ASM_LOONGARCH_SYSCALL_H
> +#define __ASM_LOONGARCH_SYSCALL_H
> +
> +#include <linux/compiler.h>
> +#include <uapi/linux/audit.h>
> +#include <linux/elf-em.h>
> +#include <linux/kernel.h>
> +#include <linux/sched.h>
> +#include <linux/uaccess.h>
> +#include <asm/ptrace.h>
> +#include <asm/unistd.h>
> +
> +extern void *sys_call_table[];
> +
> +static inline long syscall_get_nr(struct task_struct *task,
> + struct pt_regs *regs)
> +{
> + return regs->regs[11];
> +}
> +
> +static inline void syscall_rollback(struct task_struct *task,
> + struct pt_regs *regs)
> +{
> + regs->regs[4] = regs->orig_a0;
> +}
> +
> +static inline long syscall_get_error(struct task_struct *task,
> + struct pt_regs *regs)
> +{
> + unsigned long error = regs->regs[4];
> +
> + return IS_ERR_VALUE(error) ? error : 0;
> +}
> +
> +static inline long syscall_get_return_value(struct task_struct *task,
> + struct pt_regs *regs)
> +{
> + return regs->regs[4];
> +}
> +
> +static inline void syscall_set_return_value(struct task_struct *task,
> + struct pt_regs *regs,
> + int error, long val)
> +{
> + regs->regs[4] = (long) error ? error : val;
> +}
> +
> +static inline void syscall_get_arguments(struct task_struct *task,
> + struct pt_regs *regs,
> + unsigned long *args)
> +{
> + args[0] = regs->orig_a0;
> + memcpy(&args[1], ®s->regs[5], 5 * sizeof(long));
> +}
> +
> +static inline int syscall_get_arch(struct task_struct *task)
> +{
> + return AUDIT_ARCH_LOONGARCH64;
> +}
> +
> +static inline bool arch_syscall_is_vdso_sigreturn(struct pt_regs *regs)
> +{
> + return false;
> +}
> +
> +#endif /* __ASM_LOONGARCH_SYSCALL_H */
> diff --git a/arch/loongarch/include/asm/uaccess.h
> b/arch/loongarch/include/asm/uaccess.h
> new file mode 100644
> index 000000000000..217c6a3727b1
> --- /dev/null
> +++ b/arch/loongarch/include/asm/uaccess.h
> @@ -0,0 +1,269 @@
> +/* SPDX-License-Identifier: GPL-2.0 */
> +/*
> + * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
> + *
> + * Derived from MIPS:
> + * Copyright (C) 1996, 1997, 1998, 1999, 2000, 03, 04 by Ralf Baechle
> + * Copyright (C) 1999, 2000 Silicon Graphics, Inc.
> + * Copyright (C) 2007 Maciej W. Rozycki
> + * Copyright (C) 2014, Imagination Technologies Ltd.
> + */
> +#ifndef _ASM_UACCESS_H
> +#define _ASM_UACCESS_H
> +
> +#include <linux/kernel.h>
> +#include <linux/string.h>
> +#include <linux/extable.h>
> +#include <asm/pgtable.h>
> +#include <asm-generic/extable.h>
> +#include <asm-generic/access_ok.h>
> +
> +extern u64 __ua_limit;
> +
> +#define __UA_ADDR ".dword"
> +#define __UA_LA "la.abs"
> +#define __UA_LIMIT __ua_limit
> +
> +/*
> + * get_user: - Get a simple variable from user space.
> + * @x: Variable to store result.
> + * @ptr: Source address, in user space.
> + *
> + * Context: User context only. This function may sleep if pagefaults
> are
> + * enabled.
> + *
> + * This macro copies a single simple variable from user space to kernel
> + * space. It supports simple types like char and int, but not larger
> + * data types like structures or arrays.
> + *
> + * @ptr must have pointer-to-simple-variable type, and the result of
> + * dereferencing @ptr must be assignable to @x without a cast.
> + *
> + * Returns zero on success, or -EFAULT on error.
> + * On error, the variable @x is set to zero.
> + */
> +#define get_user(x, ptr) \
> +({ \
> + const __typeof__(*(ptr)) __user *__p = (ptr); \
> + \
> + might_fault(); \
> + access_ok(__p, sizeof(*__p)) ? __get_user((x), __p) : \
> + ((x) = 0, -EFAULT); \
> +})
> +
> +/*
> + * put_user: - Write a simple value into user space.
> + * @x: Value to copy to user space.
> + * @ptr: Destination address, in user space.
> + *
> + * Context: User context only. This function may sleep if pagefaults
> are
> + * enabled.
> + *
> + * This macro copies a single simple value from kernel space to user
> + * space. It supports simple types like char and int, but not larger
> + * data types like structures or arrays.
> + *
> + * @ptr must have pointer-to-simple-variable type, and @x must be
> assignable
> + * to the result of dereferencing @ptr.
> + *
> + * Returns zero on success, or -EFAULT on error.
> + */
> +#define put_user(x, ptr) \
> +({ \
> + __typeof__(*(ptr)) __user *__p = (ptr); \
> + \
> + might_fault(); \
> + access_ok(__p, sizeof(*__p)) ? __put_user((x), __p) : -EFAULT; \
> +})
> +
> +/*
> + * __get_user: - Get a simple variable from user space, with less
> checking.
> + * @x: Variable to store result.
> + * @ptr: Source address, in user space.
> + *
> + * Context: User context only. This function may sleep if pagefaults
> are
> + * enabled.
> + *
> + * This macro copies a single simple variable from user space to kernel
> + * space. It supports simple types like char and int, but not larger
> + * data types like structures or arrays.
> + *
> + * @ptr must have pointer-to-simple-variable type, and the result of
> + * dereferencing @ptr must be assignable to @x without a cast.
> + *
> + * Caller must check the pointer with access_ok() before calling this
> + * function.
> + *
> + * Returns zero on success, or -EFAULT on error.
> + * On error, the variable @x is set to zero.
> + */
> +#define __get_user(x, ptr) \
> +({ \
> + int __gu_err = 0; \
> + \
> + __chk_user_ptr(ptr); \
> + __get_user_common((x), sizeof(*(ptr)), ptr); \
> + __gu_err; \
> +})
> +
> +/*
> + * __put_user: - Write a simple value into user space, with less
> checking.
> + * @x: Value to copy to user space.
> + * @ptr: Destination address, in user space.
> + *
> + * Context: User context only. This function may sleep if pagefaults
> are
> + * enabled.
> + *
> + * This macro copies a single simple value from kernel space to user
> + * space. It supports simple types like char and int, but not larger
> + * data types like structures or arrays.
> + *
> + * @ptr must have pointer-to-simple-variable type, and @x must be
> assignable
> + * to the result of dereferencing @ptr.
> + *
> + * Caller must check the pointer with access_ok() before calling this
> + * function.
> + *
> + * Returns zero on success, or -EFAULT on error.
> + */
> +#define __put_user(x, ptr) \
> +({ \
> + int __pu_err = 0; \
> + __typeof__(*(ptr)) __pu_val; \
> + \
> + __pu_val = (x); \
> + __chk_user_ptr(ptr); \
> + __put_user_common(ptr, sizeof(*(ptr))); \
> + __pu_err; \
> +})
> +
> +struct __large_struct { unsigned long buf[100]; };
> +#define __m(x) (*(struct __large_struct __user *)(x))
> +
> +#define __get_user_common(val, size, ptr) \
> +do { \
> + switch (size) { \
> + case 1: __get_data_asm(val, "ld.b", ptr); break; \
> + case 2: __get_data_asm(val, "ld.h", ptr); break; \
> + case 4: __get_data_asm(val, "ld.w", ptr); break; \
> + case 8: __get_data_asm(val, "ld.d", ptr); break; \
> + default: BUILD_BUG(); break; \
> + } \
> +} while (0)
> +
> +#define __get_kernel_common(val, size, ptr) __get_user_common(val,
> size, ptr)
> +
> +#define __get_data_asm(val, insn, ptr) \
> +{ \
> + long __gu_tmp; \
> + \
> + __asm__ __volatile__( \
> + "1: " insn " %1, %2 \n" \
> + "2: \n" \
> + " .section .fixup,\"ax\" \n" \
> + "3: li.w %0, %3 \n" \
> + " or %1, $r0, $r0 \n" \
> + " b 2b \n" \
> + " .previous \n" \
> + " .section __ex_table,\"a\" \n" \
> + " "__UA_ADDR "\t1b, 3b \n" \
> + " .previous \n" \
> + : "+r" (__gu_err), "=r" (__gu_tmp) \
> + : "m" (__m(ptr)), "i" (-EFAULT)); \
> + \
> + (val) = (__typeof__(*(ptr))) __gu_tmp; \
> +}
> +
> +#define __put_user_common(ptr, size) \
> +do { \
> + switch (size) { \
> + case 1: __put_data_asm("st.b", ptr); break; \
> + case 2: __put_data_asm("st.h", ptr); break; \
> + case 4: __put_data_asm("st.w", ptr); break; \
> + case 8: __put_data_asm("st.d", ptr); break; \
> + default: BUILD_BUG(); break; \
> + } \
> +} while (0)
> +
> +#define __put_kernel_common(ptr, size) __put_user_common(ptr, size)
> +
> +#define __put_data_asm(insn, ptr) \
> +{ \
> + __asm__ __volatile__( \
> + "1: " insn " %z2, %1 # __put_user_asm\n" \
> + "2: \n" \
> + " .section .fixup,\"ax\" \n" \
> + "3: li.w %0, %3 \n" \
> + " b 2b \n" \
> + " .previous \n" \
> + " .section __ex_table,\"a\" \n" \
> + " " __UA_ADDR " 1b, 3b \n" \
> + " .previous \n" \
> + : "+r" (__pu_err), "=m" (__m(ptr)) \
> + : "Jr" (__pu_val), "i" (-EFAULT)); \
> +}
> +
> +#define __get_kernel_nofault(dst, src, type, err_label) \
> +do { \
> + int __gu_err = 0; \
> + \
> + __get_kernel_common(*((type *)(dst)), sizeof(type), \
> + (__force type *)(src)); \
> + if (unlikely(__gu_err)) \
> + goto err_label; \
> +} while (0)
> +
> +#define __put_kernel_nofault(dst, src, type, err_label) \
> +do { \
> + type __pu_val; \
> + int __pu_err = 0; \
> + \
> + __pu_val = *(__force type *)(src); \
> + __put_kernel_common(((type *)(dst)), sizeof(type)); \
> + if (unlikely(__pu_err)) \
> + goto err_label; \
> +} while (0)
> +
> +extern unsigned long __copy_user(void *to, const void *from,
> __kernel_size_t n);
> +
> +static inline unsigned long __must_check
> +raw_copy_from_user(void *to, const void __user *from, unsigned long n)
> +{
> + return __copy_user(to, from, n);
> +}
> +
> +static inline unsigned long __must_check
> +raw_copy_to_user(void __user *to, const void *from, unsigned long n)
> +{
> + return __copy_user(to, from, n);
> +}
> +
> +#define INLINE_COPY_FROM_USER
> +#define INLINE_COPY_TO_USER
> +
> +/*
> + * __clear_user: - Zero a block of memory in user space, with less
> checking.
> + * @addr: Destination address, in user space.
> + * @size: Number of bytes to zero.
> + *
> + * Zero a block of memory in user space. Caller must check
> + * the specified block with access_ok() before calling this function.
> + *
> + * Returns number of bytes that could not be cleared.
> + * On success, this will be zero.
> + */
> +extern unsigned long __clear_user(void __user *addr, __kernel_size_t
> size);
> +
> +#define clear_user(addr, n) \
> +({ \
> + void __user *__cl_addr = (addr); \
> + unsigned long __cl_size = (n); \
> + if (__cl_size && access_ok(__cl_addr, __cl_size)) \
> + __cl_size = __clear_user(__cl_addr, __cl_size); \
> + __cl_size; \
> +})
> +
> +extern long strncpy_from_user(char *to, const char __user *from, long
> n);
> +extern long strnlen_user(const char __user *str, long n);
> +
> +#endif /* _ASM_UACCESS_H */
> diff --git a/arch/loongarch/include/asm/unistd.h
> b/arch/loongarch/include/asm/unistd.h
> new file mode 100644
> index 000000000000..cfddb0116a8c
> --- /dev/null
> +++ b/arch/loongarch/include/asm/unistd.h
> @@ -0,0 +1,11 @@
> +/* SPDX-License-Identifier: GPL-2.0+ */
> +/*
> + * Author: Hanlu Li <[email protected]>
> + * Huacai Chen <[email protected]>
> + *
> + * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
> + */
> +
> +#include <uapi/asm/unistd.h>
> +
> +#define NR_syscalls (__NR_syscalls)
> diff --git a/arch/loongarch/include/uapi/asm/unistd.h
> b/arch/loongarch/include/uapi/asm/unistd.h
> new file mode 100644
> index 000000000000..fcb668984f03
> --- /dev/null
> +++ b/arch/loongarch/include/uapi/asm/unistd.h
> @@ -0,0 +1,5 @@
> +/* SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note */
> +#define __ARCH_WANT_SYS_CLONE
> +#define __ARCH_WANT_SYS_CLONE3
> +
> +#include <asm-generic/unistd.h>
> diff --git a/arch/loongarch/kernel/entry.S
> b/arch/loongarch/kernel/entry.S
> new file mode 100644
> index 000000000000..d5b3dbcf5425
> --- /dev/null
> +++ b/arch/loongarch/kernel/entry.S
> @@ -0,0 +1,89 @@
> +/* SPDX-License-Identifier: GPL-2.0 */
> +/*
> + * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
> + *
> + * Derived from MIPS:
> + * Copyright (C) 1994 - 2000, 2001, 2003 Ralf Baechle
> + * Copyright (C) 1999, 2000 Silicon Graphics, Inc.
> + * Copyright (C) 2001 MIPS Technologies, Inc.
> + */
> +
> +#include <asm/asm.h>
> +#include <asm/asmmacro.h>
> +#include <asm/loongarch.h>
> +#include <asm/regdef.h>
> +#include <asm/stackframe.h>
> +#include <asm/thread_info.h>
> +
> + .text
> + .cfi_sections .debug_frame
> + .align 5
> +SYM_FUNC_START(handle_syscall)
> + csrrd t0, PERCPU_BASE_KS
> + la.abs t1, kernelsp
> + add.d t1, t1, t0
> + move t2, sp
> + ld.d sp, t1, 0
> +
> + addi.d sp, sp, -PT_SIZE
> + cfi_st t2, PT_R3
> + cfi_rel_offset sp, PT_R3
> + st.d zero, sp, PT_R0
> + csrrd t2, LOONGARCH_CSR_PRMD
> + st.d t2, sp, PT_PRMD
> + csrrd t2, LOONGARCH_CSR_CRMD
> + st.d t2, sp, PT_CRMD
> + csrrd t2, LOONGARCH_CSR_EUEN
> + st.d t2, sp, PT_EUEN
> + csrrd t2, LOONGARCH_CSR_ECFG
> + st.d t2, sp, PT_ECFG
> + csrrd t2, LOONGARCH_CSR_ESTAT
> + st.d t2, sp, PT_ESTAT
> + cfi_st ra, PT_R1
> + cfi_st a0, PT_R4
> + cfi_st a1, PT_R5
> + cfi_st a2, PT_R6
> + cfi_st a3, PT_R7
> + cfi_st a4, PT_R8
> + cfi_st a5, PT_R9
> + cfi_st a6, PT_R10
> + cfi_st a7, PT_R11
> + csrrd ra, LOONGARCH_CSR_ERA
> + st.d ra, sp, PT_ERA
> + cfi_rel_offset ra, PT_ERA
> +
> + cfi_st tp, PT_R2
> + cfi_st u0, PT_R21
> + cfi_st fp, PT_R22
> +
> + SAVE_STATIC
> +
> + move u0, t0
> + li.d tp, ~_THREAD_MASK
> + and tp, tp, sp
> +
> + move a0, sp
> + bl do_syscall
> +
> + RESTORE_ALL_AND_RET
> +SYM_FUNC_END(handle_syscall)
> +
> +SYM_CODE_START(ret_from_fork)
> + bl schedule_tail # a0 = struct task_struct *prev
> + move a0, sp
> + bl syscall_exit_to_user_mode
> + RESTORE_STATIC
> + RESTORE_SOME
> + RESTORE_SP_AND_RET
> +SYM_CODE_END(ret_from_fork)
> +
> +SYM_CODE_START(ret_from_kernel_thread)
> + bl schedule_tail # a0 = struct task_struct *prev
> + move a0, s1
> + jirl ra, s0, 0
> + move a0, sp
> + bl syscall_exit_to_user_mode
> + RESTORE_STATIC
> + RESTORE_SOME
> + RESTORE_SP_AND_RET
> +SYM_CODE_END(ret_from_kernel_thread)
> diff --git a/arch/loongarch/kernel/syscall.c
> b/arch/loongarch/kernel/syscall.c
> new file mode 100644
> index 000000000000..3fc4211db989
> --- /dev/null
> +++ b/arch/loongarch/kernel/syscall.c
> @@ -0,0 +1,63 @@
> +// SPDX-License-Identifier: GPL-2.0+
> +/*
> + * Author: Hanlu Li <[email protected]>
> + * Huacai Chen <[email protected]>
> + *
> + * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
> + */
> +#include <linux/capability.h>
> +#include <linux/entry-common.h>
> +#include <linux/errno.h>
> +#include <linux/linkage.h>
> +#include <linux/syscalls.h>
> +#include <linux/unistd.h>
> +
> +#include <asm/asm.h>
> +#include <asm/signal.h>
> +#include <asm/switch_to.h>
> +#include <asm-generic/syscalls.h>
> +
> +#undef __SYSCALL
> +#define __SYSCALL(nr, call) [nr] = (call),
> +
> +SYSCALL_DEFINE6(mmap, unsigned long, addr, unsigned long, len,
> unsigned long,
> + prot, unsigned long, flags, unsigned long, fd, off_t, offset)
> +{
> + if (offset & ~PAGE_MASK)
> + return -EINVAL;
> +
> + return ksys_mmap_pgoff(addr, len, prot, flags, fd, offset >>
> PAGE_SHIFT);
> +}
> +
> +void *sys_call_table[__NR_syscalls] = {
> + [0 ... __NR_syscalls - 1] = sys_ni_syscall,
> +#include <asm/unistd.h>
> +};
> +
> +typedef long (*sys_call_fn)(unsigned long, unsigned long,
> + unsigned long, unsigned long, unsigned long, unsigned long);
> +
> +void noinstr do_syscall(struct pt_regs *regs)
> +{
> + unsigned long nr;
> + sys_call_fn syscall_fn;
> +
> + nr = regs->regs[11];
> + /* Set for syscall restarting */
> + if (nr < NR_syscalls)
> + regs->regs[0] = nr + 1;
> +
> + regs->csr_era += 4;
> + regs->orig_a0 = regs->regs[4];
> + regs->regs[4] = -ENOSYS;
> +
> + nr = syscall_enter_from_user_mode(regs, nr);
> +
> + if (nr < NR_syscalls) {
> + syscall_fn = sys_call_table[nr];
> + regs->regs[4] = syscall_fn(regs->orig_a0, regs->regs[5],
> regs->regs[6],
> + regs->regs[7], regs->regs[8], regs->regs[9]);
> + }
> +
> + syscall_exit_to_user_mode(regs);
> +}
> --
> 2.27.0
--
- Jiaxun