12952b6bbd
1, Allow usage of LSX/LASX in the kernel; 2, Add SIMD-optimized RAID5/RAID6 routines; 3, Add Loongson Binary Translation (LBT) extension support; 4, Add basic KGDB & KDB support; 5, Add building with kcov coverage; 6, Add KFENCE (Kernel Electric-Fence) support; 7, Add KASAN (Kernel Address Sanitizer) support; 8, Some bug fixes and other small changes; 9, Update the default config file. -----BEGIN PGP SIGNATURE----- iQJKBAABCAA0FiEEzOlt8mkP+tbeiYy5AoYrw/LiJnoFAmT5TfMWHGNoZW5odWFj YWlAa2VybmVsLm9yZwAKCRAChivD8uImeqd3EACjqCaHNlp33kwufSPpGuQw9a8I F7JW1KzBOoWELch5nFRjfQClROBWRmM4jN5YnxENBQ5K2F1K6gfxdkfjew+KV2mn ki9ByamCfFVJDZXo9wavUD2LBrVakEFmLT+SyXBxdWwJ3fDivHjF6A0qs9ltp7dq Bttq4bkw1mZsU6MnViRwPKVROtNUVrd9mwYSTq0iXviVEbWhPHQQTxRizNra9Z6X 7XWxO0ODHl0WVvdOJU+F16mBRS3Bs1g/HHAIDc41yrYEHFFOeFCEUAQSF/4Nj5wj BAfAB8WOa9+vPH8fTnrpCt2RtGJmkz71TM49DdXB7jpGaWIyc4WDi9MXeeBiJ0wE vQg8IECc9POC1sH4/6BMwq2qkrWRj2PYFYof0fP66iWNjmodtNUf7GOVHy8MTQan xHWizJFAdY/u/bwbF9tRQ+EVeot/844CkjtZxkgTfV8shN6kCMEVAamwBItZ7TXN g/oc1ORM6nsKHBDQF3r2LSY0Gbf3OSfMJVL8SLEQ9hAhgGhotmJ36B4bdvyO7T0Q gNn//U+p4IIMFRKRxreEz9P0KjTOJrHAAxNzu1oZebhGZd5WI+i0PHYkkBDKZTXc 7qaEdM2cX8Wd0ePIXOHQnSItwYO7ilrviHyeCM8wd/g2/W/00jvnpF3J+2rk7eJO rcfAr8+V5ylYBQzp6Q== =NXy2 -----END PGP SIGNATURE----- Merge tag 'loongarch-6.6' of git://git.kernel.org/pub/scm/linux/kernel/git/chenhuacai/linux-loongson Pull LoongArch updates from Huacai Chen: - Allow usage of LSX/LASX in the kernel, and use them for SIMD-optimized RAID5/RAID6 routines - Add Loongson Binary Translation (LBT) extension support - Add basic KGDB & KDB support - Add building with kcov coverage - Add KFENCE (Kernel Electric-Fence) support - Add KASAN (Kernel Address Sanitizer) support - Some bug fixes and other small changes - Update the default config file * tag 'loongarch-6.6' of git://git.kernel.org/pub/scm/linux/kernel/git/chenhuacai/linux-loongson: (25 commits) LoongArch: Update Loongson-3 default config file LoongArch: Add KASAN (Kernel Address Sanitizer) support LoongArch: Simplify the processing of jumping new kernel for KASLR kasan: Add (pmd|pud)_init for LoongArch zero_(pud|p4d)_populate process kasan: Add __HAVE_ARCH_SHADOW_MAP to support arch specific mapping LoongArch: Add KFENCE (Kernel Electric-Fence) support LoongArch: Get partial stack information when providing regs parameter LoongArch: mm: Add page table mapped mode support for virt_to_page() kfence: Defer the assignment of the local variable addr LoongArch: Allow building with kcov coverage LoongArch: Provide kaslr_offset() to get kernel offset LoongArch: Add basic KGDB & KDB support LoongArch: Add Loongson Binary Translation (LBT) extension support raid6: Add LoongArch SIMD recovery implementation raid6: Add LoongArch SIMD syndrome calculation LoongArch: Add SIMD-optimized XOR routines LoongArch: Allow usage of LSX/LASX in the kernel LoongArch: Define symbol 'fault' as a local label in fpu.S LoongArch: Adjust {copy, clear}_user exception handler behavior LoongArch: Use static defined zero page rather than allocated ...
374 lines
9.1 KiB
C
374 lines
9.1 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Author: Huacai Chen <chenhuacai@loongson.cn>
|
|
* Copyright (C) 2020-2022 Loongson Technology Corporation Limited
|
|
*
|
|
* Derived from MIPS:
|
|
* Copyright (C) 1994 - 1999, 2000 by Ralf Baechle and others.
|
|
* Copyright (C) 2005, 2006 by Ralf Baechle (ralf@linux-mips.org)
|
|
* Copyright (C) 1999, 2000 Silicon Graphics, Inc.
|
|
* Copyright (C) 2004 Thiemo Seufer
|
|
* Copyright (C) 2013 Imagination Technologies Ltd.
|
|
*/
|
|
#include <linux/cpu.h>
|
|
#include <linux/init.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/errno.h>
|
|
#include <linux/sched.h>
|
|
#include <linux/sched/debug.h>
|
|
#include <linux/sched/task.h>
|
|
#include <linux/sched/task_stack.h>
|
|
#include <linux/hw_breakpoint.h>
|
|
#include <linux/mm.h>
|
|
#include <linux/stddef.h>
|
|
#include <linux/unistd.h>
|
|
#include <linux/export.h>
|
|
#include <linux/ptrace.h>
|
|
#include <linux/mman.h>
|
|
#include <linux/personality.h>
|
|
#include <linux/sys.h>
|
|
#include <linux/completion.h>
|
|
#include <linux/kallsyms.h>
|
|
#include <linux/random.h>
|
|
#include <linux/prctl.h>
|
|
#include <linux/nmi.h>
|
|
|
|
#include <asm/asm.h>
|
|
#include <asm/bootinfo.h>
|
|
#include <asm/cpu.h>
|
|
#include <asm/elf.h>
|
|
#include <asm/fpu.h>
|
|
#include <asm/lbt.h>
|
|
#include <asm/io.h>
|
|
#include <asm/irq.h>
|
|
#include <asm/irq_regs.h>
|
|
#include <asm/loongarch.h>
|
|
#include <asm/pgtable.h>
|
|
#include <asm/processor.h>
|
|
#include <asm/reg.h>
|
|
#include <asm/unwind.h>
|
|
#include <asm/vdso.h>
|
|
|
|
#ifdef CONFIG_STACKPROTECTOR
|
|
#include <linux/stackprotector.h>
|
|
unsigned long __stack_chk_guard __read_mostly;
|
|
EXPORT_SYMBOL(__stack_chk_guard);
|
|
#endif
|
|
|
|
/*
|
|
* Idle related variables and functions
|
|
*/
|
|
|
|
unsigned long boot_option_idle_override = IDLE_NO_OVERRIDE;
|
|
EXPORT_SYMBOL(boot_option_idle_override);
|
|
|
|
asmlinkage void ret_from_fork(void);
|
|
asmlinkage void ret_from_kernel_thread(void);
|
|
|
|
void start_thread(struct pt_regs *regs, unsigned long pc, unsigned long sp)
|
|
{
|
|
unsigned long crmd;
|
|
unsigned long prmd;
|
|
unsigned long euen;
|
|
|
|
/* New thread loses kernel privileges. */
|
|
crmd = regs->csr_crmd & ~(PLV_MASK);
|
|
crmd |= PLV_USER;
|
|
regs->csr_crmd = crmd;
|
|
|
|
prmd = regs->csr_prmd & ~(PLV_MASK);
|
|
prmd |= PLV_USER;
|
|
regs->csr_prmd = prmd;
|
|
|
|
euen = regs->csr_euen & ~(CSR_EUEN_FPEN);
|
|
regs->csr_euen = euen;
|
|
lose_fpu(0);
|
|
lose_lbt(0);
|
|
|
|
clear_thread_flag(TIF_LSX_CTX_LIVE);
|
|
clear_thread_flag(TIF_LASX_CTX_LIVE);
|
|
clear_thread_flag(TIF_LBT_CTX_LIVE);
|
|
clear_used_math();
|
|
regs->csr_era = pc;
|
|
regs->regs[3] = sp;
|
|
}
|
|
|
|
void flush_thread(void)
|
|
{
|
|
flush_ptrace_hw_breakpoint(current);
|
|
}
|
|
|
|
void exit_thread(struct task_struct *tsk)
|
|
{
|
|
}
|
|
|
|
int arch_dup_task_struct(struct task_struct *dst, struct task_struct *src)
|
|
{
|
|
/*
|
|
* Save any process state which is live in hardware registers to the
|
|
* parent context prior to duplication. This prevents the new child
|
|
* state becoming stale if the parent is preempted before copy_thread()
|
|
* gets a chance to save the parent's live hardware registers to the
|
|
* child context.
|
|
*/
|
|
preempt_disable();
|
|
|
|
if (is_fpu_owner()) {
|
|
if (is_lasx_enabled())
|
|
save_lasx(current);
|
|
else if (is_lsx_enabled())
|
|
save_lsx(current);
|
|
else
|
|
save_fp(current);
|
|
}
|
|
|
|
preempt_enable();
|
|
|
|
if (!used_math())
|
|
memcpy(dst, src, offsetof(struct task_struct, thread.fpu.fpr));
|
|
else
|
|
memcpy(dst, src, offsetof(struct task_struct, thread.lbt.scr0));
|
|
|
|
#ifdef CONFIG_CPU_HAS_LBT
|
|
memcpy(&dst->thread.lbt, &src->thread.lbt, sizeof(struct loongarch_lbt));
|
|
#endif
|
|
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* Copy architecture-specific thread state
|
|
*/
|
|
int copy_thread(struct task_struct *p, const struct kernel_clone_args *args)
|
|
{
|
|
unsigned long childksp;
|
|
unsigned long tls = args->tls;
|
|
unsigned long usp = args->stack;
|
|
unsigned long clone_flags = args->flags;
|
|
struct pt_regs *childregs, *regs = current_pt_regs();
|
|
|
|
childksp = (unsigned long)task_stack_page(p) + THREAD_SIZE;
|
|
|
|
/* set up new TSS. */
|
|
childregs = (struct pt_regs *) childksp - 1;
|
|
/* Put the stack after the struct pt_regs. */
|
|
childksp = (unsigned long) childregs;
|
|
p->thread.sched_cfa = 0;
|
|
p->thread.csr_euen = 0;
|
|
p->thread.csr_crmd = csr_read32(LOONGARCH_CSR_CRMD);
|
|
p->thread.csr_prmd = csr_read32(LOONGARCH_CSR_PRMD);
|
|
p->thread.csr_ecfg = csr_read32(LOONGARCH_CSR_ECFG);
|
|
if (unlikely(args->fn)) {
|
|
/* kernel thread */
|
|
p->thread.reg03 = childksp;
|
|
p->thread.reg23 = (unsigned long)args->fn;
|
|
p->thread.reg24 = (unsigned long)args->fn_arg;
|
|
p->thread.reg01 = (unsigned long)ret_from_kernel_thread;
|
|
p->thread.sched_ra = (unsigned long)ret_from_kernel_thread;
|
|
memset(childregs, 0, sizeof(struct pt_regs));
|
|
childregs->csr_euen = p->thread.csr_euen;
|
|
childregs->csr_crmd = p->thread.csr_crmd;
|
|
childregs->csr_prmd = p->thread.csr_prmd;
|
|
childregs->csr_ecfg = p->thread.csr_ecfg;
|
|
goto out;
|
|
}
|
|
|
|
/* user thread */
|
|
*childregs = *regs;
|
|
childregs->regs[4] = 0; /* Child gets zero as return value */
|
|
if (usp)
|
|
childregs->regs[3] = usp;
|
|
|
|
p->thread.reg03 = (unsigned long) childregs;
|
|
p->thread.reg01 = (unsigned long) ret_from_fork;
|
|
p->thread.sched_ra = (unsigned long) ret_from_fork;
|
|
|
|
/*
|
|
* New tasks lose permission to use the fpu. This accelerates context
|
|
* switching for most programs since they don't use the fpu.
|
|
*/
|
|
childregs->csr_euen = 0;
|
|
|
|
if (clone_flags & CLONE_SETTLS)
|
|
childregs->regs[2] = tls;
|
|
|
|
out:
|
|
ptrace_hw_copy_thread(p);
|
|
clear_tsk_thread_flag(p, TIF_USEDFPU);
|
|
clear_tsk_thread_flag(p, TIF_USEDSIMD);
|
|
clear_tsk_thread_flag(p, TIF_USEDLBT);
|
|
clear_tsk_thread_flag(p, TIF_LSX_CTX_LIVE);
|
|
clear_tsk_thread_flag(p, TIF_LASX_CTX_LIVE);
|
|
clear_tsk_thread_flag(p, TIF_LBT_CTX_LIVE);
|
|
|
|
return 0;
|
|
}
|
|
|
|
unsigned long __get_wchan(struct task_struct *task)
|
|
{
|
|
unsigned long pc = 0;
|
|
struct unwind_state state;
|
|
|
|
if (!try_get_task_stack(task))
|
|
return 0;
|
|
|
|
for (unwind_start(&state, task, NULL);
|
|
!unwind_done(&state); unwind_next_frame(&state)) {
|
|
pc = unwind_get_return_address(&state);
|
|
if (!pc)
|
|
break;
|
|
if (in_sched_functions(pc))
|
|
continue;
|
|
break;
|
|
}
|
|
|
|
put_task_stack(task);
|
|
|
|
return pc;
|
|
}
|
|
|
|
bool in_irq_stack(unsigned long stack, struct stack_info *info)
|
|
{
|
|
unsigned long nextsp;
|
|
unsigned long begin = (unsigned long)this_cpu_read(irq_stack);
|
|
unsigned long end = begin + IRQ_STACK_START;
|
|
|
|
if (stack < begin || stack >= end)
|
|
return false;
|
|
|
|
nextsp = *(unsigned long *)end;
|
|
if (nextsp & (SZREG - 1))
|
|
return false;
|
|
|
|
info->begin = begin;
|
|
info->end = end;
|
|
info->next_sp = nextsp;
|
|
info->type = STACK_TYPE_IRQ;
|
|
|
|
return true;
|
|
}
|
|
|
|
bool in_task_stack(unsigned long stack, struct task_struct *task,
|
|
struct stack_info *info)
|
|
{
|
|
unsigned long begin = (unsigned long)task_stack_page(task);
|
|
unsigned long end = begin + THREAD_SIZE;
|
|
|
|
if (stack < begin || stack >= end)
|
|
return false;
|
|
|
|
info->begin = begin;
|
|
info->end = end;
|
|
info->next_sp = 0;
|
|
info->type = STACK_TYPE_TASK;
|
|
|
|
return true;
|
|
}
|
|
|
|
int get_stack_info(unsigned long stack, struct task_struct *task,
|
|
struct stack_info *info)
|
|
{
|
|
task = task ? : current;
|
|
|
|
if (!stack || stack & (SZREG - 1))
|
|
goto unknown;
|
|
|
|
if (in_task_stack(stack, task, info))
|
|
return 0;
|
|
|
|
if (task != current)
|
|
goto unknown;
|
|
|
|
if (in_irq_stack(stack, info))
|
|
return 0;
|
|
|
|
unknown:
|
|
info->type = STACK_TYPE_UNKNOWN;
|
|
return -EINVAL;
|
|
}
|
|
|
|
unsigned long stack_top(void)
|
|
{
|
|
unsigned long top = TASK_SIZE & PAGE_MASK;
|
|
|
|
/* Space for the VDSO & data page */
|
|
top -= PAGE_ALIGN(current->thread.vdso->size);
|
|
top -= VVAR_SIZE;
|
|
|
|
/* Space to randomize the VDSO base */
|
|
if (current->flags & PF_RANDOMIZE)
|
|
top -= VDSO_RANDOMIZE_SIZE;
|
|
|
|
return top;
|
|
}
|
|
|
|
/*
|
|
* Don't forget that the stack pointer must be aligned on a 8 bytes
|
|
* boundary for 32-bits ABI and 16 bytes for 64-bits ABI.
|
|
*/
|
|
unsigned long arch_align_stack(unsigned long sp)
|
|
{
|
|
if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
|
|
sp -= get_random_u32_below(PAGE_SIZE);
|
|
|
|
return sp & STACK_ALIGN;
|
|
}
|
|
|
|
static DEFINE_PER_CPU(call_single_data_t, backtrace_csd);
|
|
static struct cpumask backtrace_csd_busy;
|
|
|
|
static void handle_backtrace(void *info)
|
|
{
|
|
nmi_cpu_backtrace(get_irq_regs());
|
|
cpumask_clear_cpu(smp_processor_id(), &backtrace_csd_busy);
|
|
}
|
|
|
|
static void raise_backtrace(cpumask_t *mask)
|
|
{
|
|
call_single_data_t *csd;
|
|
int cpu;
|
|
|
|
for_each_cpu(cpu, mask) {
|
|
/*
|
|
* If we previously sent an IPI to the target CPU & it hasn't
|
|
* cleared its bit in the busy cpumask then it didn't handle
|
|
* our previous IPI & it's not safe for us to reuse the
|
|
* call_single_data_t.
|
|
*/
|
|
if (cpumask_test_and_set_cpu(cpu, &backtrace_csd_busy)) {
|
|
pr_warn("Unable to send backtrace IPI to CPU%u - perhaps it hung?\n",
|
|
cpu);
|
|
continue;
|
|
}
|
|
|
|
csd = &per_cpu(backtrace_csd, cpu);
|
|
csd->func = handle_backtrace;
|
|
smp_call_function_single_async(cpu, csd);
|
|
}
|
|
}
|
|
|
|
void arch_trigger_cpumask_backtrace(const cpumask_t *mask, int exclude_cpu)
|
|
{
|
|
nmi_trigger_cpumask_backtrace(mask, exclude_cpu, raise_backtrace);
|
|
}
|
|
|
|
#ifdef CONFIG_64BIT
|
|
void loongarch_dump_regs64(u64 *uregs, const struct pt_regs *regs)
|
|
{
|
|
unsigned int i;
|
|
|
|
for (i = LOONGARCH_EF_R1; i <= LOONGARCH_EF_R31; i++) {
|
|
uregs[i] = regs->regs[i - LOONGARCH_EF_R0];
|
|
}
|
|
|
|
uregs[LOONGARCH_EF_ORIG_A0] = regs->orig_a0;
|
|
uregs[LOONGARCH_EF_CSR_ERA] = regs->csr_era;
|
|
uregs[LOONGARCH_EF_CSR_BADV] = regs->csr_badvaddr;
|
|
uregs[LOONGARCH_EF_CSR_CRMD] = regs->csr_crmd;
|
|
uregs[LOONGARCH_EF_CSR_PRMD] = regs->csr_prmd;
|
|
uregs[LOONGARCH_EF_CSR_EUEN] = regs->csr_euen;
|
|
uregs[LOONGARCH_EF_CSR_ECFG] = regs->csr_ecfg;
|
|
uregs[LOONGARCH_EF_CSR_ESTAT] = regs->csr_estat;
|
|
}
|
|
#endif /* CONFIG_64BIT */
|