x86/fred: FRED entry/exit and dispatch code
The code to actually handle kernel and event entry/exit using FRED. It is split up into two files thus: - entry_64_fred.S contains the actual entrypoints and exit code, and saves and restores registers. - entry_fred.c contains the two-level event dispatch code for FRED. The first-level dispatch is on the event type, and the second-level is on the event vector. [ bp: Fold in an allmodconfig clang build fix: https://lore.kernel.org/r/20240129064521.5168-1-xin3.li@intel.com and a CONFIG_IA32_EMULATION=n build fix: https://lore.kernel.org/r/20240127093728.1323-3-xin3.li@intel.com] Suggested-by: Thomas Gleixner <tglx@linutronix.de> Originally-by: Megha Dey <megha.dey@intel.com> Co-developed-by: Xin Li <xin3.li@intel.com> Signed-off-by: H. Peter Anvin (Intel) <hpa@zytor.com> Signed-off-by: Xin Li <xin3.li@intel.com> Signed-off-by: Thomas Gleixner <tglx@linutronix.de> Signed-off-by: Borislav Petkov (AMD) <bp@alien8.de> Tested-by: Shan Kang <shan.kang@intel.com> Link: https://lore.kernel.org/r/20231209214214.2932-1-xin3.li@intel.com
This commit is contained in:
parent
ffa4901f0e
commit
14619d912b
@ -18,6 +18,9 @@ obj-y += vdso/
|
|||||||
obj-y += vsyscall/
|
obj-y += vsyscall/
|
||||||
|
|
||||||
obj-$(CONFIG_PREEMPTION) += thunk_$(BITS).o
|
obj-$(CONFIG_PREEMPTION) += thunk_$(BITS).o
|
||||||
|
CFLAGS_entry_fred.o += -fno-stack-protector
|
||||||
|
CFLAGS_REMOVE_entry_fred.o += -pg $(CC_FLAGS_FTRACE)
|
||||||
|
obj-$(CONFIG_X86_FRED) += entry_64_fred.o entry_fred.o
|
||||||
|
|
||||||
obj-$(CONFIG_IA32_EMULATION) += entry_64_compat.o syscall_32.o
|
obj-$(CONFIG_IA32_EMULATION) += entry_64_compat.o syscall_32.o
|
||||||
obj-$(CONFIG_X86_X32_ABI) += syscall_x32.o
|
obj-$(CONFIG_X86_X32_ABI) += syscall_x32.o
|
||||||
|
|
||||||
|
50
arch/x86/entry/entry_64_fred.S
Normal file
50
arch/x86/entry/entry_64_fred.S
Normal file
@ -0,0 +1,50 @@
|
|||||||
|
/* SPDX-License-Identifier: GPL-2.0 */
|
||||||
|
/*
|
||||||
|
* The actual FRED entry points.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include <asm/fred.h>
|
||||||
|
|
||||||
|
#include "calling.h"
|
||||||
|
|
||||||
|
.code64
|
||||||
|
.section .noinstr.text, "ax"
|
||||||
|
|
||||||
|
.macro FRED_ENTER
|
||||||
|
UNWIND_HINT_END_OF_STACK
|
||||||
|
ENDBR
|
||||||
|
PUSH_AND_CLEAR_REGS
|
||||||
|
movq %rsp, %rdi /* %rdi -> pt_regs */
|
||||||
|
.endm
|
||||||
|
|
||||||
|
.macro FRED_EXIT
|
||||||
|
UNWIND_HINT_REGS
|
||||||
|
POP_REGS
|
||||||
|
.endm
|
||||||
|
|
||||||
|
/*
|
||||||
|
* The new RIP value that FRED event delivery establishes is
|
||||||
|
* IA32_FRED_CONFIG & ~FFFH for events that occur in ring 3.
|
||||||
|
* Thus the FRED ring 3 entry point must be 4K page aligned.
|
||||||
|
*/
|
||||||
|
.align 4096
|
||||||
|
|
||||||
|
SYM_CODE_START_NOALIGN(asm_fred_entrypoint_user)
|
||||||
|
FRED_ENTER
|
||||||
|
call fred_entry_from_user
|
||||||
|
FRED_EXIT
|
||||||
|
ERETU
|
||||||
|
SYM_CODE_END(asm_fred_entrypoint_user)
|
||||||
|
|
||||||
|
/*
|
||||||
|
* The new RIP value that FRED event delivery establishes is
|
||||||
|
* (IA32_FRED_CONFIG & ~FFFH) + 256 for events that occur in
|
||||||
|
* ring 0, i.e., asm_fred_entrypoint_user + 256.
|
||||||
|
*/
|
||||||
|
.org asm_fred_entrypoint_user + 256, 0xcc
|
||||||
|
SYM_CODE_START_NOALIGN(asm_fred_entrypoint_kernel)
|
||||||
|
FRED_ENTER
|
||||||
|
call fred_entry_from_kernel
|
||||||
|
FRED_EXIT
|
||||||
|
ERETS
|
||||||
|
SYM_CODE_END(asm_fred_entrypoint_kernel)
|
245
arch/x86/entry/entry_fred.c
Normal file
245
arch/x86/entry/entry_fred.c
Normal file
@ -0,0 +1,245 @@
|
|||||||
|
/* SPDX-License-Identifier: GPL-2.0 */
|
||||||
|
/*
|
||||||
|
* The FRED specific kernel/user entry functions which are invoked from
|
||||||
|
* assembly code and dispatch to the associated handlers.
|
||||||
|
*/
|
||||||
|
#include <linux/kernel.h>
|
||||||
|
#include <linux/kdebug.h>
|
||||||
|
#include <linux/nospec.h>
|
||||||
|
|
||||||
|
#include <asm/desc.h>
|
||||||
|
#include <asm/fred.h>
|
||||||
|
#include <asm/idtentry.h>
|
||||||
|
#include <asm/syscall.h>
|
||||||
|
#include <asm/trapnr.h>
|
||||||
|
#include <asm/traps.h>
|
||||||
|
|
||||||
|
/* FRED EVENT_TYPE_OTHER vector numbers */
|
||||||
|
#define FRED_SYSCALL 1
|
||||||
|
#define FRED_SYSENTER 2
|
||||||
|
|
||||||
|
static noinstr void fred_bad_type(struct pt_regs *regs, unsigned long error_code)
|
||||||
|
{
|
||||||
|
irqentry_state_t irq_state = irqentry_nmi_enter(regs);
|
||||||
|
|
||||||
|
instrumentation_begin();
|
||||||
|
|
||||||
|
/* Panic on events from a high stack level */
|
||||||
|
if (regs->fred_cs.sl > 0) {
|
||||||
|
pr_emerg("PANIC: invalid or fatal FRED event; event type %u "
|
||||||
|
"vector %u error 0x%lx aux 0x%lx at %04x:%016lx\n",
|
||||||
|
regs->fred_ss.type, regs->fred_ss.vector, regs->orig_ax,
|
||||||
|
fred_event_data(regs), regs->cs, regs->ip);
|
||||||
|
die("invalid or fatal FRED event", regs, regs->orig_ax);
|
||||||
|
panic("invalid or fatal FRED event");
|
||||||
|
} else {
|
||||||
|
unsigned long flags = oops_begin();
|
||||||
|
int sig = SIGKILL;
|
||||||
|
|
||||||
|
pr_alert("BUG: invalid or fatal FRED event; event type %u "
|
||||||
|
"vector %u error 0x%lx aux 0x%lx at %04x:%016lx\n",
|
||||||
|
regs->fred_ss.type, regs->fred_ss.vector, regs->orig_ax,
|
||||||
|
fred_event_data(regs), regs->cs, regs->ip);
|
||||||
|
|
||||||
|
if (__die("Invalid or fatal FRED event", regs, regs->orig_ax))
|
||||||
|
sig = 0;
|
||||||
|
|
||||||
|
oops_end(flags, regs, sig);
|
||||||
|
}
|
||||||
|
|
||||||
|
instrumentation_end();
|
||||||
|
irqentry_nmi_exit(regs, irq_state);
|
||||||
|
}
|
||||||
|
|
||||||
|
static noinstr void fred_intx(struct pt_regs *regs)
|
||||||
|
{
|
||||||
|
switch (regs->fred_ss.vector) {
|
||||||
|
/* Opcode 0xcd, 0x3, NOT INT3 (opcode 0xcc) */
|
||||||
|
case X86_TRAP_BP:
|
||||||
|
return exc_int3(regs);
|
||||||
|
|
||||||
|
/* Opcode 0xcd, 0x4, NOT INTO (opcode 0xce) */
|
||||||
|
case X86_TRAP_OF:
|
||||||
|
return exc_overflow(regs);
|
||||||
|
|
||||||
|
#ifdef CONFIG_IA32_EMULATION
|
||||||
|
/* INT80 */
|
||||||
|
case IA32_SYSCALL_VECTOR:
|
||||||
|
if (ia32_enabled())
|
||||||
|
return int80_emulation(regs);
|
||||||
|
fallthrough;
|
||||||
|
#endif
|
||||||
|
|
||||||
|
default:
|
||||||
|
return exc_general_protection(regs, 0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static __always_inline void fred_other(struct pt_regs *regs)
|
||||||
|
{
|
||||||
|
/* The compiler can fold these conditions into a single test */
|
||||||
|
if (likely(regs->fred_ss.vector == FRED_SYSCALL && regs->fred_ss.lm)) {
|
||||||
|
regs->orig_ax = regs->ax;
|
||||||
|
regs->ax = -ENOSYS;
|
||||||
|
do_syscall_64(regs, regs->orig_ax);
|
||||||
|
return;
|
||||||
|
} else if (ia32_enabled() &&
|
||||||
|
likely(regs->fred_ss.vector == FRED_SYSENTER && !regs->fred_ss.lm)) {
|
||||||
|
regs->orig_ax = regs->ax;
|
||||||
|
regs->ax = -ENOSYS;
|
||||||
|
do_fast_syscall_32(regs);
|
||||||
|
return;
|
||||||
|
} else {
|
||||||
|
exc_invalid_op(regs);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#define SYSVEC(_vector, _function) [_vector - FIRST_SYSTEM_VECTOR] = fred_sysvec_##_function
|
||||||
|
|
||||||
|
static idtentry_t sysvec_table[NR_SYSTEM_VECTORS] __ro_after_init = {
|
||||||
|
SYSVEC(ERROR_APIC_VECTOR, error_interrupt),
|
||||||
|
SYSVEC(SPURIOUS_APIC_VECTOR, spurious_apic_interrupt),
|
||||||
|
SYSVEC(LOCAL_TIMER_VECTOR, apic_timer_interrupt),
|
||||||
|
SYSVEC(X86_PLATFORM_IPI_VECTOR, x86_platform_ipi),
|
||||||
|
|
||||||
|
SYSVEC(RESCHEDULE_VECTOR, reschedule_ipi),
|
||||||
|
SYSVEC(CALL_FUNCTION_SINGLE_VECTOR, call_function_single),
|
||||||
|
SYSVEC(CALL_FUNCTION_VECTOR, call_function),
|
||||||
|
SYSVEC(REBOOT_VECTOR, reboot),
|
||||||
|
|
||||||
|
SYSVEC(THRESHOLD_APIC_VECTOR, threshold),
|
||||||
|
SYSVEC(DEFERRED_ERROR_VECTOR, deferred_error),
|
||||||
|
SYSVEC(THERMAL_APIC_VECTOR, thermal),
|
||||||
|
|
||||||
|
SYSVEC(IRQ_WORK_VECTOR, irq_work),
|
||||||
|
|
||||||
|
SYSVEC(POSTED_INTR_VECTOR, kvm_posted_intr_ipi),
|
||||||
|
SYSVEC(POSTED_INTR_WAKEUP_VECTOR, kvm_posted_intr_wakeup_ipi),
|
||||||
|
SYSVEC(POSTED_INTR_NESTED_VECTOR, kvm_posted_intr_nested_ipi),
|
||||||
|
};
|
||||||
|
|
||||||
|
static noinstr void fred_extint(struct pt_regs *regs)
|
||||||
|
{
|
||||||
|
unsigned int vector = regs->fred_ss.vector;
|
||||||
|
unsigned int index = array_index_nospec(vector - FIRST_SYSTEM_VECTOR,
|
||||||
|
NR_SYSTEM_VECTORS);
|
||||||
|
|
||||||
|
if (WARN_ON_ONCE(vector < FIRST_EXTERNAL_VECTOR))
|
||||||
|
return;
|
||||||
|
|
||||||
|
if (likely(vector >= FIRST_SYSTEM_VECTOR)) {
|
||||||
|
irqentry_state_t state = irqentry_enter(regs);
|
||||||
|
|
||||||
|
instrumentation_begin();
|
||||||
|
sysvec_table[index](regs);
|
||||||
|
instrumentation_end();
|
||||||
|
irqentry_exit(regs, state);
|
||||||
|
} else {
|
||||||
|
common_interrupt(regs, vector);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static noinstr void fred_hwexc(struct pt_regs *regs, unsigned long error_code)
|
||||||
|
{
|
||||||
|
/* Optimize for #PF. That's the only exception which matters performance wise */
|
||||||
|
if (likely(regs->fred_ss.vector == X86_TRAP_PF))
|
||||||
|
return exc_page_fault(regs, error_code);
|
||||||
|
|
||||||
|
switch (regs->fred_ss.vector) {
|
||||||
|
case X86_TRAP_DE: return exc_divide_error(regs);
|
||||||
|
case X86_TRAP_DB: return fred_exc_debug(regs);
|
||||||
|
case X86_TRAP_BR: return exc_bounds(regs);
|
||||||
|
case X86_TRAP_UD: return exc_invalid_op(regs);
|
||||||
|
case X86_TRAP_NM: return exc_device_not_available(regs);
|
||||||
|
case X86_TRAP_DF: return exc_double_fault(regs, error_code);
|
||||||
|
case X86_TRAP_TS: return exc_invalid_tss(regs, error_code);
|
||||||
|
case X86_TRAP_NP: return exc_segment_not_present(regs, error_code);
|
||||||
|
case X86_TRAP_SS: return exc_stack_segment(regs, error_code);
|
||||||
|
case X86_TRAP_GP: return exc_general_protection(regs, error_code);
|
||||||
|
case X86_TRAP_MF: return exc_coprocessor_error(regs);
|
||||||
|
case X86_TRAP_AC: return exc_alignment_check(regs, error_code);
|
||||||
|
case X86_TRAP_XF: return exc_simd_coprocessor_error(regs);
|
||||||
|
|
||||||
|
#ifdef CONFIG_X86_MCE
|
||||||
|
case X86_TRAP_MC: return fred_exc_machine_check(regs);
|
||||||
|
#endif
|
||||||
|
#ifdef CONFIG_INTEL_TDX_GUEST
|
||||||
|
case X86_TRAP_VE: return exc_virtualization_exception(regs);
|
||||||
|
#endif
|
||||||
|
#ifdef CONFIG_X86_CET
|
||||||
|
case X86_TRAP_CP: return exc_control_protection(regs, error_code);
|
||||||
|
#endif
|
||||||
|
default: return fred_bad_type(regs, error_code);
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
static noinstr void fred_swexc(struct pt_regs *regs, unsigned long error_code)
|
||||||
|
{
|
||||||
|
switch (regs->fred_ss.vector) {
|
||||||
|
case X86_TRAP_BP: return exc_int3(regs);
|
||||||
|
case X86_TRAP_OF: return exc_overflow(regs);
|
||||||
|
default: return fred_bad_type(regs, error_code);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
__visible noinstr void fred_entry_from_user(struct pt_regs *regs)
|
||||||
|
{
|
||||||
|
unsigned long error_code = regs->orig_ax;
|
||||||
|
|
||||||
|
/* Invalidate orig_ax so that syscall_get_nr() works correctly */
|
||||||
|
regs->orig_ax = -1;
|
||||||
|
|
||||||
|
switch (regs->fred_ss.type) {
|
||||||
|
case EVENT_TYPE_EXTINT:
|
||||||
|
return fred_extint(regs);
|
||||||
|
case EVENT_TYPE_NMI:
|
||||||
|
if (likely(regs->fred_ss.vector == X86_TRAP_NMI))
|
||||||
|
return fred_exc_nmi(regs);
|
||||||
|
break;
|
||||||
|
case EVENT_TYPE_HWEXC:
|
||||||
|
return fred_hwexc(regs, error_code);
|
||||||
|
case EVENT_TYPE_SWINT:
|
||||||
|
return fred_intx(regs);
|
||||||
|
case EVENT_TYPE_PRIV_SWEXC:
|
||||||
|
if (likely(regs->fred_ss.vector == X86_TRAP_DB))
|
||||||
|
return fred_exc_debug(regs);
|
||||||
|
break;
|
||||||
|
case EVENT_TYPE_SWEXC:
|
||||||
|
return fred_swexc(regs, error_code);
|
||||||
|
case EVENT_TYPE_OTHER:
|
||||||
|
return fred_other(regs);
|
||||||
|
default: break;
|
||||||
|
}
|
||||||
|
|
||||||
|
return fred_bad_type(regs, error_code);
|
||||||
|
}
|
||||||
|
|
||||||
|
__visible noinstr void fred_entry_from_kernel(struct pt_regs *regs)
|
||||||
|
{
|
||||||
|
unsigned long error_code = regs->orig_ax;
|
||||||
|
|
||||||
|
/* Invalidate orig_ax so that syscall_get_nr() works correctly */
|
||||||
|
regs->orig_ax = -1;
|
||||||
|
|
||||||
|
switch (regs->fred_ss.type) {
|
||||||
|
case EVENT_TYPE_EXTINT:
|
||||||
|
return fred_extint(regs);
|
||||||
|
case EVENT_TYPE_NMI:
|
||||||
|
if (likely(regs->fred_ss.vector == X86_TRAP_NMI))
|
||||||
|
return fred_exc_nmi(regs);
|
||||||
|
break;
|
||||||
|
case EVENT_TYPE_HWEXC:
|
||||||
|
return fred_hwexc(regs, error_code);
|
||||||
|
case EVENT_TYPE_PRIV_SWEXC:
|
||||||
|
if (likely(regs->fred_ss.vector == X86_TRAP_DB))
|
||||||
|
return fred_exc_debug(regs);
|
||||||
|
break;
|
||||||
|
case EVENT_TYPE_SWEXC:
|
||||||
|
return fred_swexc(regs, error_code);
|
||||||
|
default: break;
|
||||||
|
}
|
||||||
|
|
||||||
|
return fred_bad_type(regs, error_code);
|
||||||
|
}
|
@ -12,6 +12,7 @@
|
|||||||
#include <asm/special_insns.h>
|
#include <asm/special_insns.h>
|
||||||
#include <asm/preempt.h>
|
#include <asm/preempt.h>
|
||||||
#include <asm/asm.h>
|
#include <asm/asm.h>
|
||||||
|
#include <asm/fred.h>
|
||||||
#include <asm/gsseg.h>
|
#include <asm/gsseg.h>
|
||||||
|
|
||||||
#ifndef CONFIG_X86_CMPXCHG64
|
#ifndef CONFIG_X86_CMPXCHG64
|
||||||
|
@ -60,6 +60,12 @@ static __always_inline unsigned long fred_event_data(struct pt_regs *regs)
|
|||||||
return fred_info(regs)->edata;
|
return fred_info(regs)->edata;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void asm_fred_entrypoint_user(void);
|
||||||
|
void asm_fred_entrypoint_kernel(void);
|
||||||
|
|
||||||
|
__visible void fred_entry_from_user(struct pt_regs *regs);
|
||||||
|
__visible void fred_entry_from_kernel(struct pt_regs *regs);
|
||||||
|
|
||||||
#else /* CONFIG_X86_FRED */
|
#else /* CONFIG_X86_FRED */
|
||||||
static __always_inline unsigned long fred_event_data(struct pt_regs *regs) { return 0; }
|
static __always_inline unsigned long fred_event_data(struct pt_regs *regs) { return 0; }
|
||||||
#endif /* CONFIG_X86_FRED */
|
#endif /* CONFIG_X86_FRED */
|
||||||
|
@ -69,7 +69,7 @@ extern void ia32_pick_mmap_layout(struct mm_struct *mm);
|
|||||||
|
|
||||||
extern bool __ia32_enabled;
|
extern bool __ia32_enabled;
|
||||||
|
|
||||||
static inline bool ia32_enabled(void)
|
static __always_inline bool ia32_enabled(void)
|
||||||
{
|
{
|
||||||
return __ia32_enabled;
|
return __ia32_enabled;
|
||||||
}
|
}
|
||||||
@ -81,7 +81,7 @@ static inline void ia32_disable(void)
|
|||||||
|
|
||||||
#else /* !CONFIG_IA32_EMULATION */
|
#else /* !CONFIG_IA32_EMULATION */
|
||||||
|
|
||||||
static inline bool ia32_enabled(void)
|
static __always_inline bool ia32_enabled(void)
|
||||||
{
|
{
|
||||||
return IS_ENABLED(CONFIG_X86_32);
|
return IS_ENABLED(CONFIG_X86_32);
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user