2019-06-04 10:11:33 +02:00
// SPDX-License-Identifier: GPL-2.0-only
2005-04-16 15:20:36 -07:00
/*
* linux / arch / arm / kernel / process . c
*
* Copyright ( C ) 1996 - 2000 Russell King - Converted to ARM .
* Original Copyright ( C ) 1995 Linus Torvalds
*/
# include <stdarg.h>
2011-07-22 10:58:34 -04:00
# include <linux/export.h>
2005-04-16 15:20:36 -07:00
# include <linux/sched.h>
2017-02-08 18:51:35 +01:00
# include <linux/sched/debug.h>
2017-02-08 18:51:36 +01:00
# include <linux/sched/task.h>
2017-02-08 18:51:37 +01:00
# include <linux/sched/task_stack.h>
2005-04-16 15:20:36 -07:00
# include <linux/kernel.h>
# include <linux/mm.h>
# include <linux/stddef.h>
# include <linux/unistd.h>
# include <linux/user.h>
# include <linux/interrupt.h>
# include <linux/init.h>
2006-03-15 23:17:23 +00:00
# include <linux/elfcore.h>
2006-06-19 19:57:12 +01:00
# include <linux/pm.h>
2007-03-14 17:33:24 +01:00
# include <linux/tick.h>
2007-06-18 14:59:45 +01:00
# include <linux/utsname.h>
2008-09-06 11:35:55 +01:00
# include <linux/uaccess.h>
2010-06-14 16:27:19 -04:00
# include <linux/random.h>
2010-09-03 10:42:55 +01:00
# include <linux/hw_breakpoint.h>
2012-03-14 02:26:56 +08:00
# include <linux/leds.h>
2005-04-16 15:20:36 -07:00
# include <asm/processor.h>
2006-06-21 13:31:52 +01:00
# include <asm/thread_notify.h>
2009-02-11 13:07:53 +01:00
# include <asm/stacktrace.h>
2014-04-06 16:17:39 +01:00
# include <asm/system_misc.h>
2005-06-27 14:04:05 +01:00
# include <asm/mach/time.h>
2013-06-18 23:23:26 +01:00
# include <asm/tls.h>
2015-04-01 17:02:45 +01:00
# include <asm/vdso.h>
2005-04-16 15:20:36 -07:00
2019-10-11 13:53:32 +01:00
# include "signal.h"
2018-12-06 09:32:57 +01:00
# if defined(CONFIG_STACKPROTECTOR) && !defined(CONFIG_STACKPROTECTOR_PER_TASK)
2010-05-24 23:55:42 -04:00
# include <linux/stackprotector.h>
unsigned long __stack_chk_guard __read_mostly ;
EXPORT_SYMBOL ( __stack_chk_guard ) ;
# endif
2013-12-16 10:38:57 +01:00
static const char * processor_modes [ ] __maybe_unused = {
2007-01-09 12:57:37 +00:00
" USER_26 " , " FIQ_26 " , " IRQ_26 " , " SVC_26 " , " UK4_26 " , " UK5_26 " , " UK6_26 " , " UK7_26 " ,
" UK8_26 " , " UK9_26 " , " UK10_26 " , " UK11_26 " , " UK12_26 " , " UK13_26 " , " UK14_26 " , " UK15_26 " ,
2014-12-01 19:45:19 +01:00
" USER_32 " , " FIQ_32 " , " IRQ_32 " , " SVC_32 " , " UK4_32 " , " UK5_32 " , " MON_32 " , " ABT_32 " ,
" UK8_32 " , " UK9_32 " , " HYP_32 " , " UND_32 " , " UK12_32 " , " UK13_32 " , " UK14_32 " , " SYS_32 "
2007-01-09 12:57:37 +00:00
} ;
2013-12-16 10:38:57 +01:00
static const char * isa_modes [ ] __maybe_unused = {
2007-06-26 01:38:27 +01:00
" ARM " , " Thumb " , " Jazelle " , " ThumbEE "
} ;
2005-04-16 15:20:36 -07:00
/*
2011-08-01 17:25:06 -04:00
* This is our default idle handler .
2005-04-16 15:20:36 -07:00
*/
2011-08-01 17:25:06 -04:00
void ( * arm_pm_idle ) ( void ) ;
2014-01-29 12:45:09 -05:00
/*
* Called from the core idle loop .
*/
void arch_cpu_idle ( void )
2005-04-16 15:20:36 -07:00
{
2011-08-01 17:25:06 -04:00
if ( arm_pm_idle )
arm_pm_idle ( ) ;
else
2011-12-19 03:03:58 -05:00
cpu_do_idle ( ) ;
2009-06-22 22:34:55 +01:00
local_irq_enable ( ) ;
2005-04-16 15:20:36 -07:00
}
2013-03-21 22:49:38 +01:00
void arch_cpu_idle_prepare ( void )
2005-04-16 15:20:36 -07:00
{
local_fiq_enable ( ) ;
2013-03-21 22:49:38 +01:00
}
2005-04-16 15:20:36 -07:00
2013-03-21 22:49:38 +01:00
void arch_cpu_idle_enter ( void )
{
ledtrig_cpu ( CPU_LED_IDLE_START ) ;
# ifdef CONFIG_PL310_ERRATA_769419
wmb ( ) ;
2005-11-02 22:24:33 +00:00
# endif
2013-03-21 22:49:38 +01:00
}
2005-11-02 22:24:33 +00:00
2013-03-21 22:49:38 +01:00
void arch_cpu_idle_exit ( void )
{
ledtrig_cpu ( CPU_LED_IDLE_END ) ;
}
2005-04-17 15:50:36 +01:00
void __show_regs ( struct pt_regs * regs )
2005-04-16 15:20:36 -07:00
{
2007-06-18 14:59:45 +01:00
unsigned long flags ;
char buf [ 64 ] ;
2015-12-03 14:34:45 +00:00
# ifndef CONFIG_CPU_V7M
2016-05-13 11:40:20 +01:00
unsigned int domain , fs ;
2015-12-03 14:34:45 +00:00
# ifdef CONFIG_CPU_SW_DOMAIN_PAN
/*
* Get the domain register for the parent context . In user
* mode , we don ' t save the DACR , so lets use what it should
* be . For other modes , we place it after the pt_regs struct .
*/
2016-05-13 11:40:20 +01:00
if ( user_mode ( regs ) ) {
2015-12-03 14:34:45 +00:00
domain = DACR_UACCESS_ENABLE ;
2016-05-13 11:40:20 +01:00
fs = get_fs ( ) ;
} else {
2016-05-13 10:26:10 +01:00
domain = to_svc_pt_regs ( regs ) - > dacr ;
2016-05-13 11:40:20 +01:00
fs = to_svc_pt_regs ( regs ) - > addr_limit ;
}
2015-12-03 14:34:45 +00:00
# else
domain = get_domain ( ) ;
2016-05-13 11:40:20 +01:00
fs = get_fs ( ) ;
2015-12-03 14:34:45 +00:00
# endif
# endif
2005-04-16 15:20:36 -07:00
dump_stack: unify debug information printed by show_regs()
show_regs() is inherently arch-dependent but it does make sense to print
generic debug information and some archs already do albeit in slightly
different forms. This patch introduces a generic function to print debug
information from show_regs() so that different archs print out the same
information and it's much easier to modify what's printed.
show_regs_print_info() prints out the same debug info as dump_stack()
does plus task and thread_info pointers.
* Archs which didn't print debug info now do.
alpha, arc, blackfin, c6x, cris, frv, h8300, hexagon, ia64, m32r,
metag, microblaze, mn10300, openrisc, parisc, score, sh64, sparc,
um, xtensa
* Already prints debug info. Replaced with show_regs_print_info().
The printed information is superset of what used to be there.
arm, arm64, avr32, mips, powerpc, sh32, tile, unicore32, x86
* s390 is special in that it used to print arch-specific information
along with generic debug info. Heiko and Martin think that the
arch-specific extra isn't worth keeping s390 specfic implementation.
Converted to use the generic version.
Note that now all archs print the debug info before actual register
dumps.
An example BUG() dump follows.
kernel BUG at /work/os/work/kernel/workqueue.c:4841!
invalid opcode: 0000 [#1] PREEMPT SMP DEBUG_PAGEALLOC
Modules linked in:
CPU: 0 PID: 1 Comm: swapper/0 Not tainted 3.9.0-rc1-work+ #7
Hardware name: empty empty/S3992, BIOS 080011 10/26/2007
task: ffff88007c85e040 ti: ffff88007c860000 task.ti: ffff88007c860000
RIP: 0010:[<ffffffff8234a07e>] [<ffffffff8234a07e>] init_workqueues+0x4/0x6
RSP: 0000:ffff88007c861ec8 EFLAGS: 00010246
RAX: ffff88007c861fd8 RBX: ffffffff824466a8 RCX: 0000000000000001
RDX: 0000000000000046 RSI: 0000000000000001 RDI: ffffffff8234a07a
RBP: ffff88007c861ec8 R08: 0000000000000000 R09: 0000000000000000
R10: 0000000000000001 R11: 0000000000000000 R12: ffffffff8234a07a
R13: 0000000000000000 R14: 0000000000000000 R15: 0000000000000000
FS: 0000000000000000(0000) GS:ffff88007dc00000(0000) knlGS:0000000000000000
CS: 0010 DS: 0000 ES: 0000 CR0: 000000008005003b
CR2: ffff88015f7ff000 CR3: 00000000021f1000 CR4: 00000000000007f0
DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
Stack:
ffff88007c861ef8 ffffffff81000312 ffffffff824466a8 ffff88007c85e650
0000000000000003 0000000000000000 ffff88007c861f38 ffffffff82335e5d
ffff88007c862080 ffffffff8223d8c0 ffff88007c862080 ffffffff81c47760
Call Trace:
[<ffffffff81000312>] do_one_initcall+0x122/0x170
[<ffffffff82335e5d>] kernel_init_freeable+0x9b/0x1c8
[<ffffffff81c47760>] ? rest_init+0x140/0x140
[<ffffffff81c4776e>] kernel_init+0xe/0xf0
[<ffffffff81c6be9c>] ret_from_fork+0x7c/0xb0
[<ffffffff81c47760>] ? rest_init+0x140/0x140
...
v2: Typo fix in x86-32.
v3: CPU number dropped from show_regs_print_info() as
dump_stack_print_info() has been updated to print it. s390
specific implementation dropped as requested by s390 maintainers.
Signed-off-by: Tejun Heo <tj@kernel.org>
Acked-by: David S. Miller <davem@davemloft.net>
Acked-by: Jesper Nilsson <jesper.nilsson@axis.com>
Cc: Heiko Carstens <heiko.carstens@de.ibm.com>
Cc: Martin Schwidefsky <schwidefsky@de.ibm.com>
Cc: Bjorn Helgaas <bhelgaas@google.com>
Cc: Fengguang Wu <fengguang.wu@intel.com>
Cc: Mike Frysinger <vapier@gentoo.org>
Cc: Vineet Gupta <vgupta@synopsys.com>
Cc: Sam Ravnborg <sam@ravnborg.org>
Acked-by: Chris Metcalf <cmetcalf@tilera.com> [tile bits]
Acked-by: Richard Kuo <rkuo@codeaurora.org> [hexagon bits]
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2013-04-30 15:27:17 -07:00
show_regs_print_info ( KERN_DEFAULT ) ;
2017-12-11 21:50:13 +09:00
printk ( " PC is at %pS \n " , ( void * ) instruction_pointer ( regs ) ) ;
printk ( " LR is at %pS \n " , ( void * ) regs - > ARM_lr ) ;
2017-05-04 09:17:55 +01:00
printk ( " pc : [<%08lx>] lr : [<%08lx>] psr: %08lx \n " ,
regs - > ARM_pc , regs - > ARM_lr , regs - > ARM_cpsr ) ;
printk ( " sp : %08lx ip : %08lx fp : %08lx \n " ,
regs - > ARM_sp , regs - > ARM_ip , regs - > ARM_fp ) ;
2005-04-16 15:20:36 -07:00
printk ( " r10: %08lx r9 : %08lx r8 : %08lx \n " ,
regs - > ARM_r10 , regs - > ARM_r9 ,
regs - > ARM_r8 ) ;
printk ( " r7 : %08lx r6 : %08lx r5 : %08lx r4 : %08lx \n " ,
regs - > ARM_r7 , regs - > ARM_r6 ,
regs - > ARM_r5 , regs - > ARM_r4 ) ;
printk ( " r3 : %08lx r2 : %08lx r1 : %08lx r0 : %08lx \n " ,
regs - > ARM_r3 , regs - > ARM_r2 ,
regs - > ARM_r1 , regs - > ARM_r0 ) ;
2007-06-18 14:59:45 +01:00
flags = regs - > ARM_cpsr ;
buf [ 0 ] = flags & PSR_N_BIT ? ' N ' : ' n ' ;
buf [ 1 ] = flags & PSR_Z_BIT ? ' Z ' : ' z ' ;
buf [ 2 ] = flags & PSR_C_BIT ? ' C ' : ' c ' ;
buf [ 3 ] = flags & PSR_V_BIT ? ' V ' : ' v ' ;
buf [ 4 ] = ' \0 ' ;
2013-12-16 10:38:57 +01:00
# ifndef CONFIG_CPU_V7M
2015-08-19 20:40:41 +01:00
{
const char * segment ;
if ( ( domain & domain_mask ( DOMAIN_USER ) ) = =
domain_val ( DOMAIN_USER , DOMAIN_NOACCESS ) )
segment = " none " ;
2019-03-04 10:39:05 -08:00
else if ( fs = = KERNEL_DS )
2015-08-19 20:40:41 +01:00
segment = " kernel " ;
else
segment = " user " ;
printk ( " Flags: %s IRQs o%s FIQs o%s Mode %s ISA %s Segment %s \n " ,
buf , interrupts_enabled ( regs ) ? " n " : " ff " ,
fast_interrupts_enabled ( regs ) ? " n " : " ff " ,
processor_modes [ processor_mode ( regs ) ] ,
isa_modes [ isa_mode ( regs ) ] , segment ) ;
}
2013-12-16 10:38:57 +01:00
# else
printk ( " xPSR: %08lx \n " , regs - > ARM_cpsr ) ;
# endif
2007-06-18 14:59:45 +01:00
# ifdef CONFIG_CPU_CP15
2005-04-16 15:20:36 -07:00
{
2006-09-26 17:36:37 +09:00
unsigned int ctrl ;
2007-06-18 14:59:45 +01:00
buf [ 0 ] = ' \0 ' ;
2006-09-26 17:36:37 +09:00
# ifdef CONFIG_CPU_CP15_MMU
2007-06-18 14:59:45 +01:00
{
2015-12-03 14:34:45 +00:00
unsigned int transbase ;
2007-06-18 14:59:45 +01:00
asm ( " mrc p15, 0, %0, c2, c0 \n \t "
2015-08-19 21:23:48 +01:00
: " =r " ( transbase ) ) ;
2007-06-18 14:59:45 +01:00
snprintf ( buf , sizeof ( buf ) , " Table: %08x DAC: %08x " ,
2015-12-03 14:34:45 +00:00
transbase , domain ) ;
2007-06-18 14:59:45 +01:00
}
2006-09-26 17:36:37 +09:00
# endif
2007-06-18 14:59:45 +01:00
asm ( " mrc p15, 0, %0, c1, c0 \n " : " =r " ( ctrl ) ) ;
printk ( " Control: %08x%s \n " , ctrl , buf ) ;
}
2006-09-26 17:36:37 +09:00
# endif
2005-04-16 15:20:36 -07:00
}
2005-04-17 15:50:36 +01:00
void show_regs ( struct pt_regs * regs )
{
__show_regs ( regs ) ;
2011-08-31 02:04:06 +01:00
dump_stack ( ) ;
2005-04-17 15:50:36 +01:00
}
2009-12-18 14:34:43 +00:00
ATOMIC_NOTIFIER_HEAD ( thread_notify_head ) ;
EXPORT_SYMBOL_GPL ( thread_notify_head ) ;
2005-04-16 15:20:36 -07:00
/*
* Free current thread data structures etc . .
*/
2016-05-20 17:00:20 -07:00
void exit_thread ( struct task_struct * tsk )
2005-04-16 15:20:36 -07:00
{
2016-05-20 17:00:20 -07:00
thread_notify ( THREAD_NOTIFY_EXIT , task_thread_info ( tsk ) ) ;
2005-04-16 15:20:36 -07:00
}
void flush_thread ( void )
{
struct thread_info * thread = current_thread_info ( ) ;
struct task_struct * tsk = current ;
2010-09-03 10:42:55 +01:00
flush_ptrace_hw_breakpoint ( tsk ) ;
2005-04-16 15:20:36 -07:00
memset ( thread - > used_cp , 0 , sizeof ( thread - > used_cp ) ) ;
memset ( & tsk - > thread . debug , 0 , sizeof ( struct debug_info ) ) ;
2006-06-21 13:31:52 +01:00
memset ( & thread - > fpstate , 0 , sizeof ( union fp_state ) ) ;
2014-09-11 02:49:08 +01:00
flush_tls ( ) ;
2006-06-21 13:31:52 +01:00
thread_notify ( THREAD_NOTIFY_FLUSH , thread ) ;
2005-04-16 15:20:36 -07:00
}
void release_thread ( struct task_struct * dead_task )
{
}
asmlinkage void ret_from_fork ( void ) __asm__ ( " ret_from_fork " ) ;
2020-06-11 11:04:15 +02:00
int copy_thread ( unsigned long clone_flags , unsigned long stack_start ,
unsigned long stk_sz , struct task_struct * p , unsigned long tls )
2005-04-16 15:20:36 -07:00
{
2006-01-12 01:05:57 -08:00
struct thread_info * thread = task_thread_info ( p ) ;
struct pt_regs * childregs = task_pt_regs ( p ) ;
2005-04-16 15:20:36 -07:00
memset ( & thread - > cpu_context , 0 , sizeof ( struct cpu_context_save ) ) ;
2012-09-09 21:31:07 -04:00
2015-09-09 21:19:49 +01:00
# ifdef CONFIG_CPU_USE_DOMAINS
2015-08-19 21:23:48 +01:00
/*
* Copy the initial value of the domain access control register
* from the current thread : thread - > addr_limit will have been
* copied from the current thread via setup_thread_stack ( ) in
* kernel / fork . c
*/
thread - > cpu_domain = get_domain ( ) ;
2015-09-09 21:19:49 +01:00
# endif
2015-08-19 21:23:48 +01:00
2012-10-21 15:54:27 -04:00
if ( likely ( ! ( p - > flags & PF_KTHREAD ) ) ) {
* childregs = * current_pt_regs ( ) ;
2012-09-09 21:31:07 -04:00
childregs - > ARM_r0 = 0 ;
2012-10-21 15:54:27 -04:00
if ( stack_start )
childregs - > ARM_sp = stack_start ;
2012-09-09 21:31:07 -04:00
} else {
2012-10-10 22:23:29 -04:00
memset ( childregs , 0 , sizeof ( struct pt_regs ) ) ;
2012-09-09 21:31:07 -04:00
thread - > cpu_context . r4 = stk_sz ;
thread - > cpu_context . r5 = stack_start ;
childregs - > ARM_cpsr = SVC_MODE ;
}
2012-10-10 22:23:29 -04:00
thread - > cpu_context . pc = ( unsigned long ) ret_from_fork ;
2005-04-16 15:20:36 -07:00
thread - > cpu_context . sp = ( unsigned long ) childregs ;
2010-09-03 10:42:55 +01:00
clear_ptrace_hw_breakpoint ( p ) ;
2005-04-16 15:20:36 -07:00
if ( clone_flags & CLONE_SETTLS )
2020-01-02 18:24:09 +01:00
thread - > tp_value [ 0 ] = tls ;
2013-06-18 23:23:26 +01:00
thread - > tp_value [ 1 ] = get_tpuser ( ) ;
2005-04-16 15:20:36 -07:00
2011-04-06 16:16:29 +01:00
thread_notify ( THREAD_NOTIFY_COPY , thread ) ;
2018-12-06 09:32:57 +01:00
# ifdef CONFIG_STACKPROTECTOR_PER_TASK
thread - > stack_canary = p - > stack_canary ;
# endif
2005-04-16 15:20:36 -07:00
return 0 ;
}
2009-10-13 08:54:30 +01:00
/*
* Fill in the task ' s elfregs structure for a core dump .
*/
int dump_task_regs ( struct task_struct * t , elf_gregset_t * elfregs )
{
elf_core_copy_regs ( elfregs , task_pt_regs ( t ) ) ;
return 1 ;
}
2005-04-16 15:20:36 -07:00
unsigned long get_wchan ( struct task_struct * p )
{
2009-02-11 13:07:53 +01:00
struct stackframe frame ;
2013-12-05 14:21:36 +01:00
unsigned long stack_page ;
2005-04-16 15:20:36 -07:00
int count = 0 ;
if ( ! p | | p = = current | | p - > state = = TASK_RUNNING )
return 0 ;
2009-02-11 13:07:53 +01:00
frame . fp = thread_saved_fp ( p ) ;
frame . sp = thread_saved_sp ( p ) ;
frame . lr = 0 ; /* recovered from the stack */
frame . pc = thread_saved_pc ( p ) ;
2013-12-05 14:21:36 +01:00
stack_page = ( unsigned long ) task_stack_page ( p ) ;
2005-04-16 15:20:36 -07:00
do {
2013-12-05 14:21:36 +01:00
if ( frame . sp < stack_page | |
frame . sp > = stack_page + THREAD_SIZE | |
unwind_frame ( & frame ) < 0 )
2005-04-16 15:20:36 -07:00
return 0 ;
2009-02-11 13:07:53 +01:00
if ( ! in_sched_functions ( frame . pc ) )
return frame . pc ;
2005-04-16 15:20:36 -07:00
} while ( count + + < 16 ) ;
return 0 ;
}
2010-06-14 16:27:19 -04:00
2011-01-11 14:04:36 +01:00
# ifdef CONFIG_MMU
2013-07-31 21:58:56 +01:00
# ifdef CONFIG_KUSER_HELPERS
2010-08-26 23:10:50 -04:00
/*
* The vectors page is always readable from user space for the
2013-07-24 00:29:18 +01:00
* atomic helpers . Insert it into the gate_vma so that it is visible
* through ptrace and / proc / < pid > / mem .
2010-08-26 23:10:50 -04:00
*/
2018-08-21 21:53:06 -07:00
static struct vm_area_struct gate_vma ;
2010-08-26 23:10:50 -04:00
2012-01-20 12:01:13 +01:00
static int __init gate_vma_init ( void )
2010-08-26 23:10:50 -04:00
{
2018-07-26 16:37:30 -07:00
vma_init ( & gate_vma , NULL ) ;
2013-02-23 17:55:39 +00:00
gate_vma . vm_page_prot = PAGE_READONLY_EXEC ;
2018-08-21 21:53:06 -07:00
gate_vma . vm_start = 0xffff0000 ;
gate_vma . vm_end = 0xffff0000 + PAGE_SIZE ;
gate_vma . vm_flags = VM_READ | VM_EXEC | VM_MAYREAD | VM_MAYEXEC ;
2012-01-20 12:01:13 +01:00
return 0 ;
}
arch_initcall ( gate_vma_init ) ;
struct vm_area_struct * get_gate_vma ( struct mm_struct * mm )
{
return & gate_vma ;
}
int in_gate_area ( struct mm_struct * mm , unsigned long addr )
{
return ( addr > = gate_vma . vm_start ) & & ( addr < gate_vma . vm_end ) ;
}
int in_gate_area_no_mm ( unsigned long addr )
{
return in_gate_area ( NULL , addr ) ;
2010-08-26 23:10:50 -04:00
}
2013-08-06 09:49:14 +01:00
# define is_gate_vma(vma) ((vma) == &gate_vma)
2013-07-31 21:58:56 +01:00
# else
# define is_gate_vma(vma) 0
# endif
2010-08-26 23:10:50 -04:00
const char * arch_vma_name ( struct vm_area_struct * vma )
{
2014-09-22 22:08:42 +01:00
return is_gate_vma ( vma ) ? " [vectors] " : NULL ;
2013-07-24 00:29:18 +01:00
}
2014-09-22 22:12:35 +01:00
/* If possible, provide a placement hint at a random offset from the
ARM: 8331/1: VDSO initialization, mapping, and synchronization
Initialize the VDSO page list at boot, install the VDSO mapping at
exec time, and update the data page during timer ticks. This code is
not built if CONFIG_VDSO is not enabled.
Account for the VDSO length when randomizing the offset from the
stack. The [vdso] and [vvar] pages are placed immediately following
the sigpage with separate _install_special_mapping calls.
We want to "penalize" systems lacking the arch timer as little
as possible. Previous versions of this code installed the VDSO
unconditionally and unmodified, making it a measurably slower way for
glibc to invoke the real syscalls on such systems. E.g. calling
gettimeofday via glibc goes from ~560ns to ~630ns on i.MX6Q.
If we can indicate to glibc that the time-related APIs in the VDSO are
not accelerated, glibc can continue to invoke the syscalls directly
instead of dispatching through the VDSO only to fall back to the slow
path.
Thus, if the architected timer is unusable for whatever reason, patch
the VDSO at boot time so that symbol lookups for gettimeofday and
clock_gettime return NULL. (This is similar to what powerpc does and
borrows code from there.) This allows glibc to perform the syscall
directly instead of passing control to the VDSO, which minimizes the
penalty. In my measurements the time taken for a gettimeofday call
via glibc goes from ~560ns to ~580ns (again on i.MX6Q), and this is
solely due to adding a test and branch to glibc's gettimeofday syscall
wrapper.
An alternative to patching the VDSO at boot would be to not install
the VDSO at all when the arch timer isn't usable. Another alternative
is to include a separate "dummy" vdso.so without gettimeofday and
clock_gettime, which would be selected at boot time. Either of these
would get cumbersome if the VDSO were to gain support for an API such
as getcpu which is unrelated to arch timer support.
Signed-off-by: Nathan Lynch <nathan_lynch@mentor.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2015-03-25 19:15:08 +01:00
* stack for the sigpage and vdso pages .
2014-09-22 22:12:35 +01:00
*/
static unsigned long sigpage_addr ( const struct mm_struct * mm ,
unsigned int npages )
{
unsigned long offset ;
unsigned long first ;
unsigned long last ;
unsigned long addr ;
unsigned int slots ;
first = PAGE_ALIGN ( mm - > start_stack ) ;
last = TASK_SIZE - ( npages < < PAGE_SHIFT ) ;
/* No room after stack? */
if ( first > last )
return 0 ;
/* Just enough room? */
if ( first = = last )
return first ;
slots = ( ( last - first ) > > PAGE_SHIFT ) + 1 ;
offset = get_random_int ( ) % slots ;
addr = first + ( offset < < PAGE_SHIFT ) ;
return addr ;
2013-07-24 00:29:18 +01:00
}
2013-08-03 10:30:05 +01:00
static struct page * signal_page ;
2013-07-24 00:29:18 +01:00
extern struct page * get_signal_page ( void ) ;
2017-06-19 17:32:42 +01:00
static int sigpage_mremap ( const struct vm_special_mapping * sm ,
struct vm_area_struct * new_vma )
{
current - > mm - > context . sigpage = new_vma - > vm_start ;
return 0 ;
}
2014-09-22 22:08:42 +01:00
static const struct vm_special_mapping sigpage_mapping = {
. name = " [sigpage] " ,
. pages = & signal_page ,
2017-06-19 17:32:42 +01:00
. mremap = sigpage_mremap ,
2014-09-22 22:08:42 +01:00
} ;
2013-07-24 00:29:18 +01:00
int arch_setup_additional_pages ( struct linux_binprm * bprm , int uses_interp )
{
struct mm_struct * mm = current - > mm ;
2014-09-22 22:08:42 +01:00
struct vm_area_struct * vma ;
ARM: 8331/1: VDSO initialization, mapping, and synchronization
Initialize the VDSO page list at boot, install the VDSO mapping at
exec time, and update the data page during timer ticks. This code is
not built if CONFIG_VDSO is not enabled.
Account for the VDSO length when randomizing the offset from the
stack. The [vdso] and [vvar] pages are placed immediately following
the sigpage with separate _install_special_mapping calls.
We want to "penalize" systems lacking the arch timer as little
as possible. Previous versions of this code installed the VDSO
unconditionally and unmodified, making it a measurably slower way for
glibc to invoke the real syscalls on such systems. E.g. calling
gettimeofday via glibc goes from ~560ns to ~630ns on i.MX6Q.
If we can indicate to glibc that the time-related APIs in the VDSO are
not accelerated, glibc can continue to invoke the syscalls directly
instead of dispatching through the VDSO only to fall back to the slow
path.
Thus, if the architected timer is unusable for whatever reason, patch
the VDSO at boot time so that symbol lookups for gettimeofday and
clock_gettime return NULL. (This is similar to what powerpc does and
borrows code from there.) This allows glibc to perform the syscall
directly instead of passing control to the VDSO, which minimizes the
penalty. In my measurements the time taken for a gettimeofday call
via glibc goes from ~560ns to ~580ns (again on i.MX6Q), and this is
solely due to adding a test and branch to glibc's gettimeofday syscall
wrapper.
An alternative to patching the VDSO at boot would be to not install
the VDSO at all when the arch timer isn't usable. Another alternative
is to include a separate "dummy" vdso.so without gettimeofday and
clock_gettime, which would be selected at boot time. Either of these
would get cumbersome if the VDSO were to gain support for an API such
as getcpu which is unrelated to arch timer support.
Signed-off-by: Nathan Lynch <nathan_lynch@mentor.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2015-03-25 19:15:08 +01:00
unsigned long npages ;
2013-07-24 00:29:18 +01:00
unsigned long addr ;
2014-09-22 22:12:35 +01:00
unsigned long hint ;
2014-09-22 22:08:42 +01:00
int ret = 0 ;
2013-07-24 00:29:18 +01:00
2013-08-03 10:30:05 +01:00
if ( ! signal_page )
signal_page = get_signal_page ( ) ;
if ( ! signal_page )
2013-07-24 00:29:18 +01:00
return - ENOMEM ;
ARM: 8331/1: VDSO initialization, mapping, and synchronization
Initialize the VDSO page list at boot, install the VDSO mapping at
exec time, and update the data page during timer ticks. This code is
not built if CONFIG_VDSO is not enabled.
Account for the VDSO length when randomizing the offset from the
stack. The [vdso] and [vvar] pages are placed immediately following
the sigpage with separate _install_special_mapping calls.
We want to "penalize" systems lacking the arch timer as little
as possible. Previous versions of this code installed the VDSO
unconditionally and unmodified, making it a measurably slower way for
glibc to invoke the real syscalls on such systems. E.g. calling
gettimeofday via glibc goes from ~560ns to ~630ns on i.MX6Q.
If we can indicate to glibc that the time-related APIs in the VDSO are
not accelerated, glibc can continue to invoke the syscalls directly
instead of dispatching through the VDSO only to fall back to the slow
path.
Thus, if the architected timer is unusable for whatever reason, patch
the VDSO at boot time so that symbol lookups for gettimeofday and
clock_gettime return NULL. (This is similar to what powerpc does and
borrows code from there.) This allows glibc to perform the syscall
directly instead of passing control to the VDSO, which minimizes the
penalty. In my measurements the time taken for a gettimeofday call
via glibc goes from ~560ns to ~580ns (again on i.MX6Q), and this is
solely due to adding a test and branch to glibc's gettimeofday syscall
wrapper.
An alternative to patching the VDSO at boot would be to not install
the VDSO at all when the arch timer isn't usable. Another alternative
is to include a separate "dummy" vdso.so without gettimeofday and
clock_gettime, which would be selected at boot time. Either of these
would get cumbersome if the VDSO were to gain support for an API such
as getcpu which is unrelated to arch timer support.
Signed-off-by: Nathan Lynch <nathan_lynch@mentor.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2015-03-25 19:15:08 +01:00
npages = 1 ; /* for sigpage */
npages + = vdso_total_pages ;
2020-06-08 21:33:25 -07:00
if ( mmap_write_lock_killable ( mm ) )
2016-05-23 16:25:54 -07:00
return - EINTR ;
ARM: 8331/1: VDSO initialization, mapping, and synchronization
Initialize the VDSO page list at boot, install the VDSO mapping at
exec time, and update the data page during timer ticks. This code is
not built if CONFIG_VDSO is not enabled.
Account for the VDSO length when randomizing the offset from the
stack. The [vdso] and [vvar] pages are placed immediately following
the sigpage with separate _install_special_mapping calls.
We want to "penalize" systems lacking the arch timer as little
as possible. Previous versions of this code installed the VDSO
unconditionally and unmodified, making it a measurably slower way for
glibc to invoke the real syscalls on such systems. E.g. calling
gettimeofday via glibc goes from ~560ns to ~630ns on i.MX6Q.
If we can indicate to glibc that the time-related APIs in the VDSO are
not accelerated, glibc can continue to invoke the syscalls directly
instead of dispatching through the VDSO only to fall back to the slow
path.
Thus, if the architected timer is unusable for whatever reason, patch
the VDSO at boot time so that symbol lookups for gettimeofday and
clock_gettime return NULL. (This is similar to what powerpc does and
borrows code from there.) This allows glibc to perform the syscall
directly instead of passing control to the VDSO, which minimizes the
penalty. In my measurements the time taken for a gettimeofday call
via glibc goes from ~560ns to ~580ns (again on i.MX6Q), and this is
solely due to adding a test and branch to glibc's gettimeofday syscall
wrapper.
An alternative to patching the VDSO at boot would be to not install
the VDSO at all when the arch timer isn't usable. Another alternative
is to include a separate "dummy" vdso.so without gettimeofday and
clock_gettime, which would be selected at boot time. Either of these
would get cumbersome if the VDSO were to gain support for an API such
as getcpu which is unrelated to arch timer support.
Signed-off-by: Nathan Lynch <nathan_lynch@mentor.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2015-03-25 19:15:08 +01:00
hint = sigpage_addr ( mm , npages ) ;
addr = get_unmapped_area ( NULL , hint , npages < < PAGE_SHIFT , 0 , 0 ) ;
2013-07-24 00:29:18 +01:00
if ( IS_ERR_VALUE ( addr ) ) {
ret = addr ;
goto up_fail ;
}
2014-09-22 22:08:42 +01:00
vma = _install_special_mapping ( mm , addr , PAGE_SIZE ,
2013-07-24 00:29:18 +01:00
VM_READ | VM_EXEC | VM_MAYREAD | VM_MAYWRITE | VM_MAYEXEC ,
2014-09-22 22:08:42 +01:00
& sigpage_mapping ) ;
if ( IS_ERR ( vma ) ) {
ret = PTR_ERR ( vma ) ;
goto up_fail ;
}
2013-07-24 00:29:18 +01:00
2014-09-22 22:08:42 +01:00
mm - > context . sigpage = addr ;
2013-07-24 00:29:18 +01:00
ARM: 8331/1: VDSO initialization, mapping, and synchronization
Initialize the VDSO page list at boot, install the VDSO mapping at
exec time, and update the data page during timer ticks. This code is
not built if CONFIG_VDSO is not enabled.
Account for the VDSO length when randomizing the offset from the
stack. The [vdso] and [vvar] pages are placed immediately following
the sigpage with separate _install_special_mapping calls.
We want to "penalize" systems lacking the arch timer as little
as possible. Previous versions of this code installed the VDSO
unconditionally and unmodified, making it a measurably slower way for
glibc to invoke the real syscalls on such systems. E.g. calling
gettimeofday via glibc goes from ~560ns to ~630ns on i.MX6Q.
If we can indicate to glibc that the time-related APIs in the VDSO are
not accelerated, glibc can continue to invoke the syscalls directly
instead of dispatching through the VDSO only to fall back to the slow
path.
Thus, if the architected timer is unusable for whatever reason, patch
the VDSO at boot time so that symbol lookups for gettimeofday and
clock_gettime return NULL. (This is similar to what powerpc does and
borrows code from there.) This allows glibc to perform the syscall
directly instead of passing control to the VDSO, which minimizes the
penalty. In my measurements the time taken for a gettimeofday call
via glibc goes from ~560ns to ~580ns (again on i.MX6Q), and this is
solely due to adding a test and branch to glibc's gettimeofday syscall
wrapper.
An alternative to patching the VDSO at boot would be to not install
the VDSO at all when the arch timer isn't usable. Another alternative
is to include a separate "dummy" vdso.so without gettimeofday and
clock_gettime, which would be selected at boot time. Either of these
would get cumbersome if the VDSO were to gain support for an API such
as getcpu which is unrelated to arch timer support.
Signed-off-by: Nathan Lynch <nathan_lynch@mentor.com>
Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
2015-03-25 19:15:08 +01:00
/* Unlike the sigpage, failure to install the vdso is unlikely
* to be fatal to the process , so no error check needed
* here .
*/
arm_install_vdso ( mm , addr + PAGE_SIZE ) ;
2013-07-24 00:29:18 +01:00
up_fail :
2020-06-08 21:33:25 -07:00
mmap_write_unlock ( mm ) ;
2013-07-24 00:29:18 +01:00
return ret ;
2010-08-26 23:10:50 -04:00
}
2011-01-11 14:04:36 +01:00
# endif