2008-09-30 13:12:15 +02:00
/*
* Copyright ( C ) 1991 , 1992 Linus Torvalds
* Copyright ( C ) 2000 , 2001 , 2002 Andi Kleen , SuSE Labs
*/
# include <linux/kallsyms.h>
# include <linux/kprobes.h>
# include <linux/uaccess.h>
# include <linux/hardirq.h>
# include <linux/kdebug.h>
# include <linux/module.h>
# include <linux/ptrace.h>
# include <linux/kexec.h>
2009-11-26 08:17:31 +01:00
# include <linux/sysfs.h>
2008-09-30 13:12:15 +02:00
# include <linux/bug.h>
# include <linux/nmi.h>
# include <asm/stacktrace.h>
2009-11-26 08:17:31 +01:00
# define N_EXCEPTION_STACKS_END \
( N_EXCEPTION_STACKS + DEBUG_STKSZ / EXCEPTION_STKSZ - 2 )
2009-07-01 21:02:09 +02:00
static char x86_stack_ids [ ] [ 8 ] = {
2009-11-26 08:17:31 +01:00
[ DEBUG_STACK - 1 ] = " #DB " ,
[ NMI_STACK - 1 ] = " NMI " ,
[ DOUBLEFAULT_STACK - 1 ] = " #DF " ,
[ STACKFAULT_STACK - 1 ] = " #SS " ,
[ MCE_STACK - 1 ] = " #MC " ,
2008-09-30 13:12:15 +02:00
# if DEBUG_STKSZ > EXCEPTION_STKSZ
2009-11-26 08:17:31 +01:00
[ N_EXCEPTION_STACKS . . .
N_EXCEPTION_STACKS_END ] = " #DB[?] "
2008-09-30 13:12:15 +02:00
# endif
2009-11-26 08:17:31 +01:00
} ;
2009-07-01 21:02:09 +02:00
static unsigned long * in_exception_stack ( unsigned cpu , unsigned long stack ,
2009-11-26 08:17:31 +01:00
unsigned * usedp , char * * idp )
2009-07-01 21:02:09 +02:00
{
2008-09-30 13:12:15 +02:00
unsigned k ;
/*
* Iterate over all exception stacks , and figure out whether
* ' stack ' is in one of them :
*/
for ( k = 0 ; k < N_EXCEPTION_STACKS ; k + + ) {
unsigned long end = per_cpu ( orig_ist , cpu ) . ist [ k ] ;
/*
* Is ' stack ' above this exception frame ' s end ?
* If yes then skip to the next frame .
*/
if ( stack > = end )
continue ;
/*
* Is ' stack ' above this exception frame ' s start address ?
* If yes then we found the right frame .
*/
if ( stack > = end - EXCEPTION_STKSZ ) {
/*
* Make sure we only iterate through an exception
* stack once . If it comes up for the second time
* then there ' s something wrong going on - just
* break out and return NULL :
*/
if ( * usedp & ( 1U < < k ) )
break ;
* usedp | = 1U < < k ;
2009-07-01 21:02:09 +02:00
* idp = x86_stack_ids [ k ] ;
2008-09-30 13:12:15 +02:00
return ( unsigned long * ) end ;
}
/*
* If this is a debug stack , and if it has a larger size than
* the usual exception stacks , then ' stack ' might still
* be within the lower portion of the debug stack :
*/
# if DEBUG_STKSZ > EXCEPTION_STKSZ
if ( k = = DEBUG_STACK - 1 & & stack > = end - DEBUG_STKSZ ) {
unsigned j = N_EXCEPTION_STACKS - 1 ;
/*
* Black magic . A large debug stack is composed of
* multiple exception stack entries , which we
* iterate through now . Dont look :
*/
do {
+ + j ;
end - = EXCEPTION_STKSZ ;
2009-07-01 21:02:09 +02:00
x86_stack_ids [ j ] [ 4 ] = ' 1 ' +
( j - N_EXCEPTION_STACKS ) ;
2008-09-30 13:12:15 +02:00
} while ( stack < end - EXCEPTION_STKSZ ) ;
if ( * usedp & ( 1U < < j ) )
break ;
* usedp | = 1U < < j ;
2009-07-01 21:02:09 +02:00
* idp = x86_stack_ids [ j ] ;
2008-09-30 13:12:15 +02:00
return ( unsigned long * ) end ;
}
# endif
}
return NULL ;
}
2009-12-06 05:34:27 +01:00
static inline int
in_irq_stack ( unsigned long * stack , unsigned long * irq_stack ,
unsigned long * irq_stack_end )
{
return ( stack > = irq_stack & & stack < irq_stack_end ) ;
}
2008-09-30 13:12:15 +02:00
/*
* x86 - 64 can have up to three kernel stacks :
* process stack
* interrupt stack
* severe exception ( double fault , nmi , stack fault , debug , mce ) hardware stack
*/
2011-03-18 11:40:06 +09:00
void dump_trace ( struct task_struct * task , struct pt_regs * regs ,
unsigned long * stack , unsigned long bp ,
2008-09-30 13:12:15 +02:00
const struct stacktrace_ops * ops , void * data )
{
const unsigned cpu = get_cpu ( ) ;
2009-01-19 00:38:58 +09:00
unsigned long * irq_stack_end =
( unsigned long * ) per_cpu ( irq_stack_ptr , cpu ) ;
2008-09-30 13:12:15 +02:00
unsigned used = 0 ;
struct thread_info * tinfo ;
2008-12-02 23:50:04 -05:00
int graph = 0 ;
2011-01-24 22:41:11 +01:00
unsigned long dummy ;
2008-09-30 13:12:15 +02:00
if ( ! task )
task = current ;
if ( ! stack ) {
2011-06-30 19:04:56 +02:00
if ( regs )
stack = ( unsigned long * ) regs - > sp ;
2012-01-28 13:52:46 +03:00
else if ( task ! = current )
2008-09-30 13:12:15 +02:00
stack = ( unsigned long * ) task - > thread . sp ;
2011-06-30 19:04:56 +02:00
else
stack = & dummy ;
2008-09-30 13:12:15 +02:00
}
2011-03-18 11:40:06 +09:00
if ( ! bp )
bp = stack_frame ( task , regs ) ;
2008-09-30 13:12:15 +02:00
/*
* Print function call entries in all stacks , starting at the
* current stack address . If the stacks consist of nested
* exceptions
*/
tinfo = task_thread_info ( task ) ;
for ( ; ; ) {
char * id ;
unsigned long * estack_end ;
estack_end = in_exception_stack ( cpu , ( unsigned long ) stack ,
& used , & id ) ;
if ( estack_end ) {
if ( ops - > stack ( data , id ) < 0 )
break ;
2009-12-17 05:40:33 +01:00
bp = ops - > walk_stack ( tinfo , stack , bp , ops ,
data , estack_end , & graph ) ;
2008-09-30 13:12:15 +02:00
ops - > stack ( data , " <EOE> " ) ;
/*
* We link to the next stack via the
* second - to - last pointer ( index - 2 to end ) in the
* exception stack :
*/
stack = ( unsigned long * ) estack_end [ - 2 ] ;
continue ;
}
2009-01-19 00:38:58 +09:00
if ( irq_stack_end ) {
unsigned long * irq_stack ;
irq_stack = irq_stack_end -
( IRQ_STACK_SIZE - 64 ) / sizeof ( * irq_stack ) ;
2008-09-30 13:12:15 +02:00
2009-12-06 05:34:27 +01:00
if ( in_irq_stack ( stack , irq_stack , irq_stack_end ) ) {
2008-09-30 13:12:15 +02:00
if ( ops - > stack ( data , " IRQ " ) < 0 )
break ;
2010-03-03 07:38:37 +01:00
bp = ops - > walk_stack ( tinfo , stack , bp ,
2009-01-19 00:38:58 +09:00
ops , data , irq_stack_end , & graph ) ;
2008-09-30 13:12:15 +02:00
/*
* We link to the next stack ( which would be
* the process stack normally ) the last
* pointer ( index - 1 to end ) in the IRQ stack :
*/
2009-01-19 00:38:58 +09:00
stack = ( unsigned long * ) ( irq_stack_end [ - 1 ] ) ;
irq_stack_end = NULL ;
2008-09-30 13:12:15 +02:00
ops - > stack ( data , " EOI " ) ;
continue ;
}
}
break ;
}
/*
* This handles the process stack :
*/
2010-03-03 07:38:37 +01:00
bp = ops - > walk_stack ( tinfo , stack , bp , ops , data , NULL , & graph ) ;
2008-09-30 13:12:15 +02:00
put_cpu ( ) ;
}
EXPORT_SYMBOL ( dump_trace ) ;
2008-10-23 10:40:06 -04:00
void
2008-09-30 13:12:15 +02:00
show_stack_log_lvl ( struct task_struct * task , struct pt_regs * regs ,
2011-03-18 11:40:06 +09:00
unsigned long * sp , unsigned long bp , char * log_lvl )
2008-09-30 13:12:15 +02:00
{
2009-11-26 08:29:10 +01:00
unsigned long * irq_stack_end ;
unsigned long * irq_stack ;
2008-09-30 13:12:15 +02:00
unsigned long * stack ;
2009-11-26 08:29:10 +01:00
int cpu ;
2008-09-30 13:12:15 +02:00
int i ;
2009-11-26 08:29:10 +01:00
preempt_disable ( ) ;
cpu = smp_processor_id ( ) ;
irq_stack_end = ( unsigned long * ) ( per_cpu ( irq_stack_ptr , cpu ) ) ;
irq_stack = ( unsigned long * ) ( per_cpu ( irq_stack_ptr , cpu ) - IRQ_STACK_SIZE ) ;
2008-09-30 13:12:15 +02:00
/*
2009-11-26 08:29:10 +01:00
* Debugging aid : " show_stack(NULL, NULL); " prints the
* back trace for this cpu :
2008-09-30 13:12:15 +02:00
*/
if ( sp = = NULL ) {
if ( task )
sp = ( unsigned long * ) task - > thread . sp ;
else
sp = ( unsigned long * ) & sp ;
}
stack = sp ;
for ( i = 0 ; i < kstack_depth_to_print ; i + + ) {
2009-01-19 00:38:58 +09:00
if ( stack > = irq_stack & & stack < = irq_stack_end ) {
if ( stack = = irq_stack_end ) {
stack = ( unsigned long * ) ( irq_stack_end [ - 1 ] ) ;
2012-05-21 19:50:07 -07:00
pr_cont ( " <EOI> " ) ;
2008-09-30 13:12:15 +02:00
}
} else {
if ( ( ( long ) stack & ( THREAD_SIZE - 1 ) ) = = 0 )
break ;
}
2008-10-04 23:12:46 +02:00
if ( i & & ( ( i % STACKSLOTS_PER_LINE ) = = 0 ) )
2012-05-21 19:50:07 -07:00
pr_cont ( " \n " ) ;
pr_cont ( " %016lx " , * stack + + ) ;
2008-09-30 13:12:15 +02:00
touch_nmi_watchdog ( ) ;
}
2009-11-26 08:29:10 +01:00
preempt_enable ( ) ;
2012-05-21 19:50:07 -07:00
pr_cont ( " \n " ) ;
2011-03-18 11:40:06 +09:00
show_trace_log_lvl ( task , regs , sp , bp , log_lvl ) ;
2008-09-30 13:12:15 +02:00
}
2012-05-09 08:47:37 +01:00
void show_regs ( struct pt_regs * regs )
2008-09-30 13:12:15 +02:00
{
int i ;
unsigned long sp ;
const int cpu = smp_processor_id ( ) ;
2009-01-19 00:38:58 +09:00
struct task_struct * cur = current ;
2008-09-30 13:12:15 +02:00
sp = regs - > sp ;
printk ( " CPU %d " , cpu ) ;
__show_regs ( regs , 1 ) ;
2012-05-21 19:50:07 -07:00
printk ( KERN_DEFAULT " Process %s (pid: %d, threadinfo %p, task %p) \n " ,
cur - > comm , cur - > pid , task_thread_info ( cur ) , cur ) ;
2008-09-30 13:12:15 +02:00
/*
* When in - kernel , we also print out the stack and code at the
* time of the fault . .
*/
if ( ! user_mode ( regs ) ) {
unsigned int code_prologue = code_bytes * 43 / 64 ;
unsigned int code_len = code_bytes ;
unsigned char c ;
u8 * ip ;
bugs, x86: Fix printk levels for panic, softlockups and stack dumps
rsyslog will display KERN_EMERG messages on a connected
terminal. However, these messages are useless/undecipherable
for a general user.
For example, after a softlockup we get:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Stack:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Call Trace:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Code: ff ff a8 08 75 25 31 d2 48 8d 86 38 e0 ff ff 48 89
d1 0f 01 c8 0f ae f0 48 8b 86 38 e0 ff ff a8 08 75 08 b1 01 4c 89 e0 0f 01 c9 <e8> ea 69 dd ff 4c 29 e8 48 89 c7 e8 0f bc da ff 49 89 c4 49 89
This happens because the printk levels for these messages are
incorrect. Only an informational message should be displayed on
a terminal.
I modified the printk levels for various messages in the kernel
and tested the output by using the drivers/misc/lkdtm.c kernel
modules (ie, softlockups, panics, hard lockups, etc.) and
confirmed that the console output was still the same and that
the output to the terminals was correct.
For example, in the case of a softlockup we now see the much
more informative:
Message from syslogd@intel-s3e37-04 at Jan 25 10:18:06 ...
BUG: soft lockup - CPU4 stuck for 60s!
instead of the above confusing messages.
AFAICT, the messages no longer have to be KERN_EMERG. In the
most important case of a panic we set console_verbose(). As for
the other less severe cases the correct data is output to the
console and /var/log/messages.
Successfully tested by me using the drivers/misc/lkdtm.c module.
Signed-off-by: Prarit Bhargava <prarit@redhat.com>
Cc: dzickus@redhat.com
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Link: http://lkml.kernel.org/r/1327586134-11926-1-git-send-email-prarit@redhat.com
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2012-01-26 08:55:34 -05:00
printk ( KERN_DEFAULT " Stack: \n " ) ;
2008-09-30 13:12:15 +02:00
show_stack_log_lvl ( NULL , regs , ( unsigned long * ) sp ,
bugs, x86: Fix printk levels for panic, softlockups and stack dumps
rsyslog will display KERN_EMERG messages on a connected
terminal. However, these messages are useless/undecipherable
for a general user.
For example, after a softlockup we get:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Stack:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Call Trace:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Code: ff ff a8 08 75 25 31 d2 48 8d 86 38 e0 ff ff 48 89
d1 0f 01 c8 0f ae f0 48 8b 86 38 e0 ff ff a8 08 75 08 b1 01 4c 89 e0 0f 01 c9 <e8> ea 69 dd ff 4c 29 e8 48 89 c7 e8 0f bc da ff 49 89 c4 49 89
This happens because the printk levels for these messages are
incorrect. Only an informational message should be displayed on
a terminal.
I modified the printk levels for various messages in the kernel
and tested the output by using the drivers/misc/lkdtm.c kernel
modules (ie, softlockups, panics, hard lockups, etc.) and
confirmed that the console output was still the same and that
the output to the terminals was correct.
For example, in the case of a softlockup we now see the much
more informative:
Message from syslogd@intel-s3e37-04 at Jan 25 10:18:06 ...
BUG: soft lockup - CPU4 stuck for 60s!
instead of the above confusing messages.
AFAICT, the messages no longer have to be KERN_EMERG. In the
most important case of a panic we set console_verbose(). As for
the other less severe cases the correct data is output to the
console and /var/log/messages.
Successfully tested by me using the drivers/misc/lkdtm.c module.
Signed-off-by: Prarit Bhargava <prarit@redhat.com>
Cc: dzickus@redhat.com
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Link: http://lkml.kernel.org/r/1327586134-11926-1-git-send-email-prarit@redhat.com
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2012-01-26 08:55:34 -05:00
0 , KERN_DEFAULT ) ;
2008-09-30 13:12:15 +02:00
bugs, x86: Fix printk levels for panic, softlockups and stack dumps
rsyslog will display KERN_EMERG messages on a connected
terminal. However, these messages are useless/undecipherable
for a general user.
For example, after a softlockup we get:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Stack:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Call Trace:
Message from syslogd@intel-s3e37-04 at Jan 25 14:18:06 ...
kernel:Code: ff ff a8 08 75 25 31 d2 48 8d 86 38 e0 ff ff 48 89
d1 0f 01 c8 0f ae f0 48 8b 86 38 e0 ff ff a8 08 75 08 b1 01 4c 89 e0 0f 01 c9 <e8> ea 69 dd ff 4c 29 e8 48 89 c7 e8 0f bc da ff 49 89 c4 49 89
This happens because the printk levels for these messages are
incorrect. Only an informational message should be displayed on
a terminal.
I modified the printk levels for various messages in the kernel
and tested the output by using the drivers/misc/lkdtm.c kernel
modules (ie, softlockups, panics, hard lockups, etc.) and
confirmed that the console output was still the same and that
the output to the terminals was correct.
For example, in the case of a softlockup we now see the much
more informative:
Message from syslogd@intel-s3e37-04 at Jan 25 10:18:06 ...
BUG: soft lockup - CPU4 stuck for 60s!
instead of the above confusing messages.
AFAICT, the messages no longer have to be KERN_EMERG. In the
most important case of a panic we set console_verbose(). As for
the other less severe cases the correct data is output to the
console and /var/log/messages.
Successfully tested by me using the drivers/misc/lkdtm.c module.
Signed-off-by: Prarit Bhargava <prarit@redhat.com>
Cc: dzickus@redhat.com
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Link: http://lkml.kernel.org/r/1327586134-11926-1-git-send-email-prarit@redhat.com
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2012-01-26 08:55:34 -05:00
printk ( KERN_DEFAULT " Code: " ) ;
2008-09-30 13:12:15 +02:00
ip = ( u8 * ) regs - > ip - code_prologue ;
if ( ip < ( u8 * ) PAGE_OFFSET | | probe_kernel_address ( ip , c ) ) {
2008-10-04 23:12:46 +02:00
/* try starting at IP */
2008-09-30 13:12:15 +02:00
ip = ( u8 * ) regs - > ip ;
code_len = code_len - code_prologue + 1 ;
}
for ( i = 0 ; i < code_len ; i + + , ip + + ) {
if ( ip < ( u8 * ) PAGE_OFFSET | |
probe_kernel_address ( ip , c ) ) {
2012-05-21 19:50:07 -07:00
pr_cont ( " Bad RIP value. " ) ;
2008-09-30 13:12:15 +02:00
break ;
}
if ( ip = = ( u8 * ) regs - > ip )
2012-05-21 19:50:07 -07:00
pr_cont ( " <%02x> " , c ) ;
2008-09-30 13:12:15 +02:00
else
2012-05-21 19:50:07 -07:00
pr_cont ( " %02x " , c ) ;
2008-09-30 13:12:15 +02:00
}
}
2012-05-21 19:50:07 -07:00
pr_cont ( " \n " ) ;
2008-09-30 13:12:15 +02:00
}
int is_valid_bugaddr ( unsigned long ip )
{
unsigned short ud2 ;
if ( __copy_from_user ( & ud2 , ( const void __user * ) ip , sizeof ( ud2 ) ) )
return 0 ;
return ud2 = = 0x0b0f ;
}