2005-04-17 02:20:36 +04:00
/**
* @ file nmi_int . c
*
* @ remark Copyright 2002 OProfile authors
* @ remark Read the file COPYING
*
* @ author John Levon < levon @ movementarian . org >
*/
# include <linux/init.h>
# include <linux/notifier.h>
# include <linux/smp.h>
# include <linux/oprofile.h>
# include <linux/sysdev.h>
# include <linux/slab.h>
2006-07-10 19:06:21 +04:00
# include <linux/moduleparam.h>
2007-05-08 11:27:03 +04:00
# include <linux/kdebug.h>
2005-04-17 02:20:36 +04:00
# include <asm/nmi.h>
# include <asm/msr.h>
# include <asm/apic.h>
# include "op_counter.h"
# include "op_x86_model.h"
2006-09-26 12:52:27 +04:00
2005-04-17 02:20:36 +04:00
static struct op_x86_model_spec const * model ;
static struct op_msrs cpu_msrs [ NR_CPUS ] ;
static unsigned long saved_lvtpc [ NR_CPUS ] ;
2006-09-26 12:52:27 +04:00
2005-04-17 02:20:36 +04:00
static int nmi_start ( void ) ;
static void nmi_stop ( void ) ;
/* 0 == registered but off, 1 == registered and on */
static int nmi_enabled = 0 ;
# ifdef CONFIG_PM
2005-04-17 02:25:24 +04:00
static int nmi_suspend ( struct sys_device * dev , pm_message_t state )
2005-04-17 02:20:36 +04:00
{
if ( nmi_enabled = = 1 )
nmi_stop ( ) ;
return 0 ;
}
static int nmi_resume ( struct sys_device * dev )
{
if ( nmi_enabled = = 1 )
nmi_start ( ) ;
return 0 ;
}
static struct sysdev_class oprofile_sysclass = {
set_kset_name ( " oprofile " ) ,
. resume = nmi_resume ,
. suspend = nmi_suspend ,
} ;
static struct sys_device device_oprofile = {
. id = 0 ,
. cls = & oprofile_sysclass ,
} ;
2007-02-17 21:13:42 +03:00
static int __init init_sysfs ( void )
2005-04-17 02:20:36 +04:00
{
int error ;
if ( ! ( error = sysdev_class_register ( & oprofile_sysclass ) ) )
error = sysdev_register ( & device_oprofile ) ;
return error ;
}
2007-02-17 21:13:42 +03:00
static void exit_sysfs ( void )
2005-04-17 02:20:36 +04:00
{
sysdev_unregister ( & device_oprofile ) ;
sysdev_class_unregister ( & oprofile_sysclass ) ;
}
# else
2007-02-17 21:13:42 +03:00
# define init_sysfs() do { } while (0)
# define exit_sysfs() do { } while (0)
2005-04-17 02:20:36 +04:00
# endif /* CONFIG_PM */
2006-09-26 12:52:27 +04:00
static int profile_exceptions_notify ( struct notifier_block * self ,
unsigned long val , void * data )
2005-04-17 02:20:36 +04:00
{
2006-09-26 12:52:27 +04:00
struct die_args * args = ( struct die_args * ) data ;
int ret = NOTIFY_DONE ;
int cpu = smp_processor_id ( ) ;
switch ( val ) {
case DIE_NMI :
if ( model - > check_ctrs ( args - > regs , & cpu_msrs [ cpu ] ) )
ret = NOTIFY_STOP ;
break ;
default :
break ;
}
return ret ;
2005-04-17 02:20:36 +04:00
}
2006-09-26 12:52:27 +04:00
2005-04-17 02:20:36 +04:00
static void nmi_cpu_save_registers ( struct op_msrs * msrs )
{
unsigned int const nr_ctrs = model - > num_counters ;
unsigned int const nr_ctrls = model - > num_controls ;
struct op_msr * counters = msrs - > counters ;
struct op_msr * controls = msrs - > controls ;
unsigned int i ;
for ( i = 0 ; i < nr_ctrs ; + + i ) {
2006-09-26 12:52:26 +04:00
if ( counters [ i ] . addr ) {
rdmsr ( counters [ i ] . addr ,
counters [ i ] . saved . low ,
counters [ i ] . saved . high ) ;
}
2005-04-17 02:20:36 +04:00
}
for ( i = 0 ; i < nr_ctrls ; + + i ) {
2006-09-26 12:52:26 +04:00
if ( controls [ i ] . addr ) {
rdmsr ( controls [ i ] . addr ,
controls [ i ] . saved . low ,
controls [ i ] . saved . high ) ;
}
2005-04-17 02:20:36 +04:00
}
}
static void nmi_save_registers ( void * dummy )
{
int cpu = smp_processor_id ( ) ;
struct op_msrs * msrs = & cpu_msrs [ cpu ] ;
model - > fill_in_addresses ( msrs ) ;
nmi_cpu_save_registers ( msrs ) ;
}
static void free_msrs ( void )
{
int i ;
2006-03-28 13:56:39 +04:00
for_each_possible_cpu ( i ) {
2005-04-17 02:20:36 +04:00
kfree ( cpu_msrs [ i ] . counters ) ;
cpu_msrs [ i ] . counters = NULL ;
kfree ( cpu_msrs [ i ] . controls ) ;
cpu_msrs [ i ] . controls = NULL ;
}
}
static int allocate_msrs ( void )
{
int success = 1 ;
size_t controls_size = sizeof ( struct op_msr ) * model - > num_controls ;
size_t counters_size = sizeof ( struct op_msr ) * model - > num_counters ;
int i ;
2006-03-23 14:01:05 +03:00
for_each_online_cpu ( i ) {
2005-04-17 02:20:36 +04:00
cpu_msrs [ i ] . counters = kmalloc ( counters_size , GFP_KERNEL ) ;
if ( ! cpu_msrs [ i ] . counters ) {
success = 0 ;
break ;
}
cpu_msrs [ i ] . controls = kmalloc ( controls_size , GFP_KERNEL ) ;
if ( ! cpu_msrs [ i ] . controls ) {
success = 0 ;
break ;
}
}
if ( ! success )
free_msrs ( ) ;
return success ;
}
static void nmi_cpu_setup ( void * dummy )
{
int cpu = smp_processor_id ( ) ;
struct op_msrs * msrs = & cpu_msrs [ cpu ] ;
spin_lock ( & oprofilefs_lock ) ;
model - > setup_ctrs ( msrs ) ;
spin_unlock ( & oprofilefs_lock ) ;
saved_lvtpc [ cpu ] = apic_read ( APIC_LVTPC ) ;
apic_write ( APIC_LVTPC , APIC_DM_NMI ) ;
}
2006-09-26 12:52:27 +04:00
static struct notifier_block profile_exceptions_nb = {
. notifier_call = profile_exceptions_notify ,
. next = NULL ,
. priority = 0
} ;
2005-04-17 02:20:36 +04:00
static int nmi_setup ( void )
{
2006-09-26 12:52:27 +04:00
int err = 0 ;
2005-04-17 02:20:36 +04:00
if ( ! allocate_msrs ( ) )
return - ENOMEM ;
2006-09-26 12:52:27 +04:00
if ( ( err = register_die_notifier ( & profile_exceptions_nb ) ) ) {
2005-04-17 02:20:36 +04:00
free_msrs ( ) ;
2006-09-26 12:52:27 +04:00
return err ;
2005-04-17 02:20:36 +04:00
}
2006-09-26 12:52:27 +04:00
2005-04-17 02:20:36 +04:00
/* We need to serialize save and setup for HT because the subset
* of msrs are distinct for save and setup operations
*/
on_each_cpu ( nmi_save_registers , NULL , 0 , 1 ) ;
on_each_cpu ( nmi_cpu_setup , NULL , 0 , 1 ) ;
nmi_enabled = 1 ;
return 0 ;
}
static void nmi_restore_registers ( struct op_msrs * msrs )
{
unsigned int const nr_ctrs = model - > num_counters ;
unsigned int const nr_ctrls = model - > num_controls ;
struct op_msr * counters = msrs - > counters ;
struct op_msr * controls = msrs - > controls ;
unsigned int i ;
for ( i = 0 ; i < nr_ctrls ; + + i ) {
2006-09-26 12:52:26 +04:00
if ( controls [ i ] . addr ) {
wrmsr ( controls [ i ] . addr ,
controls [ i ] . saved . low ,
controls [ i ] . saved . high ) ;
}
2005-04-17 02:20:36 +04:00
}
for ( i = 0 ; i < nr_ctrs ; + + i ) {
2006-09-26 12:52:26 +04:00
if ( counters [ i ] . addr ) {
wrmsr ( counters [ i ] . addr ,
counters [ i ] . saved . low ,
counters [ i ] . saved . high ) ;
}
2005-04-17 02:20:36 +04:00
}
}
static void nmi_cpu_shutdown ( void * dummy )
{
unsigned int v ;
int cpu = smp_processor_id ( ) ;
struct op_msrs * msrs = & cpu_msrs [ cpu ] ;
/* restoring APIC_LVTPC can trigger an apic error because the delivery
* mode and vector nr combination can be illegal . That ' s by design : on
* power on apic lvt contain a zero vector nr which are legal only for
* NMI delivery mode . So inhibit apic err before restoring lvtpc
*/
v = apic_read ( APIC_LVTERR ) ;
apic_write ( APIC_LVTERR , v | APIC_LVT_MASKED ) ;
apic_write ( APIC_LVTPC , saved_lvtpc [ cpu ] ) ;
apic_write ( APIC_LVTERR , v ) ;
nmi_restore_registers ( msrs ) ;
2006-09-26 12:52:26 +04:00
model - > shutdown ( msrs ) ;
2005-04-17 02:20:36 +04:00
}
static void nmi_shutdown ( void )
{
nmi_enabled = 0 ;
on_each_cpu ( nmi_cpu_shutdown , NULL , 0 , 1 ) ;
2006-09-26 12:52:27 +04:00
unregister_die_notifier ( & profile_exceptions_nb ) ;
2005-04-17 02:20:36 +04:00
free_msrs ( ) ;
}
static void nmi_cpu_start ( void * dummy )
{
struct op_msrs const * msrs = & cpu_msrs [ smp_processor_id ( ) ] ;
model - > start ( msrs ) ;
}
static int nmi_start ( void )
{
on_each_cpu ( nmi_cpu_start , NULL , 0 , 1 ) ;
return 0 ;
}
static void nmi_cpu_stop ( void * dummy )
{
struct op_msrs const * msrs = & cpu_msrs [ smp_processor_id ( ) ] ;
model - > stop ( msrs ) ;
}
static void nmi_stop ( void )
{
on_each_cpu ( nmi_cpu_stop , NULL , 0 , 1 ) ;
}
struct op_counter_config counter_config [ OP_MAX_COUNTER ] ;
static int nmi_create_files ( struct super_block * sb , struct dentry * root )
{
unsigned int i ;
for ( i = 0 ; i < model - > num_counters ; + + i ) {
struct dentry * dir ;
2006-06-26 11:24:34 +04:00
char buf [ 4 ] ;
2005-04-17 02:20:36 +04:00
2006-09-26 12:52:26 +04:00
/* quick little hack to _not_ expose a counter if it is not
* available for use . This should protect userspace app .
* NOTE : assumes 1 : 1 mapping here ( that counters are organized
* sequentially in their struct assignment ) .
*/
if ( unlikely ( ! avail_to_resrv_perfctr_nmi_bit ( i ) ) )
continue ;
2006-06-26 11:24:34 +04:00
snprintf ( buf , sizeof ( buf ) , " %d " , i ) ;
2005-04-17 02:20:36 +04:00
dir = oprofilefs_mkdir ( sb , root , buf ) ;
oprofilefs_create_ulong ( sb , dir , " enabled " , & counter_config [ i ] . enabled ) ;
oprofilefs_create_ulong ( sb , dir , " event " , & counter_config [ i ] . event ) ;
oprofilefs_create_ulong ( sb , dir , " count " , & counter_config [ i ] . count ) ;
oprofilefs_create_ulong ( sb , dir , " unit_mask " , & counter_config [ i ] . unit_mask ) ;
oprofilefs_create_ulong ( sb , dir , " kernel " , & counter_config [ i ] . kernel ) ;
oprofilefs_create_ulong ( sb , dir , " user " , & counter_config [ i ] . user ) ;
}
return 0 ;
}
2006-07-10 19:06:21 +04:00
static int p4force ;
module_param ( p4force , int , 0 ) ;
2005-04-17 02:20:36 +04:00
static int __init p4_init ( char * * cpu_type )
{
__u8 cpu_model = boot_cpu_data . x86_model ;
2006-07-10 19:06:21 +04:00
if ( ! p4force & & ( cpu_model > 6 | | cpu_model = = 5 ) )
2005-04-17 02:20:36 +04:00
return 0 ;
# ifndef CONFIG_SMP
* cpu_type = " i386/p4 " ;
model = & op_p4_spec ;
return 1 ;
# else
switch ( smp_num_siblings ) {
case 1 :
* cpu_type = " i386/p4 " ;
model = & op_p4_spec ;
return 1 ;
case 2 :
* cpu_type = " i386/p4-ht " ;
model = & op_p4_ht2_spec ;
return 1 ;
}
# endif
printk ( KERN_INFO " oprofile: P4 HyperThreading detected with > 2 threads \n " ) ;
printk ( KERN_INFO " oprofile: Reverting to timer mode. \n " ) ;
return 0 ;
}
static int __init ppro_init ( char * * cpu_type )
{
__u8 cpu_model = boot_cpu_data . x86_model ;
2006-05-15 20:44:24 +04:00
if ( cpu_model = = 14 )
* cpu_type = " i386/core " ;
2006-09-17 03:35:46 +04:00
else if ( cpu_model = = 15 )
* cpu_type = " i386/core_2 " ;
2006-05-15 20:44:24 +04:00
else if ( cpu_model > 0xd )
2005-04-17 02:20:36 +04:00
return 0 ;
2006-05-15 20:44:24 +04:00
else if ( cpu_model = = 9 ) {
2005-04-17 02:20:36 +04:00
* cpu_type = " i386/p6_mobile " ;
} else if ( cpu_model > 5 ) {
* cpu_type = " i386/piii " ;
} else if ( cpu_model > 2 ) {
* cpu_type = " i386/pii " ;
} else {
* cpu_type = " i386/ppro " ;
}
model = & op_ppro_spec ;
return 1 ;
}
2007-02-17 21:13:42 +03:00
/* in order to get sysfs right */
2005-04-17 02:20:36 +04:00
static int using_nmi ;
2005-09-07 02:17:26 +04:00
int __init op_nmi_init ( struct oprofile_operations * ops )
2005-04-17 02:20:36 +04:00
{
__u8 vendor = boot_cpu_data . x86_vendor ;
__u8 family = boot_cpu_data . x86 ;
char * cpu_type ;
if ( ! cpu_has_apic )
return - ENODEV ;
switch ( vendor ) {
case X86_VENDOR_AMD :
/* Needs to be at least an Athlon (or hammer in 32bit mode) */
switch ( family ) {
default :
return - ENODEV ;
case 6 :
model = & op_athlon_spec ;
cpu_type = " i386/athlon " ;
break ;
case 0xf :
model = & op_athlon_spec ;
/* Actually it could be i386/hammer too, but give
user space an consistent name . */
cpu_type = " x86-64/hammer " ;
break ;
2007-05-02 21:27:06 +04:00
case 0x10 :
model = & op_athlon_spec ;
cpu_type = " x86-64/family10 " ;
break ;
2005-04-17 02:20:36 +04:00
}
break ;
case X86_VENDOR_INTEL :
switch ( family ) {
/* Pentium IV */
case 0xf :
if ( ! p4_init ( & cpu_type ) )
return - ENODEV ;
break ;
/* A P6-class processor */
case 6 :
if ( ! ppro_init ( & cpu_type ) )
return - ENODEV ;
break ;
default :
return - ENODEV ;
}
break ;
default :
return - ENODEV ;
}
2007-02-17 21:13:42 +03:00
init_sysfs ( ) ;
2005-04-17 02:20:36 +04:00
using_nmi = 1 ;
ops - > create_files = nmi_create_files ;
ops - > setup = nmi_setup ;
ops - > shutdown = nmi_shutdown ;
ops - > start = nmi_start ;
ops - > stop = nmi_stop ;
ops - > cpu_type = cpu_type ;
printk ( KERN_INFO " oprofile: using NMI interrupt. \n " ) ;
return 0 ;
}
2005-09-07 02:17:26 +04:00
void op_nmi_exit ( void )
2005-04-17 02:20:36 +04:00
{
if ( using_nmi )
2007-02-17 21:13:42 +03:00
exit_sysfs ( ) ;
2005-04-17 02:20:36 +04:00
}