2010-03-11 19:54:39 +03:00
/*
2011-03-17 16:24:16 -03:00
* Netburst Performance Events ( P4 , old Xeon )
2010-03-11 19:54:39 +03:00
*
* Copyright ( C ) 2010 Parallels , Inc . , Cyrill Gorcunov < gorcunov @ openvz . org >
* Copyright ( C ) 2010 Intel Corporation , Lin Ming < ming . m . lin @ intel . com >
*
* For licencing details see kernel - base / COPYING
*/
# ifdef CONFIG_CPU_SUP_INTEL
# include <asm/perf_event_p4.h>
2010-03-24 12:09:26 +08:00
# define P4_CNTR_LIMIT 3
2010-03-11 19:54:39 +03:00
/*
* array indices : 0 , 1 - HT threads , used with HT enabled cpu
*/
2010-03-24 12:09:26 +08:00
struct p4_event_bind {
unsigned int opcode ; /* Event code and ESCR selector */
unsigned int escr_msr [ 2 ] ; /* ESCR MSR for this event */
2010-08-25 22:23:34 +04:00
unsigned int escr_emask ; /* valid ESCR EventMask bits */
unsigned int shared ; /* event is shared across threads */
2010-05-14 23:08:15 +04:00
char cntr [ 2 ] [ P4_CNTR_LIMIT ] ; /* counter index (offset), -1 on abscence */
2010-03-11 19:54:39 +03:00
} ;
2010-07-05 10:09:29 +08:00
struct p4_pebs_bind {
2010-03-24 12:09:26 +08:00
unsigned int metric_pebs ;
unsigned int metric_vert ;
2010-03-11 19:54:39 +03:00
} ;
2010-07-05 10:09:29 +08:00
/* it sets P4_PEBS_ENABLE_UOP_TAG as well */
# define P4_GEN_PEBS_BIND(name, pebs, vert) \
[ P4_PEBS_METRIC__ # # name ] = { \
. metric_pebs = pebs | P4_PEBS_ENABLE_UOP_TAG , \
. metric_vert = vert , \
2010-03-24 12:09:26 +08:00
}
2010-07-05 10:09:29 +08:00
/*
* note we have P4_PEBS_ENABLE_UOP_TAG always set here
*
* it ' s needed for mapping P4_PEBS_CONFIG_METRIC_MASK bits of
* event configuration to find out which values are to be
* written into MSR_IA32_PEBS_ENABLE and MSR_P4_PEBS_MATRIX_VERT
* resgisters
*/
static struct p4_pebs_bind p4_pebs_bind_map [ ] = {
P4_GEN_PEBS_BIND ( 1 stl_cache_load_miss_retired , 0x0000001 , 0x0000001 ) ,
P4_GEN_PEBS_BIND ( 2 ndl_cache_load_miss_retired , 0x0000002 , 0x0000001 ) ,
P4_GEN_PEBS_BIND ( dtlb_load_miss_retired , 0x0000004 , 0x0000001 ) ,
P4_GEN_PEBS_BIND ( dtlb_store_miss_retired , 0x0000004 , 0x0000002 ) ,
P4_GEN_PEBS_BIND ( dtlb_all_miss_retired , 0x0000004 , 0x0000003 ) ,
P4_GEN_PEBS_BIND ( tagged_mispred_branch , 0x0018000 , 0x0000010 ) ,
P4_GEN_PEBS_BIND ( mob_load_replay_retired , 0x0000200 , 0x0000001 ) ,
P4_GEN_PEBS_BIND ( split_load_retired , 0x0000400 , 0x0000001 ) ,
P4_GEN_PEBS_BIND ( split_store_retired , 0x0000400 , 0x0000002 ) ,
2010-03-24 12:09:26 +08:00
} ;
/*
* Note that we don ' t use CCCR1 here , there is an
* exception for P4_BSQ_ALLOCATION but we just have
* no workaround
*
* consider this binding as resources which particular
* event may borrow , it doesn ' t contain EventMask ,
* Tags and friends - - they are left to a caller
*/
static struct p4_event_bind p4_event_bind_map [ ] = {
[ P4_EVENT_TC_DELIVER_MODE ] = {
. opcode = P4_OPCODE ( P4_EVENT_TC_DELIVER_MODE ) ,
. escr_msr = { MSR_P4_TC_ESCR0 , MSR_P4_TC_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , DD ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , DB ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , DI ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , BD ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , BB ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , BI ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_DELIVER_MODE , ID ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 4 , 5 , - 1 } , { 6 , 7 , - 1 } } ,
} ,
[ P4_EVENT_BPU_FETCH_REQUEST ] = {
. opcode = P4_OPCODE ( P4_EVENT_BPU_FETCH_REQUEST ) ,
. escr_msr = { MSR_P4_BPU_ESCR0 , MSR_P4_BPU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_BPU_FETCH_REQUEST , TCMISS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_ITLB_REFERENCE ] = {
. opcode = P4_OPCODE ( P4_EVENT_ITLB_REFERENCE ) ,
. escr_msr = { MSR_P4_ITLB_ESCR0 , MSR_P4_ITLB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_ITLB_REFERENCE , HIT ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_ITLB_REFERENCE , MISS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_ITLB_REFERENCE , HIT_UK ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_MEMORY_CANCEL ] = {
. opcode = P4_OPCODE ( P4_EVENT_MEMORY_CANCEL ) ,
. escr_msr = { MSR_P4_DAC_ESCR0 , MSR_P4_DAC_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_MEMORY_CANCEL , ST_RB_FULL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MEMORY_CANCEL , 64 K_CONF ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_MEMORY_COMPLETE ] = {
. opcode = P4_OPCODE ( P4_EVENT_MEMORY_COMPLETE ) ,
. escr_msr = { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_MEMORY_COMPLETE , LSC ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MEMORY_COMPLETE , SSC ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_LOAD_PORT_REPLAY ] = {
. opcode = P4_OPCODE ( P4_EVENT_LOAD_PORT_REPLAY ) ,
. escr_msr = { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_LOAD_PORT_REPLAY , SPLIT_LD ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_STORE_PORT_REPLAY ] = {
. opcode = P4_OPCODE ( P4_EVENT_STORE_PORT_REPLAY ) ,
. escr_msr = { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_STORE_PORT_REPLAY , SPLIT_ST ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_MOB_LOAD_REPLAY ] = {
. opcode = P4_OPCODE ( P4_EVENT_MOB_LOAD_REPLAY ) ,
. escr_msr = { MSR_P4_MOB_ESCR0 , MSR_P4_MOB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_MOB_LOAD_REPLAY , NO_STA ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MOB_LOAD_REPLAY , NO_STD ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MOB_LOAD_REPLAY , PARTIAL_DATA ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MOB_LOAD_REPLAY , UNALGN_ADDR ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_PAGE_WALK_TYPE ] = {
. opcode = P4_OPCODE ( P4_EVENT_PAGE_WALK_TYPE ) ,
. escr_msr = { MSR_P4_PMH_ESCR0 , MSR_P4_PMH_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_PAGE_WALK_TYPE , DTMISS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_PAGE_WALK_TYPE , ITMISS ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_BSQ_CACHE_REFERENCE ] = {
. opcode = P4_OPCODE ( P4_EVENT_BSQ_CACHE_REFERENCE ) ,
. escr_msr = { MSR_P4_BSU_ESCR0 , MSR_P4_BSU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_HITS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_HITE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_HITM ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_HITS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_HITE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_HITM ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_MISS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_MISS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , WR_2ndL_MISS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_IOQ_ALLOCATION ] = {
. opcode = P4_OPCODE ( P4_EVENT_IOQ_ALLOCATION ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , DEFAULT ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , ALL_READ ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , ALL_WRITE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , MEM_UC ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , MEM_WC ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , MEM_WT ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , MEM_WP ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , MEM_WB ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , OWN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , OTHER ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ALLOCATION , PREFETCH ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_IOQ_ACTIVE_ENTRIES ] = { /* shared ESCR */
. opcode = P4_OPCODE ( P4_EVENT_IOQ_ACTIVE_ENTRIES ) ,
. escr_msr = { MSR_P4_FSB_ESCR1 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , DEFAULT ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , ALL_READ ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , ALL_WRITE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , MEM_UC ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , MEM_WC ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , MEM_WT ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , MEM_WP ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , MEM_WB ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , OWN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , OTHER ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_IOQ_ACTIVE_ENTRIES , PREFETCH ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 2 , - 1 , - 1 } , { 3 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_FSB_DATA_ACTIVITY ] = {
. opcode = P4_OPCODE ( P4_EVENT_FSB_DATA_ACTIVITY ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DRDY_DRV ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DRDY_OWN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DRDY_OTHER ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DBSY_DRV ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DBSY_OWN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DBSY_OTHER ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_BSQ_ALLOCATION ] = { /* shared ESCR, broken CCCR1 */
. opcode = P4_OPCODE ( P4_EVENT_BSQ_ALLOCATION ) ,
. escr_msr = { MSR_P4_BSU_ESCR0 , MSR_P4_BSU_ESCR0 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_TYPE0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_TYPE1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_LEN0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_LEN1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_IO_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_LOCK_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_CACHE_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_SPLIT_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_DEM_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , REQ_ORD_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , MEM_TYPE0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , MEM_TYPE1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ALLOCATION , MEM_TYPE2 ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 1 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_BSQ_ACTIVE_ENTRIES ] = { /* shared ESCR */
. opcode = P4_OPCODE ( P4_EVENT_BSQ_ACTIVE_ENTRIES ) ,
. escr_msr = { MSR_P4_BSU_ESCR1 , MSR_P4_BSU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_TYPE0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_TYPE1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_LEN0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_LEN1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_IO_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_LOCK_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_CACHE_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_SPLIT_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_DEM_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , REQ_ORD_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , MEM_TYPE0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , MEM_TYPE1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_ACTIVE_ENTRIES , MEM_TYPE2 ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 2 , - 1 , - 1 } , { 3 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_SSE_INPUT_ASSIST ] = {
. opcode = P4_OPCODE ( P4_EVENT_SSE_INPUT_ASSIST ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_SSE_INPUT_ASSIST , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_PACKED_SP_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_PACKED_SP_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_PACKED_SP_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_PACKED_DP_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_PACKED_DP_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_PACKED_DP_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_SCALAR_SP_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_SCALAR_SP_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_SCALAR_SP_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_SCALAR_DP_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_SCALAR_DP_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_SCALAR_DP_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_64BIT_MMX_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_64BIT_MMX_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_64BIT_MMX_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_128BIT_MMX_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_128BIT_MMX_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_128BIT_MMX_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_X87_FP_UOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_X87_FP_UOP ) ,
. escr_msr = { MSR_P4_FIRM_ESCR0 , MSR_P4_FIRM_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_X87_FP_UOP , ALL ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_TC_MISC ] = {
. opcode = P4_OPCODE ( P4_EVENT_TC_MISC ) ,
. escr_msr = { MSR_P4_TC_ESCR0 , MSR_P4_TC_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_MISC , FLUSH ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 4 , 5 , - 1 } , { 6 , 7 , - 1 } } ,
} ,
[ P4_EVENT_GLOBAL_POWER_EVENTS ] = {
. opcode = P4_OPCODE ( P4_EVENT_GLOBAL_POWER_EVENTS ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_GLOBAL_POWER_EVENTS , RUNNING ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_TC_MS_XFER ] = {
. opcode = P4_OPCODE ( P4_EVENT_TC_MS_XFER ) ,
. escr_msr = { MSR_P4_MS_ESCR0 , MSR_P4_MS_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_TC_MS_XFER , CISC ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 4 , 5 , - 1 } , { 6 , 7 , - 1 } } ,
} ,
[ P4_EVENT_UOP_QUEUE_WRITES ] = {
. opcode = P4_OPCODE ( P4_EVENT_UOP_QUEUE_WRITES ) ,
. escr_msr = { MSR_P4_MS_ESCR0 , MSR_P4_MS_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_UOP_QUEUE_WRITES , FROM_TC_BUILD ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_UOP_QUEUE_WRITES , FROM_TC_DELIVER ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_UOP_QUEUE_WRITES , FROM_ROM ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 4 , 5 , - 1 } , { 6 , 7 , - 1 } } ,
} ,
[ P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE ] = {
. opcode = P4_OPCODE ( P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE ) ,
. escr_msr = { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR0 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE , CONDITIONAL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE , CALL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE , RETURN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE , INDIRECT ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 4 , 5 , - 1 } , { 6 , 7 , - 1 } } ,
} ,
[ P4_EVENT_RETIRED_BRANCH_TYPE ] = {
. opcode = P4_OPCODE ( P4_EVENT_RETIRED_BRANCH_TYPE ) ,
. escr_msr = { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , CONDITIONAL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , CALL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , RETURN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , INDIRECT ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 4 , 5 , - 1 } , { 6 , 7 , - 1 } } ,
} ,
[ P4_EVENT_RESOURCE_STALL ] = {
. opcode = P4_OPCODE ( P4_EVENT_RESOURCE_STALL ) ,
. escr_msr = { MSR_P4_ALF_ESCR0 , MSR_P4_ALF_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_RESOURCE_STALL , SBFULL ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_WC_BUFFER ] = {
. opcode = P4_OPCODE ( P4_EVENT_WC_BUFFER ) ,
. escr_msr = { MSR_P4_DAC_ESCR0 , MSR_P4_DAC_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_WC_BUFFER , WCB_EVICTS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_WC_BUFFER , WCB_FULL_EVICTS ) ,
. shared = 1 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 8 , 9 , - 1 } , { 10 , 11 , - 1 } } ,
} ,
[ P4_EVENT_B2B_CYCLES ] = {
. opcode = P4_OPCODE ( P4_EVENT_B2B_CYCLES ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask = 0 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_BNR ] = {
. opcode = P4_OPCODE ( P4_EVENT_BNR ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask = 0 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_SNOOP ] = {
. opcode = P4_OPCODE ( P4_EVENT_SNOOP ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask = 0 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_RESPONSE ] = {
. opcode = P4_OPCODE ( P4_EVENT_RESPONSE ) ,
. escr_msr = { MSR_P4_FSB_ESCR0 , MSR_P4_FSB_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask = 0 ,
2010-03-24 12:09:26 +08:00
. cntr = { { 0 , - 1 , - 1 } , { 2 , - 1 , - 1 } } ,
} ,
[ P4_EVENT_FRONT_END_EVENT ] = {
. opcode = P4_OPCODE ( P4_EVENT_FRONT_END_EVENT ) ,
. escr_msr = { MSR_P4_CRU_ESCR2 , MSR_P4_CRU_ESCR3 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_FRONT_END_EVENT , NBOGUS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FRONT_END_EVENT , BOGUS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_EXECUTION_EVENT ] = {
. opcode = P4_OPCODE ( P4_EVENT_EXECUTION_EVENT ) ,
. escr_msr = { MSR_P4_CRU_ESCR2 , MSR_P4_CRU_ESCR3 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS2 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS3 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS2 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS3 ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_REPLAY_EVENT ] = {
. opcode = P4_OPCODE ( P4_EVENT_REPLAY_EVENT ) ,
. escr_msr = { MSR_P4_CRU_ESCR2 , MSR_P4_CRU_ESCR3 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_REPLAY_EVENT , NBOGUS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_REPLAY_EVENT , BOGUS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_INSTR_RETIRED ] = {
. opcode = P4_OPCODE ( P4_EVENT_INSTR_RETIRED ) ,
. escr_msr = { MSR_P4_CRU_ESCR0 , MSR_P4_CRU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_RETIRED , NBOGUSNTAG ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_RETIRED , NBOGUSTAG ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_RETIRED , BOGUSNTAG ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_RETIRED , BOGUSTAG ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_UOPS_RETIRED ] = {
. opcode = P4_OPCODE ( P4_EVENT_UOPS_RETIRED ) ,
. escr_msr = { MSR_P4_CRU_ESCR0 , MSR_P4_CRU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_UOPS_RETIRED , NBOGUS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_UOPS_RETIRED , BOGUS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_UOP_TYPE ] = {
. opcode = P4_OPCODE ( P4_EVENT_UOP_TYPE ) ,
. escr_msr = { MSR_P4_RAT_ESCR0 , MSR_P4_RAT_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_UOP_TYPE , TAGLOADS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_UOP_TYPE , TAGSTORES ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_BRANCH_RETIRED ] = {
. opcode = P4_OPCODE ( P4_EVENT_BRANCH_RETIRED ) ,
. escr_msr = { MSR_P4_CRU_ESCR2 , MSR_P4_CRU_ESCR3 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_BRANCH_RETIRED , MMNP ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BRANCH_RETIRED , MMNM ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BRANCH_RETIRED , MMTP ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BRANCH_RETIRED , MMTM ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_MISPRED_BRANCH_RETIRED ] = {
. opcode = P4_OPCODE ( P4_EVENT_MISPRED_BRANCH_RETIRED ) ,
. escr_msr = { MSR_P4_CRU_ESCR0 , MSR_P4_CRU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
2011-03-28 00:46:11 +04:00
P4_ESCR_EMASK_BIT ( P4_EVENT_MISPRED_BRANCH_RETIRED , NBOGUS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_X87_ASSIST ] = {
. opcode = P4_OPCODE ( P4_EVENT_X87_ASSIST ) ,
. escr_msr = { MSR_P4_CRU_ESCR2 , MSR_P4_CRU_ESCR3 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_X87_ASSIST , FPSU ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_X87_ASSIST , FPSO ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_X87_ASSIST , POAO ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_X87_ASSIST , POAU ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_X87_ASSIST , PREA ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_MACHINE_CLEAR ] = {
. opcode = P4_OPCODE ( P4_EVENT_MACHINE_CLEAR ) ,
. escr_msr = { MSR_P4_CRU_ESCR2 , MSR_P4_CRU_ESCR3 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_MACHINE_CLEAR , CLEAR ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MACHINE_CLEAR , MOCLEAR ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MACHINE_CLEAR , SMCLEAR ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
[ P4_EVENT_INSTR_COMPLETED ] = {
. opcode = P4_OPCODE ( P4_EVENT_INSTR_COMPLETED ) ,
. escr_msr = { MSR_P4_CRU_ESCR0 , MSR_P4_CRU_ESCR1 } ,
2010-08-25 22:23:34 +04:00
. escr_emask =
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_COMPLETED , NBOGUS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_COMPLETED , BOGUS ) ,
2010-03-24 12:09:26 +08:00
. cntr = { { 12 , 13 , 16 } , { 14 , 15 , 17 } } ,
} ,
} ;
2010-03-11 19:54:39 +03:00
2010-07-05 10:09:29 +08:00
# define P4_GEN_CACHE_EVENT(event, bit, metric) \
2010-03-24 12:09:26 +08:00
p4_config_pack_escr ( P4_ESCR_EVENT ( event ) | \
P4_ESCR_EMASK_BIT ( event , bit ) ) | \
2010-07-05 10:09:29 +08:00
p4_config_pack_cccr ( metric | \
2010-03-24 12:09:26 +08:00
P4_CCCR_ESEL ( P4_OPCODE_ESEL ( P4_OPCODE ( event ) ) ) )
2010-03-18 18:33:12 +08:00
2010-03-29 13:09:53 +02:00
static __initconst const u64 p4_hw_cache_event_ids
2010-03-18 18:33:12 +08:00
[ PERF_COUNT_HW_CACHE_MAX ]
[ PERF_COUNT_HW_CACHE_OP_MAX ]
[ PERF_COUNT_HW_CACHE_RESULT_MAX ] =
{
[ C ( L1D ) ] = {
[ C ( OP_READ ) ] = {
[ C ( RESULT_ACCESS ) ] = 0x0 ,
2010-03-24 12:09:26 +08:00
[ C ( RESULT_MISS ) ] = P4_GEN_CACHE_EVENT ( P4_EVENT_REPLAY_EVENT , NBOGUS ,
2010-07-05 10:09:29 +08:00
P4_PEBS_METRIC__1stl_cache_load_miss_retired ) ,
2010-03-18 18:33:12 +08:00
} ,
} ,
[ C ( LL ) ] = {
[ C ( OP_READ ) ] = {
[ C ( RESULT_ACCESS ) ] = 0x0 ,
2010-03-24 12:09:26 +08:00
[ C ( RESULT_MISS ) ] = P4_GEN_CACHE_EVENT ( P4_EVENT_REPLAY_EVENT , NBOGUS ,
2010-07-05 10:09:29 +08:00
P4_PEBS_METRIC__2ndl_cache_load_miss_retired ) ,
2010-03-18 18:33:12 +08:00
} ,
2010-03-24 12:09:26 +08:00
} ,
2010-03-18 18:33:12 +08:00
[ C ( DTLB ) ] = {
[ C ( OP_READ ) ] = {
[ C ( RESULT_ACCESS ) ] = 0x0 ,
2010-03-24 12:09:26 +08:00
[ C ( RESULT_MISS ) ] = P4_GEN_CACHE_EVENT ( P4_EVENT_REPLAY_EVENT , NBOGUS ,
2010-07-05 10:09:29 +08:00
P4_PEBS_METRIC__dtlb_load_miss_retired ) ,
2010-03-18 18:33:12 +08:00
} ,
[ C ( OP_WRITE ) ] = {
[ C ( RESULT_ACCESS ) ] = 0x0 ,
2010-03-24 12:09:26 +08:00
[ C ( RESULT_MISS ) ] = P4_GEN_CACHE_EVENT ( P4_EVENT_REPLAY_EVENT , NBOGUS ,
2010-07-05 10:09:29 +08:00
P4_PEBS_METRIC__dtlb_store_miss_retired ) ,
2010-03-18 18:33:12 +08:00
} ,
} ,
[ C ( ITLB ) ] = {
[ C ( OP_READ ) ] = {
2010-03-24 12:09:26 +08:00
[ C ( RESULT_ACCESS ) ] = P4_GEN_CACHE_EVENT ( P4_EVENT_ITLB_REFERENCE , HIT ,
2010-07-05 10:09:29 +08:00
P4_PEBS_METRIC__none ) ,
2010-03-24 12:09:26 +08:00
[ C ( RESULT_MISS ) ] = P4_GEN_CACHE_EVENT ( P4_EVENT_ITLB_REFERENCE , MISS ,
2010-07-05 10:09:29 +08:00
P4_PEBS_METRIC__none ) ,
2010-03-18 18:33:12 +08:00
} ,
[ C ( OP_WRITE ) ] = {
[ C ( RESULT_ACCESS ) ] = - 1 ,
[ C ( RESULT_MISS ) ] = - 1 ,
} ,
[ C ( OP_PREFETCH ) ] = {
[ C ( RESULT_ACCESS ) ] = - 1 ,
[ C ( RESULT_MISS ) ] = - 1 ,
} ,
} ,
} ;
2010-03-24 12:09:26 +08:00
static u64 p4_general_events [ PERF_COUNT_HW_MAX ] = {
/* non-halted CPU clocks */
[ PERF_COUNT_HW_CPU_CYCLES ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_GLOBAL_POWER_EVENTS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_GLOBAL_POWER_EVENTS , RUNNING ) ) ,
/*
* retired instructions
* in a sake of simplicity we don ' t use the FSB tagging
*/
[ PERF_COUNT_HW_INSTRUCTIONS ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_INSTR_RETIRED ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_RETIRED , NBOGUSNTAG ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_INSTR_RETIRED , BOGUSNTAG ) ) ,
/* cache hits */
[ PERF_COUNT_HW_CACHE_REFERENCES ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_BSQ_CACHE_REFERENCE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_HITS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_HITE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_HITM ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_HITS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_HITE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_HITM ) ) ,
/* cache misses */
[ PERF_COUNT_HW_CACHE_MISSES ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_BSQ_CACHE_REFERENCE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_2ndL_MISS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , RD_3rdL_MISS ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_BSQ_CACHE_REFERENCE , WR_2ndL_MISS ) ) ,
/* branch instructions retired */
[ PERF_COUNT_HW_BRANCH_INSTRUCTIONS ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_RETIRED_BRANCH_TYPE ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , CONDITIONAL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , CALL ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , RETURN ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_RETIRED_BRANCH_TYPE , INDIRECT ) ) ,
/* mispredicted branches retired */
[ PERF_COUNT_HW_BRANCH_MISSES ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_MISPRED_BRANCH_RETIRED ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_MISPRED_BRANCH_RETIRED , NBOGUS ) ) ,
/* bus ready clocks (cpu is driving #DRDY_DRV\#DRDY_OWN): */
[ PERF_COUNT_HW_BUS_CYCLES ] =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_FSB_DATA_ACTIVITY ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DRDY_DRV ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_FSB_DATA_ACTIVITY , DRDY_OWN ) ) |
p4_config_pack_cccr ( P4_CCCR_EDGE | P4_CCCR_COMPARE ) ,
2010-03-11 19:54:39 +03:00
} ;
2010-03-24 12:09:26 +08:00
static struct p4_event_bind * p4_config_get_bind ( u64 config )
{
unsigned int evnt = p4_config_unpack_event ( config ) ;
struct p4_event_bind * bind = NULL ;
if ( evnt < ARRAY_SIZE ( p4_event_bind_map ) )
bind = & p4_event_bind_map [ evnt ] ;
return bind ;
}
2010-03-11 19:54:39 +03:00
static u64 p4_pmu_event_map ( int hw_event )
{
2010-03-24 12:09:26 +08:00
struct p4_event_bind * bind ;
unsigned int esel ;
2010-03-11 19:54:39 +03:00
u64 config ;
2010-03-24 12:09:26 +08:00
config = p4_general_events [ hw_event ] ;
bind = p4_config_get_bind ( config ) ;
esel = P4_OPCODE_ESEL ( bind - > opcode ) ;
config | = p4_config_pack_cccr ( P4_CCCR_ESEL ( esel ) ) ;
2010-03-11 19:54:39 +03:00
return config ;
}
2010-08-25 22:23:34 +04:00
/* check cpu model specifics */
static bool p4_event_match_cpu_model ( unsigned int event_idx )
{
/* INSTR_COMPLETED event only exist for model 3, 4, 6 (Prescott) */
if ( event_idx = = P4_EVENT_INSTR_COMPLETED ) {
if ( boot_cpu_data . x86_model ! = 3 & &
boot_cpu_data . x86_model ! = 4 & &
boot_cpu_data . x86_model ! = 6 )
return false ;
}
/*
* For info
* - IQ_ESCR0 , IQ_ESCR1 only for models 1 and 2
*/
return true ;
}
2010-07-05 10:09:29 +08:00
static int p4_validate_raw_event ( struct perf_event * event )
{
2010-08-25 22:23:34 +04:00
unsigned int v , emask ;
2010-07-05 10:09:29 +08:00
2010-08-25 22:23:34 +04:00
/* User data may have out-of-bound event index */
2010-07-05 10:09:29 +08:00
v = p4_config_unpack_event ( event - > attr . config ) ;
2010-08-25 22:23:34 +04:00
if ( v > = ARRAY_SIZE ( p4_event_bind_map ) )
return - EINVAL ;
/* It may be unsupported: */
if ( ! p4_event_match_cpu_model ( v ) )
2010-07-05 10:09:29 +08:00
return - EINVAL ;
2010-08-25 22:23:34 +04:00
/*
* NOTE : P4_CCCR_THREAD_ANY has not the same meaning as
* in Architectural Performance Monitoring , it means not
* on _which_ logical cpu to count but rather _when_ , ie it
* depends on logical cpu state - - count event if one cpu active ,
* none , both or any , so we just allow user to pass any value
* desired .
*
* In turn we always set Tx_OS / Tx_USR bits bound to logical
* cpu without their propagation to another cpu
*/
/*
2011-03-17 16:24:16 -03:00
* if an event is shared across the logical threads
2010-08-25 22:23:34 +04:00
* the user needs special permissions to be able to use it
*/
2011-01-25 17:32:01 +02:00
if ( p4_ht_active ( ) & & p4_event_bind_map [ v ] . shared ) {
2010-08-25 22:23:34 +04:00
if ( perf_paranoid_cpu ( ) & & ! capable ( CAP_SYS_ADMIN ) )
return - EACCES ;
2010-07-05 10:09:29 +08:00
}
2010-08-25 22:23:34 +04:00
/* ESCR EventMask bits may be invalid */
emask = p4_config_unpack_escr ( event - > attr . config ) & P4_ESCR_EVENTMASK_MASK ;
if ( emask & ~ p4_event_bind_map [ v ] . escr_emask )
return - EINVAL ;
2010-07-05 10:09:29 +08:00
/*
2010-08-25 22:23:34 +04:00
* it may have some invalid PEBS bits
2010-07-05 10:09:29 +08:00
*/
2010-08-25 22:23:34 +04:00
if ( p4_config_pebs_has ( event - > attr . config , P4_PEBS_CONFIG_ENABLE ) )
2010-07-05 10:09:29 +08:00
return - EINVAL ;
2010-08-25 22:23:34 +04:00
2010-07-05 10:09:29 +08:00
v = p4_config_unpack_metric ( event - > attr . config ) ;
2010-08-25 22:23:34 +04:00
if ( v > = ARRAY_SIZE ( p4_pebs_bind_map ) )
2010-07-05 10:09:29 +08:00
return - EINVAL ;
return 0 ;
}
2011-06-23 16:49:18 +04:00
static void p4_hw_watchdog_set_attr ( struct perf_event_attr * wd_attr )
{
/*
* Watchdog ticks are special on Netburst , we use
* that named " non-sleeping " ticks as recommended
* by Intel SDM Vol3b .
*/
WARN_ON_ONCE ( wd_attr - > type ! = PERF_TYPE_HARDWARE | |
wd_attr - > config ! = PERF_COUNT_HW_CPU_CYCLES ) ;
wd_attr - > type = PERF_TYPE_RAW ;
wd_attr - > config =
p4_config_pack_escr ( P4_ESCR_EVENT ( P4_EVENT_EXECUTION_EVENT ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS2 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , NBOGUS3 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS0 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS1 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS2 ) |
P4_ESCR_EMASK_BIT ( P4_EVENT_EXECUTION_EVENT , BOGUS3 ) ) |
p4_config_pack_cccr ( P4_CCCR_THRESHOLD ( 15 ) | P4_CCCR_COMPLEMENT |
P4_CCCR_COMPARE ) ;
}
2010-03-30 17:00:06 +02:00
static int p4_hw_config ( struct perf_event * event )
2010-03-11 19:54:39 +03:00
{
2010-05-08 15:25:52 +04:00
int cpu = get_cpu ( ) ;
int rc = 0 ;
2010-03-24 12:09:26 +08:00
u32 escr , cccr ;
2010-03-11 19:54:39 +03:00
/*
* the reason we use cpu that early is that : if we get scheduled
* first time on the same cpu - - we will not need swap thread
* specific flags in config ( and will save some cpu cycles )
*/
2010-03-24 12:09:26 +08:00
cccr = p4_default_cccr_conf ( cpu ) ;
2010-03-30 17:00:06 +02:00
escr = p4_default_escr_conf ( cpu , event - > attr . exclude_kernel ,
event - > attr . exclude_user ) ;
event - > hw . config = p4_config_pack_escr ( escr ) |
p4_config_pack_cccr ( cccr ) ;
2010-03-11 19:54:39 +03:00
2010-03-18 18:33:12 +08:00
if ( p4_ht_active ( ) & & p4_ht_thread ( cpu ) )
2010-03-30 17:00:06 +02:00
event - > hw . config = p4_set_ht_bit ( event - > hw . config ) ;
2010-05-08 15:39:52 +04:00
if ( event - > attr . type = = PERF_TYPE_RAW ) {
2011-01-25 17:32:01 +02:00
struct p4_event_bind * bind ;
unsigned int esel ;
2010-08-25 22:23:34 +04:00
/*
* Clear bits we reserve to be managed by kernel itself
* and never allowed from a user space
*/
event - > attr . config & = P4_CONFIG_MASK ;
2010-07-05 10:09:29 +08:00
rc = p4_validate_raw_event ( event ) ;
if ( rc )
2010-05-08 15:25:54 +04:00
goto out ;
2010-05-08 15:39:52 +04:00
/*
2010-07-05 10:09:29 +08:00
* Note that for RAW events we allow user to use P4_CCCR_RESERVED
* bits since we keep additional info here ( for cache events and etc )
2010-05-08 15:39:52 +04:00
*/
2010-08-25 22:23:34 +04:00
event - > hw . config | = event - > attr . config ;
2011-01-25 17:32:01 +02:00
bind = p4_config_get_bind ( event - > attr . config ) ;
if ( ! bind ) {
rc = - EINVAL ;
goto out ;
}
esel = P4_OPCODE_ESEL ( bind - > opcode ) ;
event - > hw . config | = p4_config_pack_cccr ( P4_CCCR_ESEL ( esel ) ) ;
2010-05-08 15:39:52 +04:00
}
2010-03-18 18:33:12 +08:00
2010-05-08 15:25:52 +04:00
rc = x86_setup_perfctr ( event ) ;
2010-05-08 15:25:54 +04:00
out :
2010-05-08 15:25:52 +04:00
put_cpu ( ) ;
return rc ;
2010-03-11 19:54:39 +03:00
}
2010-05-17 16:13:04 +08:00
static inline int p4_pmu_clear_cccr_ovf ( struct hw_perf_event * hwc )
2010-03-11 19:54:39 +03:00
{
2011-01-07 21:42:06 +03:00
u64 v ;
2010-03-11 19:54:39 +03:00
2011-01-07 21:42:06 +03:00
/* an official way for overflow indication */
2011-02-02 17:40:59 +01:00
rdmsrl ( hwc - > config_base , v ) ;
2011-01-07 21:42:06 +03:00
if ( v & P4_CCCR_OVF ) {
2011-02-02 17:40:59 +01:00
wrmsrl ( hwc - > config_base , v & ~ P4_CCCR_OVF ) ;
2011-01-07 21:42:06 +03:00
return 1 ;
2010-03-11 19:54:39 +03:00
}
2010-05-17 16:13:04 +08:00
2011-02-16 14:08:02 +03:00
/*
* In some circumstances the overflow might issue an NMI but did
* not set P4_CCCR_OVF bit . Because a counter holds a negative value
* we simply check for high bit being set , if it ' s cleared it means
* the counter has reached zero value and continued counting before
* real NMI signal was received :
*/
2011-03-24 23:36:25 +03:00
rdmsrl ( hwc - > event_base , v ) ;
2011-02-16 14:08:02 +03:00
if ( ! ( v & ARCH_P4_UNFLAGGED_BIT ) )
2011-01-07 21:42:06 +03:00
return 1 ;
return 0 ;
2010-03-11 19:54:39 +03:00
}
2010-07-05 10:09:29 +08:00
static void p4_pmu_disable_pebs ( void )
{
/*
* FIXME
*
* It ' s still allowed that two threads setup same cache
* events so we can ' t simply clear metrics until we knew
2011-03-17 16:24:16 -03:00
* no one is depending on us , so we need kind of counter
2010-07-05 10:09:29 +08:00
* for " ReplayEvent " users .
*
* What is more complex - - RAW events , if user ( for some
* reason ) will pass some cache event metric with improper
* event opcode - - it ' s fine from hardware point of view
2011-03-17 16:24:16 -03:00
* but completely nonsense from " meaning " of such action .
2010-07-05 10:09:29 +08:00
*
* So at moment let leave metrics turned on forever - - it ' s
* ok for now but need to be revisited !
*
* ( void ) checking_wrmsrl ( MSR_IA32_PEBS_ENABLE , ( u64 ) 0 ) ;
* ( void ) checking_wrmsrl ( MSR_P4_PEBS_MATRIX_VERT , ( u64 ) 0 ) ;
*/
}
2010-03-11 19:54:39 +03:00
static inline void p4_pmu_disable_event ( struct perf_event * event )
{
struct hw_perf_event * hwc = & event - > hw ;
/*
* If event gets disabled while counter is in overflowed
* state we need to clear P4_CCCR_OVF , otherwise interrupt get
* asserted again and again
*/
2011-02-02 17:40:59 +01:00
( void ) checking_wrmsrl ( hwc - > config_base ,
2010-03-11 19:54:39 +03:00
( u64 ) ( p4_config_unpack_cccr ( hwc - > config ) ) &
2010-03-24 12:09:26 +08:00
~ P4_CCCR_ENABLE & ~ P4_CCCR_OVF & ~ P4_CCCR_RESERVED ) ;
2010-03-11 19:54:39 +03:00
}
static void p4_pmu_disable_all ( void )
{
struct cpu_hw_events * cpuc = & __get_cpu_var ( cpu_hw_events ) ;
int idx ;
2010-03-29 18:36:50 +02:00
for ( idx = 0 ; idx < x86_pmu . num_counters ; idx + + ) {
2010-03-11 19:54:39 +03:00
struct perf_event * event = cpuc - > events [ idx ] ;
if ( ! test_bit ( idx , cpuc - > active_mask ) )
continue ;
p4_pmu_disable_event ( event ) ;
}
2010-07-05 10:09:29 +08:00
p4_pmu_disable_pebs ( ) ;
}
/* configuration must be valid */
static void p4_pmu_enable_pebs ( u64 config )
{
struct p4_pebs_bind * bind ;
unsigned int idx ;
BUILD_BUG_ON ( P4_PEBS_METRIC__max > P4_PEBS_CONFIG_METRIC_MASK ) ;
idx = p4_config_unpack_metric ( config ) ;
if ( idx = = P4_PEBS_METRIC__none )
return ;
bind = & p4_pebs_bind_map [ idx ] ;
( void ) checking_wrmsrl ( MSR_IA32_PEBS_ENABLE , ( u64 ) bind - > metric_pebs ) ;
( void ) checking_wrmsrl ( MSR_P4_PEBS_MATRIX_VERT , ( u64 ) bind - > metric_vert ) ;
2010-03-11 19:54:39 +03:00
}
static void p4_pmu_enable_event ( struct perf_event * event )
{
struct hw_perf_event * hwc = & event - > hw ;
int thread = p4_ht_config_thread ( hwc - > config ) ;
u64 escr_conf = p4_config_unpack_escr ( p4_clear_ht_bit ( hwc - > config ) ) ;
2010-03-24 12:09:26 +08:00
unsigned int idx = p4_config_unpack_event ( hwc - > config ) ;
struct p4_event_bind * bind ;
u64 escr_addr , cccr ;
2010-03-11 19:54:39 +03:00
2010-03-24 12:09:26 +08:00
bind = & p4_event_bind_map [ idx ] ;
escr_addr = ( u64 ) bind - > escr_msr [ thread ] ;
2010-03-11 19:54:39 +03:00
/*
* - we dont support cascaded counters yet
* - and counter 1 is broken ( erratum )
*/
WARN_ON_ONCE ( p4_is_event_cascaded ( hwc - > config ) ) ;
WARN_ON_ONCE ( hwc - > idx = = 1 ) ;
2010-03-24 12:09:26 +08:00
/* we need a real Event value */
escr_conf & = ~ P4_ESCR_EVENT_MASK ;
escr_conf | = P4_ESCR_EVENT ( P4_OPCODE_EVNT ( bind - > opcode ) ) ;
cccr = p4_config_unpack_cccr ( hwc - > config ) ;
/*
2010-07-05 10:09:29 +08:00
* it could be Cache event so we need to write metrics
* into additional MSRs
2010-03-24 12:09:26 +08:00
*/
2010-07-05 10:09:29 +08:00
p4_pmu_enable_pebs ( hwc - > config ) ;
2010-03-24 12:09:26 +08:00
( void ) checking_wrmsrl ( escr_addr , escr_conf ) ;
2011-02-02 17:40:59 +01:00
( void ) checking_wrmsrl ( hwc - > config_base ,
2010-03-24 12:09:26 +08:00
( cccr & ~ P4_CCCR_RESERVED ) | P4_CCCR_ENABLE ) ;
2010-03-11 19:54:39 +03:00
}
2010-03-26 14:08:44 +01:00
static void p4_pmu_enable_all ( int added )
2010-03-11 19:54:39 +03:00
{
struct cpu_hw_events * cpuc = & __get_cpu_var ( cpu_hw_events ) ;
int idx ;
2010-03-29 18:36:50 +02:00
for ( idx = 0 ; idx < x86_pmu . num_counters ; idx + + ) {
2010-03-11 19:54:39 +03:00
struct perf_event * event = cpuc - > events [ idx ] ;
if ( ! test_bit ( idx , cpuc - > active_mask ) )
continue ;
p4_pmu_enable_event ( event ) ;
}
}
static int p4_pmu_handle_irq ( struct pt_regs * regs )
{
struct perf_sample_data data ;
struct cpu_hw_events * cpuc ;
struct perf_event * event ;
struct hw_perf_event * hwc ;
int idx , handled = 0 ;
u64 val ;
2011-04-21 11:03:20 -04:00
perf_sample_data_init ( & data , 0 ) ;
2010-03-11 19:54:39 +03:00
cpuc = & __get_cpu_var ( cpu_hw_events ) ;
2010-03-29 18:36:50 +02:00
for ( idx = 0 ; idx < x86_pmu . num_counters ; idx + + ) {
2010-08-05 19:09:17 +04:00
int overflow ;
2010-03-11 19:54:39 +03:00
2010-09-29 23:01:38 -04:00
if ( ! test_bit ( idx , cpuc - > active_mask ) ) {
/* catch in-flight IRQs */
if ( __test_and_clear_bit ( idx , cpuc - > running ) )
handled + + ;
2010-03-11 19:54:39 +03:00
continue ;
2010-09-29 23:01:38 -04:00
}
2010-03-11 19:54:39 +03:00
event = cpuc - > events [ idx ] ;
hwc = & event - > hw ;
WARN_ON_ONCE ( hwc - > idx ! = idx ) ;
2010-05-17 16:13:04 +08:00
/* it might be unflagged overflow */
2010-08-05 19:09:17 +04:00
overflow = p4_pmu_clear_cccr_ovf ( hwc ) ;
2010-03-11 19:54:39 +03:00
val = x86_perf_event_update ( event ) ;
2010-08-05 19:09:17 +04:00
if ( ! overflow & & ( val & ( 1ULL < < ( x86_pmu . cntval_bits - 1 ) ) ) )
2010-03-11 19:54:39 +03:00
continue ;
2010-08-05 19:09:17 +04:00
handled + = overflow ;
2010-05-17 16:13:04 +08:00
/* event overflow for sure */
data . period = event - > hw . last_period ;
2010-03-11 19:54:39 +03:00
if ( ! x86_perf_event_set_period ( event ) )
continue ;
2011-06-27 14:41:57 +02:00
if ( perf_event_overflow ( event , & data , regs ) )
2011-04-21 11:03:21 -04:00
x86_pmu_stop ( event , 0 ) ;
2010-03-11 19:54:39 +03:00
}
2011-04-27 06:32:33 -04:00
if ( handled )
2010-03-11 19:54:39 +03:00
inc_irq_stat ( apic_perf_irqs ) ;
2011-04-27 06:32:33 -04:00
/*
* When dealing with the unmasking of the LVTPC on P4 perf hw , it has
* been observed that the OVF bit flag has to be cleared first _before_
* the LVTPC can be unmasked .
*
* The reason is the NMI line will continue to be asserted while the OVF
* bit is set . This causes a second NMI to generate if the LVTPC is
* unmasked before the OVF bit is cleared , leading to unknown NMI
* messages .
*/
apic_write ( APIC_LVTPC , APIC_DM_NMI ) ;
2010-03-11 19:54:39 +03:00
2010-09-02 15:07:49 -04:00
return handled ;
2010-03-11 19:54:39 +03:00
}
/*
* swap thread specific fields according to a thread
* we are going to run on
*/
static void p4_pmu_swap_config_ts ( struct hw_perf_event * hwc , int cpu )
{
u32 escr , cccr ;
/*
* we either lucky and continue on same cpu or no HT support
*/
if ( ! p4_should_swap_ts ( hwc - > config , cpu ) )
return ;
/*
* the event is migrated from an another logical
* cpu , so we need to swap thread specific flags
*/
escr = p4_config_unpack_escr ( hwc - > config ) ;
cccr = p4_config_unpack_cccr ( hwc - > config ) ;
if ( p4_ht_thread ( cpu ) ) {
cccr & = ~ P4_CCCR_OVF_PMI_T0 ;
cccr | = P4_CCCR_OVF_PMI_T1 ;
2010-03-24 12:09:26 +08:00
if ( escr & P4_ESCR_T0_OS ) {
escr & = ~ P4_ESCR_T0_OS ;
escr | = P4_ESCR_T1_OS ;
2010-03-11 19:54:39 +03:00
}
2010-03-24 12:09:26 +08:00
if ( escr & P4_ESCR_T0_USR ) {
escr & = ~ P4_ESCR_T0_USR ;
escr | = P4_ESCR_T1_USR ;
2010-03-11 19:54:39 +03:00
}
hwc - > config = p4_config_pack_escr ( escr ) ;
hwc - > config | = p4_config_pack_cccr ( cccr ) ;
hwc - > config | = P4_CONFIG_HT ;
} else {
cccr & = ~ P4_CCCR_OVF_PMI_T1 ;
cccr | = P4_CCCR_OVF_PMI_T0 ;
2010-03-24 12:09:26 +08:00
if ( escr & P4_ESCR_T1_OS ) {
escr & = ~ P4_ESCR_T1_OS ;
escr | = P4_ESCR_T0_OS ;
2010-03-11 19:54:39 +03:00
}
2010-03-24 12:09:26 +08:00
if ( escr & P4_ESCR_T1_USR ) {
escr & = ~ P4_ESCR_T1_USR ;
escr | = P4_ESCR_T0_USR ;
2010-03-11 19:54:39 +03:00
}
hwc - > config = p4_config_pack_escr ( escr ) ;
hwc - > config | = p4_config_pack_cccr ( cccr ) ;
hwc - > config & = ~ P4_CONFIG_HT ;
}
}
2010-05-12 21:42:42 +04:00
/*
* ESCR address hashing is tricky , ESCRs are not sequential
2010-05-19 01:19:17 +04:00
* in memory but all starts from MSR_P4_BSU_ESCR0 ( 0x03a0 ) and
2010-05-12 21:42:42 +04:00
* the metric between any ESCRs is laid in range [ 0xa0 , 0xe1 ]
*
* so we make ~ 70 % filled hashtable
*/
# define P4_ESCR_MSR_BASE 0x000003a0
# define P4_ESCR_MSR_MAX 0x000003e1
# define P4_ESCR_MSR_TABLE_SIZE (P4_ESCR_MSR_MAX - P4_ESCR_MSR_BASE + 1)
# define P4_ESCR_MSR_IDX(msr) (msr - P4_ESCR_MSR_BASE)
# define P4_ESCR_MSR_TABLE_ENTRY(msr) [P4_ESCR_MSR_IDX(msr)] = msr
static const unsigned int p4_escr_table [ P4_ESCR_MSR_TABLE_SIZE ] = {
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_ALF_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_ALF_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_BPU_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_BPU_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_BSU_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_BSU_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_CRU_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_CRU_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_CRU_ESCR2 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_CRU_ESCR3 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_CRU_ESCR4 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_CRU_ESCR5 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_DAC_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_DAC_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_FIRM_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_FIRM_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_FLAME_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_FLAME_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_FSB_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_FSB_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_IQ_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_IQ_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_IS_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_IS_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_ITLB_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_ITLB_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_IX_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_IX_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_MOB_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_MOB_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_MS_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_MS_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_PMH_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_PMH_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_RAT_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_RAT_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_SAAT_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_SAAT_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_SSU_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_SSU_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_TBPU_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_TBPU_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_TC_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_TC_ESCR1 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_U2L_ESCR0 ) ,
P4_ESCR_MSR_TABLE_ENTRY ( MSR_P4_U2L_ESCR1 ) ,
2010-03-11 19:54:39 +03:00
} ;
static int p4_get_escr_idx ( unsigned int addr )
{
2010-05-12 21:42:42 +04:00
unsigned int idx = P4_ESCR_MSR_IDX ( addr ) ;
2010-03-11 19:54:39 +03:00
2010-05-19 01:19:17 +04:00
if ( unlikely ( idx > = P4_ESCR_MSR_TABLE_SIZE | |
! p4_escr_table [ idx ] | |
p4_escr_table [ idx ] ! = addr ) ) {
2010-05-12 21:42:42 +04:00
WARN_ONCE ( 1 , " P4 PMU: Wrong address passed: %x \n " , addr ) ;
return - 1 ;
2010-03-11 19:54:39 +03:00
}
2010-05-12 21:42:42 +04:00
return idx ;
2010-03-11 19:54:39 +03:00
}
2010-03-24 12:09:26 +08:00
static int p4_next_cntr ( int thread , unsigned long * used_mask ,
struct p4_event_bind * bind )
{
2010-05-14 23:08:15 +04:00
int i , j ;
2010-03-24 12:09:26 +08:00
for ( i = 0 ; i < P4_CNTR_LIMIT ; i + + ) {
2010-05-14 23:08:15 +04:00
j = bind - > cntr [ thread ] [ i ] ;
if ( j ! = - 1 & & ! test_bit ( j , used_mask ) )
2010-03-24 12:09:26 +08:00
return j ;
}
return - 1 ;
}
2010-03-11 19:54:39 +03:00
static int p4_pmu_schedule_events ( struct cpu_hw_events * cpuc , int n , int * assign )
{
unsigned long used_mask [ BITS_TO_LONGS ( X86_PMC_IDX_MAX ) ] ;
2010-05-12 21:42:42 +04:00
unsigned long escr_mask [ BITS_TO_LONGS ( P4_ESCR_MSR_TABLE_SIZE ) ] ;
2010-05-19 01:19:18 +04:00
int cpu = smp_processor_id ( ) ;
2010-03-24 12:09:26 +08:00
struct hw_perf_event * hwc ;
struct p4_event_bind * bind ;
unsigned int i , thread , num ;
int cntr_idx , escr_idx ;
2010-03-11 19:54:39 +03:00
bitmap_zero ( used_mask , X86_PMC_IDX_MAX ) ;
2010-05-12 21:42:42 +04:00
bitmap_zero ( escr_mask , P4_ESCR_MSR_TABLE_SIZE ) ;
2010-03-11 19:54:39 +03:00
for ( i = 0 , num = n ; i < n ; i + + , num - - ) {
2010-03-24 12:09:26 +08:00
2010-03-11 19:54:39 +03:00
hwc = & cpuc - > event_list [ i ] - > hw ;
thread = p4_ht_thread ( cpu ) ;
2010-03-24 12:09:26 +08:00
bind = p4_config_get_bind ( hwc - > config ) ;
escr_idx = p4_get_escr_idx ( bind - > escr_msr [ thread ] ) ;
2010-05-12 21:42:42 +04:00
if ( unlikely ( escr_idx = = - 1 ) )
goto done ;
2010-03-11 19:54:39 +03:00
if ( hwc - > idx ! = - 1 & & ! p4_should_swap_ts ( hwc - > config , cpu ) ) {
2010-03-24 12:09:26 +08:00
cntr_idx = hwc - > idx ;
2010-03-11 19:54:39 +03:00
if ( assign )
assign [ i ] = hwc - > idx ;
goto reserve ;
}
2010-03-24 12:09:26 +08:00
cntr_idx = p4_next_cntr ( thread , used_mask , bind ) ;
if ( cntr_idx = = - 1 | | test_bit ( escr_idx , escr_mask ) )
2010-03-11 19:54:39 +03:00
goto done ;
p4_pmu_swap_config_ts ( hwc , cpu ) ;
2010-03-24 12:09:26 +08:00
if ( assign )
assign [ i ] = cntr_idx ;
2010-03-11 19:54:39 +03:00
reserve :
2010-03-24 12:09:26 +08:00
set_bit ( cntr_idx , used_mask ) ;
2010-03-11 19:54:39 +03:00
set_bit ( escr_idx , escr_mask ) ;
}
done :
return num ? - ENOSPC : 0 ;
}
2010-03-29 13:09:53 +02:00
static __initconst const struct x86_pmu p4_pmu = {
2010-03-11 19:54:39 +03:00
. name = " Netburst P4/Xeon " ,
. handle_irq = p4_pmu_handle_irq ,
. disable_all = p4_pmu_disable_all ,
. enable_all = p4_pmu_enable_all ,
. enable = p4_pmu_enable_event ,
. disable = p4_pmu_disable_event ,
. eventsel = MSR_P4_BPU_CCCR0 ,
. perfctr = MSR_P4_BPU_PERFCTR0 ,
. event_map = p4_pmu_event_map ,
2010-03-24 12:09:26 +08:00
. max_events = ARRAY_SIZE ( p4_general_events ) ,
2010-03-11 19:54:39 +03:00
. get_event_constraints = x86_get_event_constraints ,
/*
* IF HT disabled we may need to use all
* ARCH_P4_MAX_CCCR counters simulaneously
* though leave it restricted at moment assuming
* HT is on
*/
2010-03-29 18:36:50 +02:00
. num_counters = ARCH_P4_MAX_CCCR ,
2010-03-11 19:54:39 +03:00
. apic = 1 ,
2011-01-07 21:42:06 +03:00
. cntval_bits = ARCH_P4_CNTRVAL_BITS ,
. cntval_mask = ARCH_P4_CNTRVAL_MASK ,
. max_period = ( 1ULL < < ( ARCH_P4_CNTRVAL_BITS - 1 ) ) - 1 ,
2011-06-23 16:49:18 +04:00
. hw_watchdog_set_attr = p4_hw_watchdog_set_attr ,
2010-03-11 19:54:39 +03:00
. hw_config = p4_hw_config ,
. schedule_events = p4_pmu_schedule_events ,
2010-06-03 01:23:04 +04:00
/*
* This handles erratum N15 in intel doc 249199 - 02 9 ,
* the counter may not be updated correctly on write
* so we need a second write operation to do the trick
* ( the official workaround didn ' t work )
*
* the former idea is taken from OProfile code
*/
. perfctr_second_write = 1 ,
2010-03-11 19:54:39 +03:00
} ;
static __init int p4_pmu_init ( void )
{
unsigned int low , high ;
2011-04-22 10:08:52 -07:00
/* If we get stripped -- indexing fails */
2010-03-11 19:54:39 +03:00
BUILD_BUG_ON ( ARCH_P4_MAX_CCCR > X86_PMC_MAX_GENERIC ) ;
rdmsr ( MSR_IA32_MISC_ENABLE , low , high ) ;
if ( ! ( low & ( 1 < < 7 ) ) ) {
pr_cont ( " unsupported Netburst CPU model %d " ,
boot_cpu_data . x86_model ) ;
return - ENODEV ;
}
2010-03-18 18:33:12 +08:00
memcpy ( hw_cache_event_ids , p4_hw_cache_event_ids ,
2010-03-24 12:09:26 +08:00
sizeof ( hw_cache_event_ids ) ) ;
2010-03-18 18:33:12 +08:00
2010-03-11 19:54:39 +03:00
pr_cont ( " Netburst events, " ) ;
x86_pmu = p4_pmu ;
return 0 ;
}
# endif /* CONFIG_CPU_SUP_INTEL */