2009-06-25 21:32:38 +04:00
# include <linux/module.h>
2010-08-18 17:11:35 +04:00
# include <linux/slab.h>
2010-09-27 17:30:39 +04:00
# include "mce_amd.h"
2009-05-06 19:57:20 +04:00
2010-08-18 17:11:35 +04:00
static struct amd_decoder_ops * fam_ops ;
2010-09-17 21:11:47 +04:00
static u8 xec_mask = 0xf ;
2010-08-31 20:28:08 +04:00
2009-07-24 15:51:42 +04:00
static bool report_gart_errors ;
2011-08-24 20:44:22 +04:00
static void ( * nb_bus_decoder ) ( int node_id , struct mce * m ) ;
2009-07-24 15:51:42 +04:00
void amd_report_gart_errors ( bool v )
{
report_gart_errors = v ;
}
EXPORT_SYMBOL_GPL ( amd_report_gart_errors ) ;
2011-08-24 20:44:22 +04:00
void amd_register_ecc_decoder ( void ( * f ) ( int , struct mce * ) )
2009-07-24 15:51:42 +04:00
{
nb_bus_decoder = f ;
}
EXPORT_SYMBOL_GPL ( amd_register_ecc_decoder ) ;
2011-08-24 20:44:22 +04:00
void amd_unregister_ecc_decoder ( void ( * f ) ( int , struct mce * ) )
2009-07-24 15:51:42 +04:00
{
if ( nb_bus_decoder ) {
WARN_ON ( nb_bus_decoder ! = f ) ;
nb_bus_decoder = NULL ;
}
}
EXPORT_SYMBOL_GPL ( amd_unregister_ecc_decoder ) ;
2009-05-06 19:57:20 +04:00
/*
* string representation for the different MCA reported error types , see F3x48
* or MSR0000_0411 .
*/
2010-09-06 20:13:39 +04:00
/* transaction type */
2012-12-23 15:40:45 +04:00
static const char * const tt_msgs [ ] = { " INSN " , " DATA " , " GEN " , " RESV " } ;
2009-05-06 19:57:20 +04:00
2010-09-06 20:13:39 +04:00
/* cache level */
2012-12-23 15:40:45 +04:00
static const char * const ll_msgs [ ] = { " RESV " , " L1 " , " L2 " , " L3/GEN " } ;
2009-05-06 19:57:20 +04:00
2010-09-06 20:13:39 +04:00
/* memory transaction type */
2012-12-23 15:40:45 +04:00
static const char * const rrrr_msgs [ ] = {
2010-09-06 20:13:39 +04:00
" GEN " , " RD " , " WR " , " DRD " , " DWR " , " IRD " , " PRF " , " EV " , " SNP "
2009-05-06 19:57:20 +04:00
} ;
2010-09-06 20:13:39 +04:00
/* participating processor */
2011-11-29 22:03:25 +04:00
const char * const pp_msgs [ ] = { " SRC " , " RES " , " OBS " , " GEN " } ;
2009-06-25 21:32:38 +04:00
EXPORT_SYMBOL_GPL ( pp_msgs ) ;
2009-05-06 19:57:20 +04:00
2010-09-06 20:13:39 +04:00
/* request timeout */
2012-12-23 15:40:45 +04:00
static const char * const to_msgs [ ] = { " no timeout " , " timed out " } ;
2009-05-06 19:57:20 +04:00
2010-09-06 20:13:39 +04:00
/* memory or i/o */
2012-12-23 15:40:45 +04:00
static const char * const ii_msgs [ ] = { " MEM " , " RESV " , " IO " , " GEN " } ;
2009-05-06 19:57:20 +04:00
2012-12-19 01:06:11 +04:00
/* internal error type */
2012-12-23 15:40:45 +04:00
static const char * const uu_msgs [ ] = { " RESV " , " RESV " , " HWA " , " RESV " } ;
2012-12-19 01:06:11 +04:00
2012-09-11 20:57:43 +04:00
static const char * const f15h_mc1_mce_desc [ ] = {
2010-11-08 17:03:35 +03:00
" UC during a demand linefill from L2 " ,
" Parity error during data load from IC " ,
" Parity error for IC valid bit " ,
" Main tag parity error " ,
" Parity error in prediction queue " ,
" PFB data/address parity error " ,
" Parity error in the branch status reg " ,
" PFB promotion address error " ,
" Tag error during probe/victimization " ,
" Parity error for IC probe tag valid bit " ,
" PFB non-cacheable bit parity error " ,
" PFB valid bit parity error " , /* xec = 0xd */
2011-11-21 22:45:34 +04:00
" Microcode Patch Buffer " , /* xec = 010 */
2010-11-08 17:03:35 +03:00
" uop queue " ,
" insn buffer " ,
" predecode buffer " ,
2014-07-14 18:58:19 +04:00
" fetch address FIFO " ,
" dispatch uop queue "
2010-11-08 17:03:35 +03:00
} ;
2012-09-11 20:57:43 +04:00
static const char * const f15h_mc2_mce_desc [ ] = {
2010-09-21 22:45:10 +04:00
" Fill ECC error on data fills " , /* xec = 0x4 */
" Fill parity error on insn fills " ,
" Prefetcher request FIFO parity error " ,
" PRQ address parity error " ,
" PRQ data parity error " ,
" WCC Tag ECC error " ,
" WCC Data ECC error " ,
" WCB Data parity error " ,
2011-11-23 17:50:44 +04:00
" VB Data ECC or parity error " ,
2010-09-21 22:45:10 +04:00
" L2 Tag ECC error " , /* xec = 0x10 */
" Hard L2 Tag ECC error " ,
" Multiple hits on L2 tag " ,
" XAB parity error " ,
" PRB address parity error "
} ;
2012-09-11 20:57:43 +04:00
static const char * const mc4_mce_desc [ ] = {
2011-11-25 00:29:57 +04:00
" DRAM ECC error detected on the NB " ,
" CRC error detected on HT link " ,
" Link-defined sync error packets detected on HT link " ,
" HT Master abort " ,
" HT Target abort " ,
" Invalid GART PTE entry during GART table walk " ,
" Unsupported atomic RMW received from an IO link " ,
" Watchdog timeout due to lack of progress " ,
" DRAM ECC error detected on the NB " ,
" SVM DMA Exclusion Vector error " ,
" HT data error detected on link " ,
" Protocol error (link, L3, probe filter) " ,
" NB internal arrays parity error " ,
" DRAM addr/ctl signals parity error " ,
" IO link transmission error " ,
" L3 data cache ECC error " , /* xec = 0x1c */
" L3 cache tag error " ,
" L3 LRU parity bits error " ,
" ECC Error in the Probe Filter directory "
} ;
2012-09-11 20:57:43 +04:00
static const char * const mc5_mce_desc [ ] = {
2010-09-22 17:28:59 +04:00
" CPU Watchdog timer expire " ,
" Wakeup array dest tag " ,
" AG payload array " ,
" EX payload array " ,
" IDRF array " ,
" Retire dispatch queue " ,
" Mapper checkpoint array " ,
" Physical register file EX0 port " ,
" Physical register file EX1 port " ,
" Physical register file AG0 port " ,
" Physical register file AG1 port " ,
" Flag register file " ,
2013-06-06 00:50:03 +04:00
" DE error occurred " ,
" Retire status queue "
2010-09-22 17:28:59 +04:00
} ;
2014-11-04 20:41:08 +03:00
static const char * const mc6_mce_desc [ ] = {
" Hardware Assertion " ,
" Free List " ,
" Physical Register File " ,
" Retire Queue " ,
" Scheduler table " ,
" Status Register File " ,
} ;
2012-09-11 20:57:43 +04:00
static bool f12h_mc0_mce ( u16 ec , u8 xec )
2009-07-28 15:50:43 +04:00
{
2010-08-18 17:11:35 +04:00
bool ret = false ;
2009-07-28 15:50:43 +04:00
2010-08-18 17:11:35 +04:00
if ( MEM_ERROR ( ec ) ) {
2010-09-22 18:08:37 +04:00
u8 ll = LL ( ec ) ;
2010-08-18 17:11:35 +04:00
ret = true ;
2009-07-28 15:50:43 +04:00
2010-08-18 17:11:35 +04:00
if ( ll = = LL_L2 )
pr_cont ( " during L1 linefill from L2. \n " ) ;
else if ( ll = = LL_L1 )
2010-09-22 18:08:37 +04:00
pr_cont ( " Data/Tag %s error. \n " , R4_MSG ( ec ) ) ;
2010-08-18 17:11:35 +04:00
else
ret = false ;
}
return ret ;
}
2009-07-28 15:50:43 +04:00
2012-09-11 20:57:43 +04:00
static bool f10h_mc0_mce ( u16 ec , u8 xec )
2010-09-16 17:08:14 +04:00
{
2010-09-22 18:08:37 +04:00
if ( R4 ( ec ) = = R4_GEN & & LL ( ec ) = = LL_L1 ) {
2010-09-16 17:08:14 +04:00
pr_cont ( " during data scrub. \n " ) ;
return true ;
}
2012-09-11 20:57:43 +04:00
return f12h_mc0_mce ( ec , xec ) ;
2010-09-16 17:08:14 +04:00
}
2012-09-11 20:57:43 +04:00
static bool k8_mc0_mce ( u16 ec , u8 xec )
2010-08-18 17:11:35 +04:00
{
if ( BUS_ERROR ( ec ) ) {
pr_cont ( " during system linefill. \n " ) ;
return true ;
}
2009-07-28 15:50:43 +04:00
2012-09-11 20:57:43 +04:00
return f10h_mc0_mce ( ec , xec ) ;
2010-08-18 17:11:35 +04:00
}
2012-12-19 01:06:11 +04:00
static bool cat_mc0_mce ( u16 ec , u8 xec )
2010-08-18 17:11:35 +04:00
{
2010-09-22 18:08:37 +04:00
u8 r4 = R4 ( ec ) ;
2010-08-18 17:11:35 +04:00
bool ret = true ;
if ( MEM_ERROR ( ec ) ) {
2010-09-22 18:08:37 +04:00
if ( TT ( ec ) ! = TT_DATA | | LL ( ec ) ! = LL_L1 )
2010-08-18 17:11:35 +04:00
return false ;
switch ( r4 ) {
case R4_DRD :
case R4_DWR :
pr_cont ( " Data/Tag parity error due to %s. \n " ,
( r4 = = R4_DRD ? " load/hw prf " : " store " ) ) ;
break ;
case R4_EVICT :
pr_cont ( " Copyback parity error on a tag miss. \n " ) ;
break ;
case R4_SNOOP :
pr_cont ( " Tag parity error during snoop. \n " ) ;
break ;
default :
ret = false ;
}
} else if ( BUS_ERROR ( ec ) ) {
2010-09-22 18:08:37 +04:00
if ( ( II ( ec ) ! = II_MEM & & II ( ec ) ! = II_IO ) | | LL ( ec ) ! = LL_LG )
2010-08-18 17:11:35 +04:00
return false ;
pr_cont ( " System read data error on a " ) ;
switch ( r4 ) {
case R4_RD :
pr_cont ( " TLB reload. \n " ) ;
break ;
case R4_DWR :
pr_cont ( " store. \n " ) ;
break ;
case R4_DRD :
pr_cont ( " load. \n " ) ;
break ;
default :
ret = false ;
}
} else {
ret = false ;
}
return ret ;
}
2012-09-11 20:57:43 +04:00
static bool f15h_mc0_mce ( u16 ec , u8 xec )
2010-09-17 21:22:34 +04:00
{
bool ret = true ;
if ( MEM_ERROR ( ec ) ) {
switch ( xec ) {
case 0x0 :
pr_cont ( " Data Array access error. \n " ) ;
break ;
case 0x1 :
pr_cont ( " UC error during a linefill from L2/NB. \n " ) ;
break ;
case 0x2 :
case 0x11 :
pr_cont ( " STQ access error. \n " ) ;
break ;
case 0x3 :
pr_cont ( " SCB access error. \n " ) ;
break ;
case 0x10 :
pr_cont ( " Tag error. \n " ) ;
break ;
case 0x12 :
pr_cont ( " LDQ access error. \n " ) ;
break ;
default :
ret = false ;
}
} else if ( BUS_ERROR ( ec ) ) {
if ( ! xec )
2011-11-15 20:10:58 +04:00
pr_cont ( " System Read Data Error. \n " ) ;
2010-09-17 21:22:34 +04:00
else
2011-11-15 20:10:58 +04:00
pr_cont ( " Internal error condition type %d. \n " , xec ) ;
2014-07-14 18:58:19 +04:00
} else if ( INT_ERROR ( ec ) ) {
if ( xec < = 0x1f )
pr_cont ( " Hardware Assert. \n " ) ;
else
ret = false ;
2010-09-17 21:22:34 +04:00
} else
ret = false ;
return ret ;
}
2012-09-11 20:57:43 +04:00
static void decode_mc0_mce ( struct mce * m )
2010-08-18 17:11:35 +04:00
{
2010-09-22 18:08:37 +04:00
u16 ec = EC ( m - > status ) ;
u8 xec = XEC ( m - > status , xec_mask ) ;
2010-08-18 17:11:35 +04:00
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " MC0 Error: " ) ;
2010-08-18 17:11:35 +04:00
/* TLB error signatures are the same across families */
if ( TLB_ERROR ( ec ) ) {
2010-09-22 18:08:37 +04:00
if ( TT ( ec ) = = TT_DATA ) {
2010-08-18 17:11:35 +04:00
pr_cont ( " %s TLB %s. \n " , LL_MSG ( ec ) ,
2010-09-17 21:22:34 +04:00
( ( xec = = 2 ) ? " locked miss "
: ( xec ? " multimatch " : " parity " ) ) ) ;
2010-08-18 17:11:35 +04:00
return ;
}
2012-09-11 20:57:43 +04:00
} else if ( fam_ops - > mc0_mce ( ec , xec ) )
2010-09-17 21:22:34 +04:00
;
else
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " Corrupted MC0 MCE info? \n " ) ;
2009-07-28 15:50:43 +04:00
}
2012-09-11 20:57:43 +04:00
static bool k8_mc1_mce ( u16 ec , u8 xec )
2009-07-28 16:06:26 +04:00
{
2010-09-22 18:08:37 +04:00
u8 ll = LL ( ec ) ;
2010-08-26 21:05:49 +04:00
bool ret = true ;
2009-07-28 16:06:26 +04:00
2010-08-26 21:05:49 +04:00
if ( ! MEM_ERROR ( ec ) )
return false ;
2009-07-28 16:06:26 +04:00
2010-08-26 21:05:49 +04:00
if ( ll = = 0x2 )
pr_cont ( " during a linefill from L2. \n " ) ;
else if ( ll = = 0x1 ) {
2010-09-22 18:08:37 +04:00
switch ( R4 ( ec ) ) {
2010-08-26 21:05:49 +04:00
case R4_IRD :
pr_cont ( " Parity error during data load. \n " ) ;
break ;
2009-07-28 16:06:26 +04:00
2010-08-26 21:05:49 +04:00
case R4_EVICT :
pr_cont ( " Copyback Parity/Victim error. \n " ) ;
break ;
case R4_SNOOP :
pr_cont ( " Tag Snoop error. \n " ) ;
break ;
default :
ret = false ;
break ;
}
2009-07-28 16:06:26 +04:00
} else
2010-08-26 21:05:49 +04:00
ret = false ;
2009-07-28 16:06:26 +04:00
2010-08-26 21:05:49 +04:00
return ret ;
}
2012-12-19 01:06:11 +04:00
static bool cat_mc1_mce ( u16 ec , u8 xec )
2010-08-26 21:05:49 +04:00
{
2010-09-22 18:08:37 +04:00
u8 r4 = R4 ( ec ) ;
2010-08-26 21:05:49 +04:00
bool ret = true ;
2009-07-28 16:06:26 +04:00
2012-12-19 01:06:11 +04:00
if ( ! MEM_ERROR ( ec ) )
return false ;
if ( TT ( ec ) ! = TT_INSTR )
return false ;
if ( r4 = = R4_IRD )
pr_cont ( " Data/tag array parity error for a tag hit. \n " ) ;
else if ( r4 = = R4_SNOOP )
pr_cont ( " Tag error during snoop/victimization. \n " ) ;
else if ( xec = = 0x0 )
pr_cont ( " Tag parity error from victim castout. \n " ) ;
else if ( xec = = 0x2 )
pr_cont ( " Microcode patch RAM parity error. \n " ) ;
else
ret = false ;
2010-08-26 21:05:49 +04:00
return ret ;
}
2012-09-11 20:57:43 +04:00
static bool f15h_mc1_mce ( u16 ec , u8 xec )
2010-11-08 17:03:35 +03:00
{
bool ret = true ;
if ( ! MEM_ERROR ( ec ) )
return false ;
switch ( xec ) {
case 0x0 . . . 0xa :
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , f15h_mc1_mce_desc [ xec ] ) ;
2010-11-08 17:03:35 +03:00
break ;
case 0xd :
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , f15h_mc1_mce_desc [ xec - 2 ] ) ;
2010-11-08 17:03:35 +03:00
break ;
2011-11-21 22:45:34 +04:00
case 0x10 :
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , f15h_mc1_mce_desc [ xec - 4 ] ) ;
2011-11-21 22:45:34 +04:00
break ;
2014-07-14 18:58:19 +04:00
case 0x11 . . . 0x15 :
2012-09-11 20:57:43 +04:00
pr_cont ( " Decoder %s parity error. \n " , f15h_mc1_mce_desc [ xec - 4 ] ) ;
2010-11-08 17:03:35 +03:00
break ;
default :
ret = false ;
}
return ret ;
}
2012-09-11 20:57:43 +04:00
static void decode_mc1_mce ( struct mce * m )
2010-08-26 21:05:49 +04:00
{
2010-09-22 18:08:37 +04:00
u16 ec = EC ( m - > status ) ;
u8 xec = XEC ( m - > status , xec_mask ) ;
2010-08-26 21:05:49 +04:00
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " MC1 Error: " ) ;
2010-08-26 21:05:49 +04:00
if ( TLB_ERROR ( ec ) )
pr_cont ( " %s TLB %s. \n " , LL_MSG ( ec ) ,
( xec ? " multimatch " : " parity error " ) ) ;
else if ( BUS_ERROR ( ec ) ) {
2010-10-15 17:27:02 +04:00
bool k8 = ( boot_cpu_data . x86 = = 0xf & & ( m - > status & BIT_64 ( 58 ) ) ) ;
2010-08-26 21:05:49 +04:00
pr_cont ( " during %s. \n " , ( k8 ? " system linefill " : " NB data read " ) ) ;
2014-07-14 18:58:19 +04:00
} else if ( INT_ERROR ( ec ) ) {
if ( xec < = 0x3f )
pr_cont ( " Hardware Assert. \n " ) ;
else
goto wrong_mc1_mce ;
2012-09-11 20:57:43 +04:00
} else if ( fam_ops - > mc1_mce ( ec , xec ) )
2010-08-26 21:05:49 +04:00
;
else
2014-07-14 18:58:19 +04:00
goto wrong_mc1_mce ;
return ;
wrong_mc1_mce :
pr_emerg ( HW_ERR " Corrupted MC1 MCE info? \n " ) ;
2009-07-28 16:06:26 +04:00
}
2012-12-19 01:06:10 +04:00
static bool k8_mc2_mce ( u16 ec , u8 xec )
2009-07-28 16:14:24 +04:00
{
2012-12-19 01:06:10 +04:00
bool ret = true ;
2009-07-28 16:14:24 +04:00
if ( xec = = 0x1 )
pr_cont ( " in the write data buffers. \n " ) ;
else if ( xec = = 0x3 )
pr_cont ( " in the victim data buffers. \n " ) ;
else if ( xec = = 0x2 & & MEM_ERROR ( ec ) )
2010-09-22 18:08:37 +04:00
pr_cont ( " : %s error in the L2 cache tags. \n " , R4_MSG ( ec ) ) ;
2009-07-28 16:14:24 +04:00
else if ( xec = = 0x0 ) {
if ( TLB_ERROR ( ec ) )
2014-11-22 15:41:01 +03:00
pr_cont ( " %s error in a Page Descriptor Cache or Guest TLB. \n " ,
TT_MSG ( ec ) ) ;
2009-07-28 16:14:24 +04:00
else if ( BUS_ERROR ( ec ) )
pr_cont ( " : %s/ECC error in data read from NB: %s. \n " ,
2010-09-22 18:08:37 +04:00
R4_MSG ( ec ) , PP_MSG ( ec ) ) ;
2009-07-28 16:14:24 +04:00
else if ( MEM_ERROR ( ec ) ) {
2010-09-22 18:08:37 +04:00
u8 r4 = R4 ( ec ) ;
2009-07-28 16:14:24 +04:00
2010-09-22 18:08:37 +04:00
if ( r4 > = 0x7 )
2009-07-28 16:14:24 +04:00
pr_cont ( " : %s error during data copyback. \n " ,
2010-09-22 18:08:37 +04:00
R4_MSG ( ec ) ) ;
else if ( r4 < = 0x1 )
2009-07-28 16:14:24 +04:00
pr_cont ( " : %s parity/ECC error during data "
2010-09-22 18:08:37 +04:00
" access from L2. \n " , R4_MSG ( ec ) ) ;
2009-07-28 16:14:24 +04:00
else
2012-12-19 01:06:10 +04:00
ret = false ;
2009-07-28 16:14:24 +04:00
} else
2012-12-19 01:06:10 +04:00
ret = false ;
2009-07-28 16:14:24 +04:00
} else
2012-12-19 01:06:10 +04:00
ret = false ;
2009-07-28 16:14:24 +04:00
2012-12-19 01:06:10 +04:00
return ret ;
2009-07-28 16:14:24 +04:00
}
2012-12-19 01:06:10 +04:00
static bool f15h_mc2_mce ( u16 ec , u8 xec )
2010-09-21 22:45:10 +04:00
{
2012-12-19 01:06:10 +04:00
bool ret = true ;
2010-09-21 22:45:10 +04:00
if ( TLB_ERROR ( ec ) ) {
if ( xec = = 0x0 )
pr_cont ( " Data parity TLB read error. \n " ) ;
else if ( xec = = 0x1 )
pr_cont ( " Poison data provided for TLB fill. \n " ) ;
else
2012-12-19 01:06:10 +04:00
ret = false ;
2010-09-21 22:45:10 +04:00
} else if ( BUS_ERROR ( ec ) ) {
if ( xec > 2 )
2012-12-19 01:06:10 +04:00
ret = false ;
2010-09-21 22:45:10 +04:00
pr_cont ( " Error during attempted NB data read. \n " ) ;
} else if ( MEM_ERROR ( ec ) ) {
switch ( xec ) {
case 0x4 . . . 0xc :
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , f15h_mc2_mce_desc [ xec - 0x4 ] ) ;
2010-09-21 22:45:10 +04:00
break ;
case 0x10 . . . 0x14 :
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , f15h_mc2_mce_desc [ xec - 0x7 ] ) ;
2010-09-21 22:45:10 +04:00
break ;
default :
2012-12-19 01:06:10 +04:00
ret = false ;
2010-09-21 22:45:10 +04:00
}
2014-07-14 18:58:19 +04:00
} else if ( INT_ERROR ( ec ) ) {
if ( xec < = 0x3f )
pr_cont ( " Hardware Assert. \n " ) ;
else
ret = false ;
2010-09-21 22:45:10 +04:00
}
2012-12-19 01:06:10 +04:00
return ret ;
}
2012-12-19 01:06:11 +04:00
static bool f16h_mc2_mce ( u16 ec , u8 xec )
{
u8 r4 = R4 ( ec ) ;
if ( ! MEM_ERROR ( ec ) )
return false ;
switch ( xec ) {
case 0x04 . . . 0x05 :
pr_cont ( " %cBUFF parity error. \n " , ( r4 = = R4_RD ) ? ' I ' : ' O ' ) ;
break ;
case 0x09 . . . 0x0b :
case 0x0d . . . 0x0f :
pr_cont ( " ECC error in L2 tag (%s). \n " ,
( ( r4 = = R4_GEN ) ? " BankReq " :
( ( r4 = = R4_SNOOP ) ? " Prb " : " Fill " ) ) ) ;
break ;
case 0x10 . . . 0x19 :
case 0x1b :
pr_cont ( " ECC error in L2 data array (%s). \n " ,
( ( ( r4 = = R4_RD ) & & ! ( xec & 0x3 ) ) ? " Hit " :
( ( r4 = = R4_GEN ) ? " Attr " :
( ( r4 = = R4_EVICT ) ? " Vict " : " Fill " ) ) ) ) ;
break ;
case 0x1c . . . 0x1d :
case 0x1f :
pr_cont ( " Parity error in L2 attribute bits (%s). \n " ,
( ( r4 = = R4_RD ) ? " Hit " :
( ( r4 = = R4_GEN ) ? " Attr " : " Fill " ) ) ) ;
break ;
default :
return false ;
}
return true ;
}
2012-12-19 01:06:10 +04:00
static void decode_mc2_mce ( struct mce * m )
{
u16 ec = EC ( m - > status ) ;
u8 xec = XEC ( m - > status , xec_mask ) ;
2010-09-21 22:45:10 +04:00
2012-12-19 01:06:10 +04:00
pr_emerg ( HW_ERR " MC2 Error: " ) ;
if ( ! fam_ops - > mc2_mce ( ec , xec ) )
pr_cont ( HW_ERR " Corrupted MC2 MCE info? \n " ) ;
2010-09-21 22:45:10 +04:00
}
2012-09-11 20:57:43 +04:00
static void decode_mc3_mce ( struct mce * m )
2009-07-28 16:17:30 +04:00
{
2010-09-22 18:08:37 +04:00
u16 ec = EC ( m - > status ) ;
u8 xec = XEC ( m - > status , xec_mask ) ;
2010-08-27 19:03:34 +04:00
2010-09-22 13:53:32 +04:00
if ( boot_cpu_data . x86 > = 0x14 ) {
2012-09-11 20:57:43 +04:00
pr_emerg ( " You shouldn't be seeing MC3 MCE on this cpu family, "
2010-08-27 19:03:34 +04:00
" please report on LKML. \n " ) ;
return ;
}
2009-07-28 16:17:30 +04:00
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " MC3 Error " ) ;
2009-07-28 16:17:30 +04:00
if ( xec = = 0x0 ) {
2010-09-22 18:08:37 +04:00
u8 r4 = R4 ( ec ) ;
2009-07-28 16:17:30 +04:00
2010-08-27 19:03:34 +04:00
if ( ! BUS_ERROR ( ec ) | | ( r4 ! = R4_DRD & & r4 ! = R4_DWR ) )
2012-09-11 20:57:43 +04:00
goto wrong_mc3_mce ;
2009-07-28 16:17:30 +04:00
2010-09-22 18:08:37 +04:00
pr_cont ( " during %s. \n " , R4_MSG ( ec ) ) ;
2010-08-27 19:03:34 +04:00
} else
2012-09-11 20:57:43 +04:00
goto wrong_mc3_mce ;
2010-08-27 19:03:34 +04:00
2009-07-28 16:17:30 +04:00
return ;
2012-09-11 20:57:43 +04:00
wrong_mc3_mce :
pr_emerg ( HW_ERR " Corrupted MC3 MCE info? \n " ) ;
2009-07-28 16:17:30 +04:00
}
2012-09-11 20:57:43 +04:00
static void decode_mc4_mce ( struct mce * m )
2010-08-31 20:28:08 +04:00
{
2011-11-25 00:29:57 +04:00
struct cpuinfo_x86 * c = & boot_cpu_data ;
int node_id = amd_get_nb_id ( m - > extcpu ) ;
u16 ec = EC ( m - > status ) ;
u8 xec = XEC ( m - > status , 0x1f ) ;
u8 offset = 0 ;
2010-08-31 20:28:08 +04:00
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " MC4 Error (node %d): " , node_id ) ;
2010-08-31 20:28:08 +04:00
2011-11-25 00:29:57 +04:00
switch ( xec ) {
case 0x0 . . . 0xe :
2010-08-31 20:28:08 +04:00
2011-11-25 00:29:57 +04:00
/* special handling for DRAM ECCs */
if ( xec = = 0x0 | | xec = = 0x8 ) {
/* no ECCs on F11h */
if ( c - > x86 = = 0x11 )
2012-09-11 20:57:43 +04:00
goto wrong_mc4_mce ;
2010-08-31 20:28:08 +04:00
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , mc4_mce_desc [ xec ] ) ;
2010-08-31 20:28:08 +04:00
2011-11-25 00:29:57 +04:00
if ( nb_bus_decoder )
nb_bus_decoder ( node_id , m ) ;
return ;
}
2010-08-31 20:28:08 +04:00
break ;
case 0xf :
if ( TLB_ERROR ( ec ) )
pr_cont ( " GART Table Walk data error. \n " ) ;
else if ( BUS_ERROR ( ec ) )
pr_cont ( " DMA Exclusion Vector Table Walk error. \n " ) ;
else
2012-09-11 20:57:43 +04:00
goto wrong_mc4_mce ;
2011-11-25 00:29:57 +04:00
return ;
2010-08-31 20:28:08 +04:00
2010-09-22 17:06:24 +04:00
case 0x19 :
2012-12-19 01:06:11 +04:00
if ( boot_cpu_data . x86 = = 0x15 | | boot_cpu_data . x86 = = 0x16 )
2010-09-22 17:06:24 +04:00
pr_cont ( " Compute Unit Data Error. \n " ) ;
else
2012-09-11 20:57:43 +04:00
goto wrong_mc4_mce ;
2011-11-25 00:29:57 +04:00
return ;
2010-09-22 17:06:24 +04:00
2010-08-31 20:28:08 +04:00
case 0x1c . . . 0x1f :
2011-11-25 00:29:57 +04:00
offset = 13 ;
2010-08-31 20:28:08 +04:00
break ;
default :
2012-09-11 20:57:43 +04:00
goto wrong_mc4_mce ;
2011-11-25 00:29:57 +04:00
}
2010-08-31 20:28:08 +04:00
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , mc4_mce_desc [ xec - offset ] ) ;
2010-08-31 20:28:08 +04:00
return ;
2012-09-11 20:57:43 +04:00
wrong_mc4_mce :
pr_emerg ( HW_ERR " Corrupted MC4 MCE info? \n " ) ;
2009-07-28 12:56:15 +04:00
}
2012-09-11 20:57:43 +04:00
static void decode_mc5_mce ( struct mce * m )
2009-07-28 16:20:46 +04:00
{
2010-09-22 17:28:59 +04:00
struct cpuinfo_x86 * c = & boot_cpu_data ;
2014-07-14 18:58:19 +04:00
u16 ec = EC ( m - > status ) ;
2010-09-22 18:08:37 +04:00
u8 xec = XEC ( m - > status , xec_mask ) ;
2010-09-22 17:28:59 +04:00
if ( c - > x86 = = 0xf | | c - > x86 = = 0x11 )
2012-09-11 20:57:43 +04:00
goto wrong_mc5_mce ;
2010-08-31 20:38:24 +04:00
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " MC5 Error: " ) ;
2010-09-22 17:28:59 +04:00
2014-07-14 18:58:19 +04:00
if ( INT_ERROR ( ec ) ) {
if ( xec < = 0x1f ) {
pr_cont ( " Hardware Assert. \n " ) ;
return ;
} else
goto wrong_mc5_mce ;
}
2010-09-22 17:28:59 +04:00
if ( xec = = 0x0 | | xec = = 0xc )
2012-09-11 20:57:43 +04:00
pr_cont ( " %s. \n " , mc5_mce_desc [ xec ] ) ;
2013-06-06 00:50:03 +04:00
else if ( xec < = 0xd )
2012-09-11 20:57:43 +04:00
pr_cont ( " %s parity error. \n " , mc5_mce_desc [ xec ] ) ;
2010-09-22 17:28:59 +04:00
else
2012-09-11 20:57:43 +04:00
goto wrong_mc5_mce ;
2010-09-22 17:28:59 +04:00
return ;
2010-08-31 20:38:24 +04:00
2012-09-11 20:57:43 +04:00
wrong_mc5_mce :
pr_emerg ( HW_ERR " Corrupted MC5 MCE info? \n " ) ;
2009-07-28 16:20:46 +04:00
}
2012-09-11 20:57:43 +04:00
static void decode_mc6_mce ( struct mce * m )
2010-09-22 17:37:58 +04:00
{
2010-09-22 18:08:37 +04:00
u8 xec = XEC ( m - > status , xec_mask ) ;
2010-09-22 17:37:58 +04:00
2012-09-11 20:57:43 +04:00
pr_emerg ( HW_ERR " MC6 Error: " ) ;
2010-09-22 17:37:58 +04:00
2014-11-04 20:41:08 +03:00
if ( xec > 0x5 )
2012-09-11 20:57:43 +04:00
goto wrong_mc6_mce ;
2010-09-22 17:37:58 +04:00
2014-11-04 20:41:08 +03:00
pr_cont ( " %s parity error. \n " , mc6_mce_desc [ xec ] ) ;
2010-09-22 17:37:58 +04:00
return ;
2012-09-11 20:57:43 +04:00
wrong_mc6_mce :
pr_emerg ( HW_ERR " Corrupted MC6 MCE info? \n " ) ;
2010-09-22 17:37:58 +04:00
}
2010-09-06 20:13:39 +04:00
static inline void amd_decode_err_code ( u16 ec )
2009-07-28 12:56:15 +04:00
{
2012-12-19 01:06:11 +04:00
if ( INT_ERROR ( ec ) ) {
pr_emerg ( HW_ERR " internal: %s \n " , UU_MSG ( ec ) ) ;
return ;
}
2010-09-22 19:42:27 +04:00
pr_emerg ( HW_ERR " cache level: %s " , LL_MSG ( ec ) ) ;
if ( BUS_ERROR ( ec ) )
pr_cont ( " , mem/io: %s " , II_MSG ( ec ) ) ;
else
pr_cont ( " , tx: %s " , TT_MSG ( ec ) ) ;
if ( MEM_ERROR ( ec ) | | BUS_ERROR ( ec ) ) {
pr_cont ( " , mem-tx: %s " , R4_MSG ( ec ) ) ;
if ( BUS_ERROR ( ec ) )
pr_cont ( " , part-proc: %s (%s) " , PP_MSG ( ec ) , TO_MSG ( ec ) ) ;
}
pr_cont ( " \n " ) ;
2009-07-24 15:51:42 +04:00
}
2010-08-31 20:28:08 +04:00
/*
* Filter out unwanted MCE signatures here .
*/
static bool amd_filter_mce ( struct mce * m )
{
u8 xec = ( m - > status > > 16 ) & 0x1f ;
/*
* NB GART TLB error reporting is disabled by default .
*/
if ( m - > bank = = 4 & & xec = = 0x5 & & ! report_gart_errors )
return true ;
return false ;
}
2012-09-14 22:25:37 +04:00
static const char * decode_error_status ( struct mce * m )
{
if ( m - > status & MCI_STATUS_UC ) {
if ( m - > status & MCI_STATUS_PCC )
return " System Fatal error. " ;
if ( m - > mcgstatus & MCG_STATUS_RIPV )
return " Uncorrected, software restartable error. " ;
return " Uncorrected, software containable error. " ;
}
if ( m - > status & MCI_STATUS_DEFERRED )
return " Deferred error. " ;
return " Corrected error, no action required. " ;
}
2010-09-02 20:33:24 +04:00
int amd_decode_mce ( struct notifier_block * nb , unsigned long val , void * data )
2009-07-24 15:51:42 +04:00
{
2009-10-07 15:20:38 +04:00
struct mce * m = ( struct mce * ) data ;
2012-09-13 17:14:22 +04:00
struct cpuinfo_x86 * c = & cpu_data ( m - > extcpu ) ;
2011-08-24 20:44:22 +04:00
int ecc ;
2009-07-24 15:51:42 +04:00
2010-08-31 20:28:08 +04:00
if ( amd_filter_mce ( m ) )
return NOTIFY_STOP ;
2014-02-17 23:51:52 +04:00
pr_emerg ( HW_ERR " %s \n " , decode_error_status ( m ) ) ;
pr_emerg ( HW_ERR " CPU:%d (%x:%x:%x) MC%d_STATUS[%s|%s|%s|%s|%s " ,
m - > extcpu ,
c - > x86 , c - > x86_model , c - > x86_mask ,
m - > bank ,
( ( m - > status & MCI_STATUS_OVER ) ? " Over " : " - " ) ,
( ( m - > status & MCI_STATUS_UC ) ? " UE " : " CE " ) ,
( ( m - > status & MCI_STATUS_MISCV ) ? " MiscV " : " - " ) ,
( ( m - > status & MCI_STATUS_PCC ) ? " PCC " : " - " ) ,
( ( m - > status & MCI_STATUS_ADDRV ) ? " AddrV " : " - " ) ) ;
if ( c - > x86 = = 0x15 | | c - > x86 = = 0x16 )
pr_cont ( " |%s|%s " ,
( ( m - > status & MCI_STATUS_DEFERRED ) ? " Deferred " : " - " ) ,
( ( m - > status & MCI_STATUS_POISON ) ? " Poison " : " - " ) ) ;
/* do the two bits[14:13] together */
ecc = ( m - > status > > 45 ) & 0x3 ;
if ( ecc )
pr_cont ( " |%sECC " , ( ( ecc = = 2 ) ? " C " : " U " ) ) ;
pr_cont ( " ]: 0x%016llx \n " , m - > status ) ;
if ( m - > status & MCI_STATUS_ADDRV )
2014-11-22 15:41:01 +03:00
pr_emerg ( HW_ERR " MC%d Error Address: 0x%016llx \n " , m - > bank , m - > addr ) ;
2014-02-17 23:51:52 +04:00
if ( ! fam_ops )
goto err_code ;
2009-07-28 15:50:43 +04:00
switch ( m - > bank ) {
case 0 :
2012-09-11 20:57:43 +04:00
decode_mc0_mce ( m ) ;
2009-07-28 15:50:43 +04:00
break ;
2009-07-28 12:56:15 +04:00
2009-07-28 16:06:26 +04:00
case 1 :
2012-09-11 20:57:43 +04:00
decode_mc1_mce ( m ) ;
2009-07-28 16:06:26 +04:00
break ;
2009-07-28 16:14:24 +04:00
case 2 :
2012-12-19 01:06:10 +04:00
decode_mc2_mce ( m ) ;
2009-07-28 16:14:24 +04:00
break ;
2009-07-28 16:17:30 +04:00
case 3 :
2012-09-11 20:57:43 +04:00
decode_mc3_mce ( m ) ;
2009-07-28 16:17:30 +04:00
break ;
2009-07-28 15:50:43 +04:00
case 4 :
2012-09-11 20:57:43 +04:00
decode_mc4_mce ( m ) ;
2009-07-28 15:50:43 +04:00
break ;
2009-07-28 16:20:46 +04:00
case 5 :
2012-09-11 20:57:43 +04:00
decode_mc5_mce ( m ) ;
2009-07-28 16:20:46 +04:00
break ;
2010-09-22 17:37:58 +04:00
case 6 :
2012-09-11 20:57:43 +04:00
decode_mc6_mce ( m ) ;
2010-09-22 17:37:58 +04:00
break ;
2009-07-28 15:50:43 +04:00
default :
break ;
2009-07-27 18:21:14 +04:00
}
2009-07-28 15:50:43 +04:00
2014-02-17 23:51:52 +04:00
err_code :
2009-07-28 15:50:43 +04:00
amd_decode_err_code ( m - > status & 0xffff ) ;
2009-10-07 15:20:38 +04:00
return NOTIFY_STOP ;
2009-07-24 15:51:42 +04:00
}
2010-09-02 20:33:24 +04:00
EXPORT_SYMBOL_GPL ( amd_decode_mce ) ;
2009-10-01 18:14:32 +04:00
2009-10-07 15:20:38 +04:00
static struct notifier_block amd_mce_dec_nb = {
. notifier_call = amd_decode_mce ,
} ;
2009-10-01 18:14:32 +04:00
static int __init mce_amd_init ( void )
{
2010-09-22 19:44:51 +04:00
struct cpuinfo_x86 * c = & boot_cpu_data ;
if ( c - > x86_vendor ! = X86_VENDOR_AMD )
2014-02-17 23:51:52 +04:00
return - ENODEV ;
2010-08-06 20:55:45 +04:00
2010-08-18 17:11:35 +04:00
fam_ops = kzalloc ( sizeof ( struct amd_decoder_ops ) , GFP_KERNEL ) ;
if ( ! fam_ops )
return - ENOMEM ;
2010-09-22 19:44:51 +04:00
switch ( c - > x86 ) {
2010-08-18 17:11:35 +04:00
case 0xf :
2012-09-11 20:57:43 +04:00
fam_ops - > mc0_mce = k8_mc0_mce ;
fam_ops - > mc1_mce = k8_mc1_mce ;
2012-12-19 01:06:10 +04:00
fam_ops - > mc2_mce = k8_mc2_mce ;
2010-08-18 17:11:35 +04:00
break ;
case 0x10 :
2012-09-11 20:57:43 +04:00
fam_ops - > mc0_mce = f10h_mc0_mce ;
fam_ops - > mc1_mce = k8_mc1_mce ;
2012-12-19 01:06:10 +04:00
fam_ops - > mc2_mce = k8_mc2_mce ;
2010-08-18 17:11:35 +04:00
break ;
2010-10-05 21:07:16 +04:00
case 0x11 :
2012-09-11 20:57:43 +04:00
fam_ops - > mc0_mce = k8_mc0_mce ;
fam_ops - > mc1_mce = k8_mc1_mce ;
2012-12-19 01:06:10 +04:00
fam_ops - > mc2_mce = k8_mc2_mce ;
2010-10-05 21:07:16 +04:00
break ;
2010-09-16 17:08:14 +04:00
case 0x12 :
2012-09-11 20:57:43 +04:00
fam_ops - > mc0_mce = f12h_mc0_mce ;
fam_ops - > mc1_mce = k8_mc1_mce ;
2012-12-19 01:06:10 +04:00
fam_ops - > mc2_mce = k8_mc2_mce ;
2010-09-16 17:08:14 +04:00
break ;
2010-08-18 17:11:35 +04:00
case 0x14 :
2012-12-19 01:06:11 +04:00
fam_ops - > mc0_mce = cat_mc0_mce ;
fam_ops - > mc1_mce = cat_mc1_mce ;
2012-12-19 01:06:10 +04:00
fam_ops - > mc2_mce = k8_mc2_mce ;
2010-08-18 17:11:35 +04:00
break ;
2010-09-17 21:11:47 +04:00
case 0x15 :
2014-07-14 18:58:19 +04:00
xec_mask = c - > x86_model = = 0x60 ? 0x3f : 0x1f ;
2012-09-11 20:57:43 +04:00
fam_ops - > mc0_mce = f15h_mc0_mce ;
fam_ops - > mc1_mce = f15h_mc1_mce ;
2012-12-19 01:06:10 +04:00
fam_ops - > mc2_mce = f15h_mc2_mce ;
2010-09-17 21:11:47 +04:00
break ;
2012-12-19 01:06:11 +04:00
case 0x16 :
xec_mask = 0x1f ;
fam_ops - > mc0_mce = cat_mc0_mce ;
fam_ops - > mc1_mce = cat_mc1_mce ;
fam_ops - > mc2_mce = f16h_mc2_mce ;
break ;
2010-08-18 17:11:35 +04:00
default :
2012-04-04 16:21:02 +04:00
printk ( KERN_WARNING " Huh? What family is it: 0x%x?! \n " , c - > x86 ) ;
2010-08-18 17:11:35 +04:00
kfree ( fam_ops ) ;
2014-02-17 23:51:52 +04:00
fam_ops = NULL ;
2010-08-18 17:11:35 +04:00
}
2010-09-06 17:05:45 +04:00
pr_info ( " MCE: In-kernel MCE decoding enabled. \n " ) ;
2011-12-04 18:12:09 +04:00
mce_register_decode_chain ( & amd_mce_dec_nb ) ;
2009-10-01 18:14:32 +04:00
return 0 ;
}
early_initcall ( mce_amd_init ) ;
2009-10-02 17:31:48 +04:00
# ifdef MODULE
static void __exit mce_amd_exit ( void )
{
2011-12-04 18:12:09 +04:00
mce_unregister_decode_chain ( & amd_mce_dec_nb ) ;
2010-08-18 17:11:35 +04:00
kfree ( fam_ops ) ;
2009-10-02 17:31:48 +04:00
}
MODULE_DESCRIPTION ( " AMD MCE decoder " ) ;
MODULE_ALIAS ( " edac-mce-amd " ) ;
MODULE_LICENSE ( " GPL " ) ;
module_exit ( mce_amd_exit ) ;
# endif