2010-05-23 21:44:54 -07:00
* Copyright ( c ) 2006 , 2007 , 2008 , 2009 , 2010 QLogic Corporation .
* All rights reserved .
* Copyright ( c ) 2003 , 2004 , 2005 , 2006 PathScale , Inc . All rights reserved .
* This software is available to you under a choice of one of two
* licenses . You may choose to be licensed under the terms of the GNU
* General Public License ( GPL ) Version 2 , available from the file
* COPYING in the main directory of this source tree , or the
* OpenIB . org BSD license below :
* Redistribution and use in source and binary forms , with or
* without modification , are permitted provided that the following
* conditions are met :
* - Redistributions of source code must retain the above
* copyright notice , this list of conditions and the following
* disclaimer .
* - Redistributions in binary form must reproduce the above
* copyright notice , this list of conditions and the following
* disclaimer in the documentation and / or other materials
* provided with the distribution .
* This file contains all of the code that is specific to the
* QLogic_IB 6120 PCIe chip .
# include <linux/interrupt.h>
# include <linux/pci.h>
# include <linux/delay.h>
# include <rdma/ib_verbs.h>
# include "qib.h"
# include "qib_6120_regs.h"
static void qib_6120_setup_setextled ( struct qib_pportdata * , u32 ) ;
static void sendctrl_6120_mod ( struct qib_pportdata * ppd , u32 op ) ;
static u8 qib_6120_phys_portstate ( u64 ) ;
static u32 qib_6120_iblink_state ( u64 ) ;
* This file contains all the chip - specific register information and
* access functions for the QLogic QLogic_IB PCI - Express chip .
/* KREG_IDX uses machine-generated #defines */
# define KREG_IDX(regname) (QIB_6120_##regname##_OFFS / sizeof(u64))
/* Use defines to tie machine-generated names to lower-case names */
# define kr_extctrl KREG_IDX(EXTCtrl)
# define kr_extstatus KREG_IDX(EXTStatus)
# define kr_gpio_clear KREG_IDX(GPIOClear)
# define kr_gpio_mask KREG_IDX(GPIOMask)
# define kr_gpio_out KREG_IDX(GPIOOut)
# define kr_gpio_status KREG_IDX(GPIOStatus)
# define kr_rcvctrl KREG_IDX(RcvCtrl)
# define kr_sendctrl KREG_IDX(SendCtrl)
# define kr_partitionkey KREG_IDX(RcvPartitionKey)
# define kr_hwdiagctrl KREG_IDX(HwDiagCtrl)
# define kr_ibcstatus KREG_IDX(IBCStatus)
# define kr_ibcctrl KREG_IDX(IBCCtrl)
# define kr_sendbuffererror KREG_IDX(SendBufErr0)
# define kr_rcvbthqp KREG_IDX(RcvBTHQP)
# define kr_counterregbase KREG_IDX(CntrRegBase)
# define kr_palign KREG_IDX(PageAlign)
# define kr_rcvegrbase KREG_IDX(RcvEgrBase)
# define kr_rcvegrcnt KREG_IDX(RcvEgrCnt)
# define kr_rcvhdrcnt KREG_IDX(RcvHdrCnt)
# define kr_rcvhdrentsize KREG_IDX(RcvHdrEntSize)
# define kr_rcvhdrsize KREG_IDX(RcvHdrSize)
# define kr_rcvtidbase KREG_IDX(RcvTIDBase)
# define kr_rcvtidcnt KREG_IDX(RcvTIDCnt)
# define kr_scratch KREG_IDX(Scratch)
# define kr_sendctrl KREG_IDX(SendCtrl)
# define kr_sendpioavailaddr KREG_IDX(SendPIOAvailAddr)
# define kr_sendpiobufbase KREG_IDX(SendPIOBufBase)
# define kr_sendpiobufcnt KREG_IDX(SendPIOBufCnt)
# define kr_sendpiosize KREG_IDX(SendPIOSize)
# define kr_sendregbase KREG_IDX(SendRegBase)
# define kr_userregbase KREG_IDX(UserRegBase)
# define kr_control KREG_IDX(Control)
# define kr_intclear KREG_IDX(IntClear)
# define kr_intmask KREG_IDX(IntMask)
# define kr_intstatus KREG_IDX(IntStatus)
# define kr_errclear KREG_IDX(ErrClear)
# define kr_errmask KREG_IDX(ErrMask)
# define kr_errstatus KREG_IDX(ErrStatus)
# define kr_hwerrclear KREG_IDX(HwErrClear)
# define kr_hwerrmask KREG_IDX(HwErrMask)
# define kr_hwerrstatus KREG_IDX(HwErrStatus)
# define kr_revision KREG_IDX(Revision)
# define kr_portcnt KREG_IDX(PortCnt)
# define kr_serdes_cfg0 KREG_IDX(SerdesCfg0)
# define kr_serdes_cfg1 (kr_serdes_cfg0 + 1)
# define kr_serdes_stat KREG_IDX(SerdesStat)
# define kr_xgxs_cfg KREG_IDX(XGXSCfg)
/* These must only be written via qib_write_kreg_ctxt() */
# define kr_rcvhdraddr KREG_IDX(RcvHdrAddr0)
# define kr_rcvhdrtailaddr KREG_IDX(RcvHdrTailAddr0)
# define CREG_IDX(regname) ((QIB_6120_##regname##_OFFS - \
QIB_6120_LBIntCnt_OFFS ) / sizeof ( u64 ) )
# define cr_badformat CREG_IDX(RxBadFormatCnt)
# define cr_erricrc CREG_IDX(RxICRCErrCnt)
# define cr_errlink CREG_IDX(RxLinkProblemCnt)
# define cr_errlpcrc CREG_IDX(RxLPCRCErrCnt)
# define cr_errpkey CREG_IDX(RxPKeyMismatchCnt)
# define cr_rcvflowctrl_err CREG_IDX(RxFlowCtrlErrCnt)
# define cr_err_rlen CREG_IDX(RxLenErrCnt)
# define cr_errslen CREG_IDX(TxLenErrCnt)
# define cr_errtidfull CREG_IDX(RxTIDFullErrCnt)
# define cr_errtidvalid CREG_IDX(RxTIDValidErrCnt)
# define cr_errvcrc CREG_IDX(RxVCRCErrCnt)
# define cr_ibstatuschange CREG_IDX(IBStatusChangeCnt)
# define cr_lbint CREG_IDX(LBIntCnt)
# define cr_invalidrlen CREG_IDX(RxMaxMinLenErrCnt)
# define cr_invalidslen CREG_IDX(TxMaxMinLenErrCnt)
# define cr_lbflowstall CREG_IDX(LBFlowStallCnt)
# define cr_pktrcv CREG_IDX(RxDataPktCnt)
# define cr_pktrcvflowctrl CREG_IDX(RxFlowPktCnt)
# define cr_pktsend CREG_IDX(TxDataPktCnt)
# define cr_pktsendflow CREG_IDX(TxFlowPktCnt)
# define cr_portovfl CREG_IDX(RxP0HdrEgrOvflCnt)
# define cr_rcvebp CREG_IDX(RxEBPCnt)
# define cr_rcvovfl CREG_IDX(RxBufOvflCnt)
# define cr_senddropped CREG_IDX(TxDroppedPktCnt)
# define cr_sendstall CREG_IDX(TxFlowStallCnt)
# define cr_sendunderrun CREG_IDX(TxUnderrunCnt)
# define cr_wordrcv CREG_IDX(RxDwordCnt)
# define cr_wordsend CREG_IDX(TxDwordCnt)
# define cr_txunsupvl CREG_IDX(TxUnsupVLErrCnt)
# define cr_rxdroppkt CREG_IDX(RxDroppedPktCnt)
# define cr_iblinkerrrecov CREG_IDX(IBLinkErrRecoveryCnt)
# define cr_iblinkdown CREG_IDX(IBLinkDownedCnt)
# define cr_ibsymbolerr CREG_IDX(IBSymbolErrCnt)
# define SYM_RMASK(regname, fldname) ((u64) \
QIB_6120_ # # regname # # _ # # fldname # # _RMASK )
# define SYM_MASK(regname, fldname) ((u64) \
QIB_6120_ # # regname # # _ # # fldname # # _RMASK < < \
QIB_6120_ # # regname # # _ # # fldname # # _LSB )
# define SYM_LSB(regname, fldname) (QIB_6120_##regname##_##fldname##_LSB)
# define SYM_FIELD(value, regname, fldname) ((u64) \
( ( ( value ) > > SYM_LSB ( regname , fldname ) ) & \
SYM_RMASK ( regname , fldname ) ) )
# define ERR_MASK(fldname) SYM_MASK(ErrMask, fldname##Mask)
# define HWE_MASK(fldname) SYM_MASK(HwErrMask, fldname##Mask)
/* link training states, from IBC */
# define IB_6120_LT_STATE_DISABLED 0x00
# define IB_6120_LT_STATE_LINKUP 0x01
# define IB_6120_LT_STATE_POLLACTIVE 0x02
# define IB_6120_LT_STATE_POLLQUIET 0x03
# define IB_6120_LT_STATE_SLEEPDELAY 0x04
# define IB_6120_LT_STATE_SLEEPQUIET 0x05
# define IB_6120_LT_STATE_CFGDEBOUNCE 0x08
# define IB_6120_LT_STATE_CFGRCVFCFG 0x09
# define IB_6120_LT_STATE_CFGWAITRMT 0x0a
# define IB_6120_LT_STATE_CFGIDLE 0x0b
# define IB_6120_LT_STATE_RECOVERIDLE 0x0f
/* link state machine states from IBC */
# define IB_6120_L_STATE_DOWN 0x0
# define IB_6120_L_STATE_INIT 0x1
# define IB_6120_L_STATE_ARM 0x2
# define IB_6120_L_STATE_ACTIVE 0x3
# define IB_6120_L_STATE_ACT_DEFER 0x4
static const u8 qib_6120_physportstate [ 0x20 ] = {
} ;
struct qib_chip_specific {
u64 __iomem * cregbase ;
u64 * cntrs ;
u64 * portcntrs ;
void * dummy_hdrq ; /* used after ctxt close */
dma_addr_t dummy_hdrq_phys ;
spinlock_t kernel_tid_lock ; /* no back to back kernel TID writes */
spinlock_t user_tid_lock ; /* no back to back user TID writes */
spinlock_t rcvmod_lock ; /* protect rcvctrl shadow changes */
spinlock_t gpio_lock ; /* RMW of shadows/regs for ExtCtrl and GPIO */
u64 hwerrmask ;
u64 errormask ;
u64 gpio_out ; /* shadow of kr_gpio_out, for rmw ops */
u64 gpio_mask ; /* shadow the gpio mask register */
u64 extctrl ; /* shadow the gpio output enable, etc... */
* these 5 fields are used to establish deltas for IB symbol
* errors and linkrecovery errors . They can be reported on
* some chips during link negotiation prior to INIT , and with
* DDR when faking DDR negotiations with non - IBTA switches .
* The chip counters are adjusted at driver unload if there is
* a non - zero delta .
u64 ibdeltainprog ;
u64 ibsymdelta ;
u64 ibsymsnap ;
u64 iblnkerrdelta ;
u64 iblnkerrsnap ;
u64 ibcctrl ; /* shadow for kr_ibcctrl */
u32 lastlinkrecov ; /* link recovery issue */
int irq ;
u32 cntrnamelen ;
u32 portcntrnamelen ;
u32 ncntrs ;
u32 nportcntrs ;
/* used with gpio interrupts to implement IB counters */
u32 rxfc_unsupvl_errs ;
u32 overrun_thresh_errs ;
* these count only cases where _successive_ LocalLinkIntegrity
* errors were seen in the receive headers of IB standard packets
u32 lli_errs ;
u32 lli_counter ;
u64 lli_thresh ;
u64 sword ; /* total dwords sent (sample result) */
u64 rword ; /* total dwords received (sample result) */
u64 spkts ; /* total packets sent (sample result) */
u64 rpkts ; /* total packets received (sample result) */
u64 xmit_wait ; /* # of ticks no data sent (sample result) */
struct timer_list pma_timer ;
char emsgbuf [ 128 ] ;
char bitsmsgbuf [ 64 ] ;
u8 pma_sample_status ;
} ;
/* ibcctrl bits */
/* cycle through TS1/TS2 till OK */
/* wait for TS1, then go on */
# define QLOGIC_IB_IBCC_LINKCMD_DOWN 1 /* move to 0x11 */
# define QLOGIC_IB_IBCC_LINKCMD_ARMED 2 /* move to 0x21 */
# define QLOGIC_IB_IBCC_LINKCMD_ACTIVE 3 /* move to 0x31 */
* We could have a single register get / put routine , that takes a group type ,
* but this is somewhat clearer and cleaner . It also gives us some error
* checking . 64 bit register reads should always work , but are inefficient
* on opteron ( the northbridge always generates 2 separate HT 32 bit reads ) ,
* so we use kreg32 wherever possible . User register and counter register
* reads are always 32 bit reads , so only one form of those routines .
* qib_read_ureg32 - read 32 - bit virtualized per - context register
* @ dd : device
* @ regno : register number
* @ ctxt : context number
* Return the contents of a register that is virtualized to be per context .
* Returns - 1 on errors ( not distinguishable from valid contents at
* runtime ; we may add a separate error variable at some point ) .
static inline u32 qib_read_ureg32 ( const struct qib_devdata * dd ,
enum qib_ureg regno , int ctxt )
if ( ! dd - > kregbase | | ! ( dd - > flags & QIB_PRESENT ) )
return 0 ;
if ( dd - > userbase )
return readl ( regno + ( u64 __iomem * )
( ( char __iomem * ) dd - > userbase +
dd - > ureg_align * ctxt ) ) ;
return readl ( regno + ( u64 __iomem * )
( dd - > uregbase +
( char __iomem * ) dd - > kregbase +
dd - > ureg_align * ctxt ) ) ;
* qib_write_ureg - write 32 - bit virtualized per - context register
* @ dd : device
* @ regno : register number
* @ value : value
* @ ctxt : context
* Write the contents of a register that is virtualized to be per context .
static inline void qib_write_ureg ( const struct qib_devdata * dd ,
enum qib_ureg regno , u64 value , int ctxt )
u64 __iomem * ubase ;
if ( dd - > userbase )
ubase = ( u64 __iomem * )
( ( char __iomem * ) dd - > userbase +
dd - > ureg_align * ctxt ) ;
ubase = ( u64 __iomem * )
( dd - > uregbase +
( char __iomem * ) dd - > kregbase +
dd - > ureg_align * ctxt ) ;
if ( dd - > kregbase & & ( dd - > flags & QIB_PRESENT ) )
writeq ( value , & ubase [ regno ] ) ;
static inline u32 qib_read_kreg32 ( const struct qib_devdata * dd ,
const u16 regno )
if ( ! dd - > kregbase | | ! ( dd - > flags & QIB_PRESENT ) )
return - 1 ;
return readl ( ( u32 __iomem * ) & dd - > kregbase [ regno ] ) ;
static inline u64 qib_read_kreg64 ( const struct qib_devdata * dd ,
const u16 regno )
if ( ! dd - > kregbase | | ! ( dd - > flags & QIB_PRESENT ) )
return - 1 ;
return readq ( & dd - > kregbase [ regno ] ) ;
static inline void qib_write_kreg ( const struct qib_devdata * dd ,
const u16 regno , u64 value )
if ( dd - > kregbase & & ( dd - > flags & QIB_PRESENT ) )
writeq ( value , & dd - > kregbase [ regno ] ) ;
* qib_write_kreg_ctxt - write a device ' s per - ctxt 64 - bit kernel register
* @ dd : the qlogic_ib device
* @ regno : the register number to write
* @ ctxt : the context containing the register
* @ value : the value to write
static inline void qib_write_kreg_ctxt ( const struct qib_devdata * dd ,
const u16 regno , unsigned ctxt ,
u64 value )
qib_write_kreg ( dd , regno + ctxt , value ) ;
static inline void write_6120_creg ( const struct qib_devdata * dd ,
u16 regno , u64 value )
if ( dd - > cspec - > cregbase & & ( dd - > flags & QIB_PRESENT ) )
writeq ( value , & dd - > cspec - > cregbase [ regno ] ) ;
static inline u64 read_6120_creg ( const struct qib_devdata * dd , u16 regno )
if ( ! dd - > cspec - > cregbase | | ! ( dd - > flags & QIB_PRESENT ) )
return 0 ;
return readq ( & dd - > cspec - > cregbase [ regno ] ) ;
static inline u32 read_6120_creg32 ( const struct qib_devdata * dd , u16 regno )
if ( ! dd - > cspec - > cregbase | | ! ( dd - > flags & QIB_PRESENT ) )
return 0 ;
return readl ( & dd - > cspec - > cregbase [ regno ] ) ;
/* kr_control bits */
/* kr_intstatus, kr_intclear, kr_intmask bits */
# define QLOGIC_IB_I_RCVURG_MASK ((1U << 5) - 1)
# define QLOGIC_IB_I_RCVAVAIL_MASK ((1U << 5) - 1)
# define QLOGIC_IB_C_FREEZEMODE 0x00000002
# define QLOGIC_IB_C_LINKENABLE 0x00000004
# define QLOGIC_IB_I_ERROR 0x0000000080000000ULL
# define QLOGIC_IB_I_SPIOSENT 0x0000000040000000ULL
# define QLOGIC_IB_I_SPIOBUFAVAIL 0x0000000020000000ULL
# define QLOGIC_IB_I_GPIO 0x0000000010000000ULL
/* kr_hwerrclear, kr_hwerrmask, kr_hwerrstatus, bits */
# define QLOGIC_IB_HWE_PCIEPOISONEDTLP 0x0000000010000000ULL
# define QLOGIC_IB_HWE_PCIECPLTIMEOUT 0x0000000020000000ULL
# define QLOGIC_IB_HWE_PCIEBUSPARITYXTLH 0x0000000040000000ULL
# define QLOGIC_IB_HWE_PCIEBUSPARITYXADM 0x0000000080000000ULL
# define QLOGIC_IB_HWE_PCIEBUSPARITYRADM 0x0000000100000000ULL
# define QLOGIC_IB_HWE_COREPLL_FBSLIP 0x0080000000000000ULL
# define QLOGIC_IB_HWE_COREPLL_RFSLIP 0x0100000000000000ULL
# define QLOGIC_IB_HWE_PCIE1PLLFAILED 0x0400000000000000ULL
# define QLOGIC_IB_HWE_PCIE0PLLFAILED 0x0800000000000000ULL
# define QLOGIC_IB_HWE_SERDESPLLFAILED 0x1000000000000000ULL
/* kr_extstatus bits */
# define QLOGIC_IB_EXTS_MEMBIST_ENDTEST 0x0000000000004000
# define QLOGIC_IB_EXTS_MEMBIST_FOUND 0x0000000000008000
/* kr_xgxsconfig bits */
# define _QIB_GPIO_SDA_NUM 1
# define _QIB_GPIO_SCL_NUM 0
/* Bits in GPIO for the added IB link interrupts */
# define GPIO_RXUVL_BIT 3
# define GPIO_OVRUN_BIT 4
# define GPIO_LLI_BIT 5
# define GPIO_ERRINTR_MASK 0x38
# define QLOGIC_IB_RT_BUFSIZE_MASK 0xe0000000ULL
( ( ( ( tid ) & QLOGIC_IB_RT_BUFSIZE_MASK ) > > 29 ) + 11 - 1 )
# define QLOGIC_IB_RT_IS_VALID(tid) \
( ( ( tid ) & QLOGIC_IB_RT_BUFSIZE_MASK ) & & \
# define QLOGIC_IB_RT_ADDR_MASK 0x1FFFFFFFULL /* 29 bits valid */
# define IBA6120_R_PKEY_DIS_SHIFT 30
# define PBC_6120_VL15_SEND_CTRL (1ULL << 31) /* pbc; VL15; link_buf only */
# define SYM_MASK_BIT(regname, fldname, bit) ((u64) \
( ( 1ULL < < ( SYM_LSB ( regname , fldname ) + ( bit ) ) ) ) )
SYM_MASK_BIT ( HwErrMask , TXEMemParityErrMask , 0 )
SYM_MASK_BIT ( HwErrMask , TXEMemParityErrMask , 1 )
SYM_MASK_BIT ( HwErrMask , TXEMemParityErrMask , 2 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 0 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 1 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 2 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 3 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 4 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 5 )
SYM_MASK_BIT ( HwErrMask , RXEMemParityErrMask , 6 )
/* 6120 specific hardware errors... */
static const struct qib_hwerror_msgs qib_6120_hwerror_msgs [ ] = {
/* generic hardware errors */
" TXE PIOBUF Memory Parity " ) ,
" TXE PIOPBC Memory Parity " ) ,
" TXE PIOLAUNCHFIFO Memory Parity " ) ,
" RXE RCVBUF Memory Parity " ) ,
" RXE LOOKUPQ Memory Parity " ) ,
" RXE EAGERTID Memory Parity " ) ,
" RXE EXPTID Memory Parity " ) ,
" RXE FLAGBUF Memory Parity " ) ,
" RXE DATAINFO Memory Parity " ) ,
" RXE HDRINFO Memory Parity " ) ,
/* chip-specific hardware errors */
" PCIe Poisoned TLP " ) ,
" PCIe completion timeout " ) ,
* In practice , it ' s unlikely wthat we ' ll see PCIe PLL , or bus
* parity or memory parity error failures , because most likely we
* won ' t be able to talk to the core of the chip . Nonetheless , we
* might see them , if they are in parts of the PCIe core that aren ' t
* essential .
" PCIePLL1 " ) ,
" PCIePLL0 " ) ,
" PCIe XTLH core parity " ) ,
" PCIe ADM TX core parity " ) ,
" PCIe ADM RX core parity " ) ,
" SerDes PLL " ) ,
} ;
/* variables for sanity checking interrupt and errors */
( HWE_MASK ( RXEMemParityErr ) | \
HWE_MASK ( TXEMemParityErr ) | \
HWE_MASK ( PowerOnBISTFailed ) | \
HWE_MASK ( IBCBusToSPCParityErr ) | \
HWE_MASK ( IBCBusFromSPCParityErr ) )
# define IB_E_BITSEXTANT \
( ERR_MASK ( RcvFormatErr ) | ERR_MASK ( RcvVCRCErr ) | \
ERR_MASK ( RcvICRCErr ) | ERR_MASK ( RcvMinPktLenErr ) | \
ERR_MASK ( RcvMaxPktLenErr ) | ERR_MASK ( RcvLongPktLenErr ) | \
ERR_MASK ( RcvShortPktLenErr ) | ERR_MASK ( RcvUnexpectedCharErr ) | \
ERR_MASK ( RcvUnsupportedVLErr ) | ERR_MASK ( RcvEBPErr ) | \
ERR_MASK ( RcvIBFlowErr ) | ERR_MASK ( RcvBadVersionErr ) | \
ERR_MASK ( RcvEgrFullErr ) | ERR_MASK ( RcvHdrFullErr ) | \
ERR_MASK ( RcvBadTidErr ) | ERR_MASK ( RcvHdrLenErr ) | \
ERR_MASK ( RcvHdrErr ) | ERR_MASK ( RcvIBLostLinkErr ) | \
ERR_MASK ( SendMinPktLenErr ) | ERR_MASK ( SendMaxPktLenErr ) | \
ERR_MASK ( SendUnderRunErr ) | ERR_MASK ( SendPktLenErr ) | \
ERR_MASK ( SendDroppedSmpPktErr ) | \
ERR_MASK ( SendDroppedDataPktErr ) | \
ERR_MASK ( SendPioArmLaunchErr ) | \
ERR_MASK ( SendUnexpectedPktNumErr ) | \
ERR_MASK ( SendUnsupportedVLErr ) | ERR_MASK ( IBStatusChanged ) | \
ERR_MASK ( InvalidAddrErr ) | ERR_MASK ( ResetNegated ) | \
ERR_MASK ( HardwareErr ) )
# define QLOGIC_IB_E_PKTERRS ( \
ERR_MASK ( SendPktLenErr ) | \
ERR_MASK ( SendDroppedDataPktErr ) | \
ERR_MASK ( RcvVCRCErr ) | \
ERR_MASK ( RcvICRCErr ) | \
ERR_MASK ( RcvShortPktLenErr ) | \
ERR_MASK ( RcvEBPErr ) )
/* These are all rcv-related errors which we want to count for stats */
# define E_SUM_PKTERRS \
( ERR_MASK ( RcvHdrLenErr ) | ERR_MASK ( RcvBadTidErr ) | \
ERR_MASK ( RcvBadVersionErr ) | ERR_MASK ( RcvHdrErr ) | \
ERR_MASK ( RcvLongPktLenErr ) | ERR_MASK ( RcvShortPktLenErr ) | \
ERR_MASK ( RcvMaxPktLenErr ) | ERR_MASK ( RcvMinPktLenErr ) | \
ERR_MASK ( RcvFormatErr ) | ERR_MASK ( RcvUnsupportedVLErr ) | \
ERR_MASK ( RcvUnexpectedCharErr ) | ERR_MASK ( RcvEBPErr ) )
/* These are all send-related errors which we want to count for stats */
# define E_SUM_ERRS \
( ERR_MASK ( SendPioArmLaunchErr ) | \
ERR_MASK ( SendUnexpectedPktNumErr ) | \
ERR_MASK ( SendDroppedDataPktErr ) | \
ERR_MASK ( SendDroppedSmpPktErr ) | \
ERR_MASK ( SendMaxPktLenErr ) | ERR_MASK ( SendUnsupportedVLErr ) | \
ERR_MASK ( SendMinPktLenErr ) | ERR_MASK ( SendPktLenErr ) | \
ERR_MASK ( InvalidAddrErr ) )
* this is similar to E_SUM_ERRS , but can ' t ignore armlaunch , don ' t ignore
* errors not related to freeze and cancelling buffers . Can ' t ignore
* armlaunch because could get more while still cleaning up , and need
* to cancel those as they happen .
( ERR_MASK ( SendDroppedDataPktErr ) | \
ERR_MASK ( SendDroppedSmpPktErr ) | \
ERR_MASK ( SendMaxPktLenErr ) | ERR_MASK ( SendMinPktLenErr ) | \
ERR_MASK ( SendPktLenErr ) )
* these are errors that can occur when the link changes state while
* a packet is being sent or received . This doesn ' t cover things
* like EBP or VCRC that can be the result of a sending having the
* link change state , so we receive a " known bad " packet .
( ERR_MASK ( SendDroppedDataPktErr ) | \
ERR_MASK ( SendDroppedSmpPktErr ) | \
ERR_MASK ( SendMinPktLenErr ) | ERR_MASK ( SendPktLenErr ) | \
ERR_MASK ( RcvShortPktLenErr ) | ERR_MASK ( RcvMinPktLenErr ) | \
ERR_MASK ( RcvUnexpectedCharErr ) )
static void qib_6120_put_tid_2 ( struct qib_devdata * , u64 __iomem * ,
u32 , unsigned long ) ;
* On platforms using this chip , and not having ordered WC stores , we
* can get TXE parity errors due to speculative reads to the PIO buffers ,
* and this , due to a chip issue can result in ( many ) false parity error
* reports . So it ' s a debug print on those , and an info print on systems
* where the speculative reads don ' t occur .
static void qib_6120_txe_recover ( struct qib_devdata * dd )
if ( ! qib_unordered_wc ( ) )
qib_devinfo ( dd - > pcidev ,
" Recovering from TXE PIO parity error \n " ) ;
/* enable/disable chip from delivering interrupts */
static void qib_6120_set_intr_state ( struct qib_devdata * dd , u32 enable )
if ( enable ) {
if ( dd - > flags & QIB_BADINTR )
return ;
qib_write_kreg ( dd , kr_intmask , ~ 0ULL ) ;
/* force re-interrupt of any pending interrupts. */
qib_write_kreg ( dd , kr_intclear , 0ULL ) ;
} else
qib_write_kreg ( dd , kr_intmask , 0ULL ) ;
* Try to cleanup as much as possible for anything that might have gone
* wrong while in freeze mode , such as pio buffers being written by user
* processes ( causing armlaunch ) , send errors due to going into freeze mode ,
* etc . , and try to avoid causing extra interrupts while doing so .
* Forcibly update the in - memory pioavail register copies after cleanup
* because the chip won ' t do it while in freeze mode ( the register values
* themselves are kept correct ) .
* Make sure that we don ' t lose any important interrupts by using the chip
* feature that says that writing 0 to a bit in * clear that is set in
* * status will cause an interrupt to be generated again ( if allowed by
* the * mask value ) .
* This is in chip - specific code because of all of the register accesses ,
* even though the details are similar on most chips
static void qib_6120_clear_freeze ( struct qib_devdata * dd )
/* disable error interrupts, to avoid confusion */
qib_write_kreg ( dd , kr_errmask , 0ULL ) ;
/* also disable interrupts; errormask is sometimes overwriten */
qib_6120_set_intr_state ( dd , 0 ) ;
qib_cancel_sends ( dd - > pport ) ;
/* clear the freeze, and be sure chip saw it */
qib_write_kreg ( dd , kr_control , dd - > control ) ;
qib_read_kreg32 ( dd , kr_scratch ) ;
/* force in-memory update now we are out of freeze */
qib_force_pio_avail_update ( dd ) ;
* force new interrupt if any hwerr , error or interrupt bits are
* still set , and clear " safe " send packet errors related to freeze
* and cancelling sends . Re - enable error interrupts before possible
* force of re - interrupt on pending interrupts .
qib_write_kreg ( dd , kr_hwerrclear , 0ULL ) ;
qib_write_kreg ( dd , kr_errclear , E_SPKT_ERRS_IGNORE ) ;
qib_write_kreg ( dd , kr_errmask , dd - > cspec - > errormask ) ;
qib_6120_set_intr_state ( dd , 1 ) ;
* qib_handle_6120_hwerrors - display hardware errors .
* @ dd : the qlogic_ib device
* @ msg : the output buffer
* @ msgl : the size of the output buffer
* Use same msg buffer as regular errors to avoid excessive stack
* use . Most hardware errors are catastrophic , but for right now ,
* we ' ll print them and continue . Reuse the same message buffer as
* handle_6120_errors ( ) to avoid excessive stack usage .
static void qib_handle_6120_hwerrors ( struct qib_devdata * dd , char * msg ,
size_t msgl )
u64 hwerrs ;
u32 bits , ctrl ;
int isfatal = 0 ;
char * bitsmsg ;
int log_idx ;
hwerrs = qib_read_kreg64 ( dd , kr_hwerrstatus ) ;
if ( ! hwerrs )
return ;
if ( hwerrs = = ~ 0ULL ) {
qib_dev_err ( dd , " Read of hardware error status failed "
" (all bits set); ignoring \n " ) ;
return ;
qib_stats . sps_hwerrs + + ;
/* Always clear the error status register, except MEMBISTFAIL,
* regardless of whether we continue or stop using the chip .
* We want that set so we know it failed , even across driver reload .
* We ' ll still ignore it in the hwerrmask . We do this partly for
* diagnostics , but also for support */
qib_write_kreg ( dd , kr_hwerrclear ,
hwerrs & ~ HWE_MASK ( PowerOnBISTFailed ) ) ;
hwerrs & = dd - > cspec - > hwerrmask ;
/* We log some errors to EEPROM, check if we have any of those. */
for ( log_idx = 0 ; log_idx < QIB_EEP_LOG_CNT ; + + log_idx )
if ( hwerrs & dd - > eep_st_masks [ log_idx ] . hwerrs_to_log )
qib_inc_eeprom_err ( dd , log_idx , 1 ) ;
* Make sure we get this much out , unless told to be quiet ,
* or it ' s occurred within the last 5 seconds .
qib_devinfo ( dd - > pcidev , " Hardware error: hwerr=0x%llx "
" (cleared) \n " , ( unsigned long long ) hwerrs ) ;
if ( hwerrs & ~ IB_HWE_BITSEXTANT )
qib_dev_err ( dd , " hwerror interrupt with unknown errors "
" %llx set \n " , ( unsigned long long )
( hwerrs & ~ IB_HWE_BITSEXTANT ) ) ;
ctrl = qib_read_kreg32 ( dd , kr_control ) ;
if ( ( ctrl & QLOGIC_IB_C_FREEZEMODE ) & & ! dd - > diag_client ) {
* Parity errors in send memory are recoverable ,
* just cancel the send ( if indicated in * sendbuffererror ) ,
* count the occurrence , unfreeze ( if no other handled
* hardware error bits are set ) , and continue . They can
* occur if a processor speculative read is done to the PIO
* buffer while we are sending a packet , for example .
if ( hwerrs & TXE_PIO_PARITY ) {
qib_6120_txe_recover ( dd ) ;
hwerrs & = ~ TXE_PIO_PARITY ;
if ( ! hwerrs ) {
static u32 freeze_cnt ;
freeze_cnt + + ;
qib_6120_clear_freeze ( dd ) ;
} else
isfatal = 1 ;
* msg = ' \0 ' ;
if ( hwerrs & HWE_MASK ( PowerOnBISTFailed ) ) {
isfatal = 1 ;
strlcat ( msg , " [Memory BIST test failed, InfiniPath hardware "
" unusable] " , msgl ) ;
/* ignore from now on, so disable until driver reloaded */
dd - > cspec - > hwerrmask & = ~ HWE_MASK ( PowerOnBISTFailed ) ;
qib_write_kreg ( dd , kr_hwerrmask , dd - > cspec - > hwerrmask ) ;
qib_format_hwerrors ( hwerrs , qib_6120_hwerror_msgs ,
ARRAY_SIZE ( qib_6120_hwerror_msgs ) , msg , msgl ) ;
bitsmsg = dd - > cspec - > bitsmsgbuf ;
bits = ( u32 ) ( ( hwerrs > >
snprintf ( bitsmsg , sizeof dd - > cspec - > bitsmsgbuf ,
" [PCIe Mem Parity Errs %x] " , bits ) ;
strlcat ( msg , bitsmsg , msgl ) ;
if ( hwerrs & _QIB_PLL_FAIL ) {
isfatal = 1 ;
snprintf ( bitsmsg , sizeof dd - > cspec - > bitsmsgbuf ,
" [PLL failed (%llx), InfiniPath hardware unusable] " ,
( unsigned long long ) hwerrs & _QIB_PLL_FAIL ) ;
strlcat ( msg , bitsmsg , msgl ) ;
/* ignore from now on, so disable until driver reloaded */
dd - > cspec - > hwerrmask & = ~ ( hwerrs & _QIB_PLL_FAIL ) ;
qib_write_kreg ( dd , kr_hwerrmask , dd - > cspec - > hwerrmask ) ;
* If it occurs , it is left masked since the external
* interface is unused
dd - > cspec - > hwerrmask & = ~ QLOGIC_IB_HWE_SERDESPLLFAILED ;
qib_write_kreg ( dd , kr_hwerrmask , dd - > cspec - > hwerrmask ) ;
if ( hwerrs )
* if any set that we aren ' t ignoring ; only
* make the complaint once , in case it ' s stuck
* or recurring , and we get here multiple
* times .
qib_dev_err ( dd , " %s hardware error \n " , msg ) ;
* msg = 0 ; /* recovered from all of them */
if ( isfatal & & ! dd - > diag_client ) {
qib_dev_err ( dd , " Fatal Hardware Error, no longer "
" usable, SN %.16s \n " , dd - > serial ) ;
* for / sys status file and user programs to print ; if no
* trailing brace is copied , we ' ll know it was truncated .
if ( dd - > freezemsg )
snprintf ( dd - > freezemsg , dd - > freezelen ,
" {%s} " , msg ) ;
qib_disable_after_error ( dd ) ;
* Decode the error status into strings , deciding whether to always
* print * it or not depending on " normal packet errors " vs everything
* else . Return 1 if " real " errors , otherwise 0 if only packet
* errors , so caller can decide what to print with the string .
static int qib_decode_6120_err ( struct qib_devdata * dd , char * buf , size_t blen ,
u64 err )
int iserr = 1 ;
* buf = ' \0 ' ;
if ( err & QLOGIC_IB_E_PKTERRS ) {
if ( ! ( err & ~ QLOGIC_IB_E_PKTERRS ) )
iserr = 0 ;
if ( ( err & ERR_MASK ( RcvICRCErr ) ) & &
! ( err & ( ERR_MASK ( RcvVCRCErr ) | ERR_MASK ( RcvEBPErr ) ) ) )
strlcat ( buf , " CRC " , blen ) ;
if ( ! iserr )
goto done ;
if ( err & ERR_MASK ( RcvHdrLenErr ) )
strlcat ( buf , " rhdrlen " , blen ) ;
if ( err & ERR_MASK ( RcvBadTidErr ) )
strlcat ( buf , " rbadtid " , blen ) ;
if ( err & ERR_MASK ( RcvBadVersionErr ) )
strlcat ( buf , " rbadversion " , blen ) ;
if ( err & ERR_MASK ( RcvHdrErr ) )
strlcat ( buf , " rhdr " , blen ) ;
if ( err & ERR_MASK ( RcvLongPktLenErr ) )
strlcat ( buf , " rlongpktlen " , blen ) ;
if ( err & ERR_MASK ( RcvMaxPktLenErr ) )
strlcat ( buf , " rmaxpktlen " , blen ) ;
if ( err & ERR_MASK ( RcvMinPktLenErr ) )
strlcat ( buf , " rminpktlen " , blen ) ;
if ( err & ERR_MASK ( SendMinPktLenErr ) )
strlcat ( buf , " sminpktlen " , blen ) ;
if ( err & ERR_MASK ( RcvFormatErr ) )
strlcat ( buf , " rformaterr " , blen ) ;
if ( err & ERR_MASK ( RcvUnsupportedVLErr ) )
strlcat ( buf , " runsupvl " , blen ) ;
if ( err & ERR_MASK ( RcvUnexpectedCharErr ) )
strlcat ( buf , " runexpchar " , blen ) ;
if ( err & ERR_MASK ( RcvIBFlowErr ) )
strlcat ( buf , " ribflow " , blen ) ;
if ( err & ERR_MASK ( SendUnderRunErr ) )
strlcat ( buf , " sunderrun " , blen ) ;
if ( err & ERR_MASK ( SendPioArmLaunchErr ) )
strlcat ( buf , " spioarmlaunch " , blen ) ;
if ( err & ERR_MASK ( SendUnexpectedPktNumErr ) )
strlcat ( buf , " sunexperrpktnum " , blen ) ;
if ( err & ERR_MASK ( SendDroppedSmpPktErr ) )
strlcat ( buf , " sdroppedsmppkt " , blen ) ;
if ( err & ERR_MASK ( SendMaxPktLenErr ) )
strlcat ( buf , " smaxpktlen " , blen ) ;
if ( err & ERR_MASK ( SendUnsupportedVLErr ) )
strlcat ( buf , " sunsupVL " , blen ) ;
if ( err & ERR_MASK ( InvalidAddrErr ) )
strlcat ( buf , " invalidaddr " , blen ) ;
if ( err & ERR_MASK ( RcvEgrFullErr ) )
strlcat ( buf , " rcvegrfull " , blen ) ;
if ( err & ERR_MASK ( RcvHdrFullErr ) )
strlcat ( buf , " rcvhdrfull " , blen ) ;
if ( err & ERR_MASK ( IBStatusChanged ) )
strlcat ( buf , " ibcstatuschg " , blen ) ;
if ( err & ERR_MASK ( RcvIBLostLinkErr ) )
strlcat ( buf , " riblostlink " , blen ) ;
if ( err & ERR_MASK ( HardwareErr ) )
strlcat ( buf , " hardware " , blen ) ;
if ( err & ERR_MASK ( ResetNegated ) )
strlcat ( buf , " reset " , blen ) ;
done :
return iserr ;
* Called when we might have an error that is specific to a particular
* PIO buffer , and may need to cancel that buffer , so it can be re - used .
static void qib_disarm_6120_senderrbufs ( struct qib_pportdata * ppd )
unsigned long sbuf [ 2 ] ;
struct qib_devdata * dd = ppd - > dd ;
* It ' s possible that sendbuffererror could have bits set ; might
* have already done this as a result of hardware error handling .
sbuf [ 0 ] = qib_read_kreg64 ( dd , kr_sendbuffererror ) ;
sbuf [ 1 ] = qib_read_kreg64 ( dd , kr_sendbuffererror + 1 ) ;
if ( sbuf [ 0 ] | | sbuf [ 1 ] )
qib_disarm_piobufs_set ( dd , sbuf ,
dd - > piobcnt2k + dd - > piobcnt4k ) ;
static int chk_6120_linkrecovery ( struct qib_devdata * dd , u64 ibcs )
int ret = 1 ;
u32 ibstate = qib_6120_iblink_state ( ibcs ) ;
u32 linkrecov = read_6120_creg32 ( dd , cr_iblinkerrrecov ) ;
if ( linkrecov ! = dd - > cspec - > lastlinkrecov ) {
/* and no more until active again */
dd - > cspec - > lastlinkrecov = 0 ;
qib_set_linkstate ( dd - > pport , QIB_IB_LINKDOWN ) ;
ret = 0 ;
if ( ibstate = = IB_PORT_ACTIVE )
dd - > cspec - > lastlinkrecov =
read_6120_creg32 ( dd , cr_iblinkerrrecov ) ;
return ret ;
static void handle_6120_errors ( struct qib_devdata * dd , u64 errs )
char * msg ;
u64 ignore_this_time = 0 ;
u64 iserr = 0 ;
int log_idx ;
struct qib_pportdata * ppd = dd - > pport ;
u64 mask ;
/* don't report errors that are masked */
errs & = dd - > cspec - > errormask ;
msg = dd - > cspec - > emsgbuf ;
/* do these first, they are most important */
if ( errs & ERR_MASK ( HardwareErr ) )
qib_handle_6120_hwerrors ( dd , msg , sizeof dd - > cspec - > emsgbuf ) ;
for ( log_idx = 0 ; log_idx < QIB_EEP_LOG_CNT ; + + log_idx )
if ( errs & dd - > eep_st_masks [ log_idx ] . errs_to_log )
qib_inc_eeprom_err ( dd , log_idx , 1 ) ;
if ( errs & ~ IB_E_BITSEXTANT )
qib_dev_err ( dd , " error interrupt with unknown errors "
" %llx set \n " ,
( unsigned long long ) ( errs & ~ IB_E_BITSEXTANT ) ) ;
if ( errs & E_SUM_ERRS ) {
qib_disarm_6120_senderrbufs ( ppd ) ;
if ( ( errs & E_SUM_LINK_PKTERRS ) & &
! ( ppd - > lflags & QIBL_LINKACTIVE ) ) {
* This can happen when trying to bring the link
* up , but the IB link changes state at the " wrong "
* time . The IB logic then complains that the packet
* isn ' t valid . We don ' t want to confuse people , so
* we just don ' t print them , except at debug
ignore_this_time = errs & E_SUM_LINK_PKTERRS ;
} else if ( ( errs & E_SUM_LINK_PKTERRS ) & &
! ( ppd - > lflags & QIBL_LINKACTIVE ) ) {
* This can happen when SMA is trying to bring the link
* up , but the IB link changes state at the " wrong " time .
* The IB logic then complains that the packet isn ' t
* valid . We don ' t want to confuse people , so we just
* don ' t print them , except at debug
ignore_this_time = errs & E_SUM_LINK_PKTERRS ;
qib_write_kreg ( dd , kr_errclear , errs ) ;
errs & = ~ ignore_this_time ;
if ( ! errs )
goto done ;
* The ones we mask off are handled specially below
* or above .
mask = ERR_MASK ( IBStatusChanged ) | ERR_MASK ( RcvEgrFullErr ) |
ERR_MASK ( RcvHdrFullErr ) | ERR_MASK ( HardwareErr ) ;
qib_decode_6120_err ( dd , msg , sizeof dd - > cspec - > emsgbuf , errs & ~ mask ) ;
if ( errs & E_SUM_PKTERRS )
qib_stats . sps_rcverrs + + ;
if ( errs & E_SUM_ERRS )
qib_stats . sps_txerrs + + ;
iserr = errs & ~ ( E_SUM_PKTERRS | QLOGIC_IB_E_PKTERRS ) ;
if ( errs & ERR_MASK ( IBStatusChanged ) ) {
u64 ibcs = qib_read_kreg64 ( dd , kr_ibcstatus ) ;
u32 ibstate = qib_6120_iblink_state ( ibcs ) ;
int handle = 1 ;
if ( ibstate ! = IB_PORT_INIT & & dd - > cspec - > lastlinkrecov )
handle = chk_6120_linkrecovery ( dd , ibcs ) ;
* Since going into a recovery state causes the link state
* to go down and since recovery is transitory , it is better
* if we " miss " ever seeing the link training state go into
* recovery ( i . e . , ignore this transition for link state
* special handling purposes ) without updating lastibcstat .
if ( handle & & qib_6120_phys_portstate ( ibcs ) = =
handle = 0 ;
if ( handle )
qib_handle_e_ibstatuschanged ( ppd , ibcs ) ;
if ( errs & ERR_MASK ( ResetNegated ) ) {
qib_dev_err ( dd , " Got reset, requires re-init "
" (unload and reload driver) \n " ) ;
dd - > flags & = ~ QIB_INITTED ; /* needs re-init */
/* mark as having had error */
* dd - > devstatusp | = QIB_STATUS_HWERROR ;
* dd - > pport - > statusp & = ~ QIB_STATUS_IB_CONF ;
if ( * msg & & iserr )
qib_dev_porterr ( dd , ppd - > port , " %s error \n " , msg ) ;
if ( ppd - > state_wanted & ppd - > lflags )
wake_up_interruptible ( & ppd - > state_wait ) ;
* If there were hdrq or egrfull errors , wake up any processes
* waiting in poll . We used to try to check which contexts had
* the overflow , but given the cost of that and the chip reads
* to support it , it ' s better to just wake everybody up if we
* get an overflow ; waiters can poll again if it ' s not them .
if ( errs & ( ERR_MASK ( RcvEgrFullErr ) | ERR_MASK ( RcvHdrFullErr ) ) ) {
qib_handle_urcv ( dd , ~ 0U ) ;
if ( errs & ERR_MASK ( RcvEgrFullErr ) )
qib_stats . sps_buffull + + ;
qib_stats . sps_hdrfull + + ;
done :
return ;
* qib_6120_init_hwerrors - enable hardware errors
* @ dd : the qlogic_ib device
* now that we have finished initializing everything that might reasonably
* cause a hardware error , and cleared those errors bits as they occur ,
* we can enable hardware errors in the mask ( potentially enabling
* freeze mode ) , and enable hardware errors as errors ( along with
* everything else ) in errormask
static void qib_6120_init_hwerrors ( struct qib_devdata * dd )
u64 val ;
u64 extsval ;
extsval = qib_read_kreg64 ( dd , kr_extstatus ) ;
if ( ! ( extsval & QLOGIC_IB_EXTS_MEMBIST_ENDTEST ) )
qib_dev_err ( dd , " MemBIST did not complete! \n " ) ;
/* init so all hwerrors interrupt, and enter freeze, ajdust below */
val = ~ 0ULL ;
if ( dd - > minrev < 2 ) {
* Avoid problem with internal interface bus parity
* checking . Fixed in Rev2 .
/* avoid some intel cpu's speculative read freeze mode issue */
dd - > cspec - > hwerrmask = val ;
qib_write_kreg ( dd , kr_hwerrclear , ~ HWE_MASK ( PowerOnBISTFailed ) ) ;
qib_write_kreg ( dd , kr_hwerrmask , dd - > cspec - > hwerrmask ) ;
/* clear all */
qib_write_kreg ( dd , kr_errclear , ~ 0ULL ) ;
/* enable errors that are masked, at least this first time. */
qib_write_kreg ( dd , kr_errmask , ~ 0ULL ) ;
dd - > cspec - > errormask = qib_read_kreg64 ( dd , kr_errmask ) ;
/* clear any interrupts up to this point (ints still not enabled) */
qib_write_kreg ( dd , kr_intclear , ~ 0ULL ) ;
qib_write_kreg ( dd , kr_rcvbthqp ,
dd - > qpn_mask < < ( QIB_6120_RcvBTHQP_BTHQP_Mask_LSB - 1 ) |
* Disable and enable the armlaunch error . Used for PIO bandwidth testing
* on chips that are count - based , rather than trigger - based . There is no
* reference counting , but that ' s also fine , given the intended use .
* Only chip - specific because it ' s all register accesses
static void qib_set_6120_armlaunch ( struct qib_devdata * dd , u32 enable )
if ( enable ) {
qib_write_kreg ( dd , kr_errclear ,
ERR_MASK ( SendPioArmLaunchErr ) ) ;
dd - > cspec - > errormask | = ERR_MASK ( SendPioArmLaunchErr ) ;
} else
dd - > cspec - > errormask & = ~ ERR_MASK ( SendPioArmLaunchErr ) ;
qib_write_kreg ( dd , kr_errmask , dd - > cspec - > errormask ) ;
* Formerly took parameter < which > in pre - shifted ,
* pre - merged form with LinkCmd and LinkInitCmd
* together , and assuming the zero was NOP .
static void qib_set_ib_6120_lstate ( struct qib_pportdata * ppd , u16 linkcmd ,
u16 linitcmd )
u64 mod_wd ;
struct qib_devdata * dd = ppd - > dd ;
unsigned long flags ;
* If we are told to disable , note that so link - recovery
* code does not attempt to bring us back up .
spin_lock_irqsave ( & ppd - > lflags_lock , flags ) ;
ppd - > lflags | = QIBL_IB_LINK_DISABLED ;
spin_unlock_irqrestore ( & ppd - > lflags_lock , flags ) ;
} else if ( linitcmd | | linkcmd = = QLOGIC_IB_IBCC_LINKCMD_DOWN ) {
* Any other linkinitcmd will lead to LINKDOWN and then
* to INIT ( if all is well ) , so clear flag to let
* link - recovery code attempt to bring us back up .
spin_lock_irqsave ( & ppd - > lflags_lock , flags ) ;
ppd - > lflags & = ~ QIBL_IB_LINK_DISABLED ;
spin_unlock_irqrestore ( & ppd - > lflags_lock , flags ) ;
mod_wd = ( linkcmd < < QLOGIC_IB_IBCC_LINKCMD_SHIFT ) |
qib_write_kreg ( dd , kr_ibcctrl , dd - > cspec - > ibcctrl | mod_wd ) ;
/* write to chip to prevent back-to-back writes of control reg */
qib_write_kreg ( dd , kr_scratch , 0 ) ;
* qib_6120_bringup_serdes - bring up the serdes
* @ dd : the qlogic_ib device
static int qib_6120_bringup_serdes ( struct qib_pportdata * ppd )
struct qib_devdata * dd = ppd - > dd ;
u64 val , config1 , prev_val , hwstat , ibc ;
/* Put IBC in reset, sends disabled */
dd - > control & = ~ QLOGIC_IB_C_LINKENABLE ;
qib_write_kreg ( dd , kr_control , 0ULL ) ;
dd - > cspec - > ibdeltainprog = 1 ;
dd - > cspec - > ibsymsnap = read_6120_creg32 ( dd , cr_ibsymbolerr ) ;
dd - > cspec - > iblnkerrsnap = read_6120_creg32 ( dd , cr_iblinkerrrecov ) ;
/* flowcontrolwatermark is in units of KBytes */
ibc = 0x5ULL < < SYM_LSB ( IBCCtrl , FlowCtrlWaterMark ) ;
* How often flowctrl sent . More or less in usecs ; balance against
* watermark value , so that in theory senders always get a flow
* control update in time to not let the IB link go idle .
ibc | = 0x3ULL < < SYM_LSB ( IBCCtrl , FlowCtrlPeriod ) ;
/* max error tolerance */
dd - > cspec - > lli_thresh = 0xf ;
ibc | = ( u64 ) dd - > cspec - > lli_thresh < < SYM_LSB ( IBCCtrl , PhyerrThreshold ) ;
/* use "real" buffer space for */
ibc | = 4ULL < < SYM_LSB ( IBCCtrl , CreditScale ) ;
/* IB credit flow control. */
ibc | = 0xfULL < < SYM_LSB ( IBCCtrl , OverrunThreshold ) ;
* set initial max size pkt IBC will send , including ICRC ; it ' s the
* PIO buffer size in dwords , less 1 ; also see qib_set_mtu ( )
ibc | = ( ( u64 ) ( ppd - > ibmaxlen > > 2 ) + 1 ) < < SYM_LSB ( IBCCtrl , MaxPktLen ) ;
dd - > cspec - > ibcctrl = ibc ; /* without linkcmd or linkinitcmd! */
/* initially come up waiting for TS1, without sending anything. */
val = dd - > cspec - > ibcctrl | ( QLOGIC_IB_IBCC_LINKINITCMD_DISABLE < <
qib_write_kreg ( dd , kr_ibcctrl , val ) ;
val = qib_read_kreg64 ( dd , kr_serdes_cfg0 ) ;
config1 = qib_read_kreg64 ( dd , kr_serdes_cfg1 ) ;
* Force reset on , also set rxdetect enable . Must do before reading
* serdesstatus at least for simulation , or some of the bits in
* serdes status will come back as undefined and cause simulation
* failures
val | = SYM_MASK ( SerdesCfg0 , ResetPLL ) |
SYM_MASK ( SerdesCfg0 , RxDetEnX ) |
( SYM_MASK ( SerdesCfg0 , L1PwrDnA ) |
SYM_MASK ( SerdesCfg0 , L1PwrDnB ) |
SYM_MASK ( SerdesCfg0 , L1PwrDnC ) |
SYM_MASK ( SerdesCfg0 , L1PwrDnD ) ) ;
qib_write_kreg ( dd , kr_serdes_cfg0 , val ) ;
/* be sure chip saw it */
qib_read_kreg64 ( dd , kr_scratch ) ;
udelay ( 5 ) ; /* need pll reset set at least for a bit */
* after PLL is reset , set the per - lane Resets and TxIdle and
* clear the PLL reset and rxdetect ( to get falling edge ) .
* Leave L1PWR bits set ( permanently )
val & = ~ ( SYM_MASK ( SerdesCfg0 , RxDetEnX ) |
SYM_MASK ( SerdesCfg0 , ResetPLL ) |
( SYM_MASK ( SerdesCfg0 , L1PwrDnA ) |
SYM_MASK ( SerdesCfg0 , L1PwrDnB ) |
SYM_MASK ( SerdesCfg0 , L1PwrDnC ) |
SYM_MASK ( SerdesCfg0 , L1PwrDnD ) ) ) ;
val | = ( SYM_MASK ( SerdesCfg0 , ResetA ) |
SYM_MASK ( SerdesCfg0 , ResetB ) |
SYM_MASK ( SerdesCfg0 , ResetC ) |
SYM_MASK ( SerdesCfg0 , ResetD ) ) |
SYM_MASK ( SerdesCfg0 , TxIdeEnX ) ;
qib_write_kreg ( dd , kr_serdes_cfg0 , val ) ;
/* be sure chip saw it */
( void ) qib_read_kreg64 ( dd , kr_scratch ) ;
/* need PLL reset clear for at least 11 usec before lane
* resets cleared ; give it a few more to be sure */
udelay ( 15 ) ;
val & = ~ ( ( SYM_MASK ( SerdesCfg0 , ResetA ) |
SYM_MASK ( SerdesCfg0 , ResetB ) |
SYM_MASK ( SerdesCfg0 , ResetC ) |
SYM_MASK ( SerdesCfg0 , ResetD ) ) |
SYM_MASK ( SerdesCfg0 , TxIdeEnX ) ) ;
qib_write_kreg ( dd , kr_serdes_cfg0 , val ) ;
/* be sure chip saw it */
( void ) qib_read_kreg64 ( dd , kr_scratch ) ;
val = qib_read_kreg64 ( dd , kr_xgxs_cfg ) ;
prev_val = val ;
if ( SYM_FIELD ( val , XGXSCfg , polarity_inv ) ! = ppd - > rx_pol_inv ) {
/* need to compensate for Tx inversion in partner */
val & = ~ SYM_MASK ( XGXSCfg , polarity_inv ) ;
val | = ( u64 ) ppd - > rx_pol_inv < < SYM_LSB ( XGXSCfg , polarity_inv ) ;
if ( val ! = prev_val )
qib_write_kreg ( dd , kr_xgxs_cfg , val ) ;
val = qib_read_kreg64 ( dd , kr_serdes_cfg0 ) ;
/* clear current and de-emphasis bits */
config1 & = ~ 0x0ffffffff00ULL ;
/* set current to 20ma */
config1 | = 0x00000000000ULL ;
/* set de-emphasis to -5.68dB */
config1 | = 0x0cccc000000ULL ;
qib_write_kreg ( dd , kr_serdes_cfg1 , config1 ) ;
/* base and port guid same for single port */
ppd - > guid = dd - > base_guid ;
* the process of setting and un - resetting the serdes normally
* causes a serdes PLL error , so check for that and clear it
* here . Also clearr hwerr bit in errstatus , but not others .
hwstat = qib_read_kreg64 ( dd , kr_hwerrstatus ) ;
if ( hwstat ) {
/* should just have PLL, clear all set, in an case */
2010-06-17 23:14:04 +00:00
qib_write_kreg ( dd , kr_hwerrclear , hwstat ) ;
2010-05-23 21:44:54 -07:00
qib_write_kreg ( dd , kr_errclear , ERR_MASK ( HardwareErr ) ) ;
dd - > control | = QLOGIC_IB_C_LINKENABLE ;
dd - > control & = ~ QLOGIC_IB_C_FREEZEMODE ;
qib_write_kreg ( dd , kr_control , dd - > control ) ;
return 0 ;
* qib_6120_quiet_serdes - set serdes to txidle
* @ ppd : physical port of the qlogic_ib device
* Called when driver is being unloaded
static void qib_6120_quiet_serdes ( struct qib_pportdata * ppd )
struct qib_devdata * dd = ppd - > dd ;
u64 val ;
qib_set_ib_6120_lstate ( ppd , 0 , QLOGIC_IB_IBCC_LINKINITCMD_DISABLE ) ;
/* disable IBC */
dd - > control & = ~ QLOGIC_IB_C_LINKENABLE ;
qib_write_kreg ( dd , kr_control ,
dd - > control | QLOGIC_IB_C_FREEZEMODE ) ;
if ( dd - > cspec - > ibsymdelta | | dd - > cspec - > iblnkerrdelta | |
dd - > cspec - > ibdeltainprog ) {
u64 diagc ;
/* enable counter writes */
diagc = qib_read_kreg64 ( dd , kr_hwdiagctrl ) ;
qib_write_kreg ( dd , kr_hwdiagctrl ,
diagc | SYM_MASK ( HwDiagCtrl , CounterWrEnable ) ) ;
if ( dd - > cspec - > ibsymdelta | | dd - > cspec - > ibdeltainprog ) {
val = read_6120_creg32 ( dd , cr_ibsymbolerr ) ;
if ( dd - > cspec - > ibdeltainprog )
val - = val - dd - > cspec - > ibsymsnap ;
val - = dd - > cspec - > ibsymdelta ;
write_6120_creg ( dd , cr_ibsymbolerr , val ) ;
if ( dd - > cspec - > iblnkerrdelta | | dd - > cspec - > ibdeltainprog ) {
val = read_6120_creg32 ( dd , cr_iblinkerrrecov ) ;
if ( dd - > cspec - > ibdeltainprog )
val - = val - dd - > cspec - > iblnkerrsnap ;
val - = dd - > cspec - > iblnkerrdelta ;
write_6120_creg ( dd , cr_iblinkerrrecov , val ) ;
/* and disable counter writes */
qib_write_kreg ( dd , kr_hwdiagctrl , diagc ) ;
val = qib_read_kreg64 ( dd , kr_serdes_cfg0 ) ;
val | = SYM_MASK ( SerdesCfg0 , TxIdeEnX ) ;
qib_write_kreg ( dd , kr_serdes_cfg0 , val ) ;
* qib_6120_setup_setextled - set the state of the two external LEDs
* @ dd : the qlogic_ib device
* @ on : whether the link is up or not
* The exact combo of LEDs if on is true is determined by looking
* at the ibcstatus .
* These LEDs indicate the physical and logical state of IB link .
* For this chip ( at least with recommended board pinouts ) , LED1
* is Yellow ( logical state ) and LED2 is Green ( physical state ) ,
* Note : We try to match the Mellanox HCA LED behavior as best
* we can . Green indicates physical link state is OK ( something is
* plugged in , and we can train ) .
* Amber indicates the link is logically up ( ACTIVE ) .
* Mellanox further blinks the amber LED to indicate data packet
* activity , but we have no hardware support for that , so it would
* require waking up every 10 - 20 msecs and checking the counters
* on the chip , and then turning the LED off if appropriate . That ' s
* visible overhead , so not something we will do .
static void qib_6120_setup_setextled ( struct qib_pportdata * ppd , u32 on )
u64 extctl , val , lst , ltst ;
unsigned long flags ;
struct qib_devdata * dd = ppd - > dd ;
* The diags use the LED to indicate diag info , so we leave
* the external LED alone when the diags are running .
if ( dd - > diag_client )
return ;
/* Allow override of LED display for, e.g. Locating system in rack */
if ( ppd - > led_override ) {
ltst = ( ppd - > led_override & QIB_LED_PHYS ) ?
lst = ( ppd - > led_override & QIB_LED_LOG ) ?
} else if ( on ) {
val = qib_read_kreg64 ( dd , kr_ibcstatus ) ;
ltst = qib_6120_phys_portstate ( val ) ;
lst = qib_6120_iblink_state ( val ) ;
} else {
ltst = 0 ;
lst = 0 ;
spin_lock_irqsave ( & dd - > cspec - > gpio_lock , flags ) ;
extctl = dd - > cspec - > extctrl & ~ ( SYM_MASK ( EXTCtrl , LEDPriPortGreenOn ) |
SYM_MASK ( EXTCtrl , LEDPriPortYellowOn ) ) ;
extctl | = SYM_MASK ( EXTCtrl , LEDPriPortYellowOn ) ;
if ( lst = = IB_PORT_ACTIVE )
extctl | = SYM_MASK ( EXTCtrl , LEDPriPortGreenOn ) ;
dd - > cspec - > extctrl = extctl ;
qib_write_kreg ( dd , kr_extctrl , extctl ) ;
spin_unlock_irqrestore ( & dd - > cspec - > gpio_lock , flags ) ;
static void qib_6120_free_irq ( struct qib_devdata * dd )
if ( dd - > cspec - > irq ) {
free_irq ( dd - > cspec - > irq , dd ) ;
dd - > cspec - > irq = 0 ;
qib_nomsi ( dd ) ;
* qib_6120_setup_cleanup - clean up any per - chip chip - specific stuff
* @ dd : the qlogic_ib device
* This is called during driver unload .
static void qib_6120_setup_cleanup ( struct qib_devdata * dd )
qib_6120_free_irq ( dd ) ;
kfree ( dd - > cspec - > cntrs ) ;
kfree ( dd - > cspec - > portcntrs ) ;
if ( dd - > cspec - > dummy_hdrq ) {
dma_free_coherent ( & dd - > pcidev - > dev ,
ALIGN ( dd - > rcvhdrcnt *
dd - > rcvhdrentsize *
sizeof ( u32 ) , PAGE_SIZE ) ,
dd - > cspec - > dummy_hdrq ,
dd - > cspec - > dummy_hdrq_phys ) ;
dd - > cspec - > dummy_hdrq = NULL ;
static void qib_wantpiobuf_6120_intr ( struct qib_devdata * dd , u32 needint )
unsigned long flags ;
spin_lock_irqsave ( & dd - > sendctrl_lock , flags ) ;
if ( needint )
dd - > sendctrl | = SYM_MASK ( SendCtrl , PIOIntBufAvail ) ;
dd - > sendctrl & = ~ SYM_MASK ( SendCtrl , PIOIntBufAvail ) ;
qib_write_kreg ( dd , kr_sendctrl , dd - > sendctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0ULL ) ;
spin_unlock_irqrestore ( & dd - > sendctrl_lock , flags ) ;
* handle errors and unusual events first , separate function
* to improve cache hits for fast path interrupt handling
static noinline void unlikely_6120_intr ( struct qib_devdata * dd , u64 istat )
if ( unlikely ( istat & ~ QLOGIC_IB_I_BITSEXTANT ) )
qib_dev_err ( dd , " interrupt with unknown interrupts %Lx set \n " ,
if ( istat & QLOGIC_IB_I_ERROR ) {
u64 estat = 0 ;
qib_stats . sps_errints + + ;
estat = qib_read_kreg64 ( dd , kr_errstatus ) ;
if ( ! estat )
qib_devinfo ( dd - > pcidev , " error interrupt (%Lx), "
" but no error bits set! \n " , istat ) ;
handle_6120_errors ( dd , estat ) ;
if ( istat & QLOGIC_IB_I_GPIO ) {
u32 gpiostatus ;
u32 to_clear = 0 ;
* GPIO_3 . .5 on IBA6120 Rev2 chips indicate
* errors that we need to count .
gpiostatus = qib_read_kreg32 ( dd , kr_gpio_status ) ;
/* First the error-counter case. */
if ( gpiostatus & GPIO_ERRINTR_MASK ) {
/* want to clear the bits we see asserted. */
to_clear | = ( gpiostatus & GPIO_ERRINTR_MASK ) ;
* Count appropriately , clear bits out of our copy ,
* as they have been " handled " .
if ( gpiostatus & ( 1 < < GPIO_RXUVL_BIT ) )
dd - > cspec - > rxfc_unsupvl_errs + + ;
if ( gpiostatus & ( 1 < < GPIO_OVRUN_BIT ) )
dd - > cspec - > overrun_thresh_errs + + ;
if ( gpiostatus & ( 1 < < GPIO_LLI_BIT ) )
dd - > cspec - > lli_errs + + ;
gpiostatus & = ~ GPIO_ERRINTR_MASK ;
if ( gpiostatus ) {
* Some unexpected bits remain . If they could have
* caused the interrupt , complain and clear .
* To avoid repetition of this condition , also clear
* the mask . It is almost certainly due to error .
const u32 mask = qib_read_kreg32 ( dd , kr_gpio_mask ) ;
* Also check that the chip reflects our shadow ,
* and report issues , If they caused the interrupt .
* we will suppress by refreshing from the shadow .
if ( mask & gpiostatus ) {
to_clear | = ( gpiostatus & mask ) ;
dd - > cspec - > gpio_mask & = ~ ( gpiostatus & mask ) ;
qib_write_kreg ( dd , kr_gpio_mask ,
dd - > cspec - > gpio_mask ) ;
if ( to_clear )
qib_write_kreg ( dd , kr_gpio_clear , ( u64 ) to_clear ) ;
static irqreturn_t qib_6120intr ( int irq , void * data )
struct qib_devdata * dd = data ;
irqreturn_t ret ;
u32 istat , ctxtrbits , rmask , crcs = 0 ;
unsigned i ;
if ( ( dd - > flags & ( QIB_PRESENT | QIB_BADINTR ) ) ! = QIB_PRESENT ) {
* This return value is not great , but we do not want the
* interrupt core code to remove our interrupt handler
* because we don ' t appear to be handling an interrupt
* during a chip reset .
goto bail ;
istat = qib_read_kreg32 ( dd , kr_intstatus ) ;
if ( unlikely ( ! istat ) ) {
ret = IRQ_NONE ; /* not our interrupt, or already handled */
goto bail ;
if ( unlikely ( istat = = - 1 ) ) {
qib_bad_intrstatus ( dd ) ;
/* don't know if it was our interrupt or not */
ret = IRQ_NONE ;
goto bail ;
qib_stats . sps_ints + + ;
if ( dd - > int_counter ! = ( u32 ) - 1 )
dd - > int_counter + + ;
if ( unlikely ( istat & ( ~ QLOGIC_IB_I_BITSEXTANT |
unlikely_6120_intr ( dd , istat ) ;
* Clear the interrupt bits we found set , relatively early , so we
* " know " know the chip will have seen this by the time we process
* the queue , and will re - interrupt if necessary . The processor
* itself won ' t take the interrupt again until we return .
qib_write_kreg ( dd , kr_intclear , istat ) ;
* Handle kernel receive queues before checking for pio buffers
* available since receives can overflow ; piobuf waiters can afford
* a few extra cycles , since they were waiting anyway .
ctxtrbits = istat &
if ( ctxtrbits ) {
rmask = ( 1U < < QLOGIC_IB_I_RCVAVAIL_SHIFT ) |
for ( i = 0 ; i < dd - > first_user_ctxt ; i + + ) {
if ( ctxtrbits & rmask ) {
ctxtrbits & = ~ rmask ;
crcs + = qib_kreceive ( dd - > rcd [ i ] ,
& dd - > cspec - > lli_counter ,
NULL ) ;
rmask < < = 1 ;
if ( crcs ) {
u32 cntr = dd - > cspec - > lli_counter ;
cntr + = crcs ;
if ( cntr ) {
if ( cntr > dd - > cspec - > lli_thresh ) {
dd - > cspec - > lli_counter = 0 ;
dd - > cspec - > lli_errs + + ;
} else
dd - > cspec - > lli_counter + = cntr ;
if ( ctxtrbits ) {
ctxtrbits =
( ctxtrbits > > QLOGIC_IB_I_RCVAVAIL_SHIFT ) |
( ctxtrbits > > QLOGIC_IB_I_RCVURG_SHIFT ) ;
qib_handle_urcv ( dd , ctxtrbits ) ;
if ( ( istat & QLOGIC_IB_I_SPIOBUFAVAIL ) & & ( dd - > flags & QIB_INITTED ) )
qib_ib_piobufavail ( dd ) ;
bail :
return ret ;
* Set up our chip - specific interrupt handler
* The interrupt type has already been setup , so
* we just need to do the registration and error checking .
static void qib_setup_6120_interrupt ( struct qib_devdata * dd )
* If the chip supports added error indication via GPIO pins ,
* enable interrupts on those bits so the interrupt routine
* can count the events . Also set flag so interrupt routine
* can know they are expected .
if ( SYM_FIELD ( dd - > revision , Revision_R ,
ChipRevMinor ) > 1 ) {
/* Rev2+ reports extra errors via internal GPIO pins */
dd - > cspec - > gpio_mask | = GPIO_ERRINTR_MASK ;
qib_write_kreg ( dd , kr_gpio_mask , dd - > cspec - > gpio_mask ) ;
if ( ! dd - > cspec - > irq )
qib_dev_err ( dd , " irq is 0, BIOS error? Interrupts won't "
" work \n " ) ;
else {
int ret ;
ret = request_irq ( dd - > cspec - > irq , qib_6120intr , 0 ,
QIB_DRV_NAME , dd ) ;
if ( ret )
qib_dev_err ( dd , " Couldn't setup interrupt "
" (irq=%d): %d \n " , dd - > cspec - > irq ,
ret ) ;
* pe_boardname - fill in the board name
* @ dd : the qlogic_ib device
* info is based on the board revision register
static void pe_boardname ( struct qib_devdata * dd )
char * n ;
u32 boardid , namelen ;
boardid = SYM_FIELD ( dd - > revision , Revision ,
BoardID ) ;
switch ( boardid ) {
case 2 :
n = " InfiniPath_QLE7140 " ;
break ;
default :
qib_dev_err ( dd , " Unknown 6120 board with ID %u \n " , boardid ) ;
n = " Unknown_InfiniPath_6120 " ;
break ;
namelen = strlen ( n ) + 1 ;
dd - > boardname = kmalloc ( namelen , GFP_KERNEL ) ;
if ( ! dd - > boardname )
qib_dev_err ( dd , " Failed allocation for board name: %s \n " , n ) ;
snprintf ( dd - > boardname , namelen , " %s " , n ) ;
if ( dd - > majrev ! = 4 | | ! dd - > minrev | | dd - > minrev > 2 )
qib_dev_err ( dd , " Unsupported InfiniPath hardware revision "
" %u.%u! \n " , dd - > majrev , dd - > minrev ) ;
snprintf ( dd - > boardversion , sizeof ( dd - > boardversion ) ,
" ChipABI %u.%u, %s, InfiniPath%u %u.%u, SW Compat %u \n " ,
QIB_CHIP_VERS_MAJ , QIB_CHIP_VERS_MIN , dd - > boardname ,
( unsigned ) SYM_FIELD ( dd - > revision , Revision_R , Arch ) ,
dd - > majrev , dd - > minrev ,
( unsigned ) SYM_FIELD ( dd - > revision , Revision_R , SW ) ) ;
* This routine sleeps , so it can only be called from user context , not
* from interrupt context . If we need interrupt context , we can split
* it into two routines .
static int qib_6120_setup_reset ( struct qib_devdata * dd )
u64 val ;
int i ;
int ret ;
u16 cmdval ;
u8 int_line , clinesz ;
qib_pcie_getcmd ( dd , & cmdval , & int_line , & clinesz ) ;
/* Use ERROR so it shows up in logs, etc. */
qib_dev_err ( dd , " Resetting InfiniPath unit %u \n " , dd - > unit ) ;
/* no interrupts till re-initted */
qib_6120_set_intr_state ( dd , 0 ) ;
dd - > cspec - > ibdeltainprog = 0 ;
dd - > cspec - > ibsymdelta = 0 ;
dd - > cspec - > iblnkerrdelta = 0 ;
* Keep chip from being accessed until we are ready . Use
* writeq ( ) directly , to allow the write even though QIB_PRESENT
* isnt ' set .
dd - > flags & = ~ ( QIB_INITTED | QIB_PRESENT ) ;
dd - > int_counter = 0 ; /* so we check interrupts work again */
val = dd - > control | QLOGIC_IB_C_RESET ;
writeq ( val , & dd - > kregbase [ kr_control ] ) ;
mb ( ) ; /* prevent compiler re-ordering around actual reset */
for ( i = 1 ; i < = 5 ; i + + ) {
* Allow MBIST , etc . to complete ; longer on each retry .
* We sometimes get machine checks from bus timeout if no
* response , so for now , make it * really * long .
msleep ( 1000 + ( 1 + i ) * 2000 ) ;
qib_pcie_reenable ( dd , cmdval , int_line , clinesz ) ;
* Use readq directly , so we don ' t need to mark it as PRESENT
* until we get a successful indication that all is well .
val = readq ( & dd - > kregbase [ kr_revision ] ) ;
if ( val = = dd - > revision ) {
dd - > flags | = QIB_PRESENT ; /* it's back */
ret = qib_reinit_intr ( dd ) ;
goto bail ;
ret = 0 ; /* failed */
bail :
if ( ret ) {
if ( qib_pcie_params ( dd , dd - > lbus_width , NULL , NULL ) )
qib_dev_err ( dd , " Reset failed to setup PCIe or "
" interrupts; continuing anyway \n " ) ;
/* clear the reset error, init error/hwerror mask */
qib_6120_init_hwerrors ( dd ) ;
/* for Rev2 error interrupts; nop for rev 1 */
qib_write_kreg ( dd , kr_gpio_mask , dd - > cspec - > gpio_mask ) ;
/* clear the reset error, init error/hwerror mask */
qib_6120_init_hwerrors ( dd ) ;
return ret ;
* qib_6120_put_tid - write a TID in chip
* @ dd : the qlogic_ib device
* @ tidptr : pointer to the expected TID ( in chip ) to update
* @ tidtype : RCVHQ_RCV_TYPE_EAGER ( 1 ) for eager , RCVHQ_RCV_TYPE_EXPECTED ( 0 )
* for expected
* @ pa : physical address of in memory buffer ; tidinvalid if freeing
* This exists as a separate routine to allow for special locking etc .
* It ' s used for both the full cleanup on exit , as well as the normal
* setup and teardown .
static void qib_6120_put_tid ( struct qib_devdata * dd , u64 __iomem * tidptr ,
u32 type , unsigned long pa )
u32 __iomem * tidp32 = ( u32 __iomem * ) tidptr ;
unsigned long flags ;
int tidx ;
spinlock_t * tidlockp ; /* select appropriate spinlock */
if ( ! dd - > kregbase )
return ;
if ( pa ! = dd - > tidinvalid ) {
if ( pa & ( ( 1U < < 11 ) - 1 ) ) {
qib_dev_err ( dd , " Physaddr %lx not 2KB aligned! \n " ,
pa ) ;
return ;
pa > > = 11 ;
if ( pa & ~ QLOGIC_IB_RT_ADDR_MASK ) {
qib_dev_err ( dd , " Physical page address 0x%lx "
" larger than supported \n " , pa ) ;
return ;
if ( type = = RCVHQ_RCV_TYPE_EAGER )
pa | = dd - > tidtemplate ;
else /* for now, always full 4KB page */
pa | = 2 < < 29 ;
* Avoid chip issue by writing the scratch register
* before and after the TID , and with an io write barrier .
* We use a spinlock around the writes , so they can ' t intermix
* with other TID ( eager or expected ) writes ( the chip problem
* is triggered by back to back TID writes ) . Unfortunately , this
* call can be done from interrupt level for the ctxt 0 eager TIDs ,
* so we have to use irqsave locks .
* Assumes tidptr always > egrtidbase
* if type = = RCVHQ_RCV_TYPE_EAGER .
tidx = tidptr - dd - > egrtidbase ;
tidlockp = ( type = = RCVHQ_RCV_TYPE_EAGER & & tidx < dd - > rcvhdrcnt )
? & dd - > cspec - > kernel_tid_lock : & dd - > cspec - > user_tid_lock ;
spin_lock_irqsave ( tidlockp , flags ) ;
qib_write_kreg ( dd , kr_scratch , 0xfeeddeaf ) ;
writel ( pa , tidp32 ) ;
qib_write_kreg ( dd , kr_scratch , 0xdeadbeef ) ;
mmiowb ( ) ;
spin_unlock_irqrestore ( tidlockp , flags ) ;
* qib_6120_put_tid_2 - write a TID in chip , Revision 2 or higher
* @ dd : the qlogic_ib device
* @ tidptr : pointer to the expected TID ( in chip ) to update
* @ tidtype : RCVHQ_RCV_TYPE_EAGER ( 1 ) for eager , RCVHQ_RCV_TYPE_EXPECTED ( 0 )
* for expected
* @ pa : physical address of in memory buffer ; tidinvalid if freeing
* This exists as a separate routine to allow for selection of the
* appropriate " flavor " . The static calls in cleanup just use the
* revision - agnostic form , as they are not performance critical .
static void qib_6120_put_tid_2 ( struct qib_devdata * dd , u64 __iomem * tidptr ,
u32 type , unsigned long pa )
u32 __iomem * tidp32 = ( u32 __iomem * ) tidptr ;
u32 tidx ;
if ( ! dd - > kregbase )
return ;
if ( pa ! = dd - > tidinvalid ) {
if ( pa & ( ( 1U < < 11 ) - 1 ) ) {
qib_dev_err ( dd , " Physaddr %lx not 2KB aligned! \n " ,
pa ) ;
return ;
pa > > = 11 ;
if ( pa & ~ QLOGIC_IB_RT_ADDR_MASK ) {
qib_dev_err ( dd , " Physical page address 0x%lx "
" larger than supported \n " , pa ) ;
return ;
if ( type = = RCVHQ_RCV_TYPE_EAGER )
pa | = dd - > tidtemplate ;
else /* for now, always full 4KB page */
pa | = 2 < < 29 ;
tidx = tidptr - dd - > egrtidbase ;
writel ( pa , tidp32 ) ;
mmiowb ( ) ;
* qib_6120_clear_tids - clear all TID entries for a context , expected and eager
* @ dd : the qlogic_ib device
* @ ctxt : the context
* clear all TID entries for a context , expected and eager .
* Used from qib_close ( ) . On this chip , TIDs are only 32 bits ,
* not 64 , but they are still on 64 bit boundaries , so tidbase
* is declared as u64 * for the pointer math , even though we write 32 bits
static void qib_6120_clear_tids ( struct qib_devdata * dd ,
struct qib_ctxtdata * rcd )
u64 __iomem * tidbase ;
unsigned long tidinv ;
u32 ctxt ;
int i ;
if ( ! dd - > kregbase | | ! rcd )
return ;
ctxt = rcd - > ctxt ;
tidinv = dd - > tidinvalid ;
tidbase = ( u64 __iomem * )
( ( char __iomem * ) ( dd - > kregbase ) +
dd - > rcvtidbase +
ctxt * dd - > rcvtidcnt * sizeof ( * tidbase ) ) ;
for ( i = 0 ; i < dd - > rcvtidcnt ; i + + )
/* use func pointer because could be one of two funcs */
dd - > f_put_tid ( dd , & tidbase [ i ] , RCVHQ_RCV_TYPE_EXPECTED ,
tidinv ) ;
tidbase = ( u64 __iomem * )
( ( char __iomem * ) ( dd - > kregbase ) +
dd - > rcvegrbase +
rcd - > rcvegr_tid_base * sizeof ( * tidbase ) ) ;
for ( i = 0 ; i < rcd - > rcvegrcnt ; i + + )
/* use func pointer because could be one of two funcs */
dd - > f_put_tid ( dd , & tidbase [ i ] , RCVHQ_RCV_TYPE_EAGER ,
tidinv ) ;
* qib_6120_tidtemplate - setup constants for TID updates
* @ dd : the qlogic_ib device
* We setup stuff that we use a lot , to avoid calculating each time
static void qib_6120_tidtemplate ( struct qib_devdata * dd )
u32 egrsize = dd - > rcvegrbufsize ;
* For now , we always allocate 4 KB buffers ( at init ) so we can
* receive max size packets . We may want a module parameter to
* specify 2 KB or 4 KB and / or make be per ctxt instead of per device
* for those who want to reduce memory footprint . Note that the
* rcvhdrentsize size must be large enough to hold the largest
* IB header ( currently 96 bytes ) that we expect to handle ( plus of
* course the 2 dwords of RHF ) .
if ( egrsize = = 2048 )
dd - > tidtemplate = 1U < < 29 ;
else if ( egrsize = = 4096 )
dd - > tidtemplate = 2U < < 29 ;
dd - > tidinvalid = 0 ;
int __attribute__ ( ( weak ) ) qib_unordered_wc ( void )
return 0 ;
* qib_6120_get_base_info - set chip - specific flags for user code
* @ rcd : the qlogic_ib ctxt
* @ kbase : qib_base_info pointer
* We set the PCIE flag because the lower bandwidth on PCIe vs
* HyperTransport can affect some user packet algorithms .
static int qib_6120_get_base_info ( struct qib_ctxtdata * rcd ,
struct qib_base_info * kinfo )
if ( qib_unordered_wc ( ) )
kinfo - > spi_runtime_flags | = QIB_RUNTIME_FORCE_WC_ORDER ;
kinfo - > spi_runtime_flags | = QIB_RUNTIME_PCIE |
return 0 ;
static struct qib_message_header *
qib_6120_get_msgheader ( struct qib_devdata * dd , __le32 * rhf_addr )
return ( struct qib_message_header * )
& rhf_addr [ sizeof ( u64 ) / sizeof ( u32 ) ] ;
static void qib_6120_config_ctxts ( struct qib_devdata * dd )
dd - > ctxtcnt = qib_read_kreg32 ( dd , kr_portcnt ) ;
if ( qib_n_krcv_queues > 1 ) {
dd - > first_user_ctxt = qib_n_krcv_queues * dd - > num_pports ;
if ( dd - > first_user_ctxt > dd - > ctxtcnt )
dd - > first_user_ctxt = dd - > ctxtcnt ;
dd - > qpn_mask = dd - > first_user_ctxt < = 2 ? 2 : 6 ;
} else
dd - > first_user_ctxt = dd - > num_pports ;
dd - > n_krcv_queues = dd - > first_user_ctxt ;
static void qib_update_6120_usrhead ( struct qib_ctxtdata * rcd , u64 hd ,
2011-01-10 17:42:21 -08:00
u32 updegr , u32 egrhd , u32 npkts )
2010-05-23 21:44:54 -07:00
qib_write_ureg ( rcd - > dd , ur_rcvhdrhead , hd , rcd - > ctxt ) ;
if ( updegr )
qib_write_ureg ( rcd - > dd , ur_rcvegrindexhead , egrhd , rcd - > ctxt ) ;
static u32 qib_6120_hdrqempty ( struct qib_ctxtdata * rcd )
u32 head , tail ;
head = qib_read_ureg32 ( rcd - > dd , ur_rcvhdrhead , rcd - > ctxt ) ;
if ( rcd - > rcvhdrtail_kvaddr )
tail = qib_get_rcvhdrtail ( rcd ) ;
tail = qib_read_ureg32 ( rcd - > dd , ur_rcvhdrtail , rcd - > ctxt ) ;
return head = = tail ;
* Used when we close any ctxt , for DMA already in flight
* at close . Can ' t be done until we know hdrq size , so not
* early in chip init .
static void alloc_dummy_hdrq ( struct qib_devdata * dd )
dd - > cspec - > dummy_hdrq = dma_alloc_coherent ( & dd - > pcidev - > dev ,
dd - > rcd [ 0 ] - > rcvhdrq_size ,
& dd - > cspec - > dummy_hdrq_phys ,
if ( ! dd - > cspec - > dummy_hdrq ) {
qib_devinfo ( dd - > pcidev , " Couldn't allocate dummy hdrq \n " ) ;
/* fallback to just 0'ing */
dd - > cspec - > dummy_hdrq_phys = 0UL ;
* Modify the RCVCTRL register in chip - specific way . This
* is a function because bit positions and ( future ) register
* location is chip - specific , but the needed operations are
* generic . < op > is a bit - mask because we often want to
* do multiple modifications .
static void rcvctrl_6120_mod ( struct qib_pportdata * ppd , unsigned int op ,
int ctxt )
struct qib_devdata * dd = ppd - > dd ;
u64 mask , val ;
unsigned long flags ;
spin_lock_irqsave ( & dd - > cspec - > rcvmod_lock , flags ) ;
dd - > rcvctrl | = ( 1ULL < < QLOGIC_IB_R_TAILUPD_SHIFT ) ;
dd - > rcvctrl & = ~ ( 1ULL < < QLOGIC_IB_R_TAILUPD_SHIFT ) ;
dd - > rcvctrl & = ~ ( 1ULL < < IBA6120_R_PKEY_DIS_SHIFT ) ;
dd - > rcvctrl | = ( 1ULL < < IBA6120_R_PKEY_DIS_SHIFT ) ;
if ( ctxt < 0 )
mask = ( 1ULL < < dd - > ctxtcnt ) - 1 ;
mask = ( 1ULL < < ctxt ) ;
if ( op & QIB_RCVCTRL_CTXT_ENB ) {
/* always done for specific ctxt */
dd - > rcvctrl | = ( mask < < SYM_LSB ( RcvCtrl , PortEnable ) ) ;
if ( ! ( dd - > flags & QIB_NODMA_RTAIL ) )
dd - > rcvctrl | = 1ULL < < QLOGIC_IB_R_TAILUPD_SHIFT ;
/* Write these registers before the context is enabled. */
qib_write_kreg_ctxt ( dd , kr_rcvhdrtailaddr , ctxt ,
dd - > rcd [ ctxt ] - > rcvhdrqtailaddr_phys ) ;
qib_write_kreg_ctxt ( dd , kr_rcvhdraddr , ctxt ,
dd - > rcd [ ctxt ] - > rcvhdrq_phys ) ;
if ( ctxt = = 0 & & ! dd - > cspec - > dummy_hdrq )
alloc_dummy_hdrq ( dd ) ;
dd - > rcvctrl & = ~ ( mask < < SYM_LSB ( RcvCtrl , PortEnable ) ) ;
dd - > rcvctrl | = ( mask < < QLOGIC_IB_R_INTRAVAIL_SHIFT ) ;
dd - > rcvctrl & = ~ ( mask < < QLOGIC_IB_R_INTRAVAIL_SHIFT ) ;
qib_write_kreg ( dd , kr_rcvctrl , dd - > rcvctrl ) ;
if ( ( op & QIB_RCVCTRL_INTRAVAIL_ENB ) & & dd - > rhdrhead_intr_off ) {
/* arm rcv interrupt */
val = qib_read_ureg32 ( dd , ur_rcvhdrhead , ctxt ) |
dd - > rhdrhead_intr_off ;
qib_write_ureg ( dd , ur_rcvhdrhead , val , ctxt ) ;
if ( op & QIB_RCVCTRL_CTXT_ENB ) {
* Init the context registers also ; if we were
* disabled , tail and head should both be zero
* already from the enable , but since we don ' t
* know , we have to do it explictly .
val = qib_read_ureg32 ( dd , ur_rcvegrindextail , ctxt ) ;
qib_write_ureg ( dd , ur_rcvegrindexhead , val , ctxt ) ;
val = qib_read_ureg32 ( dd , ur_rcvhdrtail , ctxt ) ;
dd - > rcd [ ctxt ] - > head = val ;
/* If kctxt, interrupt on next receive. */
if ( ctxt < dd - > first_user_ctxt )
val | = dd - > rhdrhead_intr_off ;
qib_write_ureg ( dd , ur_rcvhdrhead , val , ctxt ) ;
if ( op & QIB_RCVCTRL_CTXT_DIS ) {
* Be paranoid , and never write 0 ' s to these , just use an
* unused page . Of course ,
* rcvhdraddr points to a large chunk of memory , so this
* could still trash things , but at least it won ' t trash
* page 0 , and by disabling the ctxt , it should stop " soon " ,
* even if a packet or two is in already in flight after we
* disabled the ctxt . Only 6120 has this issue .
if ( ctxt > = 0 ) {
qib_write_kreg_ctxt ( dd , kr_rcvhdrtailaddr , ctxt ,
dd - > cspec - > dummy_hdrq_phys ) ;
qib_write_kreg_ctxt ( dd , kr_rcvhdraddr , ctxt ,
dd - > cspec - > dummy_hdrq_phys ) ;
} else {
unsigned i ;
for ( i = 0 ; i < dd - > cfgctxts ; i + + ) {
qib_write_kreg_ctxt ( dd , kr_rcvhdrtailaddr ,
i , dd - > cspec - > dummy_hdrq_phys ) ;
qib_write_kreg_ctxt ( dd , kr_rcvhdraddr ,
i , dd - > cspec - > dummy_hdrq_phys ) ;
spin_unlock_irqrestore ( & dd - > cspec - > rcvmod_lock , flags ) ;
* Modify the SENDCTRL register in chip - specific way . This
* is a function there may be multiple such registers with
* slightly different layouts . Only operations actually used
* are implemented yet .
* Chip requires no back - back sendctrl writes , so write
* scratch register after writing sendctrl
static void sendctrl_6120_mod ( struct qib_pportdata * ppd , u32 op )
struct qib_devdata * dd = ppd - > dd ;
u64 tmp_dd_sendctrl ;
unsigned long flags ;
spin_lock_irqsave ( & dd - > sendctrl_lock , flags ) ;
/* First the ones that are "sticky", saved in shadow */
dd - > sendctrl = 0 ;
dd - > sendctrl & = ~ SYM_MASK ( SendCtrl , PIOEnable ) ;
else if ( op & QIB_SENDCTRL_SEND_ENB )
dd - > sendctrl | = SYM_MASK ( SendCtrl , PIOEnable ) ;
dd - > sendctrl & = ~ SYM_MASK ( SendCtrl , PIOBufAvailUpd ) ;
else if ( op & QIB_SENDCTRL_AVAIL_ENB )
dd - > sendctrl | = SYM_MASK ( SendCtrl , PIOBufAvailUpd ) ;
u32 i , last ;
tmp_dd_sendctrl = dd - > sendctrl ;
* disarm any that are not yet launched , disabling sends
* and updates until done .
last = dd - > piobcnt2k + dd - > piobcnt4k ;
tmp_dd_sendctrl & =
~ ( SYM_MASK ( SendCtrl , PIOEnable ) |
SYM_MASK ( SendCtrl , PIOBufAvailUpd ) ) ;
for ( i = 0 ; i < last ; i + + ) {
qib_write_kreg ( dd , kr_sendctrl , tmp_dd_sendctrl |
SYM_MASK ( SendCtrl , Disarm ) | i ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
tmp_dd_sendctrl = dd - > sendctrl ;
tmp_dd_sendctrl | = SYM_MASK ( SendCtrl , Abort ) ;
tmp_dd_sendctrl | = SYM_MASK ( SendCtrl , Disarm ) |
( ( op & QIB_6120_SendCtrl_DisarmPIOBuf_RMASK ) < <
SYM_LSB ( SendCtrl , DisarmPIOBuf ) ) ;
tmp_dd_sendctrl & = ~ SYM_MASK ( SendCtrl , PIOBufAvailUpd ) ;
qib_write_kreg ( dd , kr_sendctrl , tmp_dd_sendctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
qib_write_kreg ( dd , kr_sendctrl , dd - > sendctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
spin_unlock_irqrestore ( & dd - > sendctrl_lock , flags ) ;
if ( op & QIB_SENDCTRL_FLUSH ) {
u32 v ;
* ensure writes have hit chip , then do a few
* more reads , to allow DMA of pioavail registers
* to occur , so in - memory copy is in sync with
* the chip . Not always safe to sleep .
v = qib_read_kreg32 ( dd , kr_scratch ) ;
qib_write_kreg ( dd , kr_scratch , v ) ;
v = qib_read_kreg32 ( dd , kr_scratch ) ;
qib_write_kreg ( dd , kr_scratch , v ) ;
qib_read_kreg32 ( dd , kr_scratch ) ;
* qib_portcntr_6120 - read a per - port counter
* @ dd : the qlogic_ib device
* @ creg : the counter to snapshot
static u64 qib_portcntr_6120 ( struct qib_pportdata * ppd , u32 reg )
u64 ret = 0ULL ;
struct qib_devdata * dd = ppd - > dd ;
u16 creg ;
/* 0xffff for unimplemented or synthesized counters */
static const u16 xlator [ ] = {
[ QIBPORTCNTR_PKTSEND ] = cr_pktsend ,
[ QIBPORTCNTR_WORDSEND ] = cr_wordsend ,
[ QIBPORTCNTR_SENDSTALL ] = cr_sendstall ,
[ QIBPORTCNTR_PKTRCV ] = cr_pktrcv ,
[ QIBPORTCNTR_RCVEBP ] = cr_rcvebp ,
[ QIBPORTCNTR_RCVOVFL ] = cr_rcvovfl ,
[ QIBPORTCNTR_WORDRCV ] = cr_wordrcv ,
[ QIBPORTCNTR_RXDROPPKT ] = cr_rxdroppkt ,
[ QIBPORTCNTR_ERRICRC ] = cr_erricrc ,
[ QIBPORTCNTR_ERRVCRC ] = cr_errvcrc ,
[ QIBPORTCNTR_ERRLPCRC ] = cr_errlpcrc ,
[ QIBPORTCNTR_BADFORMAT ] = cr_badformat ,
[ QIBPORTCNTR_ERR_RLEN ] = cr_err_rlen ,
[ QIBPORTCNTR_IBSYMBOLERR ] = cr_ibsymbolerr ,
[ QIBPORTCNTR_INVALIDRLEN ] = cr_invalidrlen ,
[ QIBPORTCNTR_UNSUPVL ] = cr_txunsupvl ,
[ QIBPORTCNTR_ERRLINK ] = cr_errlink ,
[ QIBPORTCNTR_IBLINKDOWN ] = cr_iblinkdown ,
[ QIBPORTCNTR_IBLINKERRRECOV ] = cr_iblinkerrrecov ,
[ QIBPORTCNTR_LLI ] = 0xffff ,
[ QIBPORTCNTR_ERRPKEY ] = cr_errpkey ,
} ;
if ( reg > = ARRAY_SIZE ( xlator ) ) {
qib_devinfo ( ppd - > dd - > pcidev ,
" Unimplemented portcounter %u \n " , reg ) ;
goto done ;
creg = xlator [ reg ] ;
/* handle counters requests not implemented as chip counters */
if ( reg = = QIBPORTCNTR_LLI )
ret = dd - > cspec - > lli_errs ;
ret = dd - > cspec - > overrun_thresh_errs ;
else if ( reg = = QIBPORTCNTR_KHDROVFL ) {
int i ;
/* sum over all kernel contexts */
for ( i = 0 ; i < dd - > first_user_ctxt ; i + + )
ret + = read_6120_creg32 ( dd , cr_portovfl + i ) ;
} else if ( reg = = QIBPORTCNTR_PSSTAT )
ret = dd - > cspec - > pma_sample_status ;
if ( creg = = 0xffff )
goto done ;
* only fast incrementing counters are 64 bit ; use 32 bit reads to
* avoid two independent reads when on opteron
if ( creg = = cr_wordsend | | creg = = cr_wordrcv | |
creg = = cr_pktsend | | creg = = cr_pktrcv )
ret = read_6120_creg ( dd , creg ) ;
ret = read_6120_creg32 ( dd , creg ) ;
if ( creg = = cr_ibsymbolerr ) {
if ( dd - > cspec - > ibdeltainprog )
ret - = ret - dd - > cspec - > ibsymsnap ;
ret - = dd - > cspec - > ibsymdelta ;
} else if ( creg = = cr_iblinkerrrecov ) {
if ( dd - > cspec - > ibdeltainprog )
ret - = ret - dd - > cspec - > iblnkerrsnap ;
ret - = dd - > cspec - > iblnkerrdelta ;
if ( reg = = QIBPORTCNTR_RXDROPPKT ) /* add special cased count */
ret + = dd - > cspec - > rxfc_unsupvl_errs ;
done :
return ret ;
* Device counter names ( not port - specific ) , one line per stat ,
* single string . Used by utilities like ipathstats to print the stats
* in a way which works for different versions of drivers , without changing
* the utility . Names need to be 12 chars or less ( w / o newline ) , for proper
* display by utility .
* Non - error counters are first .
* Start of " error " conters is indicated by a leading " E " on the first
* " error " counter , and doesn ' t count in label length .
* The EgrOvfl list needs to be last so we truncate them at the configured
* context count for the device .
* cntr6120indices contains the corresponding register indices .
static const char cntr6120names [ ] =
" Interrupts \n "
" HostBusStall \n "
" E RxTIDFull \n "
" RxTIDInvalid \n "
" Ctxt0EgrOvfl \n "
" Ctxt1EgrOvfl \n "
" Ctxt2EgrOvfl \n "
" Ctxt3EgrOvfl \n "
" Ctxt4EgrOvfl \n " ;
static const size_t cntr6120indices [ ] = {
cr_lbint ,
cr_lbflowstall ,
cr_errtidfull ,
cr_errtidvalid ,
cr_portovfl + 0 ,
cr_portovfl + 1 ,
cr_portovfl + 2 ,
cr_portovfl + 3 ,
cr_portovfl + 4 ,
} ;
* same as cntr6120names and cntr6120indices , but for port - specific counters .
* portcntr6120indices is somewhat complicated by some registers needing
* adjustments of various kinds , and those are ORed with _PORT_VIRT_FLAG
static const char portcntr6120names [ ] =
" TxPkt \n "
" TxFlowPkt \n "
" TxWords \n "
" RxPkt \n "
" RxFlowPkt \n "
" RxWords \n "
" TxFlowStall \n "
" E IBStatusChng \n "
" IBLinkDown \n "
" IBLnkRecov \n "
" IBRxLinkErr \n "
" IBSymbolErr \n "
" RxLLIErr \n "
" RxBadFormat \n "
" RxBadLen \n "
" RxBufOvrfl \n "
" RxEBP \n "
" RxFlowCtlErr \n "
" RxICRCerr \n "
" RxLPCRCerr \n "
" RxVCRCerr \n "
" RxInvalLen \n "
" RxInvalPKey \n "
" RxPktDropped \n "
" TxBadLength \n "
" TxDropped \n "
" TxInvalLen \n "
" TxUnderrun \n "
" TxUnsupVL \n "
# define _PORT_VIRT_FLAG 0x8000 /* "virtual", need adjustments */
static const size_t portcntr6120indices [ ] = {
cr_pktsendflow ,
cr_pktrcvflowctrl ,
cr_ibstatuschange ,
cr_rcvflowctrl_err ,
cr_invalidslen ,
cr_senddropped ,
cr_errslen ,
cr_sendunderrun ,
cr_txunsupvl ,
} ;
/* do all the setup to make the counter reads efficient later */
static void init_6120_cntrnames ( struct qib_devdata * dd )
int i , j = 0 ;
char * s ;
for ( i = 0 , s = ( char * ) cntr6120names ; s & & j < = dd - > cfgctxts ;
i + + ) {
/* we always have at least one counter before the egrovfl */
if ( ! j & & ! strncmp ( " Ctxt0EgrOvfl " , s + 1 , 12 ) )
j = 1 ;
s = strchr ( s + 1 , ' \n ' ) ;
if ( s & & j )
j + + ;
dd - > cspec - > ncntrs = i ;
if ( ! s )
/* full list; size is without terminating null */
dd - > cspec - > cntrnamelen = sizeof ( cntr6120names ) - 1 ;
dd - > cspec - > cntrnamelen = 1 + s - cntr6120names ;
dd - > cspec - > cntrs = kmalloc ( dd - > cspec - > ncntrs
* sizeof ( u64 ) , GFP_KERNEL ) ;
if ( ! dd - > cspec - > cntrs )
qib_dev_err ( dd , " Failed allocation for counters \n " ) ;
for ( i = 0 , s = ( char * ) portcntr6120names ; s ; i + + )
s = strchr ( s + 1 , ' \n ' ) ;
dd - > cspec - > nportcntrs = i - 1 ;
dd - > cspec - > portcntrnamelen = sizeof ( portcntr6120names ) - 1 ;
dd - > cspec - > portcntrs = kmalloc ( dd - > cspec - > nportcntrs
* sizeof ( u64 ) , GFP_KERNEL ) ;
if ( ! dd - > cspec - > portcntrs )
qib_dev_err ( dd , " Failed allocation for portcounters \n " ) ;
static u32 qib_read_6120cntrs ( struct qib_devdata * dd , loff_t pos , char * * namep ,
u64 * * cntrp )
u32 ret ;
if ( namep ) {
ret = dd - > cspec - > cntrnamelen ;
if ( pos > = ret )
ret = 0 ; /* final read after getting everything */
* namep = ( char * ) cntr6120names ;
} else {
u64 * cntr = dd - > cspec - > cntrs ;
int i ;
ret = dd - > cspec - > ncntrs * sizeof ( u64 ) ;
if ( ! cntr | | pos > = ret ) {
/* everything read, or couldn't get memory */
ret = 0 ;
goto done ;
if ( pos > = ret ) {
ret = 0 ; /* final read after getting everything */
goto done ;
* cntrp = cntr ;
for ( i = 0 ; i < dd - > cspec - > ncntrs ; i + + )
* cntr + + = read_6120_creg32 ( dd , cntr6120indices [ i ] ) ;
done :
return ret ;
static u32 qib_read_6120portcntrs ( struct qib_devdata * dd , loff_t pos , u32 port ,
char * * namep , u64 * * cntrp )
u32 ret ;
if ( namep ) {
ret = dd - > cspec - > portcntrnamelen ;
if ( pos > = ret )
ret = 0 ; /* final read after getting everything */
* namep = ( char * ) portcntr6120names ;
} else {
u64 * cntr = dd - > cspec - > portcntrs ;
struct qib_pportdata * ppd = & dd - > pport [ port ] ;
int i ;
ret = dd - > cspec - > nportcntrs * sizeof ( u64 ) ;
if ( ! cntr | | pos > = ret ) {
/* everything read, or couldn't get memory */
ret = 0 ;
goto done ;
* cntrp = cntr ;
for ( i = 0 ; i < dd - > cspec - > nportcntrs ; i + + ) {
if ( portcntr6120indices [ i ] & _PORT_VIRT_FLAG )
* cntr + + = qib_portcntr_6120 ( ppd ,
portcntr6120indices [ i ] &
* cntr + + = read_6120_creg32 ( dd ,
portcntr6120indices [ i ] ) ;
done :
return ret ;
static void qib_chk_6120_errormask ( struct qib_devdata * dd )
static u32 fixed ;
u32 ctrl ;
unsigned long errormask ;
unsigned long hwerrs ;
if ( ! dd - > cspec - > errormask | | ! ( dd - > flags & QIB_INITTED ) )
return ;
errormask = qib_read_kreg64 ( dd , kr_errmask ) ;
if ( errormask = = dd - > cspec - > errormask )
return ;
fixed + + ;
hwerrs = qib_read_kreg64 ( dd , kr_hwerrstatus ) ;
ctrl = qib_read_kreg32 ( dd , kr_control ) ;
qib_write_kreg ( dd , kr_errmask ,
dd - > cspec - > errormask ) ;
if ( ( hwerrs & dd - > cspec - > hwerrmask ) | |
qib_write_kreg ( dd , kr_hwerrclear , 0ULL ) ;
qib_write_kreg ( dd , kr_errclear , 0ULL ) ;
/* force re-interrupt of pending events, just in case */
qib_write_kreg ( dd , kr_intclear , 0ULL ) ;
qib_devinfo ( dd - > pcidev ,
" errormask fixed(%u) %lx->%lx, ctrl %x hwerr %lx \n " ,
fixed , errormask , ( unsigned long ) dd - > cspec - > errormask ,
ctrl , hwerrs ) ;
* qib_get_faststats - get word counters from chip before they overflow
* @ opaque - contains a pointer to the qlogic_ib device qib_devdata
* This needs more work ; in particular , decision on whether we really
* need traffic_wds done the way it is
* called from add_timer
static void qib_get_6120_faststats ( unsigned long opaque )
struct qib_devdata * dd = ( struct qib_devdata * ) opaque ;
struct qib_pportdata * ppd = dd - > pport ;
unsigned long flags ;
u64 traffic_wds ;
* don ' t access the chip while running diags , or memory diags can
* fail
if ( ! ( dd - > flags & QIB_INITTED ) | | dd - > diag_client )
/* but re-arm the timer, for diags case; won't hurt other */
goto done ;
* We now try to maintain an activity timer , based on traffic
* exceeding a threshold , so we need to check the word - counts
* even if they are 64 - bit .
traffic_wds = qib_portcntr_6120 ( ppd , cr_wordsend ) +
qib_portcntr_6120 ( ppd , cr_wordrcv ) ;
spin_lock_irqsave ( & dd - > eep_st_lock , flags ) ;
traffic_wds - = dd - > traffic_wds ;
dd - > traffic_wds + = traffic_wds ;
if ( traffic_wds > = QIB_TRAFFIC_ACTIVE_THRESHOLD )
atomic_add ( 5 , & dd - > active_time ) ; /* S/B #define */
spin_unlock_irqrestore ( & dd - > eep_st_lock , flags ) ;
qib_chk_6120_errormask ( dd ) ;
done :
mod_timer ( & dd - > stats_timer , jiffies + HZ * ACTIVITY_TIMER ) ;
/* no interrupt fallback for these chips */
static int qib_6120_nointr_fallback ( struct qib_devdata * dd )
return 0 ;
* reset the XGXS ( between serdes and IBC ) . Slightly less intrusive
* than resetting the IBC or external link state , and useful in some
* cases to cause some retraining . To do this right , we reset IBC
* as well .
static void qib_6120_xgxs_reset ( struct qib_pportdata * ppd )
u64 val , prev_val ;
struct qib_devdata * dd = ppd - > dd ;
prev_val = qib_read_kreg64 ( dd , kr_xgxs_cfg ) ;
val = prev_val | QLOGIC_IB_XGXS_RESET ;
prev_val & = ~ QLOGIC_IB_XGXS_RESET ; /* be sure */
qib_write_kreg ( dd , kr_control ,
dd - > control & ~ QLOGIC_IB_C_LINKENABLE ) ;
qib_write_kreg ( dd , kr_xgxs_cfg , val ) ;
qib_read_kreg32 ( dd , kr_scratch ) ;
qib_write_kreg ( dd , kr_xgxs_cfg , prev_val ) ;
qib_write_kreg ( dd , kr_control , dd - > control ) ;
static int qib_6120_get_ib_cfg ( struct qib_pportdata * ppd , int which )
int ret ;
switch ( which ) {
ret = ppd - > link_width_active ;
break ;
ret = ppd - > link_speed_active ;
break ;
ret = ppd - > link_width_enabled ;
break ;
ret = ppd - > link_speed_enabled ;
break ;
ret = ppd - > vls_operational ;
break ;
ret = 0 ;
break ;
ret = 0 ;
break ;
case QIB_IB_CFG_OVERRUN_THRESH : /* IB overrun threshold */
ret = SYM_FIELD ( ppd - > dd - > cspec - > ibcctrl , IBCCtrl ,
OverrunThreshold ) ;
break ;
case QIB_IB_CFG_PHYERR_THRESH : /* IB PHY error threshold */
ret = SYM_FIELD ( ppd - > dd - > cspec - > ibcctrl , IBCCtrl ,
PhyerrThreshold ) ;
break ;
case QIB_IB_CFG_LINKDEFAULT : /* IB link default (sleep/poll) */
/* will only take effect when the link state changes */
ret = ( ppd - > dd - > cspec - > ibcctrl &
SYM_MASK ( IBCCtrl , LinkDownDefaultState ) ) ?
break ;
case QIB_IB_CFG_HRTBT : /* Get Heartbeat off/enable/auto */
ret = 0 ; /* no heartbeat on this chip */
break ;
ret = 250 ; /* 1 usec. */
break ;
default :
ret = - EINVAL ;
break ;
return ret ;
* We assume range checking is already done , if needed .
static int qib_6120_set_ib_cfg ( struct qib_pportdata * ppd , int which , u32 val )
struct qib_devdata * dd = ppd - > dd ;
int ret = 0 ;
u64 val64 ;
u16 lcmd , licmd ;
switch ( which ) {
ppd - > link_width_enabled = val ;
break ;
ppd - > link_speed_enabled = val ;
break ;
case QIB_IB_CFG_OVERRUN_THRESH : /* IB overrun threshold */
val64 = SYM_FIELD ( dd - > cspec - > ibcctrl , IBCCtrl ,
OverrunThreshold ) ;
if ( val64 ! = val ) {
dd - > cspec - > ibcctrl & =
~ SYM_MASK ( IBCCtrl , OverrunThreshold ) ;
dd - > cspec - > ibcctrl | = ( u64 ) val < <
SYM_LSB ( IBCCtrl , OverrunThreshold ) ;
qib_write_kreg ( dd , kr_ibcctrl , dd - > cspec - > ibcctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
break ;
case QIB_IB_CFG_PHYERR_THRESH : /* IB PHY error threshold */
val64 = SYM_FIELD ( dd - > cspec - > ibcctrl , IBCCtrl ,
PhyerrThreshold ) ;
if ( val64 ! = val ) {
dd - > cspec - > ibcctrl & =
~ SYM_MASK ( IBCCtrl , PhyerrThreshold ) ;
dd - > cspec - > ibcctrl | = ( u64 ) val < <
SYM_LSB ( IBCCtrl , PhyerrThreshold ) ;
qib_write_kreg ( dd , kr_ibcctrl , dd - > cspec - > ibcctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
break ;
case QIB_IB_CFG_PKEYS : /* update pkeys */
val64 = ( u64 ) ppd - > pkeys [ 0 ] | ( ( u64 ) ppd - > pkeys [ 1 ] < < 16 ) |
( ( u64 ) ppd - > pkeys [ 2 ] < < 32 ) |
( ( u64 ) ppd - > pkeys [ 3 ] < < 48 ) ;
qib_write_kreg ( dd , kr_partitionkey , val64 ) ;
break ;
case QIB_IB_CFG_LINKDEFAULT : /* IB link default (sleep/poll) */
/* will only take effect when the link state changes */
if ( val = = IB_LINKINITCMD_POLL )
dd - > cspec - > ibcctrl & =
~ SYM_MASK ( IBCCtrl , LinkDownDefaultState ) ;
else /* SLEEP */
dd - > cspec - > ibcctrl | =
SYM_MASK ( IBCCtrl , LinkDownDefaultState ) ;
qib_write_kreg ( dd , kr_ibcctrl , dd - > cspec - > ibcctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
break ;
case QIB_IB_CFG_MTU : /* update the MTU in IBC */
* Update our housekeeping variables , and set IBC max
* size , same as init code ; max IBC is max we allow in
* buffer , less the qword pbc , plus 1 for ICRC , in dwords
* Set even if it ' s unchanged , print debug message only
* on changes .
val = ( ppd - > ibmaxlen > > 2 ) + 1 ;
dd - > cspec - > ibcctrl & = ~ SYM_MASK ( IBCCtrl , MaxPktLen ) ;
dd - > cspec - > ibcctrl | = ( u64 ) val < <
SYM_LSB ( IBCCtrl , MaxPktLen ) ;
qib_write_kreg ( dd , kr_ibcctrl , dd - > cspec - > ibcctrl ) ;
qib_write_kreg ( dd , kr_scratch , 0 ) ;
break ;
case QIB_IB_CFG_LSTATE : /* set the IB link state */
switch ( val & 0xffff0000 ) {
if ( ! dd - > cspec - > ibdeltainprog ) {
dd - > cspec - > ibdeltainprog = 1 ;
dd - > cspec - > ibsymsnap =
read_6120_creg32 ( dd , cr_ibsymbolerr ) ;
dd - > cspec - > iblnkerrsnap =
read_6120_creg32 ( dd , cr_iblinkerrrecov ) ;
break ;
break ;
break ;
default :
ret = - EINVAL ;
qib_dev_err ( dd , " bad linkcmd req 0x%x \n " , val > > 16 ) ;
goto bail ;
switch ( val & 0xffff ) {
licmd = 0 ;
break ;
break ;
break ;
break ;
default :
ret = - EINVAL ;
qib_dev_err ( dd , " bad linkinitcmd req 0x%x \n " ,
val & 0xffff ) ;
goto bail ;
qib_set_ib_6120_lstate ( ppd , lcmd , licmd ) ;
goto bail ;
ret = - EINVAL ;
break ;
default :
ret = - EINVAL ;
bail :
return ret ;
static int qib_6120_set_loopback ( struct qib_pportdata * ppd , const char * what )
int ret = 0 ;
if ( ! strncmp ( what , " ibc " , 3 ) ) {
ppd - > dd - > cspec - > ibcctrl | = SYM_MASK ( IBCCtrl , Loopback ) ;
qib_devinfo ( ppd - > dd - > pcidev , " Enabling IB%u:%u IBC loopback \n " ,
ppd - > dd - > unit , ppd - > port ) ;
} else if ( ! strncmp ( what , " off " , 3 ) ) {
ppd - > dd - > cspec - > ibcctrl & = ~ SYM_MASK ( IBCCtrl , Loopback ) ;
qib_devinfo ( ppd - > dd - > pcidev , " Disabling IB%u:%u IBC loopback "
" (normal) \n " , ppd - > dd - > unit , ppd - > port ) ;
} else
ret = - EINVAL ;
if ( ! ret ) {
qib_write_kreg ( ppd - > dd , kr_ibcctrl , ppd - > dd - > cspec - > ibcctrl ) ;
qib_write_kreg ( ppd - > dd , kr_scratch , 0 ) ;
return ret ;
static void pma_6120_timer ( unsigned long data )
struct qib_pportdata * ppd = ( struct qib_pportdata * ) data ;
struct qib_chip_specific * cs = ppd - > dd - > cspec ;
struct qib_ibport * ibp = & ppd - > ibport_data ;
unsigned long flags ;
spin_lock_irqsave ( & ibp - > lock , flags ) ;
if ( cs - > pma_sample_status = = IB_PMA_SAMPLE_STATUS_STARTED ) {
cs - > pma_sample_status = IB_PMA_SAMPLE_STATUS_RUNNING ;
qib_snapshot_counters ( ppd , & cs - > sword , & cs - > rword ,
& cs - > spkts , & cs - > rpkts , & cs - > xmit_wait ) ;
mod_timer ( & cs - > pma_timer ,
jiffies + usecs_to_jiffies ( ibp - > pma_sample_interval ) ) ;
} else if ( cs - > pma_sample_status = = IB_PMA_SAMPLE_STATUS_RUNNING ) {
u64 ta , tb , tc , td , te ;
cs - > pma_sample_status = IB_PMA_SAMPLE_STATUS_DONE ;
qib_snapshot_counters ( ppd , & ta , & tb , & tc , & td , & te ) ;
cs - > sword = ta - cs - > sword ;
cs - > rword = tb - cs - > rword ;
cs - > spkts = tc - cs - > spkts ;
cs - > rpkts = td - cs - > rpkts ;
cs - > xmit_wait = te - cs - > xmit_wait ;
spin_unlock_irqrestore ( & ibp - > lock , flags ) ;
* Note that the caller has the ibp - > lock held .
static void qib_set_cntr_6120_sample ( struct qib_pportdata * ppd , u32 intv ,
u32 start )
struct qib_chip_specific * cs = ppd - > dd - > cspec ;
if ( start & & intv ) {
cs - > pma_sample_status = IB_PMA_SAMPLE_STATUS_STARTED ;
mod_timer ( & cs - > pma_timer , jiffies + usecs_to_jiffies ( start ) ) ;
} else if ( intv ) {
cs - > pma_sample_status = IB_PMA_SAMPLE_STATUS_RUNNING ;
qib_snapshot_counters ( ppd , & cs - > sword , & cs - > rword ,
& cs - > spkts , & cs - > rpkts , & cs - > xmit_wait ) ;
mod_timer ( & cs - > pma_timer , jiffies + usecs_to_jiffies ( intv ) ) ;
} else {
cs - > pma_sample_status = IB_PMA_SAMPLE_STATUS_DONE ;
cs - > sword = 0 ;
cs - > rword = 0 ;
cs - > spkts = 0 ;
cs - > rpkts = 0 ;
cs - > xmit_wait = 0 ;
static u32 qib_6120_iblink_state ( u64 ibcs )
u32 state = ( u32 ) SYM_FIELD ( ibcs , IBCStatus , LinkState ) ;
switch ( state ) {
case IB_6120_L_STATE_INIT :
state = IB_PORT_INIT ;
break ;
case IB_6120_L_STATE_ARM :
state = IB_PORT_ARMED ;
break ;
case IB_6120_L_STATE_ACTIVE :
/* fall through */
case IB_6120_L_STATE_ACT_DEFER :
state = IB_PORT_ACTIVE ;
break ;
default : /* fall through */
case IB_6120_L_STATE_DOWN :
state = IB_PORT_DOWN ;
break ;
return state ;
/* returns the IBTA port state, rather than the IBC link training state */
static u8 qib_6120_phys_portstate ( u64 ibcs )
u8 state = ( u8 ) SYM_FIELD ( ibcs , IBCStatus , LinkTrainingState ) ;
return qib_6120_physportstate [ state ] ;
static int qib_6120_ib_updown ( struct qib_pportdata * ppd , int ibup , u64 ibcs )
unsigned long flags ;
spin_lock_irqsave ( & ppd - > lflags_lock , flags ) ;
ppd - > lflags & = ~ QIBL_IB_FORCE_NOTIFY ;
spin_unlock_irqrestore ( & ppd - > lflags_lock , flags ) ;
if ( ibup ) {
if ( ppd - > dd - > cspec - > ibdeltainprog ) {
ppd - > dd - > cspec - > ibdeltainprog = 0 ;
ppd - > dd - > cspec - > ibsymdelta + =
read_6120_creg32 ( ppd - > dd , cr_ibsymbolerr ) -
ppd - > dd - > cspec - > ibsymsnap ;
ppd - > dd - > cspec - > iblnkerrdelta + =
read_6120_creg32 ( ppd - > dd , cr_iblinkerrrecov ) -
ppd - > dd - > cspec - > iblnkerrsnap ;
qib_hol_init ( ppd ) ;
} else {
ppd - > dd - > cspec - > lli_counter = 0 ;
if ( ! ppd - > dd - > cspec - > ibdeltainprog ) {
ppd - > dd - > cspec - > ibdeltainprog = 1 ;
ppd - > dd - > cspec - > ibsymsnap =
read_6120_creg32 ( ppd - > dd , cr_ibsymbolerr ) ;
ppd - > dd - > cspec - > iblnkerrsnap =
read_6120_creg32 ( ppd - > dd , cr_iblinkerrrecov ) ;
qib_hol_down ( ppd ) ;
qib_6120_setup_setextled ( ppd , ibup ) ;
return 0 ;
/* Does read/modify/write to appropriate registers to
* set output and direction bits selected by mask .
* these are in their canonical postions ( e . g . lsb of
* dir will end up in D48 of extctrl on existing chips ) .
* returns contents of GP Inputs .
static int gpio_6120_mod ( struct qib_devdata * dd , u32 out , u32 dir , u32 mask )
u64 read_val , new_out ;
unsigned long flags ;
if ( mask ) {
/* some bits being written, lock access to GPIO */
dir & = mask ;
out & = mask ;
spin_lock_irqsave ( & dd - > cspec - > gpio_lock , flags ) ;
dd - > cspec - > extctrl & = ~ ( ( u64 ) mask < < SYM_LSB ( EXTCtrl , GPIOOe ) ) ;
dd - > cspec - > extctrl | = ( ( u64 ) dir < < SYM_LSB ( EXTCtrl , GPIOOe ) ) ;
new_out = ( dd - > cspec - > gpio_out & ~ mask ) | out ;
qib_write_kreg ( dd , kr_extctrl , dd - > cspec - > extctrl ) ;
qib_write_kreg ( dd , kr_gpio_out , new_out ) ;
dd - > cspec - > gpio_out = new_out ;
spin_unlock_irqrestore ( & dd - > cspec - > gpio_lock , flags ) ;
* It is unlikely that a read at this time would get valid
* data on a pin whose direction line was set in the same
* call to this function . We include the read here because
* that allows us to potentially combine a change on one pin with
* a read on another , and because the old code did something like
* this .
read_val = qib_read_kreg64 ( dd , kr_extstatus ) ;
return SYM_FIELD ( read_val , EXTStatus , GPIOIn ) ;
* Read fundamental info we need to use the chip . These are
* the registers that describe chip capabilities , and are
* saved in shadow registers .
static void get_6120_chip_params ( struct qib_devdata * dd )
u64 val ;
u32 piobufs ;
int mtu ;
dd - > uregbase = qib_read_kreg32 ( dd , kr_userregbase ) ;
dd - > rcvtidcnt = qib_read_kreg32 ( dd , kr_rcvtidcnt ) ;
dd - > rcvtidbase = qib_read_kreg32 ( dd , kr_rcvtidbase ) ;
dd - > rcvegrbase = qib_read_kreg32 ( dd , kr_rcvegrbase ) ;
dd - > palign = qib_read_kreg32 ( dd , kr_palign ) ;
dd - > piobufbase = qib_read_kreg64 ( dd , kr_sendpiobufbase ) ;
dd - > pio2k_bufbase = dd - > piobufbase & 0xffffffff ;
dd - > rcvhdrcnt = qib_read_kreg32 ( dd , kr_rcvegrcnt ) ;
val = qib_read_kreg64 ( dd , kr_sendpiosize ) ;
dd - > piosize2k = val & ~ 0U ;
dd - > piosize4k = val > > 32 ;
mtu = ib_mtu_enum_to_int ( qib_ibmtu ) ;
if ( mtu = = - 1 )
dd - > pport - > ibmtu = ( u32 ) mtu ;
val = qib_read_kreg64 ( dd , kr_sendpiobufcnt ) ;
dd - > piobcnt2k = val & ~ 0U ;
dd - > piobcnt4k = val > > 32 ;
/* these may be adjusted in init_chip_wc_pat() */
dd - > pio2kbase = ( u32 __iomem * )
( ( ( char __iomem * ) dd - > kregbase ) + dd - > pio2k_bufbase ) ;
if ( dd - > piobcnt4k ) {
dd - > pio4kbase = ( u32 __iomem * )
( ( ( char __iomem * ) dd - > kregbase ) +
( dd - > piobufbase > > 32 ) ) ;
* 4 K buffers take 2 pages ; we use roundup just to be
* paranoid ; we calculate it once here , rather than on
* ever buf allocate
dd - > align4k = ALIGN ( dd - > piosize4k , dd - > palign ) ;
piobufs = dd - > piobcnt4k + dd - > piobcnt2k ;
dd - > pioavregs = ALIGN ( piobufs , sizeof ( u64 ) * BITS_PER_BYTE / 2 ) /
( sizeof ( u64 ) * BITS_PER_BYTE / 2 ) ;
* The chip base addresses in cspec and cpspec have to be set
* after possible init_chip_wc_pat ( ) , rather than in
* get_6120_chip_params ( ) , so split out as separate function
static void set_6120_baseaddrs ( struct qib_devdata * dd )
u32 cregbase ;
cregbase = qib_read_kreg32 ( dd , kr_counterregbase ) ;
dd - > cspec - > cregbase = ( u64 __iomem * )
( ( char __iomem * ) dd - > kregbase + cregbase ) ;
dd - > egrtidbase = ( u64 __iomem * )
( ( char __iomem * ) dd - > kregbase + dd - > rcvegrbase ) ;
* Write the final few registers that depend on some of the
* init setup . Done late in init , just before bringing up
* the serdes .
static int qib_late_6120_initreg ( struct qib_devdata * dd )
int ret = 0 ;
u64 val ;
qib_write_kreg ( dd , kr_rcvhdrentsize , dd - > rcvhdrentsize ) ;
qib_write_kreg ( dd , kr_rcvhdrsize , dd - > rcvhdrsize ) ;
qib_write_kreg ( dd , kr_rcvhdrcnt , dd - > rcvhdrcnt ) ;
qib_write_kreg ( dd , kr_sendpioavailaddr , dd - > pioavailregs_phys ) ;
val = qib_read_kreg64 ( dd , kr_sendpioavailaddr ) ;
if ( val ! = dd - > pioavailregs_phys ) {
qib_dev_err ( dd , " Catastrophic software error, "
" SendPIOAvailAddr written as %lx, "
" read back as %llx \n " ,
( unsigned long ) dd - > pioavailregs_phys ,
( unsigned long long ) val ) ;
ret = - EINVAL ;
return ret ;
static int init_6120_variables ( struct qib_devdata * dd )
int ret = 0 ;
struct qib_pportdata * ppd ;
u32 sbufs ;
ppd = ( struct qib_pportdata * ) ( dd + 1 ) ;
dd - > pport = ppd ;
dd - > num_pports = 1 ;
dd - > cspec = ( struct qib_chip_specific * ) ( ppd + dd - > num_pports ) ;
ppd - > cpspec = NULL ; /* not used in this chip */
spin_lock_init ( & dd - > cspec - > kernel_tid_lock ) ;
spin_lock_init ( & dd - > cspec - > user_tid_lock ) ;
spin_lock_init ( & dd - > cspec - > rcvmod_lock ) ;
spin_lock_init ( & dd - > cspec - > gpio_lock ) ;
/* we haven't yet set QIB_PRESENT, so use read directly */
dd - > revision = readq ( & dd - > kregbase [ kr_revision ] ) ;
if ( ( dd - > revision & 0xffffffffU ) = = 0xffffffffU ) {
qib_dev_err ( dd , " Revision register read failure, "
" giving up initialization \n " ) ;
ret = - ENODEV ;
goto bail ;
dd - > flags | = QIB_PRESENT ; /* now register routines work */
dd - > majrev = ( u8 ) SYM_FIELD ( dd - > revision , Revision_R ,
ChipRevMajor ) ;
dd - > minrev = ( u8 ) SYM_FIELD ( dd - > revision , Revision_R ,
ChipRevMinor ) ;
get_6120_chip_params ( dd ) ;
pe_boardname ( dd ) ; /* fill in boardname */
* GPIO bits for TWSI data and clock ,
* used for serial EEPROM .
dd - > gpio_sda_num = _QIB_GPIO_SDA_NUM ;
dd - > gpio_scl_num = _QIB_GPIO_SCL_NUM ;
dd - > twsi_eeprom_dev = QIB_TWSI_NO_DEV ;
if ( qib_unordered_wc ( ) )
dd - > flags | = QIB_PIO_FLUSH_WC ;
* EEPROM error log 0 is TXE Parity errors . 1 is RXE Parity .
* 2 is Some Misc , 3 is reserved for future .
dd - > eep_st_masks [ 0 ] . hwerrs_to_log = HWE_MASK ( TXEMemParityErr ) ;
/* Ignore errors in PIO/PBC on systems with unordered write-combining */
if ( qib_unordered_wc ( ) )
dd - > eep_st_masks [ 0 ] . hwerrs_to_log & = ~ TXE_PIO_PARITY ;
dd - > eep_st_masks [ 1 ] . hwerrs_to_log = HWE_MASK ( RXEMemParityErr ) ;
dd - > eep_st_masks [ 2 ] . errs_to_log = ERR_MASK ( ResetNegated ) ;
qib_init_pportdata ( ppd , dd , 0 , 1 ) ;
ppd - > link_width_supported = IB_WIDTH_1X | IB_WIDTH_4X ;
ppd - > link_speed_supported = QIB_IB_SDR ;
ppd - > link_width_enabled = IB_WIDTH_4X ;
ppd - > link_speed_enabled = ppd - > link_speed_supported ;
/* these can't change for this chip, so set once */
ppd - > link_width_active = ppd - > link_width_enabled ;
ppd - > link_speed_active = ppd - > link_speed_enabled ;
ppd - > vls_supported = IB_VL_VL0 ;
ppd - > vls_operational = ppd - > vls_supported ;
dd - > rcvhdrentsize = QIB_RCVHDR_ENTSIZE ;
dd - > rcvhdrsize = QIB_DFLT_RCVHDRSIZE ;
dd - > rhf_offset = 0 ;
/* we always allocate at least 2048 bytes for eager buffers */
ret = ib_mtu_enum_to_int ( qib_ibmtu ) ;
dd - > rcvegrbufsize = ret ! = - 1 ? max ( ret , 2048 ) : QIB_DEFAULT_MTU ;
qib_6120_tidtemplate ( dd ) ;
* We can request a receive interrupt for 1 or
* more packets from current offset . For now , we set this
* up for a single packet .
dd - > rhdrhead_intr_off = 1ULL < < 32 ;
/* setup the stats timer; the add_timer is done at end of init */
init_timer ( & dd - > stats_timer ) ;
dd - > stats_timer . function = qib_get_6120_faststats ;
dd - > stats_timer . data = ( unsigned long ) dd ;
init_timer ( & dd - > cspec - > pma_timer ) ;
dd - > cspec - > pma_timer . function = pma_6120_timer ;
dd - > cspec - > pma_timer . data = ( unsigned long ) ppd ;
dd - > ureg_align = qib_read_kreg32 ( dd , kr_palign ) ;
dd - > piosize2kmax_dwords = dd - > piosize2k > > 2 ;
qib_6120_config_ctxts ( dd ) ;
qib_set_ctxtcnt ( dd ) ;
if ( qib_wc_pat ) {
ret = init_chip_wc_pat ( dd , 0 ) ;
if ( ret )
goto bail ;
set_6120_baseaddrs ( dd ) ; /* set chip access pointers now */
ret = 0 ;
if ( qib_mini_init )
goto bail ;
qib_num_cfg_vls = 1 ; /* if any 6120's, only one VL */
ret = qib_create_ctxts ( dd ) ;
init_6120_cntrnames ( dd ) ;
/* use all of 4KB buffers for the kernel, otherwise 16 */
sbufs = dd - > piobcnt4k ? dd - > piobcnt4k : 16 ;
dd - > lastctxt_piobuf = dd - > piobcnt2k + dd - > piobcnt4k - sbufs ;
dd - > pbufsctxt = dd - > lastctxt_piobuf /
( dd - > cfgctxts - dd - > first_user_ctxt ) ;
if ( ret )
goto bail ;
bail :
return ret ;
* For this chip , we want to use the same buffer every time
* when we are trying to bring the link up ( they are always VL15
* packets ) . At that link state the packet should always go out immediately
* ( or at least be discarded at the tx interface if the link is down ) .
* If it doesn ' t , and the buffer isn ' t available , that means some other
* sender has gotten ahead of us , and is preventing our packet from going
* out . In that case , we flush all packets , and try again . If that still
* fails , we fail the request , and hope things work the next time around .
* We don ' t need very complicated heuristics on whether the packet had
* time to go out or not , since even at SDR 1 X , it goes out in very short
* time periods , covered by the chip reads done here and as part of the
* flush .
static u32 __iomem * get_6120_link_buf ( struct qib_pportdata * ppd , u32 * bnum )
u32 __iomem * buf ;
u32 lbuf = ppd - > dd - > piobcnt2k + ppd - > dd - > piobcnt4k - 1 ;
* always blip to get avail list updated , since it ' s almost
* always needed , and is fairly cheap .
sendctrl_6120_mod ( ppd - > dd - > pport , QIB_SENDCTRL_AVAIL_BLIP ) ;
qib_read_kreg64 ( ppd - > dd , kr_scratch ) ; /* extra chip flush */
buf = qib_getsendbuf_range ( ppd - > dd , bnum , lbuf , lbuf ) ;
if ( buf )
goto done ;
sendctrl_6120_mod ( ppd , QIB_SENDCTRL_DISARM_ALL | QIB_SENDCTRL_FLUSH |
ppd - > dd - > upd_pio_shadow = 1 ; /* update our idea of what's busy */
qib_read_kreg64 ( ppd - > dd , kr_scratch ) ; /* extra chip flush */
buf = qib_getsendbuf_range ( ppd - > dd , bnum , lbuf , lbuf ) ;
done :
return buf ;
static u32 __iomem * qib_6120_getsendbuf ( struct qib_pportdata * ppd , u64 pbc ,
u32 * pbufnum )
u32 first , last , plen = pbc & QIB_PBC_LENGTH_MASK ;
struct qib_devdata * dd = ppd - > dd ;
u32 __iomem * buf ;
if ( ( ( pbc > > 32 ) & PBC_6120_VL15_SEND_CTRL ) & &
! ( ppd - > lflags & ( QIBL_IB_AUTONEG_INPROG | QIBL_LINKACTIVE ) ) )
buf = get_6120_link_buf ( ppd , pbufnum ) ;
else {
if ( ( plen + 1 ) > dd - > piosize2kmax_dwords )
first = dd - > piobcnt2k ;
first = 0 ;
/* try 4k if all 2k busy, so same last for both sizes */
last = dd - > piobcnt2k + dd - > piobcnt4k - 1 ;
buf = qib_getsendbuf_range ( dd , pbufnum , first , last ) ;
return buf ;
static int init_sdma_6120_regs ( struct qib_pportdata * ppd )
return - ENODEV ;
static u16 qib_sdma_6120_gethead ( struct qib_pportdata * ppd )
return 0 ;
static int qib_sdma_6120_busy ( struct qib_pportdata * ppd )
return 0 ;
static void qib_sdma_update_6120_tail ( struct qib_pportdata * ppd , u16 tail )
static void qib_6120_sdma_sendctrl ( struct qib_pportdata * ppd , unsigned op )
static void qib_sdma_set_6120_desc_cnt ( struct qib_pportdata * ppd , unsigned cnt )
* the pbc doesn ' t need a VL15 indicator , but we need it for link_buf .
* The chip ignores the bit if set .
static u32 qib_6120_setpbc_control ( struct qib_pportdata * ppd , u32 plen ,
u8 srate , u8 vl )
return vl = = 15 ? PBC_6120_VL15_SEND_CTRL : 0 ;
static void qib_6120_initvl15_bufs ( struct qib_devdata * dd )
static void qib_6120_init_ctxt ( struct qib_ctxtdata * rcd )
rcd - > rcvegrcnt = rcd - > dd - > rcvhdrcnt ;
rcd - > rcvegr_tid_base = rcd - > ctxt * rcd - > rcvegrcnt ;
static void qib_6120_txchk_change ( struct qib_devdata * dd , u32 start ,
u32 len , u32 avail , struct qib_ctxtdata * rcd )
static void writescratch ( struct qib_devdata * dd , u32 val )
( void ) qib_write_kreg ( dd , kr_scratch , val ) ;
static int qib_6120_tempsense_rd ( struct qib_devdata * dd , int regnum )
return - ENXIO ;
/* Dummy function, as 6120 boards never disable EEPROM Write */
static int qib_6120_eeprom_wen ( struct qib_devdata * dd , int wen )
return 1 ;
* qib_init_iba6120_funcs - set up the chip - specific function pointers
* @ pdev : pci_dev of the qlogic_ib device
* @ ent : pci_device_id matching this chip
* This is global , and is called directly at init to set up the
* chip - specific function pointers for later use .
* It also allocates / partially - inits the qib_devdata struct for
* this device .
struct qib_devdata * qib_init_iba6120_funcs ( struct pci_dev * pdev ,
const struct pci_device_id * ent )
struct qib_devdata * dd ;
int ret ;
dd = qib_alloc_devdata ( pdev , sizeof ( struct qib_pportdata ) +
sizeof ( struct qib_chip_specific ) ) ;
if ( IS_ERR ( dd ) )
goto bail ;
dd - > f_bringup_serdes = qib_6120_bringup_serdes ;
dd - > f_cleanup = qib_6120_setup_cleanup ;
dd - > f_clear_tids = qib_6120_clear_tids ;
dd - > f_free_irq = qib_6120_free_irq ;
dd - > f_get_base_info = qib_6120_get_base_info ;
dd - > f_get_msgheader = qib_6120_get_msgheader ;
dd - > f_getsendbuf = qib_6120_getsendbuf ;
dd - > f_gpio_mod = gpio_6120_mod ;
dd - > f_eeprom_wen = qib_6120_eeprom_wen ;
dd - > f_hdrqempty = qib_6120_hdrqempty ;
dd - > f_ib_updown = qib_6120_ib_updown ;
dd - > f_init_ctxt = qib_6120_init_ctxt ;
dd - > f_initvl15_bufs = qib_6120_initvl15_bufs ;
dd - > f_intr_fallback = qib_6120_nointr_fallback ;
dd - > f_late_initreg = qib_late_6120_initreg ;
dd - > f_setpbc_control = qib_6120_setpbc_control ;
dd - > f_portcntr = qib_portcntr_6120 ;
dd - > f_put_tid = ( dd - > minrev > = 2 ) ?
qib_6120_put_tid_2 :
qib_6120_put_tid ;
dd - > f_quiet_serdes = qib_6120_quiet_serdes ;
dd - > f_rcvctrl = rcvctrl_6120_mod ;
dd - > f_read_cntrs = qib_read_6120cntrs ;
dd - > f_read_portcntrs = qib_read_6120portcntrs ;
dd - > f_reset = qib_6120_setup_reset ;
dd - > f_init_sdma_regs = init_sdma_6120_regs ;
dd - > f_sdma_busy = qib_sdma_6120_busy ;
dd - > f_sdma_gethead = qib_sdma_6120_gethead ;
dd - > f_sdma_sendctrl = qib_6120_sdma_sendctrl ;
dd - > f_sdma_set_desc_cnt = qib_sdma_set_6120_desc_cnt ;
dd - > f_sdma_update_tail = qib_sdma_update_6120_tail ;
dd - > f_sendctrl = sendctrl_6120_mod ;
dd - > f_set_armlaunch = qib_set_6120_armlaunch ;
dd - > f_set_cntr_sample = qib_set_cntr_6120_sample ;
dd - > f_iblink_state = qib_6120_iblink_state ;
dd - > f_ibphys_portstate = qib_6120_phys_portstate ;
dd - > f_get_ib_cfg = qib_6120_get_ib_cfg ;
dd - > f_set_ib_cfg = qib_6120_set_ib_cfg ;
dd - > f_set_ib_loopback = qib_6120_set_loopback ;
dd - > f_set_intr_state = qib_6120_set_intr_state ;
dd - > f_setextled = qib_6120_setup_setextled ;
dd - > f_txchk_change = qib_6120_txchk_change ;
dd - > f_update_usrhead = qib_update_6120_usrhead ;
dd - > f_wantpiobuf_intr = qib_wantpiobuf_6120_intr ;
dd - > f_xgxs_reset = qib_6120_xgxs_reset ;
dd - > f_writescratch = writescratch ;
dd - > f_tempsense_rd = qib_6120_tempsense_rd ;
* Do remaining pcie setup and save pcie values in dd .
* Any error printing is already done by the init code .
* On return , we have the chip mapped and accessible ,
* but chip registers are not set up until start of
* init_6120_variables .
ret = qib_pcie_ddinit ( dd , pdev , ent ) ;
if ( ret < 0 )
goto bail_free ;
/* initialize chip-specific variables */
ret = init_6120_variables ( dd ) ;
if ( ret )
goto bail_cleanup ;
if ( qib_mini_init )
goto bail ;
if ( qib_pcie_params ( dd , 8 , NULL , NULL ) )
qib_dev_err ( dd , " Failed to setup PCIe or interrupts; "
" continuing anyway \n " ) ;
dd - > cspec - > irq = pdev - > irq ; /* save IRQ */
/* clear diagctrl register, in case diags were running and crashed */
qib_write_kreg ( dd , kr_hwdiagctrl , 0 ) ;
if ( qib_read_kreg64 ( dd , kr_hwerrstatus ) &
qib_write_kreg ( dd , kr_hwerrclear ,
/* setup interrupt handler (interrupt type handled above) */
qib_setup_6120_interrupt ( dd ) ;
/* Note that qpn_mask is set by qib_6120_config_ctxts() first */
qib_6120_init_hwerrors ( dd ) ;
goto bail ;
bail_cleanup :
qib_pcie_ddcleanup ( dd ) ;
bail_free :
qib_free_devdata ( dd ) ;
dd = ERR_PTR ( ret ) ;
bail :
return dd ;