2015-04-20 17:09:27 -04:00
/*
* Copyright 2013 Advanced Micro Devices , Inc .
*
* Permission is hereby granted , free of charge , to any person obtaining a
* copy of this software and associated documentation files ( the " Software " ) ,
* to deal in the Software without restriction , including without limitation
* the rights to use , copy , modify , merge , publish , distribute , sublicense ,
* and / or sell copies of the Software , and to permit persons to whom the
* Software is furnished to do so , subject to the following conditions :
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software .
*
* THE SOFTWARE IS PROVIDED " AS IS " , WITHOUT WARRANTY OF ANY KIND , EXPRESS OR
* IMPLIED , INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY ,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT . IN NO EVENT SHALL
* THE COPYRIGHT HOLDER ( S ) OR AUTHOR ( S ) BE LIABLE FOR ANY CLAIM , DAMAGES OR
* OTHER LIABILITY , WHETHER IN AN ACTION OF CONTRACT , TORT OR OTHERWISE ,
* ARISING FROM , OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE .
*
* Authors : Alex Deucher
*/
2019-06-10 00:07:57 +02:00
2015-04-20 17:09:27 -04:00
# include <linux/firmware.h>
2019-06-10 00:07:57 +02:00
# include <linux/module.h>
2015-04-20 17:09:27 -04:00
# include "amdgpu.h"
# include "amdgpu_ucode.h"
# include "amdgpu_trace.h"
# include "cikd.h"
# include "cik.h"
# include "bif/bif_4_1_d.h"
# include "bif/bif_4_1_sh_mask.h"
# include "gca/gfx_7_2_d.h"
2015-05-08 14:46:49 +08:00
# include "gca/gfx_7_2_enum.h"
# include "gca/gfx_7_2_sh_mask.h"
2015-04-20 17:09:27 -04:00
# include "gmc/gmc_7_1_d.h"
# include "gmc/gmc_7_1_sh_mask.h"
# include "oss/oss_2_0_d.h"
# include "oss/oss_2_0_sh_mask.h"
static const u32 sdma_offsets [ SDMA_MAX_INSTANCE ] =
{
SDMA0_REGISTER_OFFSET ,
SDMA1_REGISTER_OFFSET
} ;
static void cik_sdma_set_ring_funcs ( struct amdgpu_device * adev ) ;
static void cik_sdma_set_irq_funcs ( struct amdgpu_device * adev ) ;
static void cik_sdma_set_buffer_funcs ( struct amdgpu_device * adev ) ;
static void cik_sdma_set_vm_pte_funcs ( struct amdgpu_device * adev ) ;
2016-08-30 08:59:42 +08:00
static int cik_sdma_soft_reset ( void * handle ) ;
2015-04-20 17:09:27 -04:00
2018-07-02 14:32:28 -05:00
MODULE_FIRMWARE ( " amdgpu/bonaire_sdma.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/bonaire_sdma1.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/hawaii_sdma.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/hawaii_sdma1.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/kaveri_sdma.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/kaveri_sdma1.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/kabini_sdma.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/kabini_sdma1.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/mullins_sdma.bin " ) ;
MODULE_FIRMWARE ( " amdgpu/mullins_sdma1.bin " ) ;
2015-04-20 17:09:27 -04:00
u32 amdgpu_cik_gpu_check_soft_reset ( struct amdgpu_device * adev ) ;
2016-05-30 16:07:40 +08:00
static void cik_sdma_free_microcode ( struct amdgpu_device * adev )
{
int i ;
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
release_firmware ( adev - > sdma . instance [ i ] . fw ) ;
adev - > sdma . instance [ i ] . fw = NULL ;
}
}
2015-04-20 17:09:27 -04:00
/*
* sDMA - System DMA
* Starting with CIK , the GPU has new asynchronous
* DMA engines . These engines are used for compute
* and gfx . There are two DMA engines ( SDMA0 , SDMA1 )
* and each one supports 1 ring buffer used for gfx
* and 2 queues used for compute .
*
* The programming model is very similar to the CP
* ( ring buffer , IBs , etc . ) , but sDMA has it ' s own
* packet format that is different from the PM4 format
* used by the CP . sDMA supports copying data , writing
* embedded data , solid fills , and a number of other
* things . It also has support for tiling / detiling of
* buffers .
*/
/**
* cik_sdma_init_microcode - load ucode images from disk
*
* @ adev : amdgpu_device pointer
*
* Use the firmware interface to load the ucode images into
* the driver ( not loaded into hw ) .
* Returns 0 on success , error on failure .
*/
static int cik_sdma_init_microcode ( struct amdgpu_device * adev )
{
const char * chip_name ;
char fw_name [ 30 ] ;
2015-10-08 16:30:37 -04:00
int err = 0 , i ;
2015-04-20 17:09:27 -04:00
DRM_DEBUG ( " \n " ) ;
switch ( adev - > asic_type ) {
case CHIP_BONAIRE :
chip_name = " bonaire " ;
break ;
case CHIP_HAWAII :
chip_name = " hawaii " ;
break ;
case CHIP_KAVERI :
chip_name = " kaveri " ;
break ;
case CHIP_KABINI :
chip_name = " kabini " ;
break ;
case CHIP_MULLINS :
chip_name = " mullins " ;
break ;
default : BUG ( ) ;
}
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
2015-04-20 17:09:27 -04:00
if ( i = = 0 )
2018-07-02 14:32:28 -05:00
snprintf ( fw_name , sizeof ( fw_name ) , " amdgpu/%s_sdma.bin " , chip_name ) ;
2015-04-20 17:09:27 -04:00
else
2018-07-02 14:32:28 -05:00
snprintf ( fw_name , sizeof ( fw_name ) , " amdgpu/%s_sdma1.bin " , chip_name ) ;
2015-10-08 16:30:37 -04:00
err = request_firmware ( & adev - > sdma . instance [ i ] . fw , fw_name , adev - > dev ) ;
2015-04-20 17:09:27 -04:00
if ( err )
goto out ;
2015-10-08 16:30:37 -04:00
err = amdgpu_ucode_validate ( adev - > sdma . instance [ i ] . fw ) ;
2015-04-20 17:09:27 -04:00
}
out :
if ( err ) {
2017-02-28 04:55:52 -08:00
pr_err ( " cik_sdma: Failed to load firmware \" %s \" \n " , fw_name ) ;
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
release_firmware ( adev - > sdma . instance [ i ] . fw ) ;
adev - > sdma . instance [ i ] . fw = NULL ;
2015-04-20 17:09:27 -04:00
}
}
return err ;
}
/**
* cik_sdma_ring_get_rptr - get the current read pointer
*
* @ ring : amdgpu ring pointer
*
* Get the current rptr from the hardware ( CIK + ) .
*/
2016-03-12 09:32:30 +08:00
static uint64_t cik_sdma_ring_get_rptr ( struct amdgpu_ring * ring )
2015-04-20 17:09:27 -04:00
{
u32 rptr ;
rptr = ring - > adev - > wb . wb [ ring - > rptr_offs ] ;
return ( rptr & 0x3fffc ) > > 2 ;
}
/**
* cik_sdma_ring_get_wptr - get the current write pointer
*
* @ ring : amdgpu ring pointer
*
* Get the current wptr from the hardware ( CIK + ) .
*/
2016-03-12 09:32:30 +08:00
static uint64_t cik_sdma_ring_get_wptr ( struct amdgpu_ring * ring )
2015-04-20 17:09:27 -04:00
{
struct amdgpu_device * adev = ring - > adev ;
2018-06-25 12:24:10 -05:00
return ( RREG32 ( mmSDMA0_GFX_RB_WPTR + sdma_offsets [ ring - > me ] ) & 0x3fffc ) > > 2 ;
2015-04-20 17:09:27 -04:00
}
/**
* cik_sdma_ring_set_wptr - commit the write pointer
*
* @ ring : amdgpu ring pointer
*
* Write the wptr back to the hardware ( CIK + ) .
*/
static void cik_sdma_ring_set_wptr ( struct amdgpu_ring * ring )
{
struct amdgpu_device * adev = ring - > adev ;
2018-06-25 12:24:10 -05:00
WREG32 ( mmSDMA0_GFX_RB_WPTR + sdma_offsets [ ring - > me ] ,
2016-03-12 09:32:30 +08:00
( lower_32_bits ( ring - > wptr ) < < 2 ) & 0x3fffc ) ;
2015-04-20 17:09:27 -04:00
}
2015-09-01 13:13:54 +08:00
static void cik_sdma_ring_insert_nop ( struct amdgpu_ring * ring , uint32_t count )
{
2018-11-01 13:42:42 +08:00
struct amdgpu_sdma_instance * sdma = amdgpu_sdma_get_instance_from_ring ( ring ) ;
2015-09-01 13:13:54 +08:00
int i ;
for ( i = 0 ; i < count ; i + + )
if ( sdma & & sdma - > burst_nop & & ( i = = 0 ) )
2016-10-05 16:09:32 +02:00
amdgpu_ring_write ( ring , ring - > funcs - > nop |
2015-09-01 13:13:54 +08:00
SDMA_NOP_COUNT ( count - 1 ) ) ;
else
2016-10-05 16:09:32 +02:00
amdgpu_ring_write ( ring , ring - > funcs - > nop ) ;
2015-09-01 13:13:54 +08:00
}
2015-04-20 17:09:27 -04:00
/**
* cik_sdma_ring_emit_ib - Schedule an IB on the DMA engine
*
* @ ring : amdgpu ring pointer
* @ ib : IB object to schedule
*
* Schedule an IB in the DMA ring ( CIK ) .
*/
static void cik_sdma_ring_emit_ib ( struct amdgpu_ring * ring ,
2018-10-24 13:37:37 +08:00
struct amdgpu_job * job ,
2016-05-06 17:50:03 +02:00
struct amdgpu_ib * ib ,
2019-01-18 18:13:36 +08:00
uint32_t flags )
2015-04-20 17:09:27 -04:00
{
2018-10-24 13:37:37 +08:00
unsigned vmid = AMDGPU_JOB_GET_VMID ( job ) ;
2017-12-18 17:08:25 +01:00
u32 extra_bits = vmid & 0xf ;
2015-04-20 17:09:27 -04:00
/* IB packet must end on a 8 DW boundary */
2019-10-24 19:30:13 -04:00
cik_sdma_ring_insert_nop ( ring , ( 4 - lower_32_bits ( ring - > wptr ) ) & 7 ) ;
2015-09-01 13:13:54 +08:00
2015-04-20 17:09:27 -04:00
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_INDIRECT_BUFFER , 0 , extra_bits ) ) ;
amdgpu_ring_write ( ring , ib - > gpu_addr & 0xffffffe0 ) ; /* base must be 32 byte aligned */
amdgpu_ring_write ( ring , upper_32_bits ( ib - > gpu_addr ) & 0xffffffff ) ;
amdgpu_ring_write ( ring , ib - > length_dw ) ;
}
/**
2015-05-11 14:10:34 +02:00
* cik_sdma_ring_emit_hdp_flush - emit an hdp flush on the DMA ring
2015-04-20 17:09:27 -04:00
*
* @ ring : amdgpu ring pointer
*
* Emit an hdp flush packet on the requested DMA ring .
*/
2015-05-11 14:10:34 +02:00
static void cik_sdma_ring_emit_hdp_flush ( struct amdgpu_ring * ring )
2015-04-20 17:09:27 -04:00
{
u32 extra_bits = ( SDMA_POLL_REG_MEM_EXTRA_OP ( 1 ) |
SDMA_POLL_REG_MEM_EXTRA_FUNC ( 3 ) ) ; /* == */
u32 ref_and_mask ;
2018-06-25 12:24:10 -05:00
if ( ring - > me = = 0 )
2015-04-20 17:09:27 -04:00
ref_and_mask = GPU_HDP_FLUSH_DONE__SDMA0_MASK ;
else
ref_and_mask = GPU_HDP_FLUSH_DONE__SDMA1_MASK ;
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_POLL_REG_MEM , 0 , extra_bits ) ) ;
amdgpu_ring_write ( ring , mmGPU_HDP_FLUSH_DONE < < 2 ) ;
amdgpu_ring_write ( ring , mmGPU_HDP_FLUSH_REQ < < 2 ) ;
amdgpu_ring_write ( ring , ref_and_mask ) ; /* reference */
amdgpu_ring_write ( ring , ref_and_mask ) ; /* mask */
amdgpu_ring_write ( ring , ( 0xfff < < 16 ) | 10 ) ; /* retry count, poll interval */
}
/**
* cik_sdma_ring_emit_fence - emit a fence on the DMA ring
*
* @ ring : amdgpu ring pointer
* @ fence : amdgpu fence object
*
* Add a DMA fence packet to the ring to write
* the fence seq number and DMA trap packet to generate
* an interrupt if needed ( CIK ) .
*/
static void cik_sdma_ring_emit_fence ( struct amdgpu_ring * ring , u64 addr , u64 seq ,
2015-06-01 14:35:03 +08:00
unsigned flags )
2015-04-20 17:09:27 -04:00
{
2015-06-01 14:35:03 +08:00
bool write64bit = flags & AMDGPU_FENCE_FLAG_64BIT ;
2015-04-20 17:09:27 -04:00
/* write the fence */
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_FENCE , 0 , 0 ) ) ;
amdgpu_ring_write ( ring , lower_32_bits ( addr ) ) ;
amdgpu_ring_write ( ring , upper_32_bits ( addr ) ) ;
amdgpu_ring_write ( ring , lower_32_bits ( seq ) ) ;
/* optionally write high bits as well */
if ( write64bit ) {
addr + = 4 ;
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_FENCE , 0 , 0 ) ) ;
amdgpu_ring_write ( ring , lower_32_bits ( addr ) ) ;
amdgpu_ring_write ( ring , upper_32_bits ( addr ) ) ;
amdgpu_ring_write ( ring , upper_32_bits ( seq ) ) ;
}
/* generate an interrupt */
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_TRAP , 0 , 0 ) ) ;
}
/**
* cik_sdma_gfx_stop - stop the gfx async dma engines
*
* @ adev : amdgpu_device pointer
*
* Stop the gfx async dma ring buffers ( CIK ) .
*/
static void cik_sdma_gfx_stop ( struct amdgpu_device * adev )
{
2015-10-08 16:30:37 -04:00
struct amdgpu_ring * sdma0 = & adev - > sdma . instance [ 0 ] . ring ;
struct amdgpu_ring * sdma1 = & adev - > sdma . instance [ 1 ] . ring ;
2015-04-20 17:09:27 -04:00
u32 rb_cntl ;
int i ;
if ( ( adev - > mman . buffer_funcs_ring = = sdma0 ) | |
( adev - > mman . buffer_funcs_ring = = sdma1 ) )
2018-03-01 11:01:52 +01:00
amdgpu_ttm_set_buffer_funcs_status ( adev , false ) ;
2015-04-20 17:09:27 -04:00
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
2015-04-20 17:09:27 -04:00
rb_cntl = RREG32 ( mmSDMA0_GFX_RB_CNTL + sdma_offsets [ i ] ) ;
rb_cntl & = ~ SDMA0_GFX_RB_CNTL__RB_ENABLE_MASK ;
WREG32 ( mmSDMA0_GFX_RB_CNTL + sdma_offsets [ i ] , rb_cntl ) ;
WREG32 ( mmSDMA0_GFX_IB_CNTL + sdma_offsets [ i ] , 0 ) ;
}
}
/**
* cik_sdma_rlc_stop - stop the compute async dma engines
*
* @ adev : amdgpu_device pointer
*
* Stop the compute async dma queues ( CIK ) .
*/
static void cik_sdma_rlc_stop ( struct amdgpu_device * adev )
{
/* XXX todo */
}
2016-06-15 16:33:15 -04:00
/**
* cik_ctx_switch_enable - stop the async dma engines context switch
*
* @ adev : amdgpu_device pointer
* @ enable : enable / disable the DMA MEs context switch .
*
* Halt or unhalt the async dma engines context switch ( VI ) .
*/
static void cik_ctx_switch_enable ( struct amdgpu_device * adev , bool enable )
{
2016-07-15 18:37:05 -04:00
u32 f32_cntl , phase_quantum = 0 ;
2016-06-15 16:33:15 -04:00
int i ;
2016-07-15 18:37:05 -04:00
if ( amdgpu_sdma_phase_quantum ) {
unsigned value = amdgpu_sdma_phase_quantum ;
unsigned unit = 0 ;
while ( value > ( SDMA0_PHASE0_QUANTUM__VALUE_MASK > >
SDMA0_PHASE0_QUANTUM__VALUE__SHIFT ) ) {
value = ( value + 1 ) > > 1 ;
unit + + ;
}
if ( unit > ( SDMA0_PHASE0_QUANTUM__UNIT_MASK > >
SDMA0_PHASE0_QUANTUM__UNIT__SHIFT ) ) {
value = ( SDMA0_PHASE0_QUANTUM__VALUE_MASK > >
SDMA0_PHASE0_QUANTUM__VALUE__SHIFT ) ;
unit = ( SDMA0_PHASE0_QUANTUM__UNIT_MASK > >
SDMA0_PHASE0_QUANTUM__UNIT__SHIFT ) ;
WARN_ONCE ( 1 ,
" clamping sdma_phase_quantum to %uK clock cycles \n " ,
value < < unit ) ;
}
phase_quantum =
value < < SDMA0_PHASE0_QUANTUM__VALUE__SHIFT |
unit < < SDMA0_PHASE0_QUANTUM__UNIT__SHIFT ;
}
2016-06-15 16:33:15 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
f32_cntl = RREG32 ( mmSDMA0_CNTL + sdma_offsets [ i ] ) ;
if ( enable ) {
f32_cntl = REG_SET_FIELD ( f32_cntl , SDMA0_CNTL ,
AUTO_CTXSW_ENABLE , 1 ) ;
2016-07-15 18:37:05 -04:00
if ( amdgpu_sdma_phase_quantum ) {
WREG32 ( mmSDMA0_PHASE0_QUANTUM + sdma_offsets [ i ] ,
phase_quantum ) ;
WREG32 ( mmSDMA0_PHASE1_QUANTUM + sdma_offsets [ i ] ,
phase_quantum ) ;
}
2016-06-15 16:33:15 -04:00
} else {
f32_cntl = REG_SET_FIELD ( f32_cntl , SDMA0_CNTL ,
AUTO_CTXSW_ENABLE , 0 ) ;
}
WREG32 ( mmSDMA0_CNTL + sdma_offsets [ i ] , f32_cntl ) ;
}
}
2015-04-20 17:09:27 -04:00
/**
* cik_sdma_enable - stop the async dma engines
*
* @ adev : amdgpu_device pointer
* @ enable : enable / disable the DMA MEs .
*
* Halt or unhalt the async dma engines ( CIK ) .
*/
static void cik_sdma_enable ( struct amdgpu_device * adev , bool enable )
{
u32 me_cntl ;
int i ;
2016-07-12 10:17:53 +10:00
if ( ! enable ) {
2015-04-20 17:09:27 -04:00
cik_sdma_gfx_stop ( adev ) ;
cik_sdma_rlc_stop ( adev ) ;
}
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
2015-04-20 17:09:27 -04:00
me_cntl = RREG32 ( mmSDMA0_F32_CNTL + sdma_offsets [ i ] ) ;
if ( enable )
me_cntl & = ~ SDMA0_F32_CNTL__HALT_MASK ;
else
me_cntl | = SDMA0_F32_CNTL__HALT_MASK ;
WREG32 ( mmSDMA0_F32_CNTL + sdma_offsets [ i ] , me_cntl ) ;
}
}
/**
* cik_sdma_gfx_resume - setup and start the async dma engines
*
* @ adev : amdgpu_device pointer
*
* Set up the gfx DMA ring buffers and enable them ( CIK ) .
* Returns 0 for success , error for failure .
*/
static int cik_sdma_gfx_resume ( struct amdgpu_device * adev )
{
struct amdgpu_ring * ring ;
u32 rb_cntl , ib_cntl ;
u32 rb_bufsz ;
u32 wb_offset ;
int i , j , r ;
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
ring = & adev - > sdma . instance [ i ] . ring ;
2015-04-20 17:09:27 -04:00
wb_offset = ( ring - > rptr_offs * 4 ) ;
mutex_lock ( & adev - > srbm_mutex ) ;
for ( j = 0 ; j < 16 ; j + + ) {
cik_srbm_select ( adev , 0 , 0 , 0 , j ) ;
/* SDMA GFX */
WREG32 ( mmSDMA0_GFX_VIRTUAL_ADDR + sdma_offsets [ i ] , 0 ) ;
WREG32 ( mmSDMA0_GFX_APE1_CNTL + sdma_offsets [ i ] , 0 ) ;
/* XXX SDMA RLC - todo */
}
cik_srbm_select ( adev , 0 , 0 , 0 , 0 ) ;
mutex_unlock ( & adev - > srbm_mutex ) ;
2016-02-12 03:05:24 -05:00
WREG32 ( mmSDMA0_TILING_CONFIG + sdma_offsets [ i ] ,
adev - > gfx . config . gb_addr_config & 0x70 ) ;
2015-04-20 17:09:27 -04:00
WREG32 ( mmSDMA0_SEM_INCOMPLETE_TIMER_CNTL + sdma_offsets [ i ] , 0 ) ;
WREG32 ( mmSDMA0_SEM_WAIT_FAIL_TIMER_CNTL + sdma_offsets [ i ] , 0 ) ;
/* Set ring buffer size in dwords */
rb_bufsz = order_base_2 ( ring - > ring_size / 4 ) ;
rb_cntl = rb_bufsz < < 1 ;
# ifdef __BIG_ENDIAN
2015-06-09 09:58:23 -04:00
rb_cntl | = SDMA0_GFX_RB_CNTL__RB_SWAP_ENABLE_MASK |
SDMA0_GFX_RB_CNTL__RPTR_WRITEBACK_SWAP_ENABLE_MASK ;
2015-04-20 17:09:27 -04:00
# endif
WREG32 ( mmSDMA0_GFX_RB_CNTL + sdma_offsets [ i ] , rb_cntl ) ;
/* Initialize the ring buffer's read and write pointers */
WREG32 ( mmSDMA0_GFX_RB_RPTR + sdma_offsets [ i ] , 0 ) ;
WREG32 ( mmSDMA0_GFX_RB_WPTR + sdma_offsets [ i ] , 0 ) ;
2016-05-25 16:55:50 +08:00
WREG32 ( mmSDMA0_GFX_IB_RPTR + sdma_offsets [ i ] , 0 ) ;
WREG32 ( mmSDMA0_GFX_IB_OFFSET + sdma_offsets [ i ] , 0 ) ;
2015-04-20 17:09:27 -04:00
/* set the wb address whether it's enabled or not */
WREG32 ( mmSDMA0_GFX_RB_RPTR_ADDR_HI + sdma_offsets [ i ] ,
upper_32_bits ( adev - > wb . gpu_addr + wb_offset ) & 0xFFFFFFFF ) ;
WREG32 ( mmSDMA0_GFX_RB_RPTR_ADDR_LO + sdma_offsets [ i ] ,
( ( adev - > wb . gpu_addr + wb_offset ) & 0xFFFFFFFC ) ) ;
rb_cntl | = SDMA0_GFX_RB_CNTL__RPTR_WRITEBACK_ENABLE_MASK ;
WREG32 ( mmSDMA0_GFX_RB_BASE + sdma_offsets [ i ] , ring - > gpu_addr > > 8 ) ;
WREG32 ( mmSDMA0_GFX_RB_BASE_HI + sdma_offsets [ i ] , ring - > gpu_addr > > 40 ) ;
ring - > wptr = 0 ;
2016-03-12 09:32:30 +08:00
WREG32 ( mmSDMA0_GFX_RB_WPTR + sdma_offsets [ i ] , lower_32_bits ( ring - > wptr ) < < 2 ) ;
2015-04-20 17:09:27 -04:00
/* enable DMA RB */
WREG32 ( mmSDMA0_GFX_RB_CNTL + sdma_offsets [ i ] ,
rb_cntl | SDMA0_GFX_RB_CNTL__RB_ENABLE_MASK ) ;
ib_cntl = SDMA0_GFX_IB_CNTL__IB_ENABLE_MASK ;
# ifdef __BIG_ENDIAN
ib_cntl | = SDMA0_GFX_IB_CNTL__IB_SWAP_ENABLE_MASK ;
# endif
/* enable DMA IBs */
WREG32 ( mmSDMA0_GFX_IB_CNTL + sdma_offsets [ i ] , ib_cntl ) ;
2018-10-19 16:22:48 -04:00
ring - > sched . ready = true ;
2016-05-25 16:57:14 +08:00
}
cik_sdma_enable ( adev , true ) ;
2015-04-20 17:09:27 -04:00
2016-05-25 16:57:14 +08:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
ring = & adev - > sdma . instance [ i ] . ring ;
2018-10-19 16:22:48 -04:00
r = amdgpu_ring_test_helper ( ring ) ;
if ( r )
2015-04-20 17:09:27 -04:00
return r ;
if ( adev - > mman . buffer_funcs_ring = = ring )
2018-03-01 11:01:52 +01:00
amdgpu_ttm_set_buffer_funcs_status ( adev , true ) ;
2015-04-20 17:09:27 -04:00
}
return 0 ;
}
/**
* cik_sdma_rlc_resume - setup and start the async dma engines
*
* @ adev : amdgpu_device pointer
*
* Set up the compute DMA queues and enable them ( CIK ) .
* Returns 0 for success , error for failure .
*/
static int cik_sdma_rlc_resume ( struct amdgpu_device * adev )
{
/* XXX todo */
return 0 ;
}
/**
* cik_sdma_load_microcode - load the sDMA ME ucode
*
* @ adev : amdgpu_device pointer
*
* Loads the sDMA0 / 1 ucode .
* Returns 0 for success , - EINVAL if the ucode is not available .
*/
static int cik_sdma_load_microcode ( struct amdgpu_device * adev )
{
const struct sdma_firmware_header_v1_0 * hdr ;
const __le32 * fw_data ;
u32 fw_size ;
int i , j ;
/* halt the MEs */
cik_sdma_enable ( adev , false ) ;
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
if ( ! adev - > sdma . instance [ i ] . fw )
return - EINVAL ;
hdr = ( const struct sdma_firmware_header_v1_0 * ) adev - > sdma . instance [ i ] . fw - > data ;
2015-04-20 17:09:27 -04:00
amdgpu_ucode_print_sdma_hdr ( & hdr - > header ) ;
fw_size = le32_to_cpu ( hdr - > header . ucode_size_bytes ) / 4 ;
2015-10-08 16:30:37 -04:00
adev - > sdma . instance [ i ] . fw_version = le32_to_cpu ( hdr - > header . ucode_version ) ;
adev - > sdma . instance [ i ] . feature_version = le32_to_cpu ( hdr - > ucode_feature_version ) ;
if ( adev - > sdma . instance [ i ] . feature_version > = 20 )
adev - > sdma . instance [ i ] . burst_nop = true ;
2015-04-20 17:09:27 -04:00
fw_data = ( const __le32 * )
2015-10-08 16:30:37 -04:00
( adev - > sdma . instance [ i ] . fw - > data + le32_to_cpu ( hdr - > header . ucode_array_offset_bytes ) ) ;
2015-04-20 17:09:27 -04:00
WREG32 ( mmSDMA0_UCODE_ADDR + sdma_offsets [ i ] , 0 ) ;
for ( j = 0 ; j < fw_size ; j + + )
WREG32 ( mmSDMA0_UCODE_DATA + sdma_offsets [ i ] , le32_to_cpup ( fw_data + + ) ) ;
2015-10-08 16:30:37 -04:00
WREG32 ( mmSDMA0_UCODE_ADDR + sdma_offsets [ i ] , adev - > sdma . instance [ i ] . fw_version ) ;
2015-04-20 17:09:27 -04:00
}
return 0 ;
}
/**
* cik_sdma_start - setup and start the async dma engines
*
* @ adev : amdgpu_device pointer
*
* Set up the DMA engines and enable them ( CIK ) .
* Returns 0 for success , error for failure .
*/
static int cik_sdma_start ( struct amdgpu_device * adev )
{
int r ;
r = cik_sdma_load_microcode ( adev ) ;
if ( r )
return r ;
2016-05-25 16:57:14 +08:00
/* halt the engine before programing */
cik_sdma_enable ( adev , false ) ;
2016-06-15 16:33:15 -04:00
/* enable sdma ring preemption */
cik_ctx_switch_enable ( adev , true ) ;
2015-04-20 17:09:27 -04:00
/* start the gfx rings and rlc compute queues */
r = cik_sdma_gfx_resume ( adev ) ;
if ( r )
return r ;
r = cik_sdma_rlc_resume ( adev ) ;
if ( r )
return r ;
return 0 ;
}
/**
* cik_sdma_ring_test_ring - simple async dma engine test
*
* @ ring : amdgpu_ring structure holding ring information
*
* Test the DMA engine by writing using it to write an
* value to memory . ( CIK ) .
* Returns 0 for success , error for failure .
*/
static int cik_sdma_ring_test_ring ( struct amdgpu_ring * ring )
{
struct amdgpu_device * adev = ring - > adev ;
unsigned i ;
unsigned index ;
int r ;
u32 tmp ;
u64 gpu_addr ;
2017-12-14 16:03:43 -05:00
r = amdgpu_device_wb_get ( adev , & index ) ;
2018-10-29 10:48:31 +01:00
if ( r )
2015-04-20 17:09:27 -04:00
return r ;
gpu_addr = adev - > wb . gpu_addr + ( index * 4 ) ;
tmp = 0xCAFEDEAD ;
adev - > wb . wb [ index ] = cpu_to_le32 ( tmp ) ;
2016-01-21 11:28:53 +01:00
r = amdgpu_ring_alloc ( ring , 5 ) ;
2018-10-29 10:48:31 +01:00
if ( r )
goto error_free_wb ;
2015-04-20 17:09:27 -04:00
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_WRITE , SDMA_WRITE_SUB_OPCODE_LINEAR , 0 ) ) ;
amdgpu_ring_write ( ring , lower_32_bits ( gpu_addr ) ) ;
amdgpu_ring_write ( ring , upper_32_bits ( gpu_addr ) ) ;
amdgpu_ring_write ( ring , 1 ) ; /* number of DWs to follow */
amdgpu_ring_write ( ring , 0xDEADBEEF ) ;
2016-01-21 11:28:53 +01:00
amdgpu_ring_commit ( ring ) ;
2015-04-20 17:09:27 -04:00
for ( i = 0 ; i < adev - > usec_timeout ; i + + ) {
tmp = le32_to_cpu ( adev - > wb . wb [ index ] ) ;
if ( tmp = = 0xDEADBEEF )
break ;
2019-06-10 00:07:49 +02:00
udelay ( 1 ) ;
2015-04-20 17:09:27 -04:00
}
2018-10-29 10:48:31 +01:00
if ( i > = adev - > usec_timeout )
r = - ETIMEDOUT ;
2015-04-20 17:09:27 -04:00
2018-10-29 10:48:31 +01:00
error_free_wb :
amdgpu_device_wb_free ( adev , index ) ;
2015-04-20 17:09:27 -04:00
return r ;
}
/**
* cik_sdma_ring_test_ib - test an IB on the DMA engine
*
* @ ring : amdgpu_ring structure holding ring information
*
* Test a simple IB in the DMA ring ( CIK ) .
* Returns 0 on success , error on failure .
*/
2016-07-05 21:07:17 +02:00
static int cik_sdma_ring_test_ib ( struct amdgpu_ring * ring , long timeout )
2015-04-20 17:09:27 -04:00
{
struct amdgpu_device * adev = ring - > adev ;
struct amdgpu_ib ib ;
2016-10-25 13:00:45 +01:00
struct dma_fence * f = NULL ;
2015-04-20 17:09:27 -04:00
unsigned index ;
u32 tmp = 0 ;
u64 gpu_addr ;
2016-07-05 21:07:17 +02:00
long r ;
2015-04-20 17:09:27 -04:00
2017-12-14 16:03:43 -05:00
r = amdgpu_device_wb_get ( adev , & index ) ;
2018-10-29 16:12:42 +01:00
if ( r )
2015-04-20 17:09:27 -04:00
return r ;
gpu_addr = adev - > wb . gpu_addr + ( index * 4 ) ;
tmp = 0xCAFEDEAD ;
adev - > wb . wb [ index ] = cpu_to_le32 ( tmp ) ;
2015-08-18 18:23:16 +02:00
memset ( & ib , 0 , sizeof ( ib ) ) ;
2020-03-26 08:38:29 +08:00
r = amdgpu_ib_get ( adev , NULL , 256 ,
AMDGPU_IB_POOL_DIRECT , & ib ) ;
2018-10-29 16:12:42 +01:00
if ( r )
2015-06-01 15:33:20 +08:00
goto err0 ;
2015-04-20 17:09:27 -04:00
2016-07-05 15:53:07 +02:00
ib . ptr [ 0 ] = SDMA_PACKET ( SDMA_OPCODE_WRITE ,
SDMA_WRITE_SUB_OPCODE_LINEAR , 0 ) ;
2015-04-20 17:09:27 -04:00
ib . ptr [ 1 ] = lower_32_bits ( gpu_addr ) ;
ib . ptr [ 2 ] = upper_32_bits ( gpu_addr ) ;
ib . ptr [ 3 ] = 1 ;
ib . ptr [ 4 ] = 0xDEADBEEF ;
ib . length_dw = 5 ;
2017-01-23 16:30:38 +08:00
r = amdgpu_ib_schedule ( ring , 1 , & ib , NULL , & f ) ;
2015-06-01 15:33:20 +08:00
if ( r )
goto err1 ;
2015-04-20 17:09:27 -04:00
2016-10-25 13:00:45 +01:00
r = dma_fence_wait_timeout ( f , false , timeout ) ;
2016-07-05 21:07:17 +02:00
if ( r = = 0 ) {
r = - ETIMEDOUT ;
goto err1 ;
} else if ( r < 0 ) {
2015-06-01 15:33:20 +08:00
goto err1 ;
2015-04-20 17:09:27 -04:00
}
2016-07-05 15:53:07 +02:00
tmp = le32_to_cpu ( adev - > wb . wb [ index ] ) ;
2018-10-29 16:12:42 +01:00
if ( tmp = = 0xDEADBEEF )
2016-07-05 21:07:17 +02:00
r = 0 ;
2018-10-29 16:12:42 +01:00
else
2015-04-20 17:09:27 -04:00
r = - EINVAL ;
2015-06-01 15:33:20 +08:00
err1 :
2016-03-17 10:47:07 +08:00
amdgpu_ib_free ( adev , & ib , NULL ) ;
2016-10-25 13:00:45 +01:00
dma_fence_put ( f ) ;
2015-06-01 15:33:20 +08:00
err0 :
2017-12-14 16:03:43 -05:00
amdgpu_device_wb_free ( adev , index ) ;
2015-04-20 17:09:27 -04:00
return r ;
}
/**
* cik_sdma_vm_copy_pages - update PTEs by copying them from the GART
*
* @ ib : indirect buffer to fill with commands
* @ pe : addr of the page entry
* @ src : src addr to copy from
* @ count : number of page entries to update
*
* Update PTEs by copying them from the GART using sDMA ( CIK ) .
*/
static void cik_sdma_vm_copy_pte ( struct amdgpu_ib * ib ,
uint64_t pe , uint64_t src ,
unsigned count )
{
2016-08-12 12:59:59 +02:00
unsigned bytes = count * 8 ;
ib - > ptr [ ib - > length_dw + + ] = SDMA_PACKET ( SDMA_OPCODE_COPY ,
SDMA_WRITE_SUB_OPCODE_LINEAR , 0 ) ;
ib - > ptr [ ib - > length_dw + + ] = bytes ;
ib - > ptr [ ib - > length_dw + + ] = 0 ; /* src/dst endian swap */
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( src ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( src ) ;
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( pe ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( pe ) ;
2015-04-20 17:09:27 -04:00
}
/**
* cik_sdma_vm_write_pages - update PTEs by writing them manually
*
* @ ib : indirect buffer to fill with commands
* @ pe : addr of the page entry
2016-08-12 11:33:30 +02:00
* @ value : dst addr to write into pe
2015-04-20 17:09:27 -04:00
* @ count : number of page entries to update
* @ incr : increase next addr by incr bytes
*
* Update PTEs by writing them manually using sDMA ( CIK ) .
*/
2016-08-12 11:33:30 +02:00
static void cik_sdma_vm_write_pte ( struct amdgpu_ib * ib , uint64_t pe ,
uint64_t value , unsigned count ,
uint32_t incr )
2015-04-20 17:09:27 -04:00
{
2016-08-12 11:33:30 +02:00
unsigned ndw = count * 2 ;
ib - > ptr [ ib - > length_dw + + ] = SDMA_PACKET ( SDMA_OPCODE_WRITE ,
SDMA_WRITE_SUB_OPCODE_LINEAR , 0 ) ;
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( pe ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( pe ) ;
ib - > ptr [ ib - > length_dw + + ] = ndw ;
for ( ; ndw > 0 ; ndw - = 2 ) {
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( value ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( value ) ;
value + = incr ;
2015-04-20 17:09:27 -04:00
}
}
/**
* cik_sdma_vm_set_pages - update the page tables using sDMA
*
* @ ib : indirect buffer to fill with commands
* @ pe : addr of the page entry
* @ addr : dst addr to write into pe
* @ count : number of page entries to update
* @ incr : increase next addr by incr bytes
* @ flags : access flags
*
* Update the page tables using sDMA ( CIK ) .
*/
2016-08-12 12:59:59 +02:00
static void cik_sdma_vm_set_pte_pde ( struct amdgpu_ib * ib , uint64_t pe ,
2015-04-20 17:09:27 -04:00
uint64_t addr , unsigned count ,
2016-09-21 16:19:19 +08:00
uint32_t incr , uint64_t flags )
2015-04-20 17:09:27 -04:00
{
2016-08-12 12:59:59 +02:00
/* for physically contiguous pages (vram) */
ib - > ptr [ ib - > length_dw + + ] = SDMA_PACKET ( SDMA_OPCODE_GENERATE_PTE_PDE , 0 , 0 ) ;
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( pe ) ; /* dst addr */
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( pe ) ;
2017-03-28 16:52:07 +08:00
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( flags ) ; /* mask */
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( flags ) ;
2016-08-12 12:59:59 +02:00
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( addr ) ; /* value */
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( addr ) ;
ib - > ptr [ ib - > length_dw + + ] = incr ; /* increment size */
ib - > ptr [ ib - > length_dw + + ] = 0 ;
ib - > ptr [ ib - > length_dw + + ] = count ; /* number of entries */
2015-04-20 17:09:27 -04:00
}
/**
* cik_sdma_vm_pad_ib - pad the IB to the required number of dw
*
* @ ib : indirect buffer to fill with padding
*
*/
2016-01-31 12:20:55 +01:00
static void cik_sdma_ring_pad_ib ( struct amdgpu_ring * ring , struct amdgpu_ib * ib )
2015-04-20 17:09:27 -04:00
{
2018-11-01 13:42:42 +08:00
struct amdgpu_sdma_instance * sdma = amdgpu_sdma_get_instance_from_ring ( ring ) ;
2015-09-01 13:13:54 +08:00
u32 pad_count ;
int i ;
2019-10-24 19:30:13 -04:00
pad_count = ( - ib - > length_dw ) & 7 ;
2015-09-01 13:13:54 +08:00
for ( i = 0 ; i < pad_count ; i + + )
if ( sdma & & sdma - > burst_nop & & ( i = = 0 ) )
ib - > ptr [ ib - > length_dw + + ] =
SDMA_PACKET ( SDMA_OPCODE_NOP , 0 , 0 ) |
SDMA_NOP_COUNT ( pad_count - 1 ) ;
else
ib - > ptr [ ib - > length_dw + + ] =
SDMA_PACKET ( SDMA_OPCODE_NOP , 0 , 0 ) ;
2015-04-20 17:09:27 -04:00
}
/**
2016-03-08 14:11:00 +01:00
* cik_sdma_ring_emit_pipeline_sync - sync the pipeline
2015-04-20 17:09:27 -04:00
*
* @ ring : amdgpu_ring pointer
*
2016-03-08 14:11:00 +01:00
* Make sure all previous operations are completed ( CIK ) .
2015-04-20 17:09:27 -04:00
*/
2016-03-08 14:11:00 +01:00
static void cik_sdma_ring_emit_pipeline_sync ( struct amdgpu_ring * ring )
2015-04-20 17:09:27 -04:00
{
2016-03-02 11:30:31 +08:00
uint32_t seq = ring - > fence_drv . sync_seq ;
uint64_t addr = ring - > fence_drv . gpu_addr ;
/* wait for idle */
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_POLL_REG_MEM , 0 ,
SDMA_POLL_REG_MEM_EXTRA_OP ( 0 ) |
SDMA_POLL_REG_MEM_EXTRA_FUNC ( 3 ) | /* equal */
SDMA_POLL_REG_MEM_EXTRA_M ) ) ;
amdgpu_ring_write ( ring , addr & 0xfffffffc ) ;
amdgpu_ring_write ( ring , upper_32_bits ( addr ) & 0xffffffff ) ;
amdgpu_ring_write ( ring , seq ) ; /* reference */
2018-03-27 15:53:52 -05:00
amdgpu_ring_write ( ring , 0xffffffff ) ; /* mask */
2016-03-02 11:30:31 +08:00
amdgpu_ring_write ( ring , ( 0xfff < < 16 ) | 4 ) ; /* retry count, poll interval */
2016-03-08 14:11:00 +01:00
}
2016-03-02 11:30:31 +08:00
2015-04-20 17:09:27 -04:00
/**
* cik_sdma_ring_emit_vm_flush - cik vm flush using sDMA
*
* @ ring : amdgpu_ring pointer
* @ vm : amdgpu_vm pointer
*
* Update the page table base and flush the VM TLB
* using sDMA ( CIK ) .
*/
static void cik_sdma_ring_emit_vm_flush ( struct amdgpu_ring * ring ,
2018-02-04 10:32:35 +01:00
unsigned vmid , uint64_t pd_addr )
2015-04-20 17:09:27 -04:00
{
u32 extra_bits = ( SDMA_POLL_REG_MEM_EXTRA_OP ( 0 ) |
SDMA_POLL_REG_MEM_EXTRA_FUNC ( 0 ) ) ; /* always */
2018-02-04 10:32:35 +01:00
amdgpu_gmc_emit_flush_gpu_tlb ( ring , vmid , pd_addr ) ;
2015-04-20 17:09:27 -04:00
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_POLL_REG_MEM , 0 , extra_bits ) ) ;
amdgpu_ring_write ( ring , mmVM_INVALIDATE_REQUEST < < 2 ) ;
amdgpu_ring_write ( ring , 0 ) ;
amdgpu_ring_write ( ring , 0 ) ; /* reference */
amdgpu_ring_write ( ring , 0 ) ; /* mask */
amdgpu_ring_write ( ring , ( 0xfff < < 16 ) | 10 ) ; /* retry count, poll interval */
}
2018-01-12 16:33:15 +01:00
static void cik_sdma_ring_emit_wreg ( struct amdgpu_ring * ring ,
uint32_t reg , uint32_t val )
{
amdgpu_ring_write ( ring , SDMA_PACKET ( SDMA_OPCODE_SRBM_WRITE , 0 , 0xf000 ) ) ;
amdgpu_ring_write ( ring , reg ) ;
amdgpu_ring_write ( ring , val ) ;
}
2015-04-20 17:09:27 -04:00
static void cik_enable_sdma_mgcg ( struct amdgpu_device * adev ,
bool enable )
{
u32 orig , data ;
2016-02-05 10:56:22 -05:00
if ( enable & & ( adev - > cg_flags & AMD_CG_SUPPORT_SDMA_MGCG ) ) {
2015-04-20 17:09:27 -04:00
WREG32 ( mmSDMA0_CLK_CTRL + SDMA0_REGISTER_OFFSET , 0x00000100 ) ;
WREG32 ( mmSDMA0_CLK_CTRL + SDMA1_REGISTER_OFFSET , 0x00000100 ) ;
} else {
orig = data = RREG32 ( mmSDMA0_CLK_CTRL + SDMA0_REGISTER_OFFSET ) ;
data | = 0xff000000 ;
if ( data ! = orig )
WREG32 ( mmSDMA0_CLK_CTRL + SDMA0_REGISTER_OFFSET , data ) ;
orig = data = RREG32 ( mmSDMA0_CLK_CTRL + SDMA1_REGISTER_OFFSET ) ;
data | = 0xff000000 ;
if ( data ! = orig )
WREG32 ( mmSDMA0_CLK_CTRL + SDMA1_REGISTER_OFFSET , data ) ;
}
}
static void cik_enable_sdma_mgls ( struct amdgpu_device * adev ,
bool enable )
{
u32 orig , data ;
2016-02-05 10:56:22 -05:00
if ( enable & & ( adev - > cg_flags & AMD_CG_SUPPORT_SDMA_LS ) ) {
2015-04-20 17:09:27 -04:00
orig = data = RREG32 ( mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET ) ;
data | = 0x100 ;
if ( orig ! = data )
WREG32 ( mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET , data ) ;
orig = data = RREG32 ( mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET ) ;
data | = 0x100 ;
if ( orig ! = data )
WREG32 ( mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET , data ) ;
} else {
orig = data = RREG32 ( mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET ) ;
data & = ~ 0x100 ;
if ( orig ! = data )
WREG32 ( mmSDMA0_POWER_CNTL + SDMA0_REGISTER_OFFSET , data ) ;
orig = data = RREG32 ( mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET ) ;
data & = ~ 0x100 ;
if ( orig ! = data )
WREG32 ( mmSDMA0_POWER_CNTL + SDMA1_REGISTER_OFFSET , data ) ;
}
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_early_init ( void * handle )
2015-04-20 17:09:27 -04:00
{
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-10-08 16:30:37 -04:00
adev - > sdma . num_instances = SDMA_MAX_INSTANCE ;
2015-04-20 17:09:27 -04:00
cik_sdma_set_ring_funcs ( adev ) ;
cik_sdma_set_irq_funcs ( adev ) ;
cik_sdma_set_buffer_funcs ( adev ) ;
cik_sdma_set_vm_pte_funcs ( adev ) ;
return 0 ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_sw_init ( void * handle )
2015-04-20 17:09:27 -04:00
{
struct amdgpu_ring * ring ;
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-10-08 16:30:37 -04:00
int r , i ;
2015-04-20 17:09:27 -04:00
r = cik_sdma_init_microcode ( adev ) ;
if ( r ) {
DRM_ERROR ( " Failed to load sdma firmware! \n " ) ;
return r ;
}
/* SDMA trap event */
2018-09-17 15:29:28 +02:00
r = amdgpu_irq_add_id ( adev , AMDGPU_IRQ_CLIENTID_LEGACY , 224 ,
2016-03-29 18:28:50 -04:00
& adev - > sdma . trap_irq ) ;
2015-04-20 17:09:27 -04:00
if ( r )
return r ;
/* SDMA Privileged inst */
2018-09-17 15:29:28 +02:00
r = amdgpu_irq_add_id ( adev , AMDGPU_IRQ_CLIENTID_LEGACY , 241 ,
2016-03-29 18:28:50 -04:00
& adev - > sdma . illegal_inst_irq ) ;
2015-04-20 17:09:27 -04:00
if ( r )
return r ;
/* SDMA Privileged inst */
2018-09-17 15:29:28 +02:00
r = amdgpu_irq_add_id ( adev , AMDGPU_IRQ_CLIENTID_LEGACY , 247 ,
2016-03-29 18:28:50 -04:00
& adev - > sdma . illegal_inst_irq ) ;
2015-04-20 17:09:27 -04:00
if ( r )
return r ;
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
ring = & adev - > sdma . instance [ i ] . ring ;
ring - > ring_obj = NULL ;
sprintf ( ring - > name , " sdma%d " , i ) ;
2016-04-13 10:30:13 +02:00
r = amdgpu_ring_init ( adev , ring , 1024 ,
2015-10-08 16:30:37 -04:00
& adev - > sdma . trap_irq ,
( i = = 0 ) ?
2019-03-28 17:29:10 +08:00
AMDGPU_SDMA_IRQ_INSTANCE0 :
2020-04-01 11:46:57 +02:00
AMDGPU_SDMA_IRQ_INSTANCE1 ,
AMDGPU_RING_PRIO_DEFAULT ) ;
2015-10-08 16:30:37 -04:00
if ( r )
return r ;
}
2015-04-20 17:09:27 -04:00
return r ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_sw_fini ( void * handle )
2015-04-20 17:09:27 -04:00
{
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-10-08 16:30:37 -04:00
int i ;
2015-05-22 14:39:35 -04:00
2015-10-08 16:30:37 -04:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + )
amdgpu_ring_fini ( & adev - > sdma . instance [ i ] . ring ) ;
2015-04-20 17:09:27 -04:00
2016-05-30 16:07:40 +08:00
cik_sdma_free_microcode ( adev ) ;
2015-04-20 17:09:27 -04:00
return 0 ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_hw_init ( void * handle )
2015-04-20 17:09:27 -04:00
{
int r ;
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
r = cik_sdma_start ( adev ) ;
if ( r )
return r ;
return r ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_hw_fini ( void * handle )
2015-04-20 17:09:27 -04:00
{
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2016-06-15 16:33:15 -04:00
cik_ctx_switch_enable ( adev , false ) ;
2015-04-20 17:09:27 -04:00
cik_sdma_enable ( adev , false ) ;
return 0 ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_suspend ( void * handle )
2015-04-20 17:09:27 -04:00
{
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
return cik_sdma_hw_fini ( adev ) ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_resume ( void * handle )
2015-04-20 17:09:27 -04:00
{
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
2016-08-30 08:59:42 +08:00
cik_sdma_soft_reset ( handle ) ;
2015-04-20 17:09:27 -04:00
return cik_sdma_hw_init ( adev ) ;
}
2015-05-22 14:39:35 -04:00
static bool cik_sdma_is_idle ( void * handle )
2015-04-20 17:09:27 -04:00
{
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
u32 tmp = RREG32 ( mmSRBM_STATUS2 ) ;
if ( tmp & ( SRBM_STATUS2__SDMA_BUSY_MASK |
SRBM_STATUS2__SDMA1_BUSY_MASK ) )
return false ;
return true ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_wait_for_idle ( void * handle )
2015-04-20 17:09:27 -04:00
{
unsigned i ;
u32 tmp ;
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
for ( i = 0 ; i < adev - > usec_timeout ; i + + ) {
tmp = RREG32 ( mmSRBM_STATUS2 ) & ( SRBM_STATUS2__SDMA_BUSY_MASK |
SRBM_STATUS2__SDMA1_BUSY_MASK ) ;
if ( ! tmp )
return 0 ;
udelay ( 1 ) ;
}
return - ETIMEDOUT ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_soft_reset ( void * handle )
2015-04-20 17:09:27 -04:00
{
u32 srbm_soft_reset = 0 ;
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
u32 tmp = RREG32 ( mmSRBM_STATUS2 ) ;
if ( tmp & SRBM_STATUS2__SDMA_BUSY_MASK ) {
/* sdma0 */
tmp = RREG32 ( mmSDMA0_F32_CNTL + SDMA0_REGISTER_OFFSET ) ;
tmp | = SDMA0_F32_CNTL__HALT_MASK ;
WREG32 ( mmSDMA0_F32_CNTL + SDMA0_REGISTER_OFFSET , tmp ) ;
srbm_soft_reset | = SRBM_SOFT_RESET__SOFT_RESET_SDMA_MASK ;
}
if ( tmp & SRBM_STATUS2__SDMA1_BUSY_MASK ) {
/* sdma1 */
tmp = RREG32 ( mmSDMA0_F32_CNTL + SDMA1_REGISTER_OFFSET ) ;
tmp | = SDMA0_F32_CNTL__HALT_MASK ;
WREG32 ( mmSDMA0_F32_CNTL + SDMA1_REGISTER_OFFSET , tmp ) ;
srbm_soft_reset | = SRBM_SOFT_RESET__SOFT_RESET_SDMA1_MASK ;
}
if ( srbm_soft_reset ) {
tmp = RREG32 ( mmSRBM_SOFT_RESET ) ;
tmp | = srbm_soft_reset ;
dev_info ( adev - > dev , " SRBM_SOFT_RESET=0x%08X \n " , tmp ) ;
WREG32 ( mmSRBM_SOFT_RESET , tmp ) ;
tmp = RREG32 ( mmSRBM_SOFT_RESET ) ;
udelay ( 50 ) ;
tmp & = ~ srbm_soft_reset ;
WREG32 ( mmSRBM_SOFT_RESET , tmp ) ;
tmp = RREG32 ( mmSRBM_SOFT_RESET ) ;
/* Wait a little for things to settle down */
udelay ( 50 ) ;
}
return 0 ;
}
static int cik_sdma_set_trap_irq_state ( struct amdgpu_device * adev ,
struct amdgpu_irq_src * src ,
unsigned type ,
enum amdgpu_interrupt_state state )
{
u32 sdma_cntl ;
switch ( type ) {
2019-03-28 17:29:10 +08:00
case AMDGPU_SDMA_IRQ_INSTANCE0 :
2015-04-20 17:09:27 -04:00
switch ( state ) {
case AMDGPU_IRQ_STATE_DISABLE :
sdma_cntl = RREG32 ( mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET ) ;
sdma_cntl & = ~ SDMA0_CNTL__TRAP_ENABLE_MASK ;
WREG32 ( mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET , sdma_cntl ) ;
break ;
case AMDGPU_IRQ_STATE_ENABLE :
sdma_cntl = RREG32 ( mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET ) ;
sdma_cntl | = SDMA0_CNTL__TRAP_ENABLE_MASK ;
WREG32 ( mmSDMA0_CNTL + SDMA0_REGISTER_OFFSET , sdma_cntl ) ;
break ;
default :
break ;
}
break ;
2019-03-28 17:29:10 +08:00
case AMDGPU_SDMA_IRQ_INSTANCE1 :
2015-04-20 17:09:27 -04:00
switch ( state ) {
case AMDGPU_IRQ_STATE_DISABLE :
sdma_cntl = RREG32 ( mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET ) ;
sdma_cntl & = ~ SDMA0_CNTL__TRAP_ENABLE_MASK ;
WREG32 ( mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET , sdma_cntl ) ;
break ;
case AMDGPU_IRQ_STATE_ENABLE :
sdma_cntl = RREG32 ( mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET ) ;
sdma_cntl | = SDMA0_CNTL__TRAP_ENABLE_MASK ;
WREG32 ( mmSDMA0_CNTL + SDMA1_REGISTER_OFFSET , sdma_cntl ) ;
break ;
default :
break ;
}
break ;
default :
break ;
}
return 0 ;
}
static int cik_sdma_process_trap_irq ( struct amdgpu_device * adev ,
struct amdgpu_irq_src * source ,
struct amdgpu_iv_entry * entry )
{
u8 instance_id , queue_id ;
instance_id = ( entry - > ring_id & 0x3 ) > > 0 ;
queue_id = ( entry - > ring_id & 0xc ) > > 2 ;
DRM_DEBUG ( " IH: SDMA trap \n " ) ;
switch ( instance_id ) {
case 0 :
switch ( queue_id ) {
case 0 :
2015-10-08 16:30:37 -04:00
amdgpu_fence_process ( & adev - > sdma . instance [ 0 ] . ring ) ;
2015-04-20 17:09:27 -04:00
break ;
case 1 :
/* XXX compute */
break ;
case 2 :
/* XXX compute */
break ;
}
break ;
case 1 :
switch ( queue_id ) {
case 0 :
2015-10-08 16:30:37 -04:00
amdgpu_fence_process ( & adev - > sdma . instance [ 1 ] . ring ) ;
2015-04-20 17:09:27 -04:00
break ;
case 1 :
/* XXX compute */
break ;
case 2 :
/* XXX compute */
break ;
}
break ;
}
return 0 ;
}
static int cik_sdma_process_illegal_inst_irq ( struct amdgpu_device * adev ,
struct amdgpu_irq_src * source ,
struct amdgpu_iv_entry * entry )
{
2018-10-16 13:08:21 +02:00
u8 instance_id ;
2015-04-20 17:09:27 -04:00
DRM_ERROR ( " Illegal instruction in SDMA command stream \n " ) ;
2018-10-16 13:08:21 +02:00
instance_id = ( entry - > ring_id & 0x3 ) > > 0 ;
drm_sched_fault ( & adev - > sdma . instance [ instance_id ] . ring . sched ) ;
2015-04-20 17:09:27 -04:00
return 0 ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_set_clockgating_state ( void * handle ,
enum amd_clockgating_state state )
2015-04-20 17:09:27 -04:00
{
bool gate = false ;
2015-05-22 14:39:35 -04:00
struct amdgpu_device * adev = ( struct amdgpu_device * ) handle ;
2015-04-20 17:09:27 -04:00
2015-05-22 14:39:35 -04:00
if ( state = = AMD_CG_STATE_GATE )
2015-04-20 17:09:27 -04:00
gate = true ;
cik_enable_sdma_mgcg ( adev , gate ) ;
cik_enable_sdma_mgls ( adev , gate ) ;
return 0 ;
}
2015-05-22 14:39:35 -04:00
static int cik_sdma_set_powergating_state ( void * handle ,
enum amd_powergating_state state )
2015-04-20 17:09:27 -04:00
{
return 0 ;
}
2016-10-13 17:41:13 -04:00
static const struct amd_ip_funcs cik_sdma_ip_funcs = {
2016-05-04 14:28:35 -04:00
. name = " cik_sdma " ,
2015-04-20 17:09:27 -04:00
. early_init = cik_sdma_early_init ,
. late_init = NULL ,
. sw_init = cik_sdma_sw_init ,
. sw_fini = cik_sdma_sw_fini ,
. hw_init = cik_sdma_hw_init ,
. hw_fini = cik_sdma_hw_fini ,
. suspend = cik_sdma_suspend ,
. resume = cik_sdma_resume ,
. is_idle = cik_sdma_is_idle ,
. wait_for_idle = cik_sdma_wait_for_idle ,
. soft_reset = cik_sdma_soft_reset ,
. set_clockgating_state = cik_sdma_set_clockgating_state ,
. set_powergating_state = cik_sdma_set_powergating_state ,
} ;
static const struct amdgpu_ring_funcs cik_sdma_ring_funcs = {
2016-10-05 15:36:39 +02:00
. type = AMDGPU_RING_TYPE_SDMA ,
2016-10-05 16:09:32 +02:00
. align_mask = 0xf ,
. nop = SDMA_PACKET ( SDMA_OPCODE_NOP , 0 , 0 ) ,
2016-03-12 09:32:30 +08:00
. support_64bit_ptrs = false ,
2015-04-20 17:09:27 -04:00
. get_rptr = cik_sdma_ring_get_rptr ,
. get_wptr = cik_sdma_ring_get_wptr ,
. set_wptr = cik_sdma_ring_set_wptr ,
2016-10-05 14:29:38 +02:00
. emit_frame_size =
6 + /* cik_sdma_ring_emit_hdp_flush */
2018-01-19 15:19:16 +01:00
3 + /* hdp invalidate */
2016-10-05 14:29:38 +02:00
6 + /* cik_sdma_ring_emit_pipeline_sync */
2018-01-12 17:08:22 +01:00
CIK_FLUSH_GPU_TLB_NUM_WREG * 3 + 6 + /* cik_sdma_ring_emit_vm_flush */
2016-10-05 14:29:38 +02:00
9 + 9 + 9 , /* cik_sdma_ring_emit_fence x3 for user fence, vm fence */
. emit_ib_size = 7 + 4 , /* cik_sdma_ring_emit_ib */
2015-04-20 17:09:27 -04:00
. emit_ib = cik_sdma_ring_emit_ib ,
. emit_fence = cik_sdma_ring_emit_fence ,
2016-03-08 14:11:00 +01:00
. emit_pipeline_sync = cik_sdma_ring_emit_pipeline_sync ,
2015-04-20 17:09:27 -04:00
. emit_vm_flush = cik_sdma_ring_emit_vm_flush ,
2015-05-11 14:10:34 +02:00
. emit_hdp_flush = cik_sdma_ring_emit_hdp_flush ,
2015-04-20 17:09:27 -04:00
. test_ring = cik_sdma_ring_test_ring ,
. test_ib = cik_sdma_ring_test_ib ,
2015-09-01 13:13:54 +08:00
. insert_nop = cik_sdma_ring_insert_nop ,
2016-01-31 12:20:55 +01:00
. pad_ib = cik_sdma_ring_pad_ib ,
2018-01-12 16:33:15 +01:00
. emit_wreg = cik_sdma_ring_emit_wreg ,
2015-04-20 17:09:27 -04:00
} ;
static void cik_sdma_set_ring_funcs ( struct amdgpu_device * adev )
{
2015-10-08 16:30:37 -04:00
int i ;
2018-06-25 12:24:10 -05:00
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
2015-10-08 16:30:37 -04:00
adev - > sdma . instance [ i ] . ring . funcs = & cik_sdma_ring_funcs ;
2018-06-25 12:24:10 -05:00
adev - > sdma . instance [ i ] . ring . me = i ;
}
2015-04-20 17:09:27 -04:00
}
static const struct amdgpu_irq_src_funcs cik_sdma_trap_irq_funcs = {
. set = cik_sdma_set_trap_irq_state ,
. process = cik_sdma_process_trap_irq ,
} ;
static const struct amdgpu_irq_src_funcs cik_sdma_illegal_inst_irq_funcs = {
. process = cik_sdma_process_illegal_inst_irq ,
} ;
static void cik_sdma_set_irq_funcs ( struct amdgpu_device * adev )
{
2015-10-08 16:30:37 -04:00
adev - > sdma . trap_irq . num_types = AMDGPU_SDMA_IRQ_LAST ;
adev - > sdma . trap_irq . funcs = & cik_sdma_trap_irq_funcs ;
adev - > sdma . illegal_inst_irq . funcs = & cik_sdma_illegal_inst_irq_funcs ;
2015-04-20 17:09:27 -04:00
}
/**
* cik_sdma_emit_copy_buffer - copy buffer using the sDMA engine
*
* @ ring : amdgpu_ring structure holding ring information
* @ src_offset : src GPU address
* @ dst_offset : dst GPU address
* @ byte_count : number of bytes to xfer
*
* Copy GPU buffers using the DMA engine ( CIK ) .
* Used by the amdgpu ttm implementation to move pages if
* registered as the asic copy callback .
*/
2015-08-25 17:23:45 +08:00
static void cik_sdma_emit_copy_buffer ( struct amdgpu_ib * ib ,
2015-04-20 17:09:27 -04:00
uint64_t src_offset ,
uint64_t dst_offset ,
2019-10-15 15:37:48 +08:00
uint32_t byte_count ,
bool tmz )
2015-04-20 17:09:27 -04:00
{
2015-08-25 17:23:45 +08:00
ib - > ptr [ ib - > length_dw + + ] = SDMA_PACKET ( SDMA_OPCODE_COPY , SDMA_COPY_SUB_OPCODE_LINEAR , 0 ) ;
ib - > ptr [ ib - > length_dw + + ] = byte_count ;
ib - > ptr [ ib - > length_dw + + ] = 0 ; /* src/dst endian swap */
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( src_offset ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( src_offset ) ;
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( dst_offset ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( dst_offset ) ;
2015-04-20 17:09:27 -04:00
}
/**
* cik_sdma_emit_fill_buffer - fill buffer using the sDMA engine
*
* @ ring : amdgpu_ring structure holding ring information
* @ src_data : value to write to buffer
* @ dst_offset : dst GPU address
* @ byte_count : number of bytes to xfer
*
* Fill GPU buffers using the DMA engine ( CIK ) .
*/
2015-08-27 13:46:09 +08:00
static void cik_sdma_emit_fill_buffer ( struct amdgpu_ib * ib ,
2015-04-20 17:09:27 -04:00
uint32_t src_data ,
uint64_t dst_offset ,
uint32_t byte_count )
{
2015-08-27 13:46:09 +08:00
ib - > ptr [ ib - > length_dw + + ] = SDMA_PACKET ( SDMA_OPCODE_CONSTANT_FILL , 0 , 0 ) ;
ib - > ptr [ ib - > length_dw + + ] = lower_32_bits ( dst_offset ) ;
ib - > ptr [ ib - > length_dw + + ] = upper_32_bits ( dst_offset ) ;
ib - > ptr [ ib - > length_dw + + ] = src_data ;
ib - > ptr [ ib - > length_dw + + ] = byte_count ;
2015-04-20 17:09:27 -04:00
}
static const struct amdgpu_buffer_funcs cik_sdma_buffer_funcs = {
. copy_max_bytes = 0x1fffff ,
. copy_num_dw = 7 ,
. emit_copy_buffer = cik_sdma_emit_copy_buffer ,
. fill_max_bytes = 0x1fffff ,
. fill_num_dw = 5 ,
. emit_fill_buffer = cik_sdma_emit_fill_buffer ,
} ;
static void cik_sdma_set_buffer_funcs ( struct amdgpu_device * adev )
{
2018-09-17 15:41:45 +02:00
adev - > mman . buffer_funcs = & cik_sdma_buffer_funcs ;
adev - > mman . buffer_funcs_ring = & adev - > sdma . instance [ 0 ] . ring ;
2015-04-20 17:09:27 -04:00
}
static const struct amdgpu_vm_pte_funcs cik_sdma_vm_pte_funcs = {
2017-09-19 12:58:15 -04:00
. copy_pte_num_dw = 7 ,
2015-04-20 17:09:27 -04:00
. copy_pte = cik_sdma_vm_copy_pte ,
2017-09-19 12:58:15 -04:00
2015-04-20 17:09:27 -04:00
. write_pte = cik_sdma_vm_write_pte ,
. set_pte_pde = cik_sdma_vm_set_pte_pde ,
} ;
static void cik_sdma_set_vm_pte_funcs ( struct amdgpu_device * adev )
{
2016-02-08 17:37:38 +01:00
unsigned i ;
2018-09-17 15:41:45 +02:00
adev - > vm_manager . vm_pte_funcs = & cik_sdma_vm_pte_funcs ;
for ( i = 0 ; i < adev - > sdma . num_instances ; i + + ) {
2019-12-06 16:55:49 +01:00
adev - > vm_manager . vm_pte_scheds [ i ] =
& adev - > sdma . instance [ i ] . ring . sched ;
2015-04-20 17:09:27 -04:00
}
2019-12-06 16:55:49 +01:00
adev - > vm_manager . vm_pte_num_scheds = adev - > sdma . num_instances ;
2015-04-20 17:09:27 -04:00
}
2016-10-13 17:41:13 -04:00
const struct amdgpu_ip_block_version cik_sdma_ip_block =
{
. type = AMD_IP_BLOCK_TYPE_SDMA ,
. major = 2 ,
. minor = 0 ,
. rev = 0 ,
. funcs = & cik_sdma_ip_funcs ,
} ;