On 10/9/2024 9:15 AM, jiadong.zhu@xxxxxxx wrote: > From: Jiadong Zhu <Jiadong.Zhu@xxxxxxx> > > Implement sdma queue reset callback via SMU interface. > > v2: Leverage inst_stop/start functions in reset sequence. > Use GET_INST for physical SDMA instance. > Disable apu for sdma reset. > > Signed-off-by: Jiadong Zhu <Jiadong.Zhu@xxxxxxx> > --- > drivers/gpu/drm/amd/amdgpu/sdma_v4_4_2.c | 97 +++++++++++++++++++----- > 1 file changed, 79 insertions(+), 18 deletions(-) > > diff --git a/drivers/gpu/drm/amd/amdgpu/sdma_v4_4_2.c b/drivers/gpu/drm/amd/amdgpu/sdma_v4_4_2.c > index c77889040760..3cb16af9b78e 100644 > --- a/drivers/gpu/drm/amd/amdgpu/sdma_v4_4_2.c > +++ b/drivers/gpu/drm/amd/amdgpu/sdma_v4_4_2.c > @@ -667,11 +667,12 @@ static uint32_t sdma_v4_4_2_rb_cntl(struct amdgpu_ring *ring, uint32_t rb_cntl) > * > * @adev: amdgpu_device pointer > * @i: instance to resume > + * @restore: used to restore wptr when restart > * > * Set up the gfx DMA ring buffers and enable them. > * Returns 0 for success, error for failure. > */ > -static void sdma_v4_4_2_gfx_resume(struct amdgpu_device *adev, unsigned int i) > +static void sdma_v4_4_2_gfx_resume(struct amdgpu_device *adev, unsigned int i, bool restore) > { > struct amdgpu_ring *ring = &adev->sdma.instance[i].ring; > u32 rb_cntl, ib_cntl, wptr_poll_cntl; > @@ -698,16 +699,24 @@ static void sdma_v4_4_2_gfx_resume(struct amdgpu_device *adev, unsigned int i) > WREG32_SDMA(i, regSDMA_GFX_RB_BASE, ring->gpu_addr >> 8); > WREG32_SDMA(i, regSDMA_GFX_RB_BASE_HI, ring->gpu_addr >> 40); > > - ring->wptr = 0; > + if (!restore) > + ring->wptr = 0; > > /* before programing wptr to a less value, need set minor_ptr_update first */ > WREG32_SDMA(i, regSDMA_GFX_MINOR_PTR_UPDATE, 1); > > /* Initialize the ring buffer's read and write pointers */ > - WREG32_SDMA(i, regSDMA_GFX_RB_RPTR, 0); > - WREG32_SDMA(i, regSDMA_GFX_RB_RPTR_HI, 0); > - WREG32_SDMA(i, regSDMA_GFX_RB_WPTR, 0); > - WREG32_SDMA(i, regSDMA_GFX_RB_WPTR_HI, 0); > + if (restore) { > + WREG32_SDMA(i, regSDMA_GFX_RB_RPTR, lower_32_bits(ring->wptr << 2)); > + WREG32_SDMA(i, regSDMA_GFX_RB_RPTR_HI, upper_32_bits(ring->wptr << 2)); > + WREG32_SDMA(i, regSDMA_GFX_RB_WPTR, lower_32_bits(ring->wptr << 2)); > + WREG32_SDMA(i, regSDMA_GFX_RB_WPTR_HI, upper_32_bits(ring->wptr << 2)); > + } else { > + WREG32_SDMA(i, regSDMA_GFX_RB_RPTR, 0); > + WREG32_SDMA(i, regSDMA_GFX_RB_RPTR_HI, 0); > + WREG32_SDMA(i, regSDMA_GFX_RB_WPTR, 0); > + WREG32_SDMA(i, regSDMA_GFX_RB_WPTR_HI, 0); > + } > > doorbell = RREG32_SDMA(i, regSDMA_GFX_DOORBELL); > doorbell_offset = RREG32_SDMA(i, regSDMA_GFX_DOORBELL_OFFSET); > @@ -759,7 +768,7 @@ static void sdma_v4_4_2_gfx_resume(struct amdgpu_device *adev, unsigned int i) > * Set up the page DMA ring buffers and enable them. > * Returns 0 for success, error for failure. > */ > -static void sdma_v4_4_2_page_resume(struct amdgpu_device *adev, unsigned int i) > +static void sdma_v4_4_2_page_resume(struct amdgpu_device *adev, unsigned int i, bool restore) > { > struct amdgpu_ring *ring = &adev->sdma.instance[i].page; > u32 rb_cntl, ib_cntl, wptr_poll_cntl; > @@ -775,10 +784,17 @@ static void sdma_v4_4_2_page_resume(struct amdgpu_device *adev, unsigned int i) > WREG32_SDMA(i, regSDMA_PAGE_RB_CNTL, rb_cntl); > > /* Initialize the ring buffer's read and write pointers */ > - WREG32_SDMA(i, regSDMA_PAGE_RB_RPTR, 0); > - WREG32_SDMA(i, regSDMA_PAGE_RB_RPTR_HI, 0); > - WREG32_SDMA(i, regSDMA_PAGE_RB_WPTR, 0); > - WREG32_SDMA(i, regSDMA_PAGE_RB_WPTR_HI, 0); > + if (restore) { > + WREG32_SDMA(i, regSDMA_GFX_RB_RPTR, lower_32_bits(ring->wptr << 2)); > + WREG32_SDMA(i, regSDMA_GFX_RB_RPTR_HI, upper_32_bits(ring->wptr << 2)); > + WREG32_SDMA(i, regSDMA_GFX_RB_WPTR, lower_32_bits(ring->wptr << 2)); > + WREG32_SDMA(i, regSDMA_GFX_RB_WPTR_HI, upper_32_bits(ring->wptr << 2)); > + } else { > + WREG32_SDMA(i, regSDMA_PAGE_RB_RPTR, 0); > + WREG32_SDMA(i, regSDMA_PAGE_RB_RPTR_HI, 0); > + WREG32_SDMA(i, regSDMA_PAGE_RB_WPTR, 0); > + WREG32_SDMA(i, regSDMA_PAGE_RB_WPTR_HI, 0); > + } > > /* set the wb address whether it's enabled or not */ > WREG32_SDMA(i, regSDMA_PAGE_RB_RPTR_ADDR_HI, > @@ -792,7 +808,8 @@ static void sdma_v4_4_2_page_resume(struct amdgpu_device *adev, unsigned int i) > WREG32_SDMA(i, regSDMA_PAGE_RB_BASE, ring->gpu_addr >> 8); > WREG32_SDMA(i, regSDMA_PAGE_RB_BASE_HI, ring->gpu_addr >> 40); > > - ring->wptr = 0; > + if (!restore) > + ring->wptr = 0; > > /* before programing wptr to a less value, need set minor_ptr_update first */ > WREG32_SDMA(i, regSDMA_PAGE_MINOR_PTR_UPDATE, 1); > @@ -916,7 +933,7 @@ static int sdma_v4_4_2_inst_load_microcode(struct amdgpu_device *adev, > * Returns 0 for success, error for failure. > */ > static int sdma_v4_4_2_inst_start(struct amdgpu_device *adev, > - uint32_t inst_mask) > + uint32_t inst_mask, bool restore) > { > struct amdgpu_ring *ring; > uint32_t tmp_mask; > @@ -927,7 +944,7 @@ static int sdma_v4_4_2_inst_start(struct amdgpu_device *adev, > sdma_v4_4_2_inst_enable(adev, false, inst_mask); > } else { > /* bypass sdma microcode loading on Gopher */ > - if (adev->firmware.load_type != AMDGPU_FW_LOAD_PSP && > + if (!restore && adev->firmware.load_type != AMDGPU_FW_LOAD_PSP && > adev->sdma.instance[0].fw) { > r = sdma_v4_4_2_inst_load_microcode(adev, inst_mask); > if (r) > @@ -946,9 +963,9 @@ static int sdma_v4_4_2_inst_start(struct amdgpu_device *adev, > uint32_t temp; > > WREG32_SDMA(i, regSDMA_SEM_WAIT_FAIL_TIMER_CNTL, 0); > - sdma_v4_4_2_gfx_resume(adev, i); > + sdma_v4_4_2_gfx_resume(adev, i, restore); > if (adev->sdma.has_page_queue) > - sdma_v4_4_2_page_resume(adev, i); > + sdma_v4_4_2_page_resume(adev, i, restore); > > /* set utc l1 enable flag always to 1 */ > temp = RREG32_SDMA(i, regSDMA_CNTL); > @@ -1390,6 +1407,7 @@ static int sdma_v4_4_2_sw_init(void *handle) > ring = &adev->sdma.instance[i].ring; > ring->ring_obj = NULL; > ring->use_doorbell = true; > + ring->me = i; Appears like an unrelated change. This is alredy done in sdma_v4_4_2_set_ring_funcs() > aid_id = adev->sdma.instance[i].aid_id; > > DRM_DEBUG("SDMA %d use_doorbell being set to: [%s]\n", i, > @@ -1477,7 +1495,7 @@ static int sdma_v4_4_2_hw_init(void *handle) > if (!amdgpu_sriov_vf(adev)) > sdma_v4_4_2_inst_init_golden_registers(adev, inst_mask); > > - r = sdma_v4_4_2_inst_start(adev, inst_mask); > + r = sdma_v4_4_2_inst_start(adev, inst_mask, false); > > return r; > } > @@ -1566,6 +1584,48 @@ static int sdma_v4_4_2_soft_reset(void *handle) > return 0; > } > > +static int sdma_v4_4_2_reset_queue(struct amdgpu_ring *ring, unsigned int vmid) > +{ > + struct amdgpu_device *adev = ring->adev; > + int i, r; > + u32 preempt, inst_mask; > + > + if ((adev->flags & AMD_IS_APU) || amdgpu_sriov_vf(adev)) > + return -EINVAL; > + > + /* stop queue */ > + inst_mask = 1 << ring->me; > + sdma_v4_4_2_inst_gfx_stop(adev, inst_mask); > + if (adev->sdma.has_page_queue) > + sdma_v4_4_2_inst_page_stop(adev, inst_mask); > + > + /* soft reset SDMA_GFX_PREEMPT.IB_PREEMPT = 0*/ > + preempt = RREG32_SDMA(ring->me, regSDMA_GFX_PREEMPT); > + preempt = REG_SET_FIELD(preempt, SDMA_GFX_PREEMPT, IB_PREEMPT, 0); > + WREG32_SDMA(ring->me, regSDMA_GFX_PREEMPT, preempt); > + > + r = amdgpu_dpm_reset_sdma(adev, 1 << GET_INST(SDMA0, ring->me)); > + if (r) { > + dev_err(adev->dev, "amdgpu_dpm_reset_sdma failed(%d).\n", r); If this is here, then better to avoid another print in smu callback. May rephrase as "SDMA %d reset failed". > + return r; > + } > + > + udelay(50); > + > + for (i = 0; i < adev->usec_timeout; i++) { > + if (!REG_GET_FIELD(RREG32_SDMA(ring->me, regSDMA_F32_CNTL), SDMA_F32_CNTL, HALT)) > + break; > + udelay(1); > + } > + > + if (i == adev->usec_timeout) { > + dev_err(adev->dev, "waiting for unhalt failed.\n"); Better to add more context - ex: "timed out waiting for SDMA %d unhalt after reset". Thanks, Lijo > + return -ETIMEDOUT; > + } > + > + return sdma_v4_4_2_inst_start(adev, inst_mask, true); > +} > + > static int sdma_v4_4_2_set_trap_irq_state(struct amdgpu_device *adev, > struct amdgpu_irq_src *source, > unsigned type, > @@ -1948,6 +2008,7 @@ static const struct amdgpu_ring_funcs sdma_v4_4_2_ring_funcs = { > .emit_wreg = sdma_v4_4_2_ring_emit_wreg, > .emit_reg_wait = sdma_v4_4_2_ring_emit_reg_wait, > .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper, > + .reset = sdma_v4_4_2_reset_queue, > }; > > static const struct amdgpu_ring_funcs sdma_v4_4_2_page_ring_funcs = { > @@ -2160,7 +2221,7 @@ static int sdma_v4_4_2_xcp_resume(void *handle, uint32_t inst_mask) > if (!amdgpu_sriov_vf(adev)) > sdma_v4_4_2_inst_init_golden_registers(adev, inst_mask); > > - r = sdma_v4_4_2_inst_start(adev, inst_mask); > + r = sdma_v4_4_2_inst_start(adev, inst_mask, false); > > return r; > }