Re: [PATCH v1 3/3] drm/amdgpu: add cp queue registers for gfx9 ipdump

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Wed, May 29, 2024 at 5:50 AM Sunil Khatri <sunil.khatri@xxxxxxx> wrote:
>
> Add gfx9 support of CP queue registers for all queues
> to be used by devcoredump.
>
> Signed-off-by: Sunil Khatri <sunil.khatri@xxxxxxx>
> ---
>  drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c | 110 +++++++++++++++++++++++++-
>  1 file changed, 108 insertions(+), 2 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
> index f3d281de2a34..f1a7b60e73ce 100644
> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
> @@ -237,6 +237,47 @@ static const struct amdgpu_hwip_reg_entry gc_reg_list_9[] = {
>         SOC15_REG_ENTRY_STR(GC, 0, mmGRBM_STATUS_SE3)
>  };
>
> +static const struct amdgpu_hwip_reg_entry gc_cp_reg_list_9[] = {
> +       /* compute queue registers */
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_VMID),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_ACTIVE),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PERSISTENT_STATE),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PIPE_PRIORITY),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_QUEUE_PRIORITY),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_QUANTUM),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_BASE),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_BASE_HI),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_RPTR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_WPTR_POLL_ADDR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_WPTR_POLL_ADDR_HI),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_DOORBELL_CONTROL),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_CONTROL),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_IB_BASE_ADDR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_IB_BASE_ADDR_HI),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_IB_RPTR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_IB_CONTROL),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_DEQUEUE_REQUEST),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_BASE_ADDR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_BASE_ADDR_HI),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_CONTROL),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_RPTR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_WPTR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_EVENTS),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_CTX_SAVE_BASE_ADDR_LO),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_CTX_SAVE_BASE_ADDR_HI),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_CTX_SAVE_CONTROL),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_CNTL_STACK_OFFSET),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_CNTL_STACK_SIZE),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_WG_STATE_OFFSET),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_CTX_SAVE_SIZE),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_GDS_RESOURCE_STATE),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_ERROR),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_EOP_WPTR_MEM),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_WPTR_LO),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_PQ_WPTR_HI),
> +       SOC15_REG_ENTRY_STR(GC, 0, mmCP_HQD_GFX_STATUS),
> +};
> +
>  enum ta_ras_gfx_subblock {
>         /*CPC*/
>         TA_RAS_BLOCK__GFX_CPC_INDEX_START = 0,
> @@ -2086,6 +2127,7 @@ static void gfx_v9_0_alloc_ip_dump(struct amdgpu_device *adev)
>  {
>         uint32_t reg_count = ARRAY_SIZE(gc_reg_list_9);
>         uint32_t *ptr;
> +       uint32_t inst;
>
>         ptr = kcalloc(reg_count, sizeof(uint32_t), GFP_KERNEL);
>         if (ptr == NULL) {
> @@ -2094,6 +2136,19 @@ static void gfx_v9_0_alloc_ip_dump(struct amdgpu_device *adev)
>         } else {
>                 adev->gfx.ip_dump_core = ptr;
>         }
> +
> +       /* Allocate memory for compute queue registers for all the instances */
> +       reg_count = ARRAY_SIZE(gc_cp_reg_list_9);
> +       inst = adev->gfx.mec.num_mec * adev->gfx.mec.num_pipe_per_mec *
> +               adev->gfx.mec.num_queue_per_pipe;
> +
> +       ptr = kcalloc(reg_count * inst, sizeof(uint32_t), GFP_KERNEL);
> +       if (ptr == NULL) {
> +               DRM_ERROR("Failed to allocate memory for GFX CP IP Dump\n");
> +               adev->gfx.ip_dump_cp_queues = NULL;
> +       } else {
> +               adev->gfx.ip_dump_cp_queues = ptr;

As a follow on patch, you may want to rename this to
ip_dump_compute_queues since these are compute queue registers.
Other than that, the series is:
Reviewed-by: Alex Deucher <alexander.deucher@xxxxxxx>

> +       }
>  }
>
>  static int gfx_v9_0_sw_init(void *handle)
> @@ -2311,6 +2366,7 @@ static int gfx_v9_0_sw_fini(void *handle)
>         gfx_v9_0_free_microcode(adev);
>
>         kfree(adev->gfx.ip_dump_core);
> +       kfree(adev->gfx.ip_dump_cp_queues);
>
>         return 0;
>  }
> @@ -6949,7 +7005,7 @@ static void gfx_v9_0_emit_wave_limit(struct amdgpu_ring *ring, bool enable)
>  static void gfx_v9_ip_print(void *handle, struct drm_printer *p)
>  {
>         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
> -       uint32_t i;
> +       uint32_t i, j, k, reg, index = 0;
>         uint32_t reg_count = ARRAY_SIZE(gc_reg_list_9);
>
>         if (!adev->gfx.ip_dump_core)
> @@ -6960,12 +7016,36 @@ static void gfx_v9_ip_print(void *handle, struct drm_printer *p)
>                            gc_reg_list_9[i].reg_name,
>                            adev->gfx.ip_dump_core[i]);
>
> +       /* print compute queue registers for all instances */
> +       if (!adev->gfx.ip_dump_cp_queues)
> +               return;
> +
> +       reg_count = ARRAY_SIZE(gc_cp_reg_list_9);
> +       drm_printf(p, "\nnum_mec: %d num_pipe: %d num_queue: %d\n",
> +                  adev->gfx.mec.num_mec,
> +                  adev->gfx.mec.num_pipe_per_mec,
> +                  adev->gfx.mec.num_queue_per_pipe);
> +
> +       for (i = 0; i < adev->gfx.mec.num_mec; i++) {
> +               for (j = 0; j < adev->gfx.mec.num_pipe_per_mec; j++) {
> +                       for (k = 0; k < adev->gfx.mec.num_queue_per_pipe; k++) {
> +                               drm_printf(p, "\nmec %d, pipe %d, queue %d\n", i, j, k);
> +                               for (reg = 0; reg < reg_count; reg++) {
> +                                       drm_printf(p, "%-50s \t 0x%08x\n",
> +                                                  gc_cp_reg_list_9[reg].reg_name,
> +                                                  adev->gfx.ip_dump_cp_queues[index + reg]);
> +                               }
> +                               index += reg_count;
> +                       }
> +               }
> +       }
> +
>  }
>
>  static void gfx_v9_ip_dump(void *handle)
>  {
>         struct amdgpu_device *adev = (struct amdgpu_device *)handle;
> -       uint32_t i;
> +       uint32_t i, j, k, reg, index = 0;
>         uint32_t reg_count = ARRAY_SIZE(gc_reg_list_9);
>
>         if (!adev->gfx.ip_dump_core)
> @@ -6976,6 +7056,32 @@ static void gfx_v9_ip_dump(void *handle)
>                 adev->gfx.ip_dump_core[i] = RREG32(SOC15_REG_ENTRY_OFFSET(gc_reg_list_9[i]));
>         amdgpu_gfx_off_ctrl(adev, true);
>
> +       /* dump compute queue registers for all instances */
> +       if (!adev->gfx.ip_dump_cp_queues)
> +               return;
> +
> +       reg_count = ARRAY_SIZE(gc_cp_reg_list_9);
> +       amdgpu_gfx_off_ctrl(adev, false);
> +       mutex_lock(&adev->srbm_mutex);
> +       for (i = 0; i < adev->gfx.mec.num_mec; i++) {
> +               for (j = 0; j < adev->gfx.mec.num_pipe_per_mec; j++) {
> +                       for (k = 0; k < adev->gfx.mec.num_queue_per_pipe; k++) {
> +                               /* ME0 is for GFX so start from 1 for CP */
> +                               soc15_grbm_select(adev, 1 + i, j, k, 0, 0);
> +
> +                               for (reg = 0; reg < reg_count; reg++) {
> +                                       adev->gfx.ip_dump_cp_queues[index + reg] =
> +                                               RREG32(SOC15_REG_ENTRY_OFFSET(
> +                                                       gc_cp_reg_list_9[reg]));
> +                               }
> +                               index += reg_count;
> +                       }
> +               }
> +       }
> +       soc15_grbm_select(adev, 0, 0, 0, 0, 0);
> +       mutex_unlock(&adev->srbm_mutex);
> +       amdgpu_gfx_off_ctrl(adev, true);
> +
>  }
>
>  static const struct amd_ip_funcs gfx_v9_0_ip_funcs = {
> --
> 2.34.1
>




[Index of Archives]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]

  Powered by Linux