On Thu, Nov 21, 2024 at 8:33 AM Shashank Sharma <shashank.sharma@xxxxxxx> wrote: > > From: Arunpravin Paneer Selvam <Arunpravin.PaneerSelvam@xxxxxxx> > > - Add a field in struct amdgpu_mqd_prop for userqueue > secure sem fence address since now we have a generic > file for mes_userqueue.c > - Add secure sem fence address mqd support to gfx12 into > their corresponding init functions. > - Enable secure semaphore IRQ handling > > Signed-off-by: Arunpravin Paneer Selvam <Arunpravin.PaneerSelvam@xxxxxxx> > Signed-off-by: Somalapuram Amaranath <Amaranath.Somalapuram@xxxxxxx> > Signed-off-by: Shashank Sharma <shashank.sharma@xxxxxxx> > --- > drivers/gpu/drm/amd/amdgpu/amdgpu.h | 1 + > drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c | 2 ++ > drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c | 27 +++++++++++----------- > drivers/gpu/drm/amd/amdgpu/mes_userqueue.c | 11 +-------- > drivers/gpu/drm/amd/include/v12_structs.h | 4 ++-- > 5 files changed, 20 insertions(+), 25 deletions(-) > > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu.h b/drivers/gpu/drm/amd/amdgpu/amdgpu.h > index 2c889cc2a59e..9c4df966fa8a 100644 > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu.h > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu.h > @@ -829,6 +829,7 @@ struct amdgpu_mqd_prop { > uint64_t shadow_addr; > uint64_t gds_bkup_addr; > uint64_t csa_addr; > + uint64_t fenceaddress; I'd prefer fence_address here for readability. With that and the other comments on the earlier patches addressed, the series is: Reviewed-by: Alex Deucher <alexander.deucher@xxxxxxx> > }; > > struct amdgpu_mqd { > diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > index 0e5732795891..fc2e82eb0d64 100644 > --- a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c > @@ -4058,6 +4058,8 @@ static int gfx_v11_0_gfx_mqd_init(struct amdgpu_device *adev, void *m, > mqd->gds_bkup_base_hi = upper_32_bits(prop->gds_bkup_addr); > mqd->fw_work_area_base_lo = prop->csa_addr & 0xFFFFFFFC; > mqd->fw_work_area_base_hi = upper_32_bits(prop->csa_addr); > + mqd->fenceaddress_lo = lower_32_bits(prop->fenceaddress); > + mqd->fenceaddress_hi = upper_32_bits(prop->fenceaddress); > > return 0; > } > diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c > index b151a75cf88c..ff74f7d389e9 100644 > --- a/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c > +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c > @@ -47,6 +47,7 @@ > #include "nbif_v6_3_1.h" > #include "mes_v12_0.h" > #include "mes_userqueue.h" > +#include "amdgpu_userq_fence.h" > > #define GFX12_NUM_GFX_RINGS 1 > #define GFX12_MEC_HPD_SIZE 2048 > @@ -2972,6 +2973,8 @@ static int gfx_v12_0_gfx_mqd_init(struct amdgpu_device *adev, void *m, > mqd->shadow_base_hi = upper_32_bits(prop->shadow_addr); > mqd->fw_work_area_base_lo = prop->csa_addr & 0xFFFFFFFC; > mqd->fw_work_area_base_hi = upper_32_bits(prop->csa_addr); > + mqd->fenceaddress_lo = lower_32_bits(prop->fenceaddress); > + mqd->fenceaddress_hi = upper_32_bits(prop->fenceaddress); > > return 0; > } > @@ -4817,25 +4820,23 @@ static int gfx_v12_0_eop_irq(struct amdgpu_device *adev, > struct amdgpu_irq_src *source, > struct amdgpu_iv_entry *entry) > { > - int i; > + u32 doorbell_offset = entry->src_data[0]; > u8 me_id, pipe_id, queue_id; > struct amdgpu_ring *ring; > - uint32_t mes_queue_id = entry->src_data[0]; > + int i; > > DRM_DEBUG("IH: CP EOP\n"); > > - if (adev->enable_mes && (mes_queue_id & AMDGPU_FENCE_MES_QUEUE_FLAG)) { > - struct amdgpu_mes_queue *queue; > + if (adev->enable_mes && doorbell_offset) { > + struct amdgpu_userq_fence_driver *fence_drv = NULL; > + struct xarray *xa = &adev->userq_xa; > + unsigned long flags; > > - mes_queue_id &= AMDGPU_FENCE_MES_QUEUE_ID_MASK; > - > - spin_lock(&adev->mes.queue_id_lock); > - queue = idr_find(&adev->mes.queue_id_idr, mes_queue_id); > - if (queue) { > - DRM_DEBUG("process mes queue id = %d\n", mes_queue_id); > - amdgpu_fence_process(queue->ring); > - } > - spin_unlock(&adev->mes.queue_id_lock); > + xa_lock_irqsave(xa, flags); > + fence_drv = xa_load(xa, doorbell_offset); > + if (fence_drv) > + amdgpu_userq_fence_driver_process(fence_drv); > + xa_unlock_irqrestore(xa, flags); > } else { > me_id = (entry->ring_id & 0x0c) >> 2; > pipe_id = (entry->ring_id & 0x03) >> 0; > diff --git a/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c b/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c > index fe50c85fb2ff..93eb26f072df 100644 > --- a/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c > +++ b/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c > @@ -183,14 +183,6 @@ static int mes_userq_create_ctx_space(struct amdgpu_userq_mgr *uq_mgr, > return 0; > } > > -static void mes_userq_set_fence_space(struct amdgpu_usermode_queue *queue) > -{ > - struct v11_gfx_mqd *mqd = queue->mqd.cpu_ptr; > - > - mqd->fenceaddress_lo = lower_32_bits(queue->fence_drv->gpu_addr); > - mqd->fenceaddress_hi = upper_32_bits(queue->fence_drv->gpu_addr); > -} > - > static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr, > struct drm_amdgpu_userq_in *args_in, > struct amdgpu_usermode_queue *queue) > @@ -229,6 +221,7 @@ static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr, > userq_props->mqd_gpu_addr = queue->mqd.gpu_addr; > userq_props->use_doorbell = true; > userq_props->doorbell_index = queue->doorbell_index; > + userq_props->fenceaddress = queue->fence_drv->gpu_addr; > > if (queue->queue_type == AMDGPU_HW_IP_COMPUTE) { > struct drm_amdgpu_userq_mqd_compute_gfx11 *compute_mqd; > @@ -305,8 +298,6 @@ static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr, > goto free_mqd; > } > > - mes_userq_set_fence_space(queue); > - > /* FW expects WPTR BOs to be mapped into GART */ > r = mes_userq_create_wptr_mapping(uq_mgr, queue, userq_props->wptr_gpu_addr); > if (r) { > diff --git a/drivers/gpu/drm/amd/include/v12_structs.h b/drivers/gpu/drm/amd/include/v12_structs.h > index 5eabab611b02..bbb6ebdc6238 100644 > --- a/drivers/gpu/drm/amd/include/v12_structs.h > +++ b/drivers/gpu/drm/amd/include/v12_structs.h > @@ -535,8 +535,8 @@ struct v12_gfx_mqd { > uint32_t reserved_507; // offset: 507 (0x1FB) > uint32_t reserved_508; // offset: 508 (0x1FC) > uint32_t reserved_509; // offset: 509 (0x1FD) > - uint32_t reserved_510; // offset: 510 (0x1FE) > - uint32_t reserved_511; // offset: 511 (0x1FF) > + uint32_t fenceaddress_lo; // offset: 510 (0x1FE) > + uint32_t fenceaddress_hi; // offset: 511 (0x1FF) > }; > > struct v12_sdma_mqd { > -- > 2.46.2 >