[PATCH] drm/amdgpu: add high priority compute support for gfx9

andresx7@xxxxxxxxx (Andres Rodriguez) · Wed, 3 Jan 2018 22:01:37 -0500

On 2018-01-03 06:29 PM, Alex Deucher wrote:
> On Tue, Jan 2, 2018 at 3:49 PM, Andres Rodriguez <andresx7 at gmail.com> wrote:
>> We follow the same approach as gfx8. The only changes are register
>> access macros.
>>
>> Tested on vega10. The execution latency results fall within the expected
>> ranges from the polaris10 data.
>>
>> Signed-off-by: Andres Rodriguez <andresx7 at gmail.com>
> 
> Reviewed-by: Alex Deucher <alexander.deucher at amd.com>

Thanks, and a happy new year to you :)
> 
> Do you want to send a patch to bump the driver version so you know
> when this is available?
> 

That would be perfect. I'll send it out in the morning.

Regards,
Andres

> Alex
> 
>> ---
>>   drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c | 100 ++++++++++++++++++++++++++++++++++
>>   1 file changed, 100 insertions(+)
>>
>> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
>> index 9f7be230734c..80af928b153e 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
>> @@ -3734,6 +3734,105 @@ static u64 gfx_v9_0_ring_get_wptr_compute(struct amdgpu_ring *ring)
>>          return wptr;
>>   }
>>
>> +static void gfx_v9_0_ring_set_pipe_percent(struct amdgpu_ring *ring,
>> +                                          bool acquire)
>> +{
>> +       struct amdgpu_device *adev = ring->adev;
>> +       int pipe_num, tmp, reg;
>> +       int pipe_percent = acquire ? SPI_WCL_PIPE_PERCENT_GFX__VALUE_MASK : 0x1;
>> +
>> +       pipe_num = ring->me * adev->gfx.mec.num_pipe_per_mec + ring->pipe;
>> +
>> +       /* first me only has 2 entries, GFX and HP3D */
>> +       if (ring->me > 0)
>> +               pipe_num -= 2;
>> +
>> +       reg = SOC15_REG_OFFSET(GC, 0, mmSPI_WCL_PIPE_PERCENT_GFX) + pipe_num;
>> +       tmp = RREG32(reg);
>> +       tmp = REG_SET_FIELD(tmp, SPI_WCL_PIPE_PERCENT_GFX, VALUE, pipe_percent);
>> +       WREG32(reg, tmp);
>> +}
>> +
>> +static void gfx_v9_0_pipe_reserve_resources(struct amdgpu_device *adev,
>> +                                           struct amdgpu_ring *ring,
>> +                                           bool acquire)
>> +{
>> +       int i, pipe;
>> +       bool reserve;
>> +       struct amdgpu_ring *iring;
>> +
>> +       mutex_lock(&adev->gfx.pipe_reserve_mutex);
>> +       pipe = amdgpu_gfx_queue_to_bit(adev, ring->me, ring->pipe, 0);
>> +       if (acquire)
>> +               set_bit(pipe, adev->gfx.pipe_reserve_bitmap);
>> +       else
>> +               clear_bit(pipe, adev->gfx.pipe_reserve_bitmap);
>> +
>> +       if (!bitmap_weight(adev->gfx.pipe_reserve_bitmap, AMDGPU_MAX_COMPUTE_QUEUES)) {
>> +               /* Clear all reservations - everyone reacquires all resources */
>> +               for (i = 0; i < adev->gfx.num_gfx_rings; ++i)
>> +                       gfx_v9_0_ring_set_pipe_percent(&adev->gfx.gfx_ring[i],
>> +                                                      true);
>> +
>> +               for (i = 0; i < adev->gfx.num_compute_rings; ++i)
>> +                       gfx_v9_0_ring_set_pipe_percent(&adev->gfx.compute_ring[i],
>> +                                                      true);
>> +       } else {
>> +               /* Lower all pipes without a current reservation */
>> +               for (i = 0; i < adev->gfx.num_gfx_rings; ++i) {
>> +                       iring = &adev->gfx.gfx_ring[i];
>> +                       pipe = amdgpu_gfx_queue_to_bit(adev,
>> +                                                      iring->me,
>> +                                                      iring->pipe,
>> +                                                      0);
>> +                       reserve = test_bit(pipe, adev->gfx.pipe_reserve_bitmap);
>> +                       gfx_v9_0_ring_set_pipe_percent(iring, reserve);
>> +               }
>> +
>> +               for (i = 0; i < adev->gfx.num_compute_rings; ++i) {
>> +                       iring = &adev->gfx.compute_ring[i];
>> +                       pipe = amdgpu_gfx_queue_to_bit(adev,
>> +                                                      iring->me,
>> +                                                      iring->pipe,
>> +                                                      0);
>> +                       reserve = test_bit(pipe, adev->gfx.pipe_reserve_bitmap);
>> +                       gfx_v9_0_ring_set_pipe_percent(iring, reserve);
>> +               }
>> +       }
>> +
>> +       mutex_unlock(&adev->gfx.pipe_reserve_mutex);
>> +}
>> +
>> +static void gfx_v9_0_hqd_set_priority(struct amdgpu_device *adev,
>> +                                     struct amdgpu_ring *ring,
>> +                                     bool acquire)
>> +{
>> +       uint32_t pipe_priority = acquire ? 0x2 : 0x0;
>> +       uint32_t queue_priority = acquire ? 0xf : 0x0;
>> +
>> +       mutex_lock(&adev->srbm_mutex);
>> +       soc15_grbm_select(adev, ring->me, ring->pipe, ring->queue, 0);
>> +
>> +       WREG32_SOC15(GC, 0, mmCP_HQD_PIPE_PRIORITY, pipe_priority);
>> +       WREG32_SOC15(GC, 0, mmCP_HQD_QUEUE_PRIORITY, queue_priority);
>> +
>> +       soc15_grbm_select(adev, 0, 0, 0, 0);
>> +       mutex_unlock(&adev->srbm_mutex);
>> +}
>> +
>> +static void gfx_v9_0_ring_set_priority_compute(struct amdgpu_ring *ring,
>> +                                              enum drm_sched_priority priority)
>> +{
>> +       struct amdgpu_device *adev = ring->adev;
>> +       bool acquire = priority == DRM_SCHED_PRIORITY_HIGH_HW;
>> +
>> +       if (ring->funcs->type != AMDGPU_RING_TYPE_COMPUTE)
>> +               return;
>> +
>> +       gfx_v9_0_hqd_set_priority(adev, ring, acquire);
>> +       gfx_v9_0_pipe_reserve_resources(adev, ring, acquire);
>> +}
>> +
>>   static void gfx_v9_0_ring_set_wptr_compute(struct amdgpu_ring *ring)
>>   {
>>          struct amdgpu_device *adev = ring->adev;
>> @@ -4260,6 +4359,7 @@ static const struct amdgpu_ring_funcs gfx_v9_0_ring_funcs_compute = {
>>          .test_ib = gfx_v9_0_ring_test_ib,
>>          .insert_nop = amdgpu_ring_insert_nop,
>>          .pad_ib = amdgpu_ring_generic_pad_ib,
>> +       .set_priority = gfx_v9_0_ring_set_priority_compute,
>>   };
>>
>>   static const struct amdgpu_ring_funcs gfx_v9_0_ring_funcs_kiq = {
>> --
>> 2.14.1
>>
>> _______________________________________________
>> amd-gfx mailing list
>> amd-gfx at lists.freedesktop.org
>> https://lists.freedesktop.org/mailman/listinfo/amd-gfx