[PATCH 1/2] drm/amdgpu/gfx9: allocate queues horizontally across pipes

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



First is Reviewed-by: Tom St Denis <tom.stdenis at amd.com> and second is 
Acked-by.

Cheers,
Tom

On 05/06/17 11:06 AM, Alex Deucher wrote:
> Pipes provide better concurrency than queues, therefore we want to make
> sure that apps use queues from different pipes whenever possible.
> 
> Optimize for the trivial case where an app will consume rings in order,
> therefore we don't want adjacent rings to belong to the same pipe.
> 
> gfx9 was missed when these patches were rebased.
> 
> Signed-off-by: Alex Deucher <alexander.deucher at amd.com>
> ---
>   drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c | 115 +++++++++++++++-------------------
>   1 file changed, 52 insertions(+), 63 deletions(-)
> 
> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
> index 9502353..0c48f6c 100644
> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
> @@ -1483,9 +1483,44 @@ static int gfx_v9_0_ngg_en(struct amdgpu_device *adev)
>   	return 0;
>   }
>   
> +static int gfx_v9_0_compute_ring_init(struct amdgpu_device *adev, int ring_id,
> +				      int mec, int pipe, int queue)
> +{
> +	int r;
> +	unsigned irq_type;
> +	struct amdgpu_ring *ring = &adev->gfx.compute_ring[ring_id];
> +
> +	ring = &adev->gfx.compute_ring[ring_id];
> +
> +	/* mec0 is me1 */
> +	ring->me = mec + 1;
> +	ring->pipe = pipe;
> +	ring->queue = queue;
> +
> +	ring->ring_obj = NULL;
> +	ring->use_doorbell = true;
> +	ring->doorbell_index = AMDGPU_DOORBELL_MEC_RING0 + ring_id;
> +	ring->eop_gpu_addr = adev->gfx.mec.hpd_eop_gpu_addr
> +				+ (ring_id * GFX9_MEC_HPD_SIZE);
> +	sprintf(ring->name, "comp_%d.%d.%d", ring->me, ring->pipe, ring->queue);
> +
> +	irq_type = AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE0_EOP
> +		+ ((ring->me - 1) * adev->gfx.mec.num_pipe_per_mec)
> +		+ ring->pipe;
> +
> +	/* type-2 packets are deprecated on MEC, use type-3 instead */
> +	r = amdgpu_ring_init(adev, ring, 1024,
> +			     &adev->gfx.eop_irq, irq_type);
> +	if (r)
> +		return r;
> +
> +
> +	return 0;
> +}
> +
>   static int gfx_v9_0_sw_init(void *handle)
>   {
> -	int i, r, ring_id;
> +	int i, j, k, r, ring_id;
>   	struct amdgpu_ring *ring;
>   	struct amdgpu_kiq *kiq;
>   	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
> @@ -1547,69 +1582,23 @@ static int gfx_v9_0_sw_init(void *handle)
>   			return r;
>   	}
>   
> -	/* set up the compute queues */
> -	for (i = 0, ring_id = 0; i < AMDGPU_MAX_COMPUTE_QUEUES; i++) {
> -		unsigned irq_type;
> -
> -		if (!test_bit(i, adev->gfx.mec.queue_bitmap))
> -			continue;
> -
> -		if (WARN_ON(ring_id >= AMDGPU_MAX_COMPUTE_RINGS))
> -			break;
> -
> -		ring = &adev->gfx.compute_ring[ring_id];
> -
> -		/* mec0 is me1 */
> -		ring->me = ((i / adev->gfx.mec.num_queue_per_pipe)
> -				/ adev->gfx.mec.num_pipe_per_mec)
> -				+ 1;
> -		ring->pipe = (i / adev->gfx.mec.num_queue_per_pipe)
> -				% adev->gfx.mec.num_pipe_per_mec;
> -		ring->queue = i % adev->gfx.mec.num_queue_per_pipe;
> -
> -		ring->ring_obj = NULL;
> -		ring->use_doorbell = true;
> -		ring->eop_gpu_addr = adev->gfx.mec.hpd_eop_gpu_addr + (ring_id * GFX9_MEC_HPD_SIZE);
> -		ring->doorbell_index = AMDGPU_DOORBELL_MEC_RING0 + ring_id;
> -		sprintf(ring->name, "comp_%d.%d.%d", ring->me, ring->pipe, ring->queue);
> -
> -		irq_type = AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE0_EOP
> -			+ ((ring->me - 1) * adev->gfx.mec.num_pipe_per_mec)
> -			+ ring->pipe;
> -
> -		/* type-2 packets are deprecated on MEC, use type-3 instead */
> -		r = amdgpu_ring_init(adev, ring, 1024, &adev->gfx.eop_irq,
> -				     irq_type);
> -		if (r)
> -			return r;
> -
> -		ring_id++;
> -	}
> -
> -	/* set up the compute queues */
> -	for (i = 0, ring_id = 0; i < AMDGPU_MAX_COMPUTE_QUEUES; i++) {
> -		unsigned irq_type;
> -
> -		/* max 32 queues per MEC */
> -		if ((i >= 32) || (i >= AMDGPU_MAX_COMPUTE_RINGS)) {
> -			DRM_ERROR("Too many (%d) compute rings!\n", i);
> -			break;
> +	/* set up the compute queues - allocate horizontally across pipes */
> +	ring_id = 0;
> +	for (i = 0; i < adev->gfx.mec.num_mec; ++i) {
> +		for (j = 0; j < adev->gfx.mec.num_queue_per_pipe; j++) {
> +			for (k = 0; k < adev->gfx.mec.num_pipe_per_mec; k++) {
> +				if (!amdgpu_is_mec_queue_enabled(adev, i, k, j))
> +					continue;
> +
> +				r = gfx_v9_0_compute_ring_init(adev,
> +							       ring_id,
> +							       i, k, j);
> +				if (r)
> +					return r;
> +
> +				ring_id++;
> +			}
>   		}
> -		ring = &adev->gfx.compute_ring[i];
> -		ring->ring_obj = NULL;
> -		ring->use_doorbell = true;
> -		ring->doorbell_index = (AMDGPU_DOORBELL64_MEC_RING0 + i) << 1;
> -		ring->me = 1; /* first MEC */
> -		ring->pipe = i / 8;
> -		ring->queue = i % 8;
> -		ring->eop_gpu_addr = adev->gfx.mec.hpd_eop_gpu_addr + (i * GFX9_MEC_HPD_SIZE);
> -		sprintf(ring->name, "comp_%d.%d.%d", ring->me, ring->pipe, ring->queue);
> -		irq_type = AMDGPU_CP_IRQ_COMPUTE_MEC1_PIPE0_EOP + ring->pipe;
> -		/* type-2 packets are deprecated on MEC, use type-3 instead */
> -		r = amdgpu_ring_init(adev, ring, 1024,
> -				     &adev->gfx.eop_irq, irq_type);
> -		if (r)
> -			return r;
>   	}
>   
>   	r = gfx_v9_0_kiq_init(adev);
> 



[Index of Archives]     [Linux USB Devel]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]

  Powered by Linux