[PATCH v2 2/2] drm/amdgpu: Move old fence waiting before reservation lock is aquired.

zhoucm1@xxxxxxx (Chunming Zhou) · Wed, 11 Oct 2017 15:41:44 +0800

After ctx mutex is added, pthread_mutext in libdrm can be removed now.

David Zhou

On 2017å¹´10æ??11æ?¥ 15:25, Christian KÃ¶nig wrote:
> Yes, the mutex is mandatory.
>
> As I explained before it doesn't matter what userspace is doing, the 
> kernel IOCTL must always be thread safe.
>
> Otherwise userspace could force the kernel to run into a BUG_ON() or 
> worse.
>
> Additional to that we already use an CS interface upstream which 
> doesn't have a pthread_mutex any more.
>
> Regards,
> Christian.
>
> Am 11.10.2017 um 05:28 schrieb Liu, Monk:
>> Hi Andrey & Christian
>>
>> Do we really need the mutext lock here?
>> Libdrm_amdgpu already has the pthread_mutext to protect multi-thread 
>> racing issues, kernel side should be safe with that
>>
>> BR Monk
>>
>> -----Original Message-----
>> From: Andrey Grodzovsky [mailto:andrey.grodzovsky at amd.com]
>> Sent: Wednesday, October 11, 2017 4:50 AM
>> To: Koenig, Christian <Christian.Koenig at amd.com>; Liu, Monk 
>> <Monk.Liu at amd.com>; amd-gfx at lists.freedesktop.org
>> Cc: Grodzovsky, Andrey <Andrey.Grodzovsky at amd.com>
>> Subject: [PATCH v2 2/2] drm/amdgpu: Move old fence waiting before 
>> reservation lock is aquired.
>>
>> Helps avoiding deadlock during GPU reset.
>> Added mutex to amdgpu_ctx to preserve order of fences on a ring.
>>
>> v2:
>> Put waiting logic in a function in a seperate function in amdgpu_ctx.c
>>
>> Signed-off-by: Andrey Grodzovsky <andrey.grodzovsky at amd.com>
>> ---
>> Â  drivers/gpu/drm/amd/amdgpu/amdgpu.hÂ Â Â Â  |Â  4 ++++
>> Â  drivers/gpu/drm/amd/amdgpu/amdgpu_cs.cÂ  |Â  8 ++++++-- 
>> drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c | 30 
>> ++++++++++++++++++++++++------
>> Â  3 files changed, 34 insertions(+), 8 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu.h 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
>> index da48f97..235eca5 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu.h
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
>> @@ -741,6 +741,7 @@ struct amdgpu_ctx {
>> Â Â Â Â Â  boolÂ Â Â Â Â Â Â Â Â Â Â Â  preamble_presented;
>> Â Â Â Â Â  enum amd_sched_priority init_priority;
>> Â Â Â Â Â  enum amd_sched_priority override_priority;
>> +Â Â Â  struct mutexÂ Â Â Â Â Â Â Â Â Â Â  lock;
>> Â  };
>> Â  Â  struct amdgpu_ctx_mgr {
>> @@ -763,9 +764,12 @@ void amdgpu_ctx_priority_override(struct 
>> amdgpu_ctx *ctx,Â  int amdgpu_ctx_ioctl(struct drm_device *dev, void 
>> *data,
>> Â Â Â Â Â Â Â Â Â Â Â Â Â Â  struct drm_file *filp);
>> Â  +int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx, unsigned
>> +ring_id);
>> +
>> Â  void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr);Â  void 
>> amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr);
>> Â  +
>> Â  /*
>> Â Â  * file private structure
>> Â Â  */
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
>> index 1a54e53..c36297c 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
>> @@ -90,6 +90,8 @@ static int amdgpu_cs_parser_init(struct 
>> amdgpu_cs_parser *p, void *data)
>> Â Â Â Â Â Â Â Â Â  goto free_chunk;
>> Â Â Â Â Â  }
>> Â  +Â Â Â  mutex_lock(&p->ctx->lock);
>> +
>> Â Â Â Â Â  /* get chunks */
>> Â Â Â Â Â  chunk_array_user = u64_to_user_ptr(cs->in.chunks);
>> Â Â Â Â Â  if (copy_from_user(chunk_array, chunk_array_user, @@ -737,8 
>> +739,10 @@ static void amdgpu_cs_parser_fini(struct amdgpu_cs_parser 
>> *parser, int error,
>> Â  Â Â Â Â Â  dma_fence_put(parser->fence);
>> Â  -Â Â Â  if (parser->ctx)
>> +Â Â Â  if (parser->ctx) {
>> +Â Â Â Â Â Â Â  mutex_unlock(&parser->ctx->lock);
>> Â Â Â Â Â Â Â Â Â  amdgpu_ctx_put(parser->ctx);
>> +Â Â Â  }
>> Â  Â Â Â Â Â  if (parser->bo_list)
>> Â Â Â Â Â Â Â Â Â  amdgpu_bo_list_put(parser->bo_list);
>> @@ -992,7 +996,7 @@ static int amdgpu_cs_ib_fill(struct amdgpu_device 
>> *adev,
>> Â Â Â Â Â Â Â Â Â  parser->job->ring->funcs->type == AMDGPU_RING_TYPE_VCE))
>> Â Â Â Â Â Â Â Â Â  return -EINVAL;
>> Â  -Â Â Â  return 0;
>> +Â Â Â  return amdgpu_ctx_wait_prev_fence(parser->ctx,
>> +parser->job->ring->idx);
>> Â  }
>> Â  Â  static int amdgpu_cs_process_fence_dep(struct amdgpu_cs_parser 
>> *p, diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c
>> index a78b03f6..4309820 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c
>> @@ -67,6 +67,8 @@ static int amdgpu_ctx_init(struct amdgpu_device *adev,
>> Â Â Â Â Â  if (!ctx->fences)
>> Â Â Â Â Â Â Â Â Â  return -ENOMEM;
>> Â  +Â Â Â  mutex_init(&ctx->lock);
>> +
>> Â Â Â Â Â  for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
>> Â Â Â Â Â Â Â Â Â  ctx->rings[i].sequence = 1;
>> Â Â Â Â Â Â Â Â Â  ctx->rings[i].fences = &ctx->fences[amdgpu_sched_jobs * i]; 
>> @@ -126,6 +128,8 @@ static void amdgpu_ctx_fini(struct amdgpu_ctx *ctx)
>> Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â  &ctx->rings[i].entity);
>> Â  Â Â Â Â Â  amdgpu_queue_mgr_fini(adev, &ctx->queue_mgr);
>> +
>> +Â Â Â  mutex_destroy(&ctx->lock);
>> Â  }
>> Â  Â  static int amdgpu_ctx_alloc(struct amdgpu_device *adev, @@ 
>> -296,12 +300,8 @@ int amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx, 
>> struct amdgpu_ring *ring,
>> Â  Â Â Â Â Â  idx = seq & (amdgpu_sched_jobs - 1);
>> Â Â Â Â Â  other = cring->fences[idx];
>> -Â Â Â  if (other) {
>> -Â Â Â Â Â Â Â  signed long r;
>> -Â Â Â Â Â Â Â  r = dma_fence_wait_timeout(other, true, MAX_SCHEDULE_TIMEOUT);
>> -Â Â Â Â Â Â Â  if (r < 0)
>> -Â Â Â Â Â Â Â Â Â Â Â  return r;
>> -Â Â Â  }
>> +Â Â Â  if (other)
>> +Â Â Â Â Â Â Â  BUG_ON(!dma_fence_is_signaled(other));
>> Â  Â Â Â Â Â  dma_fence_get(fence);
>> Â  @@ -372,6 +372,24 @@ void amdgpu_ctx_priority_override(struct 
>> amdgpu_ctx *ctx,
>> Â Â Â Â Â  }
>> Â  }
>> Â  +int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx, unsigned
>> +ring_id) {
>> +Â Â Â  struct amdgpu_ctx_ring *cring = &ctx->rings[ring_id];
>> +Â Â Â  unsigned idx = cring->sequence & (amdgpu_sched_jobs - 1);
>> +Â Â Â  struct dma_fence *other = cring->fences[idx];
>> +
>> +Â Â Â  if (other) {
>> +Â Â Â Â Â Â Â  signed long r;
>> +Â Â Â Â Â Â Â  r = dma_fence_wait_timeout(other, false, MAX_SCHEDULE_TIMEOUT);
>> +Â Â Â Â Â Â Â  if (r < 0) {
>> +Â Â Â Â Â Â Â Â Â Â Â  DRM_ERROR("Error (%ld) waiting for fence!\n", r);
>> +Â Â Â Â Â Â Â Â Â Â Â  return r;
>> +Â Â Â Â Â Â Â  }
>> +Â Â Â  }
>> +
>> +Â Â Â  return 0;
>> +}
>> +
>> Â  void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)Â  {
>> Â Â Â Â Â  mutex_init(&mgr->lock);
>> -- 
>> 2.7.4
>>
>
> _______________________________________________
> amd-gfx mailing list
> amd-gfx at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/amd-gfx