Feel free to merge 1+2 since they don't really depend on any other work in the series and they were previously reviewed. Nicholas Kazlauskas On 4/23/19 8:32 AM, Koenig, Christian wrote: > Well you at least have to give me time till after the holidays to get > going again :) > > Not sure exactly jet why we need patch number 5. > > And we should probably commit patch #1 and #2. > > Christian. > > Am 22.04.19 um 13:54 schrieb Grodzovsky, Andrey: >> Ping for patches 3, new patch 5 and patch 6. >> >> Andrey >> >> On 4/18/19 11:00 AM, Andrey Grodzovsky wrote: >>> Also reject TDRs if another one already running. >>> >>> v2: >>> Stop all schedulers across device and entire XGMI hive before >>> force signaling HW fences. >>> Avoid passing job_signaled to helper fnctions to keep all the decision >>> making about skipping HW reset in one place. >>> >>> v3: >>> Fix SW sched. hang after non HW reset. sched.hw_rq_count has to be balanced >>> against it's decrement in drm_sched_stop in non HW reset case. >>> v4: rebase >>> v5: Revert v3 as we do it now in sceduler code. >>> >>> Signed-off-by: Andrey Grodzovsky <andrey.grodzovsky@xxxxxxx> >>> --- >>> drivers/gpu/drm/amd/amdgpu/amdgpu_device.c | 143 +++++++++++++++++++---------- >>> 1 file changed, 95 insertions(+), 48 deletions(-) >>> >>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c >>> index a0e165c..85f8792 100644 >>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c >>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c >>> @@ -3334,8 +3334,6 @@ static int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev, >>> if (!ring || !ring->sched.thread) >>> continue; >>> >>> - drm_sched_stop(&ring->sched, &job->base); >>> - >>> /* after all hw jobs are reset, hw fence is meaningless, so force_completion */ >>> amdgpu_fence_driver_force_completion(ring); >>> } >>> @@ -3343,6 +3341,7 @@ static int amdgpu_device_pre_asic_reset(struct amdgpu_device *adev, >>> if(job) >>> drm_sched_increase_karma(&job->base); >>> >>> + /* Don't suspend on bare metal if we are not going to HW reset the ASIC */ >>> if (!amdgpu_sriov_vf(adev)) { >>> >>> if (!need_full_reset) >>> @@ -3480,37 +3479,21 @@ static int amdgpu_do_asic_reset(struct amdgpu_hive_info *hive, >>> return r; >>> } >>> >>> -static void amdgpu_device_post_asic_reset(struct amdgpu_device *adev) >>> +static bool amdgpu_device_lock_adev(struct amdgpu_device *adev, bool trylock) >>> { >>> - int i; >>> - >>> - for (i = 0; i < AMDGPU_MAX_RINGS; ++i) { >>> - struct amdgpu_ring *ring = adev->rings[i]; >>> - >>> - if (!ring || !ring->sched.thread) >>> - continue; >>> - >>> - if (!adev->asic_reset_res) >>> - drm_sched_resubmit_jobs(&ring->sched); >>> + if (trylock) { >>> + if (!mutex_trylock(&adev->lock_reset)) >>> + return false; >>> + } else >>> + mutex_lock(&adev->lock_reset); >>> >>> - drm_sched_start(&ring->sched, !adev->asic_reset_res); >>> - } >>> - >>> - if (!amdgpu_device_has_dc_support(adev)) { >>> - drm_helper_resume_force_mode(adev->ddev); >>> - } >>> - >>> - adev->asic_reset_res = 0; >>> -} >>> - >>> -static void amdgpu_device_lock_adev(struct amdgpu_device *adev) >>> -{ >>> - mutex_lock(&adev->lock_reset); >>> atomic_inc(&adev->gpu_reset_counter); >>> adev->in_gpu_reset = 1; >>> /* Block kfd: SRIOV would do it separately */ >>> if (!amdgpu_sriov_vf(adev)) >>> amdgpu_amdkfd_pre_reset(adev); >>> + >>> + return true; >>> } >>> >>> static void amdgpu_device_unlock_adev(struct amdgpu_device *adev) >>> @@ -3538,40 +3521,42 @@ static void amdgpu_device_unlock_adev(struct amdgpu_device *adev) >>> int amdgpu_device_gpu_recover(struct amdgpu_device *adev, >>> struct amdgpu_job *job) >>> { >>> - int r; >>> + struct list_head device_list, *device_list_handle = NULL; >>> + bool need_full_reset, job_signaled; >>> struct amdgpu_hive_info *hive = NULL; >>> - bool need_full_reset = false; >>> struct amdgpu_device *tmp_adev = NULL; >>> - struct list_head device_list, *device_list_handle = NULL; >>> + int i, r = 0; >>> >>> + need_full_reset = job_signaled = false; >>> INIT_LIST_HEAD(&device_list); >>> >>> dev_info(adev->dev, "GPU reset begin!\n"); >>> >>> + hive = amdgpu_get_xgmi_hive(adev, false); >>> + >>> /* >>> - * In case of XGMI hive disallow concurrent resets to be triggered >>> - * by different nodes. No point also since the one node already executing >>> - * reset will also reset all the other nodes in the hive. >>> + * Here we trylock to avoid chain of resets executing from >>> + * either trigger by jobs on different adevs in XGMI hive or jobs on >>> + * different schedulers for same device while this TO handler is running. >>> + * We always reset all schedulers for device and all devices for XGMI >>> + * hive so that should take care of them too. >>> */ >>> - hive = amdgpu_get_xgmi_hive(adev, 0); >>> - if (hive && adev->gmc.xgmi.num_physical_nodes > 1 && >>> - !mutex_trylock(&hive->reset_lock)) >>> + >>> + if (hive && !mutex_trylock(&hive->reset_lock)) { >>> + DRM_INFO("Bailing on TDR for s_job:%llx, hive: %llx as another already in progress", >>> + job->base.id, hive->hive_id); >>> return 0; >>> + } >>> >>> /* Start with adev pre asic reset first for soft reset check.*/ >>> - amdgpu_device_lock_adev(adev); >>> - r = amdgpu_device_pre_asic_reset(adev, >>> - job, >>> - &need_full_reset); >>> - if (r) { >>> - /*TODO Should we stop ?*/ >>> - DRM_ERROR("GPU pre asic reset failed with err, %d for drm dev, %s ", >>> - r, adev->ddev->unique); >>> - adev->asic_reset_res = r; >>> + if (!amdgpu_device_lock_adev(adev, !hive)) { >>> + DRM_INFO("Bailing on TDR for s_job:%llx, as another already in progress", >>> + job->base.id); >>> + return 0; >>> } >>> >>> /* Build list of devices to reset */ >>> - if (need_full_reset && adev->gmc.xgmi.num_physical_nodes > 1) { >>> + if (adev->gmc.xgmi.num_physical_nodes > 1) { >>> if (!hive) { >>> amdgpu_device_unlock_adev(adev); >>> return -ENODEV; >>> @@ -3588,13 +3573,56 @@ int amdgpu_device_gpu_recover(struct amdgpu_device *adev, >>> device_list_handle = &device_list; >>> } >>> >>> + /* block all schedulers and reset given job's ring */ >>> + list_for_each_entry(tmp_adev, device_list_handle, gmc.xgmi.head) { >>> + for (i = 0; i < AMDGPU_MAX_RINGS; ++i) { >>> + struct amdgpu_ring *ring = tmp_adev->rings[i]; >>> + >>> + if (!ring || !ring->sched.thread) >>> + continue; >>> + >>> + drm_sched_stop(&ring->sched, &job->base); >>> + } >>> + } >>> + >>> + >>> + /* >>> + * Must check guilty signal here since after this point all old >>> + * HW fences are force signaled. >>> + * >>> + * job->base holds a reference to parent fence >>> + */ >>> + if (job && job->base.s_fence->parent && >>> + dma_fence_is_signaled(job->base.s_fence->parent)) >>> + job_signaled = true; >>> + >>> + if (!amdgpu_device_ip_need_full_reset(adev)) >>> + device_list_handle = &device_list; >>> + >>> + if (job_signaled) { >>> + dev_info(adev->dev, "Guilty job already signaled, skipping HW reset"); >>> + goto skip_hw_reset; >>> + } >>> + >>> + >>> + /* Guilty job will be freed after this*/ >>> + r = amdgpu_device_pre_asic_reset(adev, >>> + job, >>> + &need_full_reset); >>> + if (r) { >>> + /*TODO Should we stop ?*/ >>> + DRM_ERROR("GPU pre asic reset failed with err, %d for drm dev, %s ", >>> + r, adev->ddev->unique); >>> + adev->asic_reset_res = r; >>> + } >>> + >>> retry: /* Rest of adevs pre asic reset from XGMI hive. */ >>> list_for_each_entry(tmp_adev, device_list_handle, gmc.xgmi.head) { >>> >>> if (tmp_adev == adev) >>> continue; >>> >>> - amdgpu_device_lock_adev(tmp_adev); >>> + amdgpu_device_lock_adev(tmp_adev, false); >>> r = amdgpu_device_pre_asic_reset(tmp_adev, >>> NULL, >>> &need_full_reset); >>> @@ -3618,9 +3646,28 @@ int amdgpu_device_gpu_recover(struct amdgpu_device *adev, >>> goto retry; >>> } >>> >>> +skip_hw_reset: >>> + >>> /* Post ASIC reset for all devs .*/ >>> list_for_each_entry(tmp_adev, device_list_handle, gmc.xgmi.head) { >>> - amdgpu_device_post_asic_reset(tmp_adev); >>> + for (i = 0; i < AMDGPU_MAX_RINGS; ++i) { >>> + struct amdgpu_ring *ring = tmp_adev->rings[i]; >>> + >>> + if (!ring || !ring->sched.thread) >>> + continue; >>> + >>> + /* No point to resubmit jobs if we didn't HW reset*/ >>> + if (!tmp_adev->asic_reset_res && !job_signaled) >>> + drm_sched_resubmit_jobs(&ring->sched); >>> + >>> + drm_sched_start(&ring->sched, !tmp_adev->asic_reset_res); >>> + } >>> + >>> + if (!amdgpu_device_has_dc_support(tmp_adev) && !job_signaled) { >>> + drm_helper_resume_force_mode(tmp_adev->ddev); >>> + } >>> + >>> + tmp_adev->asic_reset_res = 0; >>> >>> if (r) { >>> /* bad news, how to tell it to userspace ? */ >>> @@ -3633,7 +3680,7 @@ int amdgpu_device_gpu_recover(struct amdgpu_device *adev, >>> amdgpu_device_unlock_adev(tmp_adev); >>> } >>> >>> - if (hive && adev->gmc.xgmi.num_physical_nodes > 1) >>> + if (hive) >>> mutex_unlock(&hive->reset_lock); >>> >>> if (r) > > _______________________________________________ > dri-devel mailing list > dri-devel@xxxxxxxxxxxxxxxxxxxxx > https://lists.freedesktop.org/mailman/listinfo/dri-devel > _______________________________________________ amd-gfx mailing list amd-gfx@xxxxxxxxxxxxxxxxxxxxx https://lists.freedesktop.org/mailman/listinfo/amd-gfx