On 2/2/26 23:37, Alex Deucher wrote:
> On Mon, Feb 2, 2026 at 7:51 AM Christian König
> <[email protected]> wrote:
>>
>> That is a really complicated dance and wasn't implemented fully correct.
> 
> I'd suggest elaborating on what was wrong with the previous flow.
> It's not entirely clear from the patch.
> 
>>
>> Signed-off-by: Christian König <[email protected]>
>> ---
>>  drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c            | 2 ++
>>  drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c | 8 +++++++-
>>  drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.h | 1 +
>>  drivers/gpu/drm/amd/amdgpu/amdgpu_userq.c          | 7 +++++--
>>  drivers/gpu/drm/amd/amdgpu/amdgpu_userq.h          | 1 +
>>  5 files changed, 16 insertions(+), 3 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
>> index 02abe85624a6..9cd44be45861 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
>> @@ -2976,6 +2976,8 @@ static int amdgpu_drm_release(struct inode *inode, 
>> struct file *filp)
>>
>>         if (fpriv && drm_dev_enter(dev, &idx)) {
>>                 amdgpu_evf_mgr_shutdown(&fpriv->evf_mgr);
>> +               amdgpu_userq_mgr_cancel_resume(&fpriv->userq_mgr);
>> +               amdgpu_evf_mgr_flush_suspend(&fpriv->evf_mgr);
>>                 amdgpu_userq_mgr_fini(&fpriv->userq_mgr);
>>                 amdgpu_evf_mgr_fini(&fpriv->evf_mgr);
>>                 drm_dev_exit(idx);
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
>> index 8fe9f91f9551..ef4da6f2e2a3 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c
>> @@ -146,13 +146,19 @@ void amdgpu_evf_mgr_init(struct 
>> amdgpu_eviction_fence_mgr *evf_mgr)
>>  void amdgpu_evf_mgr_shutdown(struct amdgpu_eviction_fence_mgr *evf_mgr)
>>  {
>>         evf_mgr->shutdown = true;
>> +       /* Make sure that the shutdown is visible to the suspend work */
>>         flush_work(&evf_mgr->suspend_work);
>>  }
>>
>> -void amdgpu_evf_mgr_fini(struct amdgpu_eviction_fence_mgr *evf_mgr)
>> +void amdgpu_evf_mgr_flush_suspend(struct amdgpu_eviction_fence_mgr *evf_mgr)
>>  {
>>         dma_fence_wait(rcu_dereference_protected(evf_mgr->ev_fence, true),
>>                        false);
>> +       /* Make sure that we are done with the last suspend work */
>>         flush_work(&evf_mgr->suspend_work);
> 
> Is it intended to flush the work here and in amdgpu_evf_mgr_shutdown()?

Yes, we need both. That's why I added the comments to explain why we have each.

Going to improve the commit message.

Christian.

> 
> Alex
> 
>> +}
>> +
>> +void amdgpu_evf_mgr_fini(struct amdgpu_eviction_fence_mgr *evf_mgr)
>> +{
>>         dma_fence_put(evf_mgr->ev_fence);
>>  }
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.h 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.h
>> index 527de3a23583..132a13a5dc1c 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.h
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.h
>> @@ -66,6 +66,7 @@ void amdgpu_evf_mgr_detach_fence(struct 
>> amdgpu_eviction_fence_mgr *evf_mgr,
>>                                  struct amdgpu_bo *bo);
>>  void amdgpu_evf_mgr_init(struct amdgpu_eviction_fence_mgr *evf_mgr);
>>  void amdgpu_evf_mgr_shutdown(struct amdgpu_eviction_fence_mgr *evf_mgr);
>> +void amdgpu_evf_mgr_flush_suspend(struct amdgpu_eviction_fence_mgr 
>> *evf_mgr);
>>  void amdgpu_evf_mgr_fini(struct amdgpu_eviction_fence_mgr *evf_mgr);
>>
>>  #endif
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.c 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.c
>> index e007f10a6c1c..60e8a993557a 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.c
>> @@ -1350,13 +1350,16 @@ int amdgpu_userq_mgr_init(struct amdgpu_userq_mgr 
>> *userq_mgr, struct drm_file *f
>>         return 0;
>>  }
>>
>> +void amdgpu_userq_mgr_cancel_resume(struct amdgpu_userq_mgr *userq_mgr)
>> +{
>> +       cancel_delayed_work_sync(&userq_mgr->resume_work);
>> +}
>> +
>>  void amdgpu_userq_mgr_fini(struct amdgpu_userq_mgr *userq_mgr)
>>  {
>>         struct amdgpu_usermode_queue *queue;
>>         unsigned long queue_id;
>>
>> -       cancel_delayed_work_sync(&userq_mgr->resume_work);
>> -
>>         mutex_lock(&userq_mgr->userq_mutex);
>>         amdgpu_userq_detect_and_reset_queues(userq_mgr);
>>         xa_for_each(&userq_mgr->userq_xa, queue_id, queue) {
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.h 
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.h
>> index 095c09f3d96c..13f4e356728b 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.h
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_userq.h
>> @@ -117,6 +117,7 @@ int amdgpu_userq_ioctl(struct drm_device *dev, void 
>> *data, struct drm_file *filp
>>  int amdgpu_userq_mgr_init(struct amdgpu_userq_mgr *userq_mgr, struct 
>> drm_file *file_priv,
>>                           struct amdgpu_device *adev);
>>
>> +void amdgpu_userq_mgr_cancel_resume(struct amdgpu_userq_mgr *userq_mgr);
>>  void amdgpu_userq_mgr_fini(struct amdgpu_userq_mgr *userq_mgr);
>>
>>  int amdgpu_userq_create_object(struct amdgpu_userq_mgr *uq_mgr,
>> --
>> 2.43.0
>>

Reply via email to