sched: Waiting for pending jobs to complete in scheduler kill

Christian König Mon, 18 Sep 2023 22:56:28 -0700

Am 18.09.23 um 16:57 schrieb Danilo Krummrich:

[SNIP]
What this component should do is to push jobs to the hardware and notoverview their execution, that's the job of the driver.
While, generally, I'd agree, I think we can't really get around havingsomething thatfrees the job once it's fence got signaled. This "something" could bethe driver, butonce it ends up being the same code over and over again for everydriver, we're probably
back letting the scheduler do it instead in a common way.

We already have a driver private void* in the scheduler fence. What wecould .do is to let the scheduler provide a functionality to call afunction when it signals.

In other words drivers should be able to call drm_sched_fini() whilethere are jobs still pending on the hardware.
Unless we have a better idea on how to do this, I'd, as mentioned,suggest to have somethinglike drm_sched_teardown() and/or drm_sched_teardown_timeout() waitingfor pending jobs.

Yeah, something like that. But I think the better functionality would beprovide an interator to go over the pending fences in the scheduler.

This could then be used for quite a bunch of use cases, e.g. even forsignaling the hardware fences etc...

Waiting for the last one is then just a "drm_sched_for_each_pending(...)dma_fence_wait_timeout(pending->finished....);".

Also keep in mind that you *can't* wait for all hw operations tofinish in your flush or file descriptor close callback or you createun-killable processes.
Right, that's why in Nouveau I try to wait for the channel (ring)being idle and if this didn'twork in a "reasonable" amount of time, I kill the fence context,signalling all fences with anerror code, and wait for the scheduler being idle, which comes down toonly wait for all free_job()
callbacks to finish, since all jobs are signaled already.


Exactly that's the right thing to do. Can we please document that somewhere?

Regards,
Christian.


Regards,
Christian.


Matt

Regards,
Christian.


Signed-off-by: Matthew Brost <matthew.br...@intel.com>
---
   drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c |  2 +-
   drivers/gpu/drm/scheduler/sched_entity.c    |  7 ++-

drivers/gpu/drm/scheduler/sched_main.c | 50++++++++++++++++++---

   include/drm/gpu_scheduler.h                 | 18 ++++++++
   4 files changed, 70 insertions(+), 7 deletions(-)

diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.cb/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c

index fb5dad687168..7835c0da65c5 100644
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c

@@ -1873,7 +1873,7 @@ static voidamdgpu_ib_preempt_mark_partial_job(struct amdgpu_ring *ring) list_for_each_entry_safe(s_job, tmp, &sched->pending_list,list) {

           if (dma_fence_is_signaled(&s_job->s_fence->finished)) {
               /* remove job from ring_mirror_list */
-            list_del_init(&s_job->list);
+            drm_sched_remove_pending_job(s_job);
               sched->ops->free_job(s_job);
               continue;
           }

diff --git a/drivers/gpu/drm/scheduler/sched_entity.cb/drivers/gpu/drm/scheduler/sched_entity.c

index 1dec97caaba3..37557fbb96d0 100644
--- a/drivers/gpu/drm/scheduler/sched_entity.c
+++ b/drivers/gpu/drm/scheduler/sched_entity.c

@@ -104,9 +104,11 @@ int drm_sched_entity_init(structdrm_sched_entity *entity,

       }
       init_completion(&entity->entity_idle);
+    init_completion(&entity->jobs_done);
-    /* We start in an idle state. */
+    /* We start in an idle and jobs done state. */
       complete_all(&entity->entity_idle);
+    complete_all(&entity->jobs_done);
       spin_lock_init(&entity->rq_lock);
       spsc_queue_init(&entity->job_queue);

@@ -256,6 +258,9 @@ static void drm_sched_entity_kill(structdrm_sched_entity *entity) /* Make sure this entity is not used by the scheduler atthe moment */

       wait_for_completion(&entity->entity_idle);
+    /* Make sure all pending jobs are done */
+    wait_for_completion(&entity->jobs_done);
+

/* The entity is guaranteed to not be used by thescheduler */

       prev = rcu_dereference_check(entity->last_scheduled, true);
       dma_fence_get(prev);

diff --git a/drivers/gpu/drm/scheduler/sched_main.cb/drivers/gpu/drm/scheduler/sched_main.c

index 689fb6686e01..ed6f5680793a 100644
--- a/drivers/gpu/drm/scheduler/sched_main.c
+++ b/drivers/gpu/drm/scheduler/sched_main.c

@@ -510,12 +510,52 @@ void drm_sched_resume_timeout(structdrm_gpu_scheduler *sched,

   }
   EXPORT_SYMBOL(drm_sched_resume_timeout);
+/**
+ * drm_sched_add_pending_job - Add pending job to scheduler
+ *
+ * @job: scheduler job to add
+ * @tail: add to tail of pending list
+ */

+void drm_sched_add_pending_job(struct drm_sched_job *job, booltail)

+{
+    struct drm_gpu_scheduler *sched = job->sched;
+    struct drm_sched_entity *entity = job->entity;
+
+    lockdep_assert_held(&sched->job_list_lock);
+
+    if (tail)
+        list_add_tail(&job->list, &sched->pending_list);
+    else
+        list_add(&job->list, &sched->pending_list);
+    if (!entity->pending_job_count++)
+        reinit_completion(&entity->jobs_done);
+}
+EXPORT_SYMBOL(drm_sched_add_pending_job);
+
+/**

+ * drm_sched_remove_pending_job - Remove pending job from`scheduler

+ *
+ * @job: scheduler job to remove
+ */
+void drm_sched_remove_pending_job(struct drm_sched_job *job)
+{
+    struct drm_gpu_scheduler *sched = job->sched;
+    struct drm_sched_entity *entity = job->entity;
+
+    lockdep_assert_held(&sched->job_list_lock);
+
+    list_del_init(&job->list);
+    if (!--entity->pending_job_count)
+        complete_all(&entity->jobs_done);
+}
+EXPORT_SYMBOL(drm_sched_remove_pending_job);
+
   static void drm_sched_job_begin(struct drm_sched_job *s_job)
   {
       struct drm_gpu_scheduler *sched = s_job->sched;
       spin_lock(&sched->job_list_lock);
-    list_add_tail(&s_job->list, &sched->pending_list);
+    drm_sched_add_pending_job(s_job, true);
       spin_unlock(&sched->job_list_lock);
   }

@@ -538,7 +578,7 @@ static void drm_sched_job_timedout(structwork_struct *work) * drm_sched_cleanup_jobs. It will be reinserted backafter sched->thread

            * is parked at which point it's safe.
            */
-        list_del_init(&job->list);
+        drm_sched_remove_pending_job(job);
           spin_unlock(&sched->job_list_lock);
           status = job->sched->ops->timedout_job(job);

@@ -589,7 +629,7 @@ void drm_sched_stop(struct drm_gpu_scheduler*sched, struct drm_sched_job *bad) * Add at the head of the queue to reflect it was theearliest

            * job extracted.
            */
-        list_add(&bad->list, &sched->pending_list);
+        drm_sched_add_pending_job(bad, false);
       /*

* Iterate the job list from later to earlier one andeither deactive@@ -611,7 +651,7 @@ void drm_sched_stop(struct drm_gpu_scheduler*sched, struct drm_sched_job *bad)

                * Locking here is for concurrent resume timeout
                */
               spin_lock(&sched->job_list_lock);
-            list_del_init(&s_job->list);
+            drm_sched_remove_pending_job(s_job);
spin_unlock(&sched->job_list_lock);
               /*

@@ -1066,7 +1106,7 @@ drm_sched_get_cleanup_job(structdrm_gpu_scheduler *sched)

       if (job && dma_fence_is_signaled(&job->s_fence->finished)) {
           /* remove job from pending_list */
-        list_del_init(&job->list);
+        drm_sched_remove_pending_job(job);
           /* cancel this job's TO timer */
           cancel_delayed_work(&sched->work_tdr);

diff --git a/include/drm/gpu_scheduler.hb/include/drm/gpu_scheduler.h

index b7b818cd81b6..7c628f36fe78 100644
--- a/include/drm/gpu_scheduler.h
+++ b/include/drm/gpu_scheduler.h
@@ -233,6 +233,21 @@ struct drm_sched_entity {
        */
       struct completion        entity_idle;
+    /**
+     * @pending_job_count:
+     *
+     * Number of pending jobs.
+     */
+    unsigned int                    pending_job_count;
+
+    /**
+     * @jobs_done:
+     *

+ * Signals when entity has no pending jobs, used to sequenceentity

+     * cleanup in drm_sched_entity_fini().
+     */
+    struct completion        jobs_done;
+
       /**
        * @oldest_job_waiting:
        *
@@ -656,4 +671,7 @@ struct drm_gpu_scheduler *
   drm_sched_pick_best(struct drm_gpu_scheduler **sched_list,
                unsigned int num_sched_list);

+void drm_sched_add_pending_job(struct drm_sched_job *job, booltail);

+void drm_sched_remove_pending_job(struct drm_sched_job *job);
+
   #endif

Re: [PATCH v3 11/13] drm/sched: Waiting for pending jobs to complete in scheduler kill

Reply via email to