Re: [RFC 12/18] drm/sched: Move run queue related code into a separate file

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 




On 09/01/2025 13:02, Christian König wrote:
Am 08.01.25 um 19:35 schrieb Tvrtko Ursulin:
Lets move all the code dealing with struct drm_sched_rq into a separate
compilation unit. Advantage being sched_main.c is left with a clearer set
of responsibilities.

Looks like a good idea to me in general, but I would also push to completely remove run queues or at least rename them.

Glad you noticed how this lead to more possbile simplifications and
yes, that was next in my list of goals.

Key is to find test cases to establish more confidence in the absence of regressions with the single rq approach.

Regards,

Tvrtko

We only came up with the run queue object to handle different job priorities.

But with the FIFO approach now used everywhere you can nuke that and just give individual jobs with higher priorities a boost in their FIFO score.

Regards,
Christian.


Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin@xxxxxxxxxx>
Cc: Christian König <christian.koenig@xxxxxxx>
Cc: Danilo Krummrich <dakr@xxxxxxxxxx>
Cc: Matthew Brost <matthew.brost@xxxxxxxxx>
Cc: Philipp Stanner <pstanner@xxxxxxxxxx>
---
  drivers/gpu/drm/scheduler/Makefile     |   2 +-
  drivers/gpu/drm/scheduler/sched_main.c | 210 +------------------------
  drivers/gpu/drm/scheduler/sched_rq.c   | 207 ++++++++++++++++++++++++
  include/drm/gpu_scheduler.h            |  12 ++
  4 files changed, 222 insertions(+), 209 deletions(-)
  create mode 100644 drivers/gpu/drm/scheduler/sched_rq.c

diff --git a/drivers/gpu/drm/scheduler/Makefile b/drivers/gpu/drm/scheduler/Makefile
index 53863621829f..d11d83e285e7 100644
--- a/drivers/gpu/drm/scheduler/Makefile
+++ b/drivers/gpu/drm/scheduler/Makefile
@@ -20,6 +20,6 @@
  # OTHER DEALINGS IN THE SOFTWARE.
  #
  #
-gpu-sched-y := sched_main.o sched_fence.o sched_entity.o
+gpu-sched-y := sched_main.o sched_fence.o sched_entity.o sched_rq.o
  obj-$(CONFIG_DRM_SCHED) += gpu-sched.o
diff --git a/drivers/gpu/drm/scheduler/sched_main.c b/drivers/gpu/drm/scheduler/sched_main.c
index a21376ce859f..a556ee736f9f 100644
--- a/drivers/gpu/drm/scheduler/sched_main.c
+++ b/drivers/gpu/drm/scheduler/sched_main.c
@@ -87,9 +87,6 @@ static struct lockdep_map drm_sched_lockdep_map = {
  };
  #endif
-#define to_drm_sched_job(sched_job)        \
-        container_of((sched_job), struct drm_sched_job, queue_node)
-
  int drm_sched_policy = DRM_SCHED_POLICY_FIFO;
  /**
@@ -118,8 +115,8 @@ static u32 drm_sched_available_credits(struct drm_gpu_scheduler *sched)
   * Return true if we can push at least one more job from @entity, false
   * otherwise.
   */
-static bool drm_sched_can_queue(struct drm_gpu_scheduler *sched,
-                struct drm_sched_entity *entity)
+bool drm_sched_can_queue(struct drm_gpu_scheduler *sched,
+             struct drm_sched_entity *entity)
  {
      struct drm_sched_job *s_job;
@@ -137,209 +134,6 @@ static bool drm_sched_can_queue(struct drm_gpu_scheduler *sched,
      return drm_sched_available_credits(sched) >= s_job->credits;
  }
-static __always_inline bool drm_sched_entity_compare_before(struct rb_node *a,
-                                const struct rb_node *b)
-{
-    struct drm_sched_entity *ent_a =  rb_entry((a), struct drm_sched_entity, rb_tree_node); -    struct drm_sched_entity *ent_b =  rb_entry((b), struct drm_sched_entity, rb_tree_node);
-
-    return ktime_before(ent_a->oldest_job_waiting, ent_b->oldest_job_waiting);
-}
-
-static void __drm_sched_rq_remove_fifo_locked(struct drm_sched_entity *entity,
-                          struct drm_sched_rq *rq)
-{
-    lockdep_assert_held(&entity->lock);
-    lockdep_assert_held(&rq->lock);
-
-    rb_erase_cached(&entity->rb_tree_node, &rq->rb_tree_root);
-    RB_CLEAR_NODE(&entity->rb_tree_node);
-}
-
-static void __drm_sched_rq_add_fifo_locked(struct drm_sched_entity *entity,
-                       struct drm_sched_rq *rq,
-                       ktime_t ts)
-{
-    /*
-     * Both locks need to be grabbed, one to protect from entity->rq change -     * for entity from within concurrent drm_sched_entity_select_rq and the
-     * other to update the rb tree structure.
-     */
-    lockdep_assert_held(&entity->lock);
-    lockdep_assert_held(&rq->lock);
-
-    entity->oldest_job_waiting = ts;
-
-    rb_add_cached(&entity->rb_tree_node, &rq->rb_tree_root,
-              drm_sched_entity_compare_before);
-}
-
-/**
- * drm_sched_rq_init - initialize a given run queue struct
- *
- * @sched: scheduler instance to associate with this run queue
- * @rq: scheduler run queue
- *
- * Initializes a scheduler runqueue.
- */
-static void drm_sched_rq_init(struct drm_gpu_scheduler *sched,
-                  struct drm_sched_rq *rq)
-{
-    spin_lock_init(&rq->lock);
-    INIT_LIST_HEAD(&rq->entities);
-    rq->rb_tree_root = RB_ROOT_CACHED;
-    rq->sched = sched;
-}
-
-static ktime_t
-drm_sched_rq_get_rr_deadline(struct drm_sched_rq *rq)
-{
-    lockdep_assert_held(&rq->lock);
-
-    rq->rr_deadline = ktime_add_ns(rq->rr_deadline, 1);
-
-    return rq->rr_deadline;
-}
-
-/**
- * drm_sched_rq_add_entity - add an entity
- *
- * @rq: scheduler run queue
- * @entity: scheduler entity
- *
- * Adds a scheduler entity to the run queue.
- *
- * Returns a DRM scheduler pre-selected to handle this entity.
- */
-struct drm_gpu_scheduler *
-drm_sched_rq_add_entity(struct drm_sched_rq *rq,
-            struct drm_sched_entity *entity,
-            ktime_t ts)
-{
-    struct drm_gpu_scheduler *sched;
-
-    if (entity->stopped) {
-        DRM_ERROR("Trying to push to a killed entity\n");
-        return NULL;
-    }
-
-    spin_lock(&entity->lock);
-    spin_lock(&rq->lock);
-
-    sched = rq->sched;
-
-    if (!list_empty(&entity->list)) {
-        atomic_inc(sched->score);
-        list_add_tail(&entity->list, &rq->entities);
-    }
-
-    if (drm_sched_policy == DRM_SCHED_POLICY_RR)
-        ts = drm_sched_rq_get_rr_deadline(rq);
-
-    if (!RB_EMPTY_NODE(&entity->rb_tree_node))
-        __drm_sched_rq_remove_fifo_locked(entity, rq);
-    __drm_sched_rq_add_fifo_locked(entity, rq, ts);
-
-    spin_unlock(&rq->lock);
-    spin_unlock(&entity->lock);
-
-    return sched;
-}
-
-/**
- * drm_sched_rq_remove_entity - remove an entity
- *
- * @rq: scheduler run queue
- * @entity: scheduler entity
- *
- * Removes a scheduler entity from the run queue.
- */
-void drm_sched_rq_remove_entity(struct drm_sched_rq *rq,
-                struct drm_sched_entity *entity)
-{
-    lockdep_assert_held(&entity->lock);
-
-    if (list_empty(&entity->list))
-        return;
-
-    spin_lock(&rq->lock);
-
-    atomic_dec(rq->sched->score);
-    list_del_init(&entity->list);
-
-    if (!RB_EMPTY_NODE(&entity->rb_tree_node))
-        __drm_sched_rq_remove_fifo_locked(entity, rq);
-
-    spin_unlock(&rq->lock);
-}
-
-void drm_sched_rq_pop_entity(struct drm_sched_rq *rq,
-                 struct drm_sched_entity *entity)
-{
-    struct drm_sched_job *next_job;
-
-    spin_lock(&entity->lock);
-    spin_lock(&rq->lock);
-    __drm_sched_rq_remove_fifo_locked(entity, rq);
-    next_job = to_drm_sched_job(spsc_queue_peek(&entity->job_queue));
-    if (next_job) {
-        ktime_t ts;
-
-        if (drm_sched_policy == DRM_SCHED_POLICY_FIFO)
-            ts = next_job->submit_ts;
-        else
-            ts = drm_sched_rq_get_rr_deadline(rq);
-
-        __drm_sched_rq_add_fifo_locked(entity, rq, ts);
-    }
-    spin_unlock(&rq->lock);
-    spin_unlock(&entity->lock);
-}
-
-/**
- * drm_sched_rq_select_entity - Select an entity which provides a job to run
- *
- * @sched: the gpu scheduler
- * @rq: scheduler run queue to check.
- *
- * Find oldest waiting ready entity.
- *
- * Return an entity if one is found; return an error-pointer (!NULL) if an - * entity was ready, but the scheduler had insufficient credits to accommodate
- * its job; return NULL, if no ready entity was found.
- */
-static struct drm_sched_entity *
-drm_sched_rq_select_entity(struct drm_gpu_scheduler *sched,
-               struct drm_sched_rq *rq)
-{
-    struct drm_sched_entity *entity = NULL;
-    struct rb_node *rb;
-
-    spin_lock(&rq->lock);
-    for (rb = rb_first_cached(&rq->rb_tree_root); rb; rb = rb_next(rb)) {
-        entity = rb_entry(rb, struct drm_sched_entity, rb_tree_node);
-        if (drm_sched_entity_is_ready(entity))
-            break;
-        else
-            entity = NULL;
-    }
-    spin_unlock(&rq->lock);
-
-    if (!entity)
-        return NULL;
-
-    /*
-     * If scheduler cannot take more jobs signal the caller to not consider
-     * lower priority queues.
-     */
-    if (!drm_sched_can_queue(sched, entity))
-        return ERR_PTR(-ENOSPC);
-
-    reinit_completion(&entity->entity_idle);
-
-    return entity;
-}
-
  /**
   * drm_sched_run_job_queue - enqueue run-job work
   * @sched: scheduler instance
diff --git a/drivers/gpu/drm/scheduler/sched_rq.c b/drivers/gpu/drm/scheduler/sched_rq.c
new file mode 100644
index 000000000000..40f5b770f21a
--- /dev/null
+++ b/drivers/gpu/drm/scheduler/sched_rq.c
@@ -0,0 +1,207 @@
+#include <linux/rbtree.h>
+
+#include <drm/drm_print.h>
+#include <drm/gpu_scheduler.h>
+
+static __always_inline bool drm_sched_entity_compare_before(struct rb_node *a,
+                                const struct rb_node *b)
+{
+    struct drm_sched_entity *ent_a =  rb_entry((a), struct drm_sched_entity, rb_tree_node); +    struct drm_sched_entity *ent_b =  rb_entry((b), struct drm_sched_entity, rb_tree_node);
+
+    return ktime_before(ent_a->oldest_job_waiting, ent_b->oldest_job_waiting);
+}
+
+static void __drm_sched_rq_remove_fifo_locked(struct drm_sched_entity *entity,
+                          struct drm_sched_rq *rq)
+{
+    lockdep_assert_held(&entity->lock);
+    lockdep_assert_held(&rq->lock);
+
+    rb_erase_cached(&entity->rb_tree_node, &rq->rb_tree_root);
+    RB_CLEAR_NODE(&entity->rb_tree_node);
+}
+
+static void __drm_sched_rq_add_fifo_locked(struct drm_sched_entity *entity,
+                       struct drm_sched_rq *rq,
+                       ktime_t ts)
+{
+    /*
+     * Both locks need to be grabbed, one to protect from entity->rq change +     * for entity from within concurrent drm_sched_entity_select_rq and the
+     * other to update the rb tree structure.
+     */
+    lockdep_assert_held(&entity->lock);
+    lockdep_assert_held(&rq->lock);
+
+    entity->oldest_job_waiting = ts;
+    rb_add_cached(&entity->rb_tree_node, &rq->rb_tree_root,
+              drm_sched_entity_compare_before);
+}
+
+/**
+ * drm_sched_rq_init - initialize a given run queue struct
+ *
+ * @sched: scheduler instance to associate with this run queue
+ * @rq: scheduler run queue
+ *
+ * Initializes a scheduler runqueue.
+ */
+void drm_sched_rq_init(struct drm_gpu_scheduler *sched,
+               struct drm_sched_rq *rq)
+{
+    spin_lock_init(&rq->lock);
+    INIT_LIST_HEAD(&rq->entities);
+    rq->rb_tree_root = RB_ROOT_CACHED;
+    rq->sched = sched;
+}
+
+static ktime_t
+drm_sched_rq_get_rr_deadline(struct drm_sched_rq *rq)
+{
+    lockdep_assert_held(&rq->lock);
+
+    rq->rr_deadline = ktime_add_ns(rq->rr_deadline, 1);
+
+    return rq->rr_deadline;
+}
+
+/**
+ * drm_sched_rq_add_entity - add an entity
+ *
+ * @rq: scheduler run queue
+ * @entity: scheduler entity
+ * @ts: submission timestamp
+ *
+ * Adds a scheduler entity to the run queue.
+ *
+ * Returns a DRM scheduler pre-selected to handle this entity.
+ */
+struct drm_gpu_scheduler *
+drm_sched_rq_add_entity(struct drm_sched_rq *rq,
+            struct drm_sched_entity *entity,
+            ktime_t ts)
+{
+    struct drm_gpu_scheduler *sched;
+
+    if (entity->stopped) {
+        DRM_ERROR("Trying to push to a killed entity\n");
+        return NULL;
+    }
+
+    spin_lock(&entity->lock);
+    spin_lock(&rq->lock);
+
+    sched = rq->sched;
+
+    if (!list_empty(&entity->list)) {
+        atomic_inc(sched->score);
+        list_add_tail(&entity->list, &rq->entities);
+    }
+
+    if (drm_sched_policy == DRM_SCHED_POLICY_RR)
+        ts = drm_sched_rq_get_rr_deadline(rq);
+
+    if (!RB_EMPTY_NODE(&entity->rb_tree_node))
+        __drm_sched_rq_remove_fifo_locked(entity, rq);
+    __drm_sched_rq_add_fifo_locked(entity, rq, ts);
+
+    spin_unlock(&rq->lock);
+    spin_unlock(&entity->lock);
+
+    return sched;
+}
+
+/**
+ * drm_sched_rq_remove_entity - remove an entity
+ *
+ * @rq: scheduler run queue
+ * @entity: scheduler entity
+ *
+ * Removes a scheduler entity from the run queue.
+ */
+void drm_sched_rq_remove_entity(struct drm_sched_rq *rq,
+                struct drm_sched_entity *entity)
+{
+    lockdep_assert_held(&entity->lock);
+
+    if (list_empty(&entity->list))
+        return;
+
+    spin_lock(&rq->lock);
+
+    atomic_dec(rq->sched->score);
+    list_del_init(&entity->list);
+
+    if (!RB_EMPTY_NODE(&entity->rb_tree_node))
+        __drm_sched_rq_remove_fifo_locked(entity, rq);
+
+    spin_unlock(&rq->lock);
+}
+
+void drm_sched_rq_pop_entity(struct drm_sched_rq *rq,
+                 struct drm_sched_entity *entity)
+{
+    struct drm_sched_job *next_job;
+
+    spin_lock(&entity->lock);
+    spin_lock(&rq->lock);
+    __drm_sched_rq_remove_fifo_locked(entity, rq);
+    next_job = to_drm_sched_job(spsc_queue_peek(&entity->job_queue));
+    if (next_job) {
+        ktime_t ts;
+
+        if (drm_sched_policy == DRM_SCHED_POLICY_FIFO)
+            ts = next_job->submit_ts;
+        else
+            ts = drm_sched_rq_get_rr_deadline(rq);
+
+        __drm_sched_rq_add_fifo_locked(entity, rq, ts);
+    }
+    spin_unlock(&rq->lock);
+    spin_unlock(&entity->lock);
+}
+
+/**
+ * drm_sched_rq_select_entity - Select an entity which provides a job to run
+ *
+ * @sched: the gpu scheduler
+ * @rq: scheduler run queue to check.
+ *
+ * Find oldest waiting ready entity.
+ *
+ * Return an entity if one is found; return an error-pointer (!NULL) if an + * entity was ready, but the scheduler had insufficient credits to accommodate
+ * its job; return NULL, if no ready entity was found.
+ */
+struct drm_sched_entity *
+drm_sched_rq_select_entity(struct drm_gpu_scheduler *sched,
+               struct drm_sched_rq *rq)
+{
+    struct drm_sched_entity *entity = NULL;
+    struct rb_node *rb;
+
+    spin_lock(&rq->lock);
+    for (rb = rb_first_cached(&rq->rb_tree_root); rb; rb = rb_next(rb)) {
+        entity = rb_entry(rb, struct drm_sched_entity, rb_tree_node);
+        if (drm_sched_entity_is_ready(entity))
+            break;
+        else
+            entity = NULL;
+    }
+    spin_unlock(&rq->lock);
+
+    if (!entity)
+        return NULL;
+
+    /*
+     * If scheduler cannot take more jobs signal the caller to not consider
+     * lower priority queues.
+     */
+    if (!drm_sched_can_queue(sched, entity))
+        return ERR_PTR(-ENOSPC);
+
+    reinit_completion(&entity->entity_idle);
+
+    return entity;
+}
diff --git a/include/drm/gpu_scheduler.h b/include/drm/gpu_scheduler.h
index daf4665f37fa..ccb39e7bf384 100644
--- a/include/drm/gpu_scheduler.h
+++ b/include/drm/gpu_scheduler.h
@@ -386,6 +386,9 @@ struct drm_sched_job {
      ktime_t                         submit_ts;
  };
+#define to_drm_sched_job(sched_job)        \
+        container_of((sched_job), struct drm_sched_job, queue_node)
+
  static inline bool drm_sched_invalidate_job(struct drm_sched_job *s_job,
                          int threshold)
  {
@@ -547,6 +550,9 @@ int drm_sched_init(struct drm_gpu_scheduler *sched,
             atomic_t *score, const char *name, struct device *dev);
  void drm_sched_fini(struct drm_gpu_scheduler *sched);
+bool drm_sched_can_queue(struct drm_gpu_scheduler *sched,
+             struct drm_sched_entity *entity);
+
  int drm_sched_job_init(struct drm_sched_job *job,
                 struct drm_sched_entity *entity,
                 u32 credits, void *owner);
@@ -586,6 +592,9 @@ bool drm_sched_dependency_optimized(struct dma_fence* fence,
                      struct drm_sched_entity *entity);
  void drm_sched_fault(struct drm_gpu_scheduler *sched);
+void drm_sched_rq_init(struct drm_gpu_scheduler *sched,
+               struct drm_sched_rq *rq);
+
  struct drm_gpu_scheduler *
  drm_sched_rq_add_entity(struct drm_sched_rq *rq,
              struct drm_sched_entity *entity,
@@ -595,6 +604,9 @@ void drm_sched_rq_remove_entity(struct drm_sched_rq *rq,
  void drm_sched_rq_pop_entity(struct drm_sched_rq *rq,
                   struct drm_sched_entity *entity);
+struct drm_sched_entity *
+drm_sched_rq_select_entity(struct drm_gpu_scheduler *sched,
+               struct drm_sched_rq *rq);
  int drm_sched_entity_init(struct drm_sched_entity *entity,
                enum drm_sched_priority priority,




[Index of Archives]     [Linux DRI Users]     [Linux Intel Graphics]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]     [XFree86]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Linux Kernel]     [Linux SCSI]     [XFree86]
  Powered by Linux