Message ID | 20250108183528.41007-15-tvrtko.ursulin@igalia.com (mailing list archive) |
---|---|
State | New |
Headers | show |
Series | Deadline scheduler and other ideas | expand |
Am 08.01.25 um 19:35 schrieb Tvrtko Ursulin: > If the new deadline policy is at least as good as FIFO and we can afford > to remove round-robin, we can simplify the scheduler code by making the > scheduler to run queue relationship always 1:1 and remove some code. > > Also, now that the FIFO policy is gone the tree of entities is not a FIFO > tree any more so rename it to just the tree. Yeah that's exactly what I mean with my comment on the other patch. I'm totally in favor of that, feel free to add my acked by to this approach. I will try to find some time to give it some in deep review. Thanks, Christian. > > Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin@igalia.com> > Cc: Christian König <christian.koenig@amd.com> > Cc: Danilo Krummrich <dakr@redhat.com> > Cc: Matthew Brost <matthew.brost@intel.com> > Cc: Philipp Stanner <pstanner@redhat.com> > --- > drivers/gpu/drm/amd/amdgpu/amdgpu_job.c | 23 ++-- > drivers/gpu/drm/scheduler/sched_entity.c | 30 +---- > drivers/gpu/drm/scheduler/sched_main.c | 136 ++++++----------------- > drivers/gpu/drm/scheduler/sched_rq.c | 36 ++---- > include/drm/gpu_scheduler.h | 13 +-- > 5 files changed, 56 insertions(+), 182 deletions(-) > > diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c > index b9d08bc96581..918b6d4919e1 100644 > --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c > +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c > @@ -418,25 +418,22 @@ static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job) > > void amdgpu_job_stop_all_jobs_on_sched(struct drm_gpu_scheduler *sched) > { > + struct drm_sched_rq *rq = sched->rq; > + struct drm_sched_entity *s_entity; > struct drm_sched_job *s_job; > - struct drm_sched_entity *s_entity = NULL; > - int i; > > /* Signal all jobs not yet scheduled */ > - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { > - struct drm_sched_rq *rq = sched->sched_rq[i]; > - spin_lock(&rq->lock); > - list_for_each_entry(s_entity, &rq->entities, list) { > - while ((s_job = to_drm_sched_job(spsc_queue_pop(&s_entity->job_queue)))) { > - struct drm_sched_fence *s_fence = s_job->s_fence; > + spin_lock(&rq->lock); > + list_for_each_entry(s_entity, &rq->entities, list) { > + while ((s_job = to_drm_sched_job(spsc_queue_pop(&s_entity->job_queue)))) { > + struct drm_sched_fence *s_fence = s_job->s_fence; > > - dma_fence_signal(&s_fence->scheduled); > - dma_fence_set_error(&s_fence->finished, -EHWPOISON); > - dma_fence_signal(&s_fence->finished); > - } > + dma_fence_signal(&s_fence->scheduled); > + dma_fence_set_error(&s_fence->finished, -EHWPOISON); > + dma_fence_signal(&s_fence->finished); > } > - spin_unlock(&rq->lock); > } > + spin_unlock(&rq->lock); > > /* Signal all jobs already scheduled to HW */ > list_for_each_entry(s_job, &sched->pending_list, list) { > diff --git a/drivers/gpu/drm/scheduler/sched_entity.c b/drivers/gpu/drm/scheduler/sched_entity.c > index e3c875b0afe8..98c78d1373d8 100644 > --- a/drivers/gpu/drm/scheduler/sched_entity.c > +++ b/drivers/gpu/drm/scheduler/sched_entity.c > @@ -71,8 +71,6 @@ int drm_sched_entity_init(struct drm_sched_entity *entity, > entity->guilty = guilty; > entity->num_sched_list = num_sched_list; > entity->priority = priority; > - entity->rq_priority = drm_sched_policy == DRM_SCHED_POLICY_DEADLINE ? > - DRM_SCHED_PRIORITY_KERNEL : priority; > /* > * It's perfectly valid to initialize an entity without having a valid > * scheduler attached. It's just not valid to use the scheduler before it > @@ -82,30 +80,14 @@ int drm_sched_entity_init(struct drm_sched_entity *entity, > RCU_INIT_POINTER(entity->last_scheduled, NULL); > RB_CLEAR_NODE(&entity->rb_tree_node); > > - if (num_sched_list && !sched_list[0]->sched_rq) { > + if (num_sched_list && !sched_list[0]->rq) { > /* Since every entry covered by num_sched_list > * should be non-NULL and therefore we warn drivers > * not to do this and to fix their DRM calling order. > */ > pr_warn("%s: called with uninitialized scheduler\n", __func__); > } else if (num_sched_list) { > - enum drm_sched_priority p = entity->priority; > - > - /* > - * The "priority" of an entity cannot exceed the number of > - * run-queues of a scheduler. Protect against num_rqs being 0, > - * by converting to signed. Choose the lowest priority > - * available. > - */ > - if (p >= sched_list[0]->num_user_rqs) { > - drm_err(sched_list[0], "entity with out-of-bounds priority:%u num_user_rqs:%u\n", > - p, sched_list[0]->num_user_rqs); > - p = max_t(s32, > - (s32)sched_list[0]->num_user_rqs - 1, > - (s32)DRM_SCHED_PRIORITY_KERNEL); > - entity->priority = p; > - } > - entity->rq = sched_list[0]->sched_rq[entity->rq_priority]; > + entity->rq = sched_list[0]->rq; > } > > init_completion(&entity->entity_idle); > @@ -575,7 +557,7 @@ void drm_sched_entity_select_rq(struct drm_sched_entity *entity) > > spin_lock(&entity->lock); > sched = drm_sched_pick_best(entity->sched_list, entity->num_sched_list); > - rq = sched ? sched->sched_rq[entity->rq_priority] : NULL; > + rq = sched ? sched->rq : NULL; > if (rq != entity->rq) { > drm_sched_rq_remove_entity(entity->rq, entity); > entity->rq = rq; > @@ -617,10 +599,8 @@ void drm_sched_entity_push_job(struct drm_sched_job *sched_job) > if (first) { > struct drm_gpu_scheduler *sched; > > - if (drm_sched_policy == DRM_SCHED_POLICY_DEADLINE) > - submit_ts = __drm_sched_entity_get_job_deadline(entity, > - submit_ts); > - > + submit_ts = __drm_sched_entity_get_job_deadline(entity, > + submit_ts); > sched = drm_sched_rq_add_entity(entity->rq, entity, submit_ts); > if (sched) > drm_sched_wakeup(sched); > diff --git a/drivers/gpu/drm/scheduler/sched_main.c b/drivers/gpu/drm/scheduler/sched_main.c > index e2a67c7fe2d8..f748dcd06774 100644 > --- a/drivers/gpu/drm/scheduler/sched_main.c > +++ b/drivers/gpu/drm/scheduler/sched_main.c > @@ -87,15 +87,6 @@ static struct lockdep_map drm_sched_lockdep_map = { > }; > #endif > > -int drm_sched_policy = DRM_SCHED_POLICY_DEADLINE; > - > -/** > - * DOC: sched_policy (int) > - * Used to override default entities scheduling policy in a run queue. > - */ > -MODULE_PARM_DESC(sched_policy, "Specify the scheduling policy for entities on a run-queue, " __stringify(DRM_SCHED_POLICY_RR) " = Round Robin, " __stringify(DRM_SCHED_POLICY_FIFO) " = FIFO, " __stringify(DRM_SCHED_POLICY_DEADLINE) " = Virtual deadline (default)."); > -module_param_named(sched_policy, drm_sched_policy, int, 0444); > - > static u32 drm_sched_available_credits(struct drm_gpu_scheduler *sched) > { > u32 credits; > @@ -822,34 +813,6 @@ void drm_sched_wakeup(struct drm_gpu_scheduler *sched) > drm_sched_run_job_queue(sched); > } > > -/** > - * drm_sched_select_entity - Select next entity to process > - * > - * @sched: scheduler instance > - * > - * Return an entity to process or NULL if none are found. > - * > - * Note, that we break out of the for-loop when "entity" is non-null, which can > - * also be an error-pointer--this assures we don't process lower priority > - * run-queues. See comments in the respectively called functions. > - */ > -static struct drm_sched_entity * > -drm_sched_select_entity(struct drm_gpu_scheduler *sched) > -{ > - struct drm_sched_entity *entity = NULL; > - int i; > - > - /* Start with the highest priority. > - */ > - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { > - entity = drm_sched_rq_select_entity(sched, sched->sched_rq[i]); > - if (entity) > - break; > - } > - > - return IS_ERR(entity) ? NULL : entity; > -} > - > /** > * drm_sched_get_finished_job - fetch the next finished job to be destroyed > * > @@ -971,8 +934,8 @@ static void drm_sched_run_job_work(struct work_struct *w) > int r; > > /* Find entity with a ready job */ > - entity = drm_sched_select_entity(sched); > - if (!entity) > + entity = drm_sched_rq_select_entity(sched, sched->rq); > + if (IS_ERR_OR_NULL(entity)) > return; /* No more work */ > > sched_job = drm_sched_entity_pop_job(entity); > @@ -1016,7 +979,7 @@ static void drm_sched_run_job_work(struct work_struct *w) > * @ops: backend operations for this scheduler > * @submit_wq: workqueue to use for submission. If NULL, an ordered wq is > * allocated and used > - * @num_rqs: number of runqueues, one for each priority, up to DRM_SCHED_PRIORITY_COUNT > + * @num_rqs: deprecated and ignored > * @credit_limit: the number of credits this scheduler can hold from all jobs > * @hang_limit: number of times to allow a job to hang before dropping it > * @timeout: timeout value in jiffies for the scheduler > @@ -1035,8 +998,6 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, > long timeout, struct workqueue_struct *timeout_wq, > atomic_t *score, const char *name, struct device *dev) > { > - int i; > - > sched->ops = ops; > sched->credit_limit = credit_limit; > sched->name = name; > @@ -1046,13 +1007,7 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, > sched->score = score ? score : &sched->_score; > sched->dev = dev; > > - if (num_rqs > DRM_SCHED_PRIORITY_COUNT) { > - /* This is a gross violation--tell drivers what the problem is. > - */ > - drm_err(sched, "%s: num_rqs cannot be greater than DRM_SCHED_PRIORITY_COUNT\n", > - __func__); > - return -EINVAL; > - } else if (sched->sched_rq) { > + if (sched->rq) { > /* Not an error, but warn anyway so drivers can > * fine-tune their DRM calling order, and return all > * is good. > @@ -1078,21 +1033,11 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, > sched->own_submit_wq = true; > } > > - sched->num_user_rqs = num_rqs; > - sched->num_rqs = drm_sched_policy != DRM_SCHED_POLICY_DEADLINE ? > - num_rqs : 1; > - sched->sched_rq = kmalloc_array(sched->num_rqs, > - sizeof(*sched->sched_rq), > - GFP_KERNEL | __GFP_ZERO); > - if (!sched->sched_rq) > + sched->rq = kmalloc(sizeof(*sched->rq), GFP_KERNEL | __GFP_ZERO); > + if (!sched->rq) > goto Out_check_own; > > - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { > - sched->sched_rq[i] = kzalloc(sizeof(*sched->sched_rq[i]), GFP_KERNEL); > - if (!sched->sched_rq[i]) > - goto Out_unroll; > - drm_sched_rq_init(sched, sched->sched_rq[i]); > - } > + drm_sched_rq_init(sched, sched->rq); > > init_waitqueue_head(&sched->job_scheduled); > INIT_LIST_HEAD(&sched->pending_list); > @@ -1104,15 +1049,9 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, > atomic_set(&sched->_score, 0); > atomic64_set(&sched->job_id_count, 0); > sched->pause_submit = false; > - > sched->ready = true; > return 0; > -Out_unroll: > - for (--i ; i >= DRM_SCHED_PRIORITY_KERNEL; i--) > - kfree(sched->sched_rq[i]); > > - kfree(sched->sched_rq); > - sched->sched_rq = NULL; > Out_check_own: > if (sched->own_submit_wq) > destroy_workqueue(sched->submit_wq); > @@ -1143,25 +1082,21 @@ EXPORT_SYMBOL(drm_sched_init); > */ > void drm_sched_fini(struct drm_gpu_scheduler *sched) > { > + > + struct drm_sched_rq *rq = sched->rq; > struct drm_sched_entity *s_entity; > - int i; > > drm_sched_wqueue_stop(sched); > > - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { > - struct drm_sched_rq *rq = sched->sched_rq[i]; > - > - spin_lock(&rq->lock); > - list_for_each_entry(s_entity, &rq->entities, list) > - /* > - * Prevents reinsertion and marks job_queue as idle, > - * it will be removed from the rq in drm_sched_entity_fini() > - * eventually > - */ > - s_entity->stopped = true; > - spin_unlock(&rq->lock); > - kfree(sched->sched_rq[i]); > - } > + spin_lock(&rq->lock); > + list_for_each_entry(s_entity, &rq->entities, list) > + /* > + * Prevents reinsertion and marks job_queue as idle, > + * it will be removed from the rq in drm_sched_entity_fini() > + * eventually > + */ > + s_entity->stopped = true; > + spin_unlock(&rq->lock); > > /* Wakeup everyone stuck in drm_sched_entity_flush for this scheduler */ > wake_up_all(&sched->job_scheduled); > @@ -1172,8 +1107,8 @@ void drm_sched_fini(struct drm_gpu_scheduler *sched) > if (sched->own_submit_wq) > destroy_workqueue(sched->submit_wq); > sched->ready = false; > - kfree(sched->sched_rq); > - sched->sched_rq = NULL; > + kfree(sched->rq); > + sched->rq = NULL; > } > EXPORT_SYMBOL(drm_sched_fini); > > @@ -1188,35 +1123,28 @@ EXPORT_SYMBOL(drm_sched_fini); > */ > void drm_sched_increase_karma(struct drm_sched_job *bad) > { > - int i; > - struct drm_sched_entity *tmp; > - struct drm_sched_entity *entity; > struct drm_gpu_scheduler *sched = bad->sched; > + struct drm_sched_entity *entity, *tmp; > + struct drm_sched_rq *rq = sched->rq; > > /* don't change @bad's karma if it's from KERNEL RQ, > * because sometimes GPU hang would cause kernel jobs (like VM updating jobs) > * corrupt but keep in mind that kernel jobs always considered good. > */ > - if (bad->s_priority != DRM_SCHED_PRIORITY_KERNEL) { > - atomic_inc(&bad->karma); > + if (bad->s_priority == DRM_SCHED_PRIORITY_KERNEL) > + return; > > - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { > - struct drm_sched_rq *rq = sched->sched_rq[i]; > + atomic_inc(&bad->karma); > > - spin_lock(&rq->lock); > - list_for_each_entry_safe(entity, tmp, &rq->entities, list) { > - if (bad->s_fence->scheduled.context == > - entity->fence_context) { > - if (entity->guilty) > - atomic_set(entity->guilty, 1); > - break; > - } > - } > - spin_unlock(&rq->lock); > - if (&entity->list != &rq->entities) > - break; > + spin_lock(&rq->lock); > + list_for_each_entry_safe(entity, tmp, &rq->entities, list) { > + if (bad->s_fence->scheduled.context == entity->fence_context) { > + if (entity->guilty) > + atomic_set(entity->guilty, 1); > + break; > } > } > + spin_unlock(&rq->lock); > } > EXPORT_SYMBOL(drm_sched_increase_karma); > > diff --git a/drivers/gpu/drm/scheduler/sched_rq.c b/drivers/gpu/drm/scheduler/sched_rq.c > index ac28e2877585..d9c854b2e495 100644 > --- a/drivers/gpu/drm/scheduler/sched_rq.c > +++ b/drivers/gpu/drm/scheduler/sched_rq.c > @@ -12,7 +12,7 @@ static __always_inline bool drm_sched_entity_compare_before(struct rb_node *a, > return ktime_before(ent_a->oldest_job_waiting, ent_b->oldest_job_waiting); > } > > -static void __drm_sched_rq_remove_fifo_locked(struct drm_sched_entity *entity, > +static void __drm_sched_rq_remove_tree_locked(struct drm_sched_entity *entity, > struct drm_sched_rq *rq) > { > lockdep_assert_held(&entity->lock); > @@ -22,7 +22,7 @@ static void __drm_sched_rq_remove_fifo_locked(struct drm_sched_entity *entity, > RB_CLEAR_NODE(&entity->rb_tree_node); > } > > -static void __drm_sched_rq_add_fifo_locked(struct drm_sched_entity *entity, > +static void __drm_sched_rq_add_tree_locked(struct drm_sched_entity *entity, > struct drm_sched_rq *rq, > ktime_t ts) > { > @@ -56,16 +56,6 @@ void drm_sched_rq_init(struct drm_gpu_scheduler *sched, > rq->sched = sched; > } > > -static ktime_t > -drm_sched_rq_get_rr_deadline(struct drm_sched_rq *rq) > -{ > - lockdep_assert_held(&rq->lock); > - > - rq->rr_deadline = ktime_add_ns(rq->rr_deadline, 1); > - > - return rq->rr_deadline; > -} > - > /** > * drm_sched_rq_add_entity - add an entity > * > @@ -99,12 +89,9 @@ drm_sched_rq_add_entity(struct drm_sched_rq *rq, > list_add_tail(&entity->list, &rq->entities); > } > > - if (drm_sched_policy == DRM_SCHED_POLICY_RR) > - ts = drm_sched_rq_get_rr_deadline(rq); > - > if (!RB_EMPTY_NODE(&entity->rb_tree_node)) > - __drm_sched_rq_remove_fifo_locked(entity, rq); > - __drm_sched_rq_add_fifo_locked(entity, rq, ts); > + __drm_sched_rq_remove_tree_locked(entity, rq); > + __drm_sched_rq_add_tree_locked(entity, rq, ts); > > spin_unlock(&rq->lock); > spin_unlock(&entity->lock); > @@ -134,7 +121,7 @@ void drm_sched_rq_remove_entity(struct drm_sched_rq *rq, > list_del_init(&entity->list); > > if (!RB_EMPTY_NODE(&entity->rb_tree_node)) > - __drm_sched_rq_remove_fifo_locked(entity, rq); > + __drm_sched_rq_remove_tree_locked(entity, rq); > > spin_unlock(&rq->lock); > } > @@ -146,20 +133,13 @@ void drm_sched_rq_pop_entity(struct drm_sched_rq *rq, > > spin_lock(&entity->lock); > spin_lock(&rq->lock); > - __drm_sched_rq_remove_fifo_locked(entity, rq); > + __drm_sched_rq_remove_tree_locked(entity, rq); > next_job = to_drm_sched_job(spsc_queue_peek(&entity->job_queue)); > if (next_job) { > ktime_t ts; > > - if (drm_sched_policy == DRM_SCHED_POLICY_DEADLINE) > - ts = drm_sched_entity_get_job_deadline(entity, > - next_job); > - else if (drm_sched_policy == DRM_SCHED_POLICY_FIFO) > - ts = next_job->submit_ts; > - else > - ts = drm_sched_rq_get_rr_deadline(rq); > - > - __drm_sched_rq_add_fifo_locked(entity, rq, ts); > + ts = drm_sched_entity_get_job_deadline(entity, next_job); > + __drm_sched_rq_add_tree_locked(entity, rq, ts); > } > spin_unlock(&rq->lock); > spin_unlock(&entity->lock); > diff --git a/include/drm/gpu_scheduler.h b/include/drm/gpu_scheduler.h > index a722c5d6e5f9..9f952574efe2 100644 > --- a/include/drm/gpu_scheduler.h > +++ b/include/drm/gpu_scheduler.h > @@ -71,13 +71,6 @@ enum drm_sched_priority { > DRM_SCHED_PRIORITY_COUNT > }; > > -/* Used to choose between FIFO and RR job-scheduling */ > -extern int drm_sched_policy; > - > -#define DRM_SCHED_POLICY_RR 0 > -#define DRM_SCHED_POLICY_FIFO 1 > -#define DRM_SCHED_POLICY_DEADLINE 2 > - > /** > * struct drm_sched_entity - A wrapper around a job queue (typically > * attached to the DRM file_priv). > @@ -154,8 +147,6 @@ struct drm_sched_entity { > */ > struct spsc_queue job_queue; > > - enum drm_sched_priority rq_priority; > - > /** > * @fence_seq: > * > @@ -524,9 +515,7 @@ struct drm_gpu_scheduler { > atomic_t credit_count; > long timeout; > const char *name; > - u32 num_rqs; > - u32 num_user_rqs; > - struct drm_sched_rq **sched_rq; > + struct drm_sched_rq *rq; > wait_queue_head_t job_scheduled; > atomic64_t job_id_count; > struct workqueue_struct *submit_wq;
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c index b9d08bc96581..918b6d4919e1 100644 --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_job.c @@ -418,25 +418,22 @@ static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job) void amdgpu_job_stop_all_jobs_on_sched(struct drm_gpu_scheduler *sched) { + struct drm_sched_rq *rq = sched->rq; + struct drm_sched_entity *s_entity; struct drm_sched_job *s_job; - struct drm_sched_entity *s_entity = NULL; - int i; /* Signal all jobs not yet scheduled */ - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { - struct drm_sched_rq *rq = sched->sched_rq[i]; - spin_lock(&rq->lock); - list_for_each_entry(s_entity, &rq->entities, list) { - while ((s_job = to_drm_sched_job(spsc_queue_pop(&s_entity->job_queue)))) { - struct drm_sched_fence *s_fence = s_job->s_fence; + spin_lock(&rq->lock); + list_for_each_entry(s_entity, &rq->entities, list) { + while ((s_job = to_drm_sched_job(spsc_queue_pop(&s_entity->job_queue)))) { + struct drm_sched_fence *s_fence = s_job->s_fence; - dma_fence_signal(&s_fence->scheduled); - dma_fence_set_error(&s_fence->finished, -EHWPOISON); - dma_fence_signal(&s_fence->finished); - } + dma_fence_signal(&s_fence->scheduled); + dma_fence_set_error(&s_fence->finished, -EHWPOISON); + dma_fence_signal(&s_fence->finished); } - spin_unlock(&rq->lock); } + spin_unlock(&rq->lock); /* Signal all jobs already scheduled to HW */ list_for_each_entry(s_job, &sched->pending_list, list) { diff --git a/drivers/gpu/drm/scheduler/sched_entity.c b/drivers/gpu/drm/scheduler/sched_entity.c index e3c875b0afe8..98c78d1373d8 100644 --- a/drivers/gpu/drm/scheduler/sched_entity.c +++ b/drivers/gpu/drm/scheduler/sched_entity.c @@ -71,8 +71,6 @@ int drm_sched_entity_init(struct drm_sched_entity *entity, entity->guilty = guilty; entity->num_sched_list = num_sched_list; entity->priority = priority; - entity->rq_priority = drm_sched_policy == DRM_SCHED_POLICY_DEADLINE ? - DRM_SCHED_PRIORITY_KERNEL : priority; /* * It's perfectly valid to initialize an entity without having a valid * scheduler attached. It's just not valid to use the scheduler before it @@ -82,30 +80,14 @@ int drm_sched_entity_init(struct drm_sched_entity *entity, RCU_INIT_POINTER(entity->last_scheduled, NULL); RB_CLEAR_NODE(&entity->rb_tree_node); - if (num_sched_list && !sched_list[0]->sched_rq) { + if (num_sched_list && !sched_list[0]->rq) { /* Since every entry covered by num_sched_list * should be non-NULL and therefore we warn drivers * not to do this and to fix their DRM calling order. */ pr_warn("%s: called with uninitialized scheduler\n", __func__); } else if (num_sched_list) { - enum drm_sched_priority p = entity->priority; - - /* - * The "priority" of an entity cannot exceed the number of - * run-queues of a scheduler. Protect against num_rqs being 0, - * by converting to signed. Choose the lowest priority - * available. - */ - if (p >= sched_list[0]->num_user_rqs) { - drm_err(sched_list[0], "entity with out-of-bounds priority:%u num_user_rqs:%u\n", - p, sched_list[0]->num_user_rqs); - p = max_t(s32, - (s32)sched_list[0]->num_user_rqs - 1, - (s32)DRM_SCHED_PRIORITY_KERNEL); - entity->priority = p; - } - entity->rq = sched_list[0]->sched_rq[entity->rq_priority]; + entity->rq = sched_list[0]->rq; } init_completion(&entity->entity_idle); @@ -575,7 +557,7 @@ void drm_sched_entity_select_rq(struct drm_sched_entity *entity) spin_lock(&entity->lock); sched = drm_sched_pick_best(entity->sched_list, entity->num_sched_list); - rq = sched ? sched->sched_rq[entity->rq_priority] : NULL; + rq = sched ? sched->rq : NULL; if (rq != entity->rq) { drm_sched_rq_remove_entity(entity->rq, entity); entity->rq = rq; @@ -617,10 +599,8 @@ void drm_sched_entity_push_job(struct drm_sched_job *sched_job) if (first) { struct drm_gpu_scheduler *sched; - if (drm_sched_policy == DRM_SCHED_POLICY_DEADLINE) - submit_ts = __drm_sched_entity_get_job_deadline(entity, - submit_ts); - + submit_ts = __drm_sched_entity_get_job_deadline(entity, + submit_ts); sched = drm_sched_rq_add_entity(entity->rq, entity, submit_ts); if (sched) drm_sched_wakeup(sched); diff --git a/drivers/gpu/drm/scheduler/sched_main.c b/drivers/gpu/drm/scheduler/sched_main.c index e2a67c7fe2d8..f748dcd06774 100644 --- a/drivers/gpu/drm/scheduler/sched_main.c +++ b/drivers/gpu/drm/scheduler/sched_main.c @@ -87,15 +87,6 @@ static struct lockdep_map drm_sched_lockdep_map = { }; #endif -int drm_sched_policy = DRM_SCHED_POLICY_DEADLINE; - -/** - * DOC: sched_policy (int) - * Used to override default entities scheduling policy in a run queue. - */ -MODULE_PARM_DESC(sched_policy, "Specify the scheduling policy for entities on a run-queue, " __stringify(DRM_SCHED_POLICY_RR) " = Round Robin, " __stringify(DRM_SCHED_POLICY_FIFO) " = FIFO, " __stringify(DRM_SCHED_POLICY_DEADLINE) " = Virtual deadline (default)."); -module_param_named(sched_policy, drm_sched_policy, int, 0444); - static u32 drm_sched_available_credits(struct drm_gpu_scheduler *sched) { u32 credits; @@ -822,34 +813,6 @@ void drm_sched_wakeup(struct drm_gpu_scheduler *sched) drm_sched_run_job_queue(sched); } -/** - * drm_sched_select_entity - Select next entity to process - * - * @sched: scheduler instance - * - * Return an entity to process or NULL if none are found. - * - * Note, that we break out of the for-loop when "entity" is non-null, which can - * also be an error-pointer--this assures we don't process lower priority - * run-queues. See comments in the respectively called functions. - */ -static struct drm_sched_entity * -drm_sched_select_entity(struct drm_gpu_scheduler *sched) -{ - struct drm_sched_entity *entity = NULL; - int i; - - /* Start with the highest priority. - */ - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { - entity = drm_sched_rq_select_entity(sched, sched->sched_rq[i]); - if (entity) - break; - } - - return IS_ERR(entity) ? NULL : entity; -} - /** * drm_sched_get_finished_job - fetch the next finished job to be destroyed * @@ -971,8 +934,8 @@ static void drm_sched_run_job_work(struct work_struct *w) int r; /* Find entity with a ready job */ - entity = drm_sched_select_entity(sched); - if (!entity) + entity = drm_sched_rq_select_entity(sched, sched->rq); + if (IS_ERR_OR_NULL(entity)) return; /* No more work */ sched_job = drm_sched_entity_pop_job(entity); @@ -1016,7 +979,7 @@ static void drm_sched_run_job_work(struct work_struct *w) * @ops: backend operations for this scheduler * @submit_wq: workqueue to use for submission. If NULL, an ordered wq is * allocated and used - * @num_rqs: number of runqueues, one for each priority, up to DRM_SCHED_PRIORITY_COUNT + * @num_rqs: deprecated and ignored * @credit_limit: the number of credits this scheduler can hold from all jobs * @hang_limit: number of times to allow a job to hang before dropping it * @timeout: timeout value in jiffies for the scheduler @@ -1035,8 +998,6 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, long timeout, struct workqueue_struct *timeout_wq, atomic_t *score, const char *name, struct device *dev) { - int i; - sched->ops = ops; sched->credit_limit = credit_limit; sched->name = name; @@ -1046,13 +1007,7 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, sched->score = score ? score : &sched->_score; sched->dev = dev; - if (num_rqs > DRM_SCHED_PRIORITY_COUNT) { - /* This is a gross violation--tell drivers what the problem is. - */ - drm_err(sched, "%s: num_rqs cannot be greater than DRM_SCHED_PRIORITY_COUNT\n", - __func__); - return -EINVAL; - } else if (sched->sched_rq) { + if (sched->rq) { /* Not an error, but warn anyway so drivers can * fine-tune their DRM calling order, and return all * is good. @@ -1078,21 +1033,11 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, sched->own_submit_wq = true; } - sched->num_user_rqs = num_rqs; - sched->num_rqs = drm_sched_policy != DRM_SCHED_POLICY_DEADLINE ? - num_rqs : 1; - sched->sched_rq = kmalloc_array(sched->num_rqs, - sizeof(*sched->sched_rq), - GFP_KERNEL | __GFP_ZERO); - if (!sched->sched_rq) + sched->rq = kmalloc(sizeof(*sched->rq), GFP_KERNEL | __GFP_ZERO); + if (!sched->rq) goto Out_check_own; - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { - sched->sched_rq[i] = kzalloc(sizeof(*sched->sched_rq[i]), GFP_KERNEL); - if (!sched->sched_rq[i]) - goto Out_unroll; - drm_sched_rq_init(sched, sched->sched_rq[i]); - } + drm_sched_rq_init(sched, sched->rq); init_waitqueue_head(&sched->job_scheduled); INIT_LIST_HEAD(&sched->pending_list); @@ -1104,15 +1049,9 @@ int drm_sched_init(struct drm_gpu_scheduler *sched, atomic_set(&sched->_score, 0); atomic64_set(&sched->job_id_count, 0); sched->pause_submit = false; - sched->ready = true; return 0; -Out_unroll: - for (--i ; i >= DRM_SCHED_PRIORITY_KERNEL; i--) - kfree(sched->sched_rq[i]); - kfree(sched->sched_rq); - sched->sched_rq = NULL; Out_check_own: if (sched->own_submit_wq) destroy_workqueue(sched->submit_wq); @@ -1143,25 +1082,21 @@ EXPORT_SYMBOL(drm_sched_init); */ void drm_sched_fini(struct drm_gpu_scheduler *sched) { + + struct drm_sched_rq *rq = sched->rq; struct drm_sched_entity *s_entity; - int i; drm_sched_wqueue_stop(sched); - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { - struct drm_sched_rq *rq = sched->sched_rq[i]; - - spin_lock(&rq->lock); - list_for_each_entry(s_entity, &rq->entities, list) - /* - * Prevents reinsertion and marks job_queue as idle, - * it will be removed from the rq in drm_sched_entity_fini() - * eventually - */ - s_entity->stopped = true; - spin_unlock(&rq->lock); - kfree(sched->sched_rq[i]); - } + spin_lock(&rq->lock); + list_for_each_entry(s_entity, &rq->entities, list) + /* + * Prevents reinsertion and marks job_queue as idle, + * it will be removed from the rq in drm_sched_entity_fini() + * eventually + */ + s_entity->stopped = true; + spin_unlock(&rq->lock); /* Wakeup everyone stuck in drm_sched_entity_flush for this scheduler */ wake_up_all(&sched->job_scheduled); @@ -1172,8 +1107,8 @@ void drm_sched_fini(struct drm_gpu_scheduler *sched) if (sched->own_submit_wq) destroy_workqueue(sched->submit_wq); sched->ready = false; - kfree(sched->sched_rq); - sched->sched_rq = NULL; + kfree(sched->rq); + sched->rq = NULL; } EXPORT_SYMBOL(drm_sched_fini); @@ -1188,35 +1123,28 @@ EXPORT_SYMBOL(drm_sched_fini); */ void drm_sched_increase_karma(struct drm_sched_job *bad) { - int i; - struct drm_sched_entity *tmp; - struct drm_sched_entity *entity; struct drm_gpu_scheduler *sched = bad->sched; + struct drm_sched_entity *entity, *tmp; + struct drm_sched_rq *rq = sched->rq; /* don't change @bad's karma if it's from KERNEL RQ, * because sometimes GPU hang would cause kernel jobs (like VM updating jobs) * corrupt but keep in mind that kernel jobs always considered good. */ - if (bad->s_priority != DRM_SCHED_PRIORITY_KERNEL) { - atomic_inc(&bad->karma); + if (bad->s_priority == DRM_SCHED_PRIORITY_KERNEL) + return; - for (i = DRM_SCHED_PRIORITY_KERNEL; i < sched->num_rqs; i++) { - struct drm_sched_rq *rq = sched->sched_rq[i]; + atomic_inc(&bad->karma); - spin_lock(&rq->lock); - list_for_each_entry_safe(entity, tmp, &rq->entities, list) { - if (bad->s_fence->scheduled.context == - entity->fence_context) { - if (entity->guilty) - atomic_set(entity->guilty, 1); - break; - } - } - spin_unlock(&rq->lock); - if (&entity->list != &rq->entities) - break; + spin_lock(&rq->lock); + list_for_each_entry_safe(entity, tmp, &rq->entities, list) { + if (bad->s_fence->scheduled.context == entity->fence_context) { + if (entity->guilty) + atomic_set(entity->guilty, 1); + break; } } + spin_unlock(&rq->lock); } EXPORT_SYMBOL(drm_sched_increase_karma); diff --git a/drivers/gpu/drm/scheduler/sched_rq.c b/drivers/gpu/drm/scheduler/sched_rq.c index ac28e2877585..d9c854b2e495 100644 --- a/drivers/gpu/drm/scheduler/sched_rq.c +++ b/drivers/gpu/drm/scheduler/sched_rq.c @@ -12,7 +12,7 @@ static __always_inline bool drm_sched_entity_compare_before(struct rb_node *a, return ktime_before(ent_a->oldest_job_waiting, ent_b->oldest_job_waiting); } -static void __drm_sched_rq_remove_fifo_locked(struct drm_sched_entity *entity, +static void __drm_sched_rq_remove_tree_locked(struct drm_sched_entity *entity, struct drm_sched_rq *rq) { lockdep_assert_held(&entity->lock); @@ -22,7 +22,7 @@ static void __drm_sched_rq_remove_fifo_locked(struct drm_sched_entity *entity, RB_CLEAR_NODE(&entity->rb_tree_node); } -static void __drm_sched_rq_add_fifo_locked(struct drm_sched_entity *entity, +static void __drm_sched_rq_add_tree_locked(struct drm_sched_entity *entity, struct drm_sched_rq *rq, ktime_t ts) { @@ -56,16 +56,6 @@ void drm_sched_rq_init(struct drm_gpu_scheduler *sched, rq->sched = sched; } -static ktime_t -drm_sched_rq_get_rr_deadline(struct drm_sched_rq *rq) -{ - lockdep_assert_held(&rq->lock); - - rq->rr_deadline = ktime_add_ns(rq->rr_deadline, 1); - - return rq->rr_deadline; -} - /** * drm_sched_rq_add_entity - add an entity * @@ -99,12 +89,9 @@ drm_sched_rq_add_entity(struct drm_sched_rq *rq, list_add_tail(&entity->list, &rq->entities); } - if (drm_sched_policy == DRM_SCHED_POLICY_RR) - ts = drm_sched_rq_get_rr_deadline(rq); - if (!RB_EMPTY_NODE(&entity->rb_tree_node)) - __drm_sched_rq_remove_fifo_locked(entity, rq); - __drm_sched_rq_add_fifo_locked(entity, rq, ts); + __drm_sched_rq_remove_tree_locked(entity, rq); + __drm_sched_rq_add_tree_locked(entity, rq, ts); spin_unlock(&rq->lock); spin_unlock(&entity->lock); @@ -134,7 +121,7 @@ void drm_sched_rq_remove_entity(struct drm_sched_rq *rq, list_del_init(&entity->list); if (!RB_EMPTY_NODE(&entity->rb_tree_node)) - __drm_sched_rq_remove_fifo_locked(entity, rq); + __drm_sched_rq_remove_tree_locked(entity, rq); spin_unlock(&rq->lock); } @@ -146,20 +133,13 @@ void drm_sched_rq_pop_entity(struct drm_sched_rq *rq, spin_lock(&entity->lock); spin_lock(&rq->lock); - __drm_sched_rq_remove_fifo_locked(entity, rq); + __drm_sched_rq_remove_tree_locked(entity, rq); next_job = to_drm_sched_job(spsc_queue_peek(&entity->job_queue)); if (next_job) { ktime_t ts; - if (drm_sched_policy == DRM_SCHED_POLICY_DEADLINE) - ts = drm_sched_entity_get_job_deadline(entity, - next_job); - else if (drm_sched_policy == DRM_SCHED_POLICY_FIFO) - ts = next_job->submit_ts; - else - ts = drm_sched_rq_get_rr_deadline(rq); - - __drm_sched_rq_add_fifo_locked(entity, rq, ts); + ts = drm_sched_entity_get_job_deadline(entity, next_job); + __drm_sched_rq_add_tree_locked(entity, rq, ts); } spin_unlock(&rq->lock); spin_unlock(&entity->lock); diff --git a/include/drm/gpu_scheduler.h b/include/drm/gpu_scheduler.h index a722c5d6e5f9..9f952574efe2 100644 --- a/include/drm/gpu_scheduler.h +++ b/include/drm/gpu_scheduler.h @@ -71,13 +71,6 @@ enum drm_sched_priority { DRM_SCHED_PRIORITY_COUNT }; -/* Used to choose between FIFO and RR job-scheduling */ -extern int drm_sched_policy; - -#define DRM_SCHED_POLICY_RR 0 -#define DRM_SCHED_POLICY_FIFO 1 -#define DRM_SCHED_POLICY_DEADLINE 2 - /** * struct drm_sched_entity - A wrapper around a job queue (typically * attached to the DRM file_priv). @@ -154,8 +147,6 @@ struct drm_sched_entity { */ struct spsc_queue job_queue; - enum drm_sched_priority rq_priority; - /** * @fence_seq: * @@ -524,9 +515,7 @@ struct drm_gpu_scheduler { atomic_t credit_count; long timeout; const char *name; - u32 num_rqs; - u32 num_user_rqs; - struct drm_sched_rq **sched_rq; + struct drm_sched_rq *rq; wait_queue_head_t job_scheduled; atomic64_t job_id_count; struct workqueue_struct *submit_wq;
If the new deadline policy is at least as good as FIFO and we can afford to remove round-robin, we can simplify the scheduler code by making the scheduler to run queue relationship always 1:1 and remove some code. Also, now that the FIFO policy is gone the tree of entities is not a FIFO tree any more so rename it to just the tree. Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin@igalia.com> Cc: Christian König <christian.koenig@amd.com> Cc: Danilo Krummrich <dakr@redhat.com> Cc: Matthew Brost <matthew.brost@intel.com> Cc: Philipp Stanner <pstanner@redhat.com> --- drivers/gpu/drm/amd/amdgpu/amdgpu_job.c | 23 ++-- drivers/gpu/drm/scheduler/sched_entity.c | 30 +---- drivers/gpu/drm/scheduler/sched_main.c | 136 ++++++----------------- drivers/gpu/drm/scheduler/sched_rq.c | 36 ++---- include/drm/gpu_scheduler.h | 13 +-- 5 files changed, 56 insertions(+), 182 deletions(-)