[RFC PATCH] drm/amdgpu: allocate entities on demand

Tue Dec 3 15:02:17 UTC 2019

Hi Christian,

On 12/2/19 3:59 PM, Christian KÃ¶nig wrote:
> Am 02.12.19 um 15:43 schrieb Nirmoy:
>>
>> Do you mean something like
>>
>> diff --git a/include/drm/gpu_scheduler.h b/include/drm/gpu_scheduler.h
>> index 684692a8ed76..ac67f8f098fa 100644
>> --- a/include/drm/gpu_scheduler.h
>> +++ b/include/drm/gpu_scheduler.h
>> @@ -81,7 +81,7 @@ enum drm_sched_priority {
>> Â struct drm_sched_entity {
>> Â Â Â Â Â Â Â  struct list_headÂ Â Â Â Â Â Â Â Â Â Â Â Â Â Â  list;
>> Â Â Â Â Â Â Â  struct drm_sched_rqÂ Â Â Â Â Â Â Â Â Â Â Â  *rq;
>> -Â Â Â Â Â Â  struct drm_sched_rqÂ Â Â Â Â Â Â Â Â Â Â Â  **rq_list;
>> +Â Â Â Â Â  struct drm_gpu_schedulerÂ Â Â Â Â Â Â  **sched;
>> Â Â Â Â Â Â Â  unsigned intÂ Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â  num_rq_list;
>> Â Â Â Â Â Â Â  spinlock_tÂ Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â  rq_lock;
>
> Yes, exactly. Problem is that I'm not 100% sure if that really works 
> with all users of the rq_list.

currently rq_list users does two main tasks.

1Â  change rq priority for a context on user requests

2Â  helps drm scheduler to find rqÂ  with least load.

Can you please check the bellow diff it doesn't really work because I 
get some kernel panic. But do you think

it is matching your idea ?

test at install:~/linux> git diff drivers/gpu/drm/scheduler/sched_entity.c 
|tee

diff --git a/drivers/gpu/drm/scheduler/sched_entity.c 
b/drivers/gpu/drm/scheduler/sched_entity.c
index 1a5153197fe9..0bbd8ddd6c83 100644
--- a/drivers/gpu/drm/scheduler/sched_entity.c
+++ b/drivers/gpu/drm/scheduler/sched_entity.c
@@ -37,9 +37,9 @@
 Â  * submit to HW ring.
 Â  *
 Â  * @entity: scheduler entity to init
- * @rq_list: the list of run queue on which jobs from this
+ * @sched_list: the list of drm scheds on which jobs from this
 Â  *Â Â Â Â Â Â Â Â Â Â  entity can be submitted
- * @num_rq_list: number of run queue in rq_list
+ * @num_sched_list: number of drm sched in sched_list
 Â  * @guilty: atomic_t set to 1 when a job on this queue
 Â  *Â Â Â Â Â Â Â Â Â  is found to be guilty causing a timeout
 Â  *
@@ -49,30 +49,24 @@
 Â  * Returns 0 on success or a negative error code on failure.
 Â  */
 Â int drm_sched_entity_init(struct drm_sched_entity *entity,
-Â Â  Â Â Â  Â Â Â  Â Â  struct drm_sched_rq **rq_list,
-Â Â  Â Â Â  Â Â Â  Â Â  unsigned int num_rq_list,
-Â Â  Â Â Â  Â Â Â  Â Â  atomic_t *guilty)
+Â Â  Â Â Â  Â Â Â  Â Â  struct drm_gpu_scheduler **sched_list,
+Â Â  Â Â Â  Â Â Â  Â Â  unsigned int num_sched_list,
+Â Â  Â Â Â  Â Â Â  Â Â  atomic_t *guilty, enum drm_sched_priority priority)
 Â {
-Â Â  Â int i;

-Â Â  Â if (!(entity && rq_list && (num_rq_list == 0 || rq_list[0])))
+Â Â  Â if (!(entity && sched_list && (num_sched_list == 0 || sched_list[0])))
 Â Â Â  Â Â Â  Â return -EINVAL;

 Â Â Â  Â memset(entity, 0, sizeof(struct drm_sched_entity));
 Â Â Â  Â INIT_LIST_HEAD(&entity->list);
 Â Â Â  Â entity->rq = NULL;
 Â Â Â  Â entity->guilty = guilty;
-Â Â  Â entity->num_rq_list = num_rq_list;
-Â Â  Â entity->rq_list = kcalloc(num_rq_list, sizeof(struct drm_sched_rq *),
-Â Â  Â Â Â  Â Â Â  Â Â Â  Â GFP_KERNEL);
-Â Â  Â if (!entity->rq_list)
-Â Â  Â Â Â  Â return -ENOMEM;
-
-Â Â  Â for (i = 0; i < num_rq_list; ++i)
-Â Â  Â Â Â  Â entity->rq_list[i] = rq_list[i];
+Â Â  Â entity->num_sched_list = num_sched_list;
+Â Â  Â entity->sched_list =Â  sched_list
+Â Â  Â entity->priority = priority;

-Â Â  Â if (num_rq_list)
-Â Â  Â Â Â  Â entity->rq = rq_list[0];
+Â Â  Â if (num_sched_list)
+Â Â  Â Â Â  Â entity->rq = &entity->sched_list[0]->sched_rq[entity->priority];

 Â Â Â  Â entity->last_scheduled = NULL;

@@ -136,10 +130,10 @@ drm_sched_entity_get_free_sched(struct 
drm_sched_entity *entity)
 Â Â Â  Â unsigned int min_jobs = UINT_MAX, num_jobs;
 Â Â Â  Â int i;

-Â Â  Â for (i = 0; i < entity->num_rq_list; ++i) {
-Â Â  Â Â Â  Â struct drm_gpu_scheduler *sched = entity->rq_list[i]->sched;
+Â Â  Â for (i = 0; i < entity->num_sched_list; ++i) {
+Â Â  Â Â Â  Â struct drm_gpu_scheduler *sched = entity->sched_list[i];

-Â Â  Â Â Â  Â if (!entity->rq_list[i]->sched->ready) {
+Â Â  Â Â Â  Â if (!entity->sched_list[i]->ready) {
 Â Â Â  Â Â Â  Â Â Â  Â DRM_WARN("sched%s is not ready, skipping", sched->name);
 Â Â Â  Â Â Â  Â Â Â  Â continue;
 Â Â Â  Â Â Â  Â }
@@ -147,7 +141,7 @@ drm_sched_entity_get_free_sched(struct 
drm_sched_entity *entity)
 Â Â Â  Â Â Â  Â num_jobs = atomic_read(&sched->num_jobs);
 Â Â Â  Â Â Â  Â if (num_jobs < min_jobs) {
 Â Â Â  Â Â Â  Â Â Â  Â min_jobs = num_jobs;
-Â Â  Â Â Â  Â Â Â  Â rq = entity->rq_list[i];
+Â Â  Â Â Â  Â Â Â  Â rq = &entity->sched_list[i]->sched_rq[entity->priority];
 Â Â Â  Â Â Â  Â }
 Â Â Â  Â }

@@ -304,7 +298,6 @@ void drm_sched_entity_fini(struct drm_sched_entity 
*entity)

 Â Â Â  Â dma_fence_put(entity->last_scheduled);
 Â Â Â  Â entity->last_scheduled = NULL;
-Â Â  Â kfree(entity->rq_list);
 Â }
 Â EXPORT_SYMBOL(drm_sched_entity_fini);

@@ -372,8 +365,9 @@ void drm_sched_entity_set_priority(struct 
drm_sched_entity *entity,
 Â Â Â  Â unsigned int i;

 Â Â Â  Â spin_lock(&entity->rq_lock);
-
-Â Â  Â for (i = 0; i < entity->num_rq_list; ++i)
+//TODO
+/*
+Â Â  Â for (i = 0; i < entity->num_sched_list; ++i)
 Â drm_sched_entity_set_rq_priority(&entity->rq_list[i], priority);

 Â Â Â  Â if (entity->rq) {
@@ -381,7 +375,7 @@ void drm_sched_entity_set_priority(struct 
drm_sched_entity *entity,
 Â Â Â  Â Â Â  Â drm_sched_entity_set_rq_priority(&entity->rq, priority);
 Â Â Â  Â Â Â  Â drm_sched_rq_add_entity(entity->rq, entity);
 Â Â Â  Â }
-
+*/
 Â Â Â  Â spin_unlock(&entity->rq_lock);
 Â }
 Â EXPORT_SYMBOL(drm_sched_entity_set_priority);
@@ -486,7 +480,7 @@ void drm_sched_entity_select_rq(struct 
drm_sched_entity *entity)
 Â Â Â  Â struct dma_fence *fence;
 Â Â Â  Â struct drm_sched_rq *rq;

-Â Â  Â if (spsc_queue_count(&entity->job_queue) || entity->num_rq_list <= 1)
+Â Â  Â if (spsc_queue_count(&entity->job_queue) || entity->num_sched_list 
<= 1)
 Â Â Â  Â Â Â  Â return;

 Â Â Â  Â fence = READ_ONCE(entity->last_scheduled);