[Public]
>-----Original Message-----
>From: Joshi, Mukul <[email protected]>
>Sent: Wednesday, January 28, 2026 12:23 AM
>To: Yu, Lang <[email protected]>; [email protected]
>Cc: Zhang, Hawking <[email protected]>; Deucher, Alexander
><[email protected]>; Belanger, David <[email protected]>
>Subject: RE: [PATCH 4/4] drm/amdkfd: Use AMDGPU_MQD_SIZE_ALIGN in gfx11+
>kfd mqd manager
>
>[AMD Official Use Only - AMD Internal Distribution Only]
>
>> -----Original Message-----
>> From: Yu, Lang <[email protected]>
>> Sent: Monday, January 26, 2026 5:25 AM
>> To: [email protected]
>> Cc: Zhang, Hawking <[email protected]>; Deucher, Alexander
>> <[email protected]>; Joshi, Mukul <[email protected]>;
>> Belanger, David <[email protected]>; Yu, Lang <[email protected]>
>> Subject: [PATCH 4/4] drm/amdkfd: Use AMDGPU_MQD_SIZE_ALIGN in gfx11+
>> kfd mqd manager
>>
>> MES is enabled by default from gfx11+.
>>
>> Signed-off-by: Lang Yu <[email protected]>
>> ---
>> drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager.c | 3 ++
>> .../gpu/drm/amd/amdkfd/kfd_mqd_manager_v11.c | 22 +++-----------
>> .../gpu/drm/amd/amdkfd/kfd_mqd_manager_v12.c | 10 +++----
>> .../drm/amd/amdkfd/kfd_mqd_manager_v12_1.c | 29 ++++---------------
>> 4 files changed, 17 insertions(+), 47 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager.c
>> b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager.c
>> index ceb6566ff3e1..d88d0de58edd 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager.c
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager.c
>> @@ -292,6 +292,9 @@ void kfd_get_hiq_xcc_mqd(struct kfd_node *dev,
>> struct kfd_mem_obj *mqd_mem_obj, uint64_t kfd_mqd_stride(struct
>> mqd_manager *mm,
>> struct queue_properties *q) {
>> + if (KFD_GC_VERSION(mm->dev) >= IP_VERSION(11, 0, 0))
>> + return AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>> +
>> return mm->mqd_size;
>> }
>>
>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v11.c
>> b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v11.c
>> index 5c44d0987737..7e5a7ab6d0c0 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v11.c
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v11.c
>> @@ -102,20 +102,11 @@ static void set_priority(struct v11_compute_mqd
>> *m, struct queue_properties *q) static struct kfd_mem_obj
>> *allocate_mqd(struct mqd_manager *mm,
>> struct queue_properties *q) {
>> + u32 mqd_size = AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>> struct kfd_node *node = mm->dev;
>> struct kfd_mem_obj *mqd_mem_obj;
>> - int size;
>> -
>> - /*
>> - * MES write to areas beyond MQD size. So allocate
>> - * 1 PAGE_SIZE memory for MQD is MES is enabled.
>> - */
>> - if (node->kfd->shared_resources.enable_mes)
>> - size = PAGE_SIZE;
>> - else
>> - size = sizeof(struct v11_compute_mqd);
>>
>> - if (kfd_gtt_sa_allocate(node, size, &mqd_mem_obj))
>> + if (kfd_gtt_sa_allocate(node, mqd_size, &mqd_mem_obj))
>> return NULL;
>>
>> return mqd_mem_obj;
>> @@ -127,18 +118,13 @@ static void init_mqd(struct mqd_manager *mm,
>> void **mqd, {
>> uint64_t addr;
>> struct v11_compute_mqd *m;
>> - int size;
>> + u32 mqd_size = AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>> uint32_t wa_mask = q->is_dbg_wa ? 0xffff : 0xffffffff;
>>
>> m = (struct v11_compute_mqd *) mqd_mem_obj->cpu_ptr;
>> addr = mqd_mem_obj->gpu_addr;
>>
>> - if (mm->dev->kfd->shared_resources.enable_mes)
>> - size = PAGE_SIZE;
>> - else
>> - size = sizeof(struct v11_compute_mqd);
>> -
>> - memset(m, 0, size);
>> + memset(m, 0, mqd_size);
>>
>> m->header = 0xC0310800;
>> m->compute_pipelinestat_enable = 1; diff --git
>> a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12.c
>> b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12.c
>> index b7ac2dea8775..a51f217329db 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12.c
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12.c
>> @@ -83,14 +83,11 @@ static void set_priority(struct v12_compute_mqd
>> *m, struct queue_properties *q) static struct kfd_mem_obj
>> *allocate_mqd(struct mqd_manager *mm,
>> struct queue_properties *q) {
>> + u32 mqd_size = AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>> struct kfd_node *node = mm->dev;
>> struct kfd_mem_obj *mqd_mem_obj;
>>
>> - /*
>> - * Allocate one PAGE_SIZE memory for MQD as MES writes to areas
>> beyond
>> - * struct MQD size.
>> - */
>> - if (kfd_gtt_sa_allocate(node, PAGE_SIZE, &mqd_mem_obj))
>> + if (kfd_gtt_sa_allocate(node, mqd_size, &mqd_mem_obj))
>> return NULL;
>>
>> return mqd_mem_obj;
>> @@ -102,11 +99,12 @@ static void init_mqd(struct mqd_manager *mm, void
>> **mqd, {
>> uint64_t addr;
>> struct v12_compute_mqd *m;
>> + u32 mqd_size = AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>>
>> m = (struct v12_compute_mqd *) mqd_mem_obj->cpu_ptr;
>> addr = mqd_mem_obj->gpu_addr;
>>
>> - memset(m, 0, PAGE_SIZE);
>> + memset(m, 0, mqd_size);
>>
>> m->header = 0xC0310800;
>> m->compute_pipelinestat_enable = 1; diff --git
>> a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12_1.c
>> b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12_1.c
>> index 0b0d802a0917..d0776ba2cc99 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12_1.c
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_mqd_manager_v12_1.c
>> @@ -32,17 +32,6 @@
>> #include "amdgpu_amdkfd.h"
>> #include "kfd_device_queue_manager.h"
>>
>> -#define MQD_SIZE (2 * PAGE_SIZE)
>> -
>> -static uint64_t mqd_stride_v12_1(struct mqd_manager *mm,
>> - struct queue_properties *q)
>> -{
>> - if (q->type == KFD_QUEUE_TYPE_COMPUTE)
>> - return MQD_SIZE;
>> - else
>> - return PAGE_SIZE;
>> -}
>> -
>> static inline struct v12_1_compute_mqd *get_mqd(void *mqd) {
>> return (struct v12_1_compute_mqd *)mqd; @@ -148,21 +137,14 @@
>> static void set_priority(struct v12_1_compute_mqd *m, struct
>> queue_properties *q static struct kfd_mem_obj *allocate_mqd(struct
>> mqd_manager *mm,
>> struct queue_properties *q) {
>> + u32 mqd_size = AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>> struct kfd_node *node = mm->dev;
>> struct kfd_mem_obj *mqd_mem_obj;
>> - unsigned int size;
>>
>> - /*
>> - * Allocate two PAGE_SIZE memory for Compute MQD as MES writes
>> to areas beyond
>> - * struct MQD size. Size of the Compute MQD is 1 PAGE_SIZE.
>> - * For SDMA MQD, we allocate 1 Page_size.
>> - */
>> if (q->type == KFD_QUEUE_TYPE_COMPUTE)
>> - size = MQD_SIZE * NUM_XCC(node->xcc_mask);
>> - else
>> - size = PAGE_SIZE;
>> + mqd_size *= NUM_XCC(node->xcc_mask);
>>
>
>SDMA MQD allocation is not per XCC in the partition. This wastes a ton of
>memory for
>SDMA queues.
Look carefully. " if (q->type == KFD_QUEUE_TYPE_COMPUTE)" is still there.
Only compute queue will be applied.
Regards,
Lang
>Regards,
>Mukul
>
>> - if (kfd_gtt_sa_allocate(node, size, &mqd_mem_obj))
>> + if (kfd_gtt_sa_allocate(node, mqd_size, &mqd_mem_obj))
>> return NULL;
>>
>> return mqd_mem_obj;
>> @@ -174,11 +156,12 @@ static void init_mqd(struct mqd_manager *mm,
>> void **mqd, {
>> uint64_t addr;
>> struct v12_1_compute_mqd *m;
>> + u32 mqd_size = AMDGPU_MQD_SIZE_ALIGN(mm->mqd_size);
>>
>> m = (struct v12_1_compute_mqd *) mqd_mem_obj->cpu_ptr;
>> addr = mqd_mem_obj->gpu_addr;
>>
>> - memset(m, 0, MQD_SIZE);
>> + memset(m, 0, mqd_size);
>>
>> m->header = 0xC0310800;
>> m->compute_pipelinestat_enable = 1; @@ -681,7 +664,7 @@ struct
>> mqd_manager *mqd_manager_init_v12_1(enum KFD_MQD_TYPE type,
>> mqd->is_occupied = kfd_is_occupied_cp;
>> mqd->mqd_size = sizeof(struct v12_1_compute_mqd);
>> mqd->get_wave_state = get_wave_state_v12_1;
>> - mqd->mqd_stride = mqd_stride_v12_1;
>> + mqd->mqd_stride = kfd_mqd_stride;
>> #if defined(CONFIG_DEBUG_FS)
>> mqd->debugfs_show_mqd = debugfs_show_mqd; #endif
>> --
>> 2.34.1
>