[PATCH 2/2] drm/amdkfd: Adjust weight to represent num_hops info when report xgmi iolink

Kuehling, Felix Felix.Kuehling at amd.com
Tue Apr 23 18:15:44 UTC 2019


On 2019-04-17 2:59 p.m., Liu, Shaoyun wrote:
> Upper level runtime need the xgmi hops info to determine the data path
>
> Change-Id: I969b419eab125157e223e9b03980ca229c1e6af4
> Signed-off-by: shaoyunl <shaoyun.liu at amd.com>
> ---
>   drivers/gpu/drm/amd/amdkfd/kfd_crat.c | 8 ++++++--
>   drivers/gpu/drm/amd/amdkfd/kfd_crat.h | 3 ++-
>   2 files changed, 8 insertions(+), 3 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_crat.c b/drivers/gpu/drm/amd/amdkfd/kfd_crat.c
> index 2e7c449..d48c6c5 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_crat.c
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_crat.c
> @@ -341,6 +341,7 @@ static int kfd_parse_subtype_cache(struct crat_subtype_cache *cache,
>   	return 0;
>   }
>   
> +
>   /* kfd_parse_subtype_iolink - parse iolink subtypes and attach it to correct
>    * topology device present in the device_list
>    */
> @@ -372,7 +373,7 @@ static int kfd_parse_subtype_iolink(struct crat_subtype_iolink *iolink,
>   			if (props->iolink_type == CRAT_IOLINK_TYPE_PCIEXPRESS)
>   				props->weight = 20;
>   			else if (props->iolink_type == CRAT_IOLINK_TYPE_XGMI)
> -				props->weight = 15;
> +				props->weight = 15 * iolink->num_hops_xgmi;
>   			else
>   				props->weight = node_distance(id_from, id_to);
>   
> @@ -1092,6 +1093,7 @@ static int kfd_fill_gpu_direct_io_link_to_cpu(int *avail_size,
>   
>   static int kfd_fill_gpu_xgmi_link_to_gpu(int *avail_size,
>   			struct kfd_dev *kdev,
> +			struct kfd_dev *peer_kdev,
>   			struct crat_subtype_iolink *sub_type_hdr,
>   			uint32_t proximity_domain_from,
>   			uint32_t proximity_domain_to)
> @@ -1110,6 +1112,8 @@ static int kfd_fill_gpu_xgmi_link_to_gpu(int *avail_size,
>   	sub_type_hdr->io_interface_type = CRAT_IOLINK_TYPE_XGMI;
>   	sub_type_hdr->proximity_domain_from = proximity_domain_from;
>   	sub_type_hdr->proximity_domain_to = proximity_domain_to;
> +	sub_type_hdr->num_hops_xgmi =
> +		amdgpu_amdkfd_get_xgmi_hops_count(kdev->kgd, peer_kdev->kgd);
>   	return 0;
>   }
>   
> @@ -1287,7 +1291,7 @@ static int kfd_create_vcrat_image_gpu(void *pcrat_image,
>   				(char *)sub_type_hdr +
>   				sizeof(struct crat_subtype_iolink));
>   			ret = kfd_fill_gpu_xgmi_link_to_gpu(
> -				&avail_size, kdev,
> +				&avail_size, kdev, peer_dev->gpu,
>   				(struct crat_subtype_iolink *)sub_type_hdr,
>   				proximity_domain, nid);
>   			if (ret < 0)
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_crat.h b/drivers/gpu/drm/amd/amdkfd/kfd_crat.h
> index 7c3f192..579835c 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_crat.h
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_crat.h
> @@ -257,7 +257,7 @@ struct crat_subtype_ccompute {
>   #define CRAT_IOLINK_TYPE_OTHER		16
>   #define CRAT_IOLINK_TYPE_MAX		255
>   
> -#define CRAT_IOLINK_RESERVED_LENGTH	24
> +#define CRAT_IOLINK_RESERVED_LENGTH	20
>   
>   struct crat_subtype_iolink {
>   	uint8_t		type;
> @@ -274,6 +274,7 @@ struct crat_subtype_iolink {
>   	uint32_t	minimum_bandwidth_mbs;
>   	uint32_t	maximum_bandwidth_mbs;
>   	uint32_t	recommended_transfer_size;
> +	uint32_t	num_hops_xgmi;
>   	uint8_t		reserved2[CRAT_IOLINK_RESERVED_LENGTH];

It would be safer to add num_hops_xgmi at the end of the reserved space. 
uint8_t is probably enough for the hop count. I'd also not change the 
CRAT_IOLINK_RESERVED_LENGTH. Instead this would work and make it clearer 
that we're appropriating some reserved space:

     ...
     uint8_t    reserved2[CRAT_IOLINK_RESERVED_LENGTH - 1];
     uint8_t    num_hops_xgmi;
};


>   };
>   


More information about the amd-gfx mailing list