<html>
<head>
<meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1">
<style type="text/css" style="display:none;"> P {margin-top:0;margin-bottom:0;} </style>
</head>
<body dir="ltr">
<p style="font-family:Arial;font-size:10pt;color:#0078D7;margin:15pt;" align="Left">
[AMD Official Use Only - Internal Distribution Only]<br>
</p>
<br>
<div>
<div style="font-family: Calibri, Arial, Helvetica, sans-serif; font-size: 12pt; color: rgb(0, 0, 0);">
Thanks very much Christian!<br>
</div>
<div id="appendonsend"></div>
<hr style="display:inline-block;width:98%" tabindex="-1">
<div id="divRplyFwdMsg" dir="ltr"><font face="Calibri, sans-serif" style="font-size:11pt" color="#000000"><b>From:</b> Koenig, Christian <Christian.Koenig@amd.com><br>
<b>Sent:</b> Tuesday, January 21, 2020 4:52<br>
<b>To:</b> Yin, Tianci (Rico) <Tianci.Yin@amd.com>; amd-gfx@lists.freedesktop.org <amd-gfx@lists.freedesktop.org><br>
<b>Cc:</b> Tuikov, Luben <Luben.Tuikov@amd.com>; Deucher, Alexander <Alexander.Deucher@amd.com>; Zhang, Hawking <Hawking.Zhang@amd.com>; Xu, Feifei <Feifei.Xu@amd.com>; Yuan, Xiaojie <Xiaojie.Yuan@amd.com>; Long, Gang <Gang.Long@amd.com>; Wang, Kevin(Yang)
 <Kevin1.Wang@amd.com><br>
<b>Subject:</b> Re: [PATCH 1/2] drm/amdgpu: fix VRAM partially encroached issue in GDDR6 memory training(V2)</font>
<div> </div>
</div>
<div class="BodyFragment"><font size="2"><span style="font-size:11pt;">
<div class="PlainText">Am 21.01.20 um 03:22 schrieb Tianci Yin:<br>
> From: "Tianci.Yin" <tianci.yin@amd.com><br>
><br>
> [why]<br>
> In GDDR6 BIST training, a certain mount of bottom VRAM will be encroached by<br>
> UMC, that causes problems(like GTT corrupted and page fault observed).<br>
><br>
> [how]<br>
> Saving the content of this bottom VRAM to system memory before training, and<br>
> restoring it after training to avoid VRAM corruption.<br>
><br>
> Change-Id: I04a8a6e8e63b3619f7c693fe67883b229cbf3c53<br>
> Signed-off-by: Tianci.Yin <tianci.yin@amd.com><br>
<br>
Acked-by: Christian König <christian.koenig@amd.com> for this one and <br>
Reviewed-by: Christian König <christian.koenig@amd.com> for patch #2.<br>
<br>
Regards,<br>
Christian.<br>
<br>
> ---<br>
>   drivers/gpu/drm/amd/amdgpu/amdgpu_psp.h |  2 ++<br>
>   drivers/gpu/drm/amd/amdgpu/psp_v11_0.c  | 36 ++++++++++++++++++++++---<br>
>   2 files changed, 35 insertions(+), 3 deletions(-)<br>
><br>
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_psp.h b/drivers/gpu/drm/amd/amdgpu/amdgpu_psp.h<br>
> index 3265487b859f..611021514c52 100644<br>
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_psp.h<br>
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_psp.h<br>
> @@ -172,6 +172,8 @@ struct psp_dtm_context {<br>
>   #define MEM_TRAIN_SYSTEM_SIGNATURE          0x54534942<br>
>   #define GDDR6_MEM_TRAINING_DATA_SIZE_IN_BYTES       0x1000<br>
>   #define GDDR6_MEM_TRAINING_OFFSET           0x8000<br>
> +/*Define the VRAM size that will be encroached by BIST training.*/<br>
> +#define GDDR6_MEM_TRAINING_ENCROACHED_SIZE   0x2000000<br>
>   <br>
>   enum psp_memory_training_init_flag {<br>
>        PSP_MEM_TRAIN_NOT_SUPPORT       = 0x0,<br>
> diff --git a/drivers/gpu/drm/amd/amdgpu/psp_v11_0.c b/drivers/gpu/drm/amd/amdgpu/psp_v11_0.c<br>
> index 685dd9754c67..ac173d2eb809 100644<br>
> --- a/drivers/gpu/drm/amd/amdgpu/psp_v11_0.c<br>
> +++ b/drivers/gpu/drm/amd/amdgpu/psp_v11_0.c<br>
> @@ -971,10 +971,13 @@ static int psp_v11_0_memory_training_init(struct psp_context *psp)<br>
>    */<br>
>   static int psp_v11_0_memory_training(struct psp_context *psp, uint32_t ops)<br>
>   {<br>
> -     int ret;<br>
> -     uint32_t p2c_header[4];<br>
>        struct psp_memory_training_context *ctx = &psp->mem_train_ctx;<br>
>        uint32_t *pcache = (uint32_t*)ctx->sys_cache;<br>
> +     struct amdgpu_device *adev = psp->adev;<br>
> +     uint32_t p2c_header[4];<br>
> +     uint32_t sz;<br>
> +     void *buf;<br>
> +     int ret;<br>
>   <br>
>        if (ctx->init == PSP_MEM_TRAIN_NOT_SUPPORT) {<br>
>                DRM_DEBUG("Memory training is not supported.\n");<br>
> @@ -989,7 +992,7 @@ static int psp_v11_0_memory_training(struct psp_context *psp, uint32_t ops)<br>
>                return 0;<br>
>        }<br>
>   <br>
> -     amdgpu_device_vram_access(psp->adev, ctx->p2c_train_data_offset, p2c_header, sizeof(p2c_header), false);<br>
> +     amdgpu_device_vram_access(adev, ctx->p2c_train_data_offset, p2c_header, sizeof(p2c_header), false);<br>
>        DRM_DEBUG("sys_cache[%08x,%08x,%08x,%08x] p2c_header[%08x,%08x,%08x,%08x]\n",<br>
>                  pcache[0], pcache[1], pcache[2], pcache[3],<br>
>                  p2c_header[0], p2c_header[1], p2c_header[2], p2c_header[3]);<br>
> @@ -1026,11 +1029,38 @@ static int psp_v11_0_memory_training(struct psp_context *psp, uint32_t ops)<br>
>        DRM_DEBUG("Memory training ops:%x.\n", ops);<br>
>   <br>
>        if (ops & PSP_MEM_TRAIN_SEND_LONG_MSG) {<br>
> +             /*<br>
> +              * Long traing will encroach certain mount of bottom VRAM,<br>
> +              * saving the content of this bottom VRAM to system memory<br>
> +              * before training, and restoring it after training to avoid<br>
> +              * VRAM corruption.<br>
> +              */<br>
> +             sz = GDDR6_MEM_TRAINING_ENCROACHED_SIZE;<br>
> +<br>
> +             if (adev->gmc.visible_vram_size < sz || !adev->mman.aper_base_kaddr) {<br>
> +                     DRM_ERROR("visible_vram_size %llx or aper_base_kaddr %p is not initialized.\n",<br>
> +                               adev->gmc.visible_vram_size,<br>
> +                               adev->mman.aper_base_kaddr);<br>
> +                     return -EINVAL;<br>
> +             }<br>
> +<br>
> +             buf = vmalloc(sz);<br>
> +             if (!buf) {<br>
> +                     DRM_ERROR("failed to allocate system memory.\n");<br>
> +                     return -ENOMEM;<br>
> +             }<br>
> +<br>
> +             memcpy_fromio(buf, adev->mman.aper_base_kaddr, sz);<br>
>                ret = psp_v11_0_memory_training_send_msg(psp, PSP_BL__DRAM_LONG_TRAIN);<br>
>                if (ret) {<br>
>                        DRM_ERROR("Send long training msg failed.\n");<br>
> +                     vfree(buf);<br>
>                        return ret;<br>
>                }<br>
> +<br>
> +             memcpy_toio(adev->mman.aper_base_kaddr, buf, sz);<br>
> +             adev->nbio.funcs->hdp_flush(adev, NULL);<br>
> +             vfree(buf);<br>
>        }<br>
>   <br>
>        if (ops & PSP_MEM_TRAIN_SAVE) {<br>
<br>
</div>
</span></font></div>
</div>
</body>
</html>