[PATCH] drm/amdgpu: fix amdgpu_need_full_reset (v2)
Christian König
deathsimple at vodafone.de
Fri Oct 14 09:23:33 UTC 2016
Am 14.10.2016 um 04:29 schrieb zhoucm1:
>
>
> On 2016年10月14日 05:22, Alex Deucher wrote:
>> IP types are not an index. Each asic may have number and
>> type of IPs. Properly check the the type rather than
>> using the type id as an index.
>>
>> v2: fix all the IPs to not use IP type as an idx as well.
>>
>> Signed-off-by: Alex Deucher <alexander.deucher at amd.com>
>> Cc: stable at vger.kernel.org
> Reviewed-by: Chunming Zhou <david1.zhou at amd.com>
Reviewed-by: Christian König <christian.koenig at amd.com>.
Might also make sense to replace all those special IP handling in the
common code with flags or something similar.
Regards,
Christian.
>> ---
>> drivers/gpu/drm/amd/amdgpu/amdgpu_device.c | 23
>> ++++++++++++++++-------
>> drivers/gpu/drm/amd/amdgpu/dce_v10_0.c | 12 ++----------
>> drivers/gpu/drm/amd/amdgpu/gfx_v8_0.c | 17 +++++++++--------
>> drivers/gpu/drm/amd/amdgpu/gmc_v8_0.c | 13 ++++++-------
>> drivers/gpu/drm/amd/amdgpu/sdma_v3_0.c | 14 ++++++--------
>> drivers/gpu/drm/amd/amdgpu/tonga_ih.c | 14 ++++++--------
>> drivers/gpu/drm/amd/amdgpu/uvd_v6_0.c | 14 +++++++-------
>> drivers/gpu/drm/amd/amdgpu/vce_v3_0.c | 15 +++++++--------
>> drivers/gpu/drm/amd/include/amd_shared.h | 2 +-
>> 9 files changed, 60 insertions(+), 64 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
>> index 5a99a43..a67a572 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
>> @@ -2128,7 +2128,8 @@ static bool amdgpu_check_soft_reset(struct
>> amdgpu_device *adev)
>> if (!adev->ip_block_status[i].valid)
>> continue;
>> if (adev->ip_blocks[i].funcs->check_soft_reset)
>> - adev->ip_blocks[i].funcs->check_soft_reset(adev);
>> + adev->ip_block_status[i].hang =
>> + adev->ip_blocks[i].funcs->check_soft_reset(adev);
>> if (adev->ip_block_status[i].hang) {
>> DRM_INFO("IP block:%d is hang!\n", i);
>> asic_hang = true;
>> @@ -2157,12 +2158,20 @@ static int amdgpu_pre_soft_reset(struct
>> amdgpu_device *adev)
>> static bool amdgpu_need_full_reset(struct amdgpu_device *adev)
>> {
>> - if (adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang ||
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_SMC].hang ||
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_ACP].hang ||
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_DCE].hang) {
>> - DRM_INFO("Some block need full reset!\n");
>> - return true;
>> + int i;
>> +
>> + for (i = 0; i < adev->num_ip_blocks; i++) {
>> + if (!adev->ip_block_status[i].valid)
>> + continue;
>> + if ((adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_GMC) ||
>> + (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_SMC) ||
>> + (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_ACP) ||
>> + (adev->ip_blocks[i].type == AMD_IP_BLOCK_TYPE_DCE)) {
>> + if (adev->ip_block_status[i].hang) {
>> + DRM_INFO("Some block need full reset!\n");
>> + return true;
>> + }
>> + }
>> }
>> return false;
>> }
>> diff --git a/drivers/gpu/drm/amd/amdgpu/dce_v10_0.c
>> b/drivers/gpu/drm/amd/amdgpu/dce_v10_0.c
>> index bd0ecf4..15c3833 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/dce_v10_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/dce_v10_0.c
>> @@ -3104,16 +3104,11 @@ static int dce_v10_0_wait_for_idle(void *handle)
>> return 0;
>> }
>> -static int dce_v10_0_check_soft_reset(void *handle)
>> +static bool dce_v10_0_check_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (dce_v10_0_is_display_hung(adev))
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_DCE].hang = true;
>> - else
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_DCE].hang = false;
>> -
>> - return 0;
>> + return dce_v10_0_is_display_hung(adev);
>> }
>> static int dce_v10_0_soft_reset(void *handle)
>> @@ -3121,9 +3116,6 @@ static int dce_v10_0_soft_reset(void *handle)
>> u32 srbm_soft_reset = 0, tmp;
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_DCE].hang)
>> - return 0;
>> -
>> if (dce_v10_0_is_display_hung(adev))
>> srbm_soft_reset |= SRBM_SOFT_RESET__SOFT_RESET_DC_MASK;
>> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v8_0.c
>> b/drivers/gpu/drm/amd/amdgpu/gfx_v8_0.c
>> index ed49e33..6f3996f 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v8_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v8_0.c
>> @@ -5147,7 +5147,7 @@ static int gfx_v8_0_wait_for_idle(void *handle)
>> return -ETIMEDOUT;
>> }
>> -static int gfx_v8_0_check_soft_reset(void *handle)
>> +static bool gfx_v8_0_check_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 grbm_soft_reset = 0, srbm_soft_reset = 0;
>> @@ -5199,16 +5199,14 @@ static int gfx_v8_0_check_soft_reset(void
>> *handle)
>> SRBM_SOFT_RESET, SOFT_RESET_SEM, 1);
>> if (grbm_soft_reset || srbm_soft_reset) {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_GFX].hang = true;
>> adev->gfx.grbm_soft_reset = grbm_soft_reset;
>> adev->gfx.srbm_soft_reset = srbm_soft_reset;
>> + return true;
>> } else {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_GFX].hang = false;
>> adev->gfx.grbm_soft_reset = 0;
>> adev->gfx.srbm_soft_reset = 0;
>> + return false;
>> }
>> -
>> - return 0;
>> }
>> static void gfx_v8_0_inactive_hqd(struct amdgpu_device *adev,
>> @@ -5236,7 +5234,8 @@ static int gfx_v8_0_pre_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 grbm_soft_reset = 0, srbm_soft_reset = 0;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_GFX].hang)
>> + if ((!adev->gfx.grbm_soft_reset) &&
>> + (!adev->gfx.srbm_soft_reset))
>> return 0;
>> grbm_soft_reset = adev->gfx.grbm_soft_reset;
>> @@ -5274,7 +5273,8 @@ static int gfx_v8_0_soft_reset(void *handle)
>> u32 grbm_soft_reset = 0, srbm_soft_reset = 0;
>> u32 tmp;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_GFX].hang)
>> + if ((!adev->gfx.grbm_soft_reset) &&
>> + (!adev->gfx.srbm_soft_reset))
>> return 0;
>> grbm_soft_reset = adev->gfx.grbm_soft_reset;
>> @@ -5344,7 +5344,8 @@ static int gfx_v8_0_post_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 grbm_soft_reset = 0, srbm_soft_reset = 0;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_GFX].hang)
>> + if ((!adev->gfx.grbm_soft_reset) &&
>> + (!adev->gfx.srbm_soft_reset))
>> return 0;
>> grbm_soft_reset = adev->gfx.grbm_soft_reset;
>> diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v8_0.c
>> b/drivers/gpu/drm/amd/amdgpu/gmc_v8_0.c
>> index 1b319f5..c22ef14 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/gmc_v8_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/gmc_v8_0.c
>> @@ -1099,7 +1099,7 @@ static int gmc_v8_0_wait_for_idle(void *handle)
>> }
>> -static int gmc_v8_0_check_soft_reset(void *handle)
>> +static bool gmc_v8_0_check_soft_reset(void *handle)
>> {
>> u32 srbm_soft_reset = 0;
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> @@ -1116,20 +1116,19 @@ static int gmc_v8_0_check_soft_reset(void
>> *handle)
>> SRBM_SOFT_RESET, SOFT_RESET_MC, 1);
>> }
>> if (srbm_soft_reset) {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang = true;
>> adev->mc.srbm_soft_reset = srbm_soft_reset;
>> + return true;
>> } else {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang = false;
>> adev->mc.srbm_soft_reset = 0;
>> + return false;
>> }
>> - return 0;
>> }
>> static int gmc_v8_0_pre_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang)
>> + if (!adev->mc.srbm_soft_reset)
>> return 0;
>> gmc_v8_0_mc_stop(adev, &adev->mc.save);
>> @@ -1145,7 +1144,7 @@ static int gmc_v8_0_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang)
>> + if (!adev->mc.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->mc.srbm_soft_reset;
>> @@ -1175,7 +1174,7 @@ static int gmc_v8_0_post_soft_reset(void
>> *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_GMC].hang)
>> + if (!adev->mc.srbm_soft_reset)
>> return 0;
>> gmc_v8_0_mc_resume(adev, &adev->mc.save);
>> diff --git a/drivers/gpu/drm/amd/amdgpu/sdma_v3_0.c
>> b/drivers/gpu/drm/amd/amdgpu/sdma_v3_0.c
>> index 6f3a07f..24642f9 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/sdma_v3_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/sdma_v3_0.c
>> @@ -1251,7 +1251,7 @@ static int sdma_v3_0_wait_for_idle(void *handle)
>> return -ETIMEDOUT;
>> }
>> -static int sdma_v3_0_check_soft_reset(void *handle)
>> +static bool sdma_v3_0_check_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset = 0;
>> @@ -1264,14 +1264,12 @@ static int sdma_v3_0_check_soft_reset(void
>> *handle)
>> }
>> if (srbm_soft_reset) {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_SDMA].hang = true;
>> adev->sdma.srbm_soft_reset = srbm_soft_reset;
>> + return true;
>> } else {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_SDMA].hang = false;
>> adev->sdma.srbm_soft_reset = 0;
>> + return false;
>> }
>> -
>> - return 0;
>> }
>> static int sdma_v3_0_pre_soft_reset(void *handle)
>> @@ -1279,7 +1277,7 @@ static int sdma_v3_0_pre_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset = 0;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_SDMA].hang)
>> + if (!adev->sdma.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->sdma.srbm_soft_reset;
>> @@ -1298,7 +1296,7 @@ static int sdma_v3_0_post_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset = 0;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_SDMA].hang)
>> + if (!adev->sdma.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->sdma.srbm_soft_reset;
>> @@ -1318,7 +1316,7 @@ static int sdma_v3_0_soft_reset(void *handle)
>> u32 srbm_soft_reset = 0;
>> u32 tmp;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_SDMA].hang)
>> + if (!adev->sdma.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->sdma.srbm_soft_reset;
>> diff --git a/drivers/gpu/drm/amd/amdgpu/tonga_ih.c
>> b/drivers/gpu/drm/amd/amdgpu/tonga_ih.c
>> index d127d59..b4ea229 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/tonga_ih.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/tonga_ih.c
>> @@ -373,7 +373,7 @@ static int tonga_ih_wait_for_idle(void *handle)
>> return -ETIMEDOUT;
>> }
>> -static int tonga_ih_check_soft_reset(void *handle)
>> +static bool tonga_ih_check_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset = 0;
>> @@ -384,21 +384,19 @@ static int tonga_ih_check_soft_reset(void *handle)
>> SOFT_RESET_IH, 1);
>> if (srbm_soft_reset) {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_IH].hang = true;
>> adev->irq.srbm_soft_reset = srbm_soft_reset;
>> + return true;
>> } else {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_IH].hang = false;
>> adev->irq.srbm_soft_reset = 0;
>> + return false;
>> }
>> -
>> - return 0;
>> }
>> static int tonga_ih_pre_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_IH].hang)
>> + if (!adev->irq.srbm_soft_reset)
>> return 0;
>> return tonga_ih_hw_fini(adev);
>> @@ -408,7 +406,7 @@ static int tonga_ih_post_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_IH].hang)
>> + if (!adev->irq.srbm_soft_reset)
>> return 0;
>> return tonga_ih_hw_init(adev);
>> @@ -419,7 +417,7 @@ static int tonga_ih_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_IH].hang)
>> + if (!adev->irq.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->irq.srbm_soft_reset;
>> diff --git a/drivers/gpu/drm/amd/amdgpu/uvd_v6_0.c
>> b/drivers/gpu/drm/amd/amdgpu/uvd_v6_0.c
>> index 8f8a5dd..be91293 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/uvd_v6_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/uvd_v6_0.c
>> @@ -744,7 +744,7 @@ static int uvd_v6_0_wait_for_idle(void *handle)
>> }
>> #define AMDGPU_UVD_STATUS_BUSY_MASK 0xfd
>> -static int uvd_v6_0_check_soft_reset(void *handle)
>> +static bool uvd_v6_0_check_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset = 0;
>> @@ -756,19 +756,19 @@ static int uvd_v6_0_check_soft_reset(void *handle)
>> srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
>> SRBM_SOFT_RESET, SOFT_RESET_UVD, 1);
>> if (srbm_soft_reset) {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang = true;
>> adev->uvd.srbm_soft_reset = srbm_soft_reset;
>> + return true;
>> } else {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang = false;
>> adev->uvd.srbm_soft_reset = 0;
>> + return false;
>> }
>> - return 0;
>> }
>> +
>> static int uvd_v6_0_pre_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang)
>> + if (!adev->uvd.srbm_soft_reset)
>> return 0;
>> uvd_v6_0_stop(adev);
>> @@ -780,7 +780,7 @@ static int uvd_v6_0_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang)
>> + if (!adev->uvd.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->uvd.srbm_soft_reset;
>> @@ -810,7 +810,7 @@ static int uvd_v6_0_post_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_UVD].hang)
>> + if (!adev->uvd.srbm_soft_reset)
>> return 0;
>> mdelay(5);
>> diff --git a/drivers/gpu/drm/amd/amdgpu/vce_v3_0.c
>> b/drivers/gpu/drm/amd/amdgpu/vce_v3_0.c
>> index c7ddbef..589fff1 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/vce_v3_0.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/vce_v3_0.c
>> @@ -560,7 +560,7 @@ static int vce_v3_0_wait_for_idle(void *handle)
>> #define AMDGPU_VCE_STATUS_BUSY_MASK
>> (VCE_STATUS_VCPU_REPORT_AUTO_BUSY_MASK | \
>> VCE_STATUS_VCPU_REPORT_RB0_BUSY_MASK)
>> -static int vce_v3_0_check_soft_reset(void *handle)
>> +static bool vce_v3_0_check_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset = 0;
>> @@ -590,16 +590,15 @@ static int vce_v3_0_check_soft_reset(void *handle)
>> srbm_soft_reset = REG_SET_FIELD(srbm_soft_reset,
>> SRBM_SOFT_RESET, SOFT_RESET_VCE1, 1);
>> }
>> WREG32_FIELD(GRBM_GFX_INDEX, INSTANCE_INDEX, 0);
>> + mutex_unlock(&adev->grbm_idx_mutex);
>> if (srbm_soft_reset) {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_VCE].hang = true;
>> adev->vce.srbm_soft_reset = srbm_soft_reset;
>> + return true;
>> } else {
>> - adev->ip_block_status[AMD_IP_BLOCK_TYPE_VCE].hang = false;
>> adev->vce.srbm_soft_reset = 0;
>> + return false;
>> }
>> - mutex_unlock(&adev->grbm_idx_mutex);
>> - return 0;
>> }
>> static int vce_v3_0_soft_reset(void *handle)
>> @@ -607,7 +606,7 @@ static int vce_v3_0_soft_reset(void *handle)
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> u32 srbm_soft_reset;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_VCE].hang)
>> + if (!adev->vce.srbm_soft_reset)
>> return 0;
>> srbm_soft_reset = adev->vce.srbm_soft_reset;
>> @@ -637,7 +636,7 @@ static int vce_v3_0_pre_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_VCE].hang)
>> + if (!adev->vce.srbm_soft_reset)
>> return 0;
>> mdelay(5);
>> @@ -650,7 +649,7 @@ static int vce_v3_0_post_soft_reset(void *handle)
>> {
>> struct amdgpu_device *adev = (struct amdgpu_device *)handle;
>> - if (!adev->ip_block_status[AMD_IP_BLOCK_TYPE_VCE].hang)
>> + if (!adev->vce.srbm_soft_reset)
>> return 0;
>> mdelay(5);
>> diff --git a/drivers/gpu/drm/amd/include/amd_shared.h
>> b/drivers/gpu/drm/amd/include/amd_shared.h
>> index 94ebc32..d198627 100644
>> --- a/drivers/gpu/drm/amd/include/amd_shared.h
>> +++ b/drivers/gpu/drm/amd/include/amd_shared.h
>> @@ -188,7 +188,7 @@ struct amd_ip_funcs {
>> /* poll for idle */
>> int (*wait_for_idle)(void *handle);
>> /* check soft reset the IP block */
>> - int (*check_soft_reset)(void *handle);
>> + bool (*check_soft_reset)(void *handle);
>> /* pre soft reset the IP block */
>> int (*pre_soft_reset)(void *handle);
>> /* soft reset the IP block */
>
> _______________________________________________
> amd-gfx mailing list
> amd-gfx at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/amd-gfx
More information about the amd-gfx
mailing list