[PATCH] drm/amdgpu: Delay unmapping MMIO VRAM to amdgpu_ttm_fini() in GPU initialization failure
Andrey Grodzovsky
andrey.grodzovsky at amd.com
Tue Jan 4 15:40:00 UTC 2022
On 2022-01-03 9:30 p.m., Leslie Shi wrote:
> If the driver loads failed during hw_init(), delay unmapping MMIO VRAM to amdgpu_ttm_fini().
> Its prevents accessing invalid memory address in vcn_v3_0_sw_fini().
>
> Signed-off-by: Leslie Shi <Yuliang.Shi at amd.com>
> ---
> drivers/gpu/drm/amd/amdgpu/amdgpu_device.c | 16 +++++++++-------
> drivers/gpu/drm/amd/amdgpu/amdgpu_ttm.c | 4 ++++
> 2 files changed, 13 insertions(+), 7 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
> index ce93a304292c..d6006de57af5 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
> @@ -3830,7 +3830,7 @@ int amdgpu_device_init(struct amdgpu_device *adev,
> return r;
> }
>
> -static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
> +static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev, bool unmap_mmio_vram)
> {
> /* Clear all CPU mappings pointing to this device */
> unmap_mapping_range(adev->ddev.anon_inode->i_mapping, 0, 0, 1);
> @@ -3840,9 +3840,12 @@ static void amdgpu_device_unmap_mmio(struct amdgpu_device *adev)
>
> iounmap(adev->rmmio);
> adev->rmmio = NULL;
> - if (adev->mman.aper_base_kaddr)
> - iounmap(adev->mman.aper_base_kaddr);
> - adev->mman.aper_base_kaddr = NULL;
Why only VRAM ? Why not register BAR above ? In general I don't see why
not just follow
what i suggested here https://www.spinics.net/lists/amd-gfx/msg72217.html
Andrey
> +
> + if (unmap_mmio_vram) {
> + if (adev->mman.aper_base_kaddr)
> + iounmap(adev->mman.aper_base_kaddr);
> + adev->mman.aper_base_kaddr = NULL;
> + }
>
> /* Memory manager related */
> if (!adev->gmc.xgmi.connected_to_cpu) {
> @@ -3905,8 +3908,7 @@ void amdgpu_device_fini_hw(struct amdgpu_device *adev)
>
> amdgpu_gart_dummy_page_fini(adev);
>
> - if (drm_dev_is_unplugged(adev_to_drm(adev)))
> - amdgpu_device_unmap_mmio(adev);
> + amdgpu_device_unmap_mmio(adev, drm_dev_is_unplugged(adev_to_drm(adev)));
>
> }
>
> @@ -5727,7 +5729,7 @@ void amdgpu_device_halt(struct amdgpu_device *adev)
>
> adev->no_hw_access = true;
>
> - amdgpu_device_unmap_mmio(adev);
> + amdgpu_device_unmap_mmio(adev, true);
>
> pci_disable_device(pdev);
> pci_wait_for_pending_transaction(pdev);
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_ttm.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_ttm.c
> index 367abed1d6e6..67cd12caf019 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_ttm.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_ttm.c
> @@ -1815,6 +1815,10 @@ void amdgpu_ttm_fini(struct amdgpu_device *adev)
> NULL, NULL);
> amdgpu_ttm_fw_reserve_vram_fini(adev);
>
> + if (adev->mman.aper_base_kaddr)
> + iounmap(adev->mman.aper_base_kaddr);
> + adev->mman.aper_base_kaddr = NULL;
> +
> amdgpu_vram_mgr_fini(adev);
> amdgpu_gtt_mgr_fini(adev);
> amdgpu_preempt_mgr_fini(adev);
More information about the amd-gfx
mailing list