[PATCH] drm/amd: fix debugfs access for discovery blob
Mario Limonciello
mario.limonciello at amd.com
Tue Aug 8 16:26:54 UTC 2023
On 8/7/2023 10:20, Alex Deucher wrote:
> On Tue, Aug 1, 2023 at 4:15 PM Mario Limonciello
> <mario.limonciello at amd.com> wrote:
>>
>> Accessing the blob for amdgpu discovery from debugfs triggers:
>>
>> [ 1924.487667] kernel BUG at mm/usercopy.c:102!
>>
>> usercopy_abort() explains that it needs to be solved by creating
>> a cache to store the data.
>>
>> Link: https://gitlab.freedesktop.org/drm/amd/-/issues/2748#note_2023519
>> Signed-off-by: Mario Limonciello <mario.limonciello at amd.com>
>
> Reviewed-by: Alex Deucher <alexander.deucher at amd.com>
>
Although this avoids the issue; I've concluded it's an inappropriate fix
and will abandon it. It turns out to spit out 64k discovery blobs that
should have been 8k.
6.5-rc and ASDN already picked up a better solution.
db3b5cb64a9c ("drm/amdgpu: Use apt name for FW reserved region")
>> ---
>> drivers/gpu/drm/amd/amdgpu/amdgpu.h | 7 +++++--
>> drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c | 17 ++++++++++++++++-
>> drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c | 2 ++
>> 3 files changed, 23 insertions(+), 3 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu.h b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
>> index a3b86b86dc477..66a2251bdeba4 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu.h
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
>> @@ -791,8 +791,11 @@ struct amdgpu_device {
>> bool accel_working;
>> struct notifier_block acpi_nb;
>> struct amdgpu_i2c_chan *i2c_bus[AMDGPU_MAX_I2C_BUS];
>> - struct debugfs_blob_wrapper debugfs_vbios_blob;
>> - struct debugfs_blob_wrapper debugfs_discovery_blob;
>> +#if defined(CONFIG_DEBUG_FS)
>> + struct debugfs_blob_wrapper debugfs_vbios_blob;
>> + struct debugfs_blob_wrapper debugfs_discovery_blob;
>> + struct kmem_cache *discovery_blob_cache;
>> +#endif
>> struct mutex srbm_mutex;
>> /* GRBM index mutex. Protects concurrent access to GRBM index */
>> struct mutex grbm_idx_mutex;
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c
>> index 56e89e76ff179..55ea5be14b188 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_debugfs.c
>> @@ -2180,7 +2180,15 @@ int amdgpu_debugfs_init(struct amdgpu_device *adev)
>> debugfs_create_blob("amdgpu_vbios", 0444, root,
>> &adev->debugfs_vbios_blob);
>>
>> - adev->debugfs_discovery_blob.data = adev->mman.discovery_bin;
>> +
>> + adev->discovery_blob_cache = kmem_cache_create_usercopy("amdgpu_discovery",
>> + adev->mman.discovery_tmr_size,
>> + 0, 0, 0,
>> + adev->mman.discovery_tmr_size,
>> + NULL);
>> + adev->debugfs_discovery_blob.data = kmem_cache_alloc(adev->discovery_blob_cache, GFP_KERNEL);
>> + memcpy(adev->debugfs_discovery_blob.data, adev->mman.discovery_bin,
>> + adev->mman.discovery_tmr_size);
>> adev->debugfs_discovery_blob.size = adev->mman.discovery_tmr_size;
>> debugfs_create_blob("amdgpu_discovery", 0444, root,
>> &adev->debugfs_discovery_blob);
>> @@ -2188,6 +2196,12 @@ int amdgpu_debugfs_init(struct amdgpu_device *adev)
>> return 0;
>> }
>>
>> +void amdgpu_debugfs_fini(struct amdgpu_device *adev)
>> +{
>> + kmem_cache_free(adev->discovery_blob_cache, adev->debugfs_discovery_blob.data);
>> + kmem_cache_destroy(adev->discovery_blob_cache);
>> +}
>> +
>> #else
>> int amdgpu_debugfs_init(struct amdgpu_device *adev)
>> {
>> @@ -2197,4 +2211,5 @@ int amdgpu_debugfs_regs_init(struct amdgpu_device *adev)
>> {
>> return 0;
>> }
>> +inline void amdgpu_debugfs_fini(struct amdgpu_device *adev) {}
>> #endif
>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
>> index 0593ef8fe0a63..1a3b30dff5171 100644
>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
>> @@ -2276,6 +2276,8 @@ amdgpu_pci_remove(struct pci_dev *pdev)
>> struct drm_device *dev = pci_get_drvdata(pdev);
>> struct amdgpu_device *adev = drm_to_adev(dev);
>>
>> + amdgpu_debugfs_fini(adev);
>> +
>> amdgpu_xcp_dev_unplug(adev);
>> drm_dev_unplug(dev);
>>
>> --
>> 2.34.1
>>
More information about the amd-gfx
mailing list