[PATCH v3 6/6] drm/amdgpu: add RAS POISON interrupt funcs for jpeg_v4_0
Zhou1, Tao
Tao.Zhou1 at amd.com
Tue May 16 06:31:09 UTC 2023
[AMD Official Use Only - General]
The series is:
Reviewed-by: Tao Zhou <tao.zhou1 at amd.com>
> -----Original Message-----
> From: amd-gfx <amd-gfx-bounces at lists.freedesktop.org> On Behalf Of Horatio
> Zhang
> Sent: Tuesday, May 16, 2023 1:04 PM
> To: amd-gfx at lists.freedesktop.org
> Cc: Liu, HaoPing (Alan) <HaoPing.Liu at amd.com>; Zhou, Bob
> <Bob.Zhou at amd.com>; Zhang, Horatio <Hongkun.Zhang at amd.com>; Xu, Feifei
> <Feifei.Xu at amd.com>; Zhou1, Tao <Tao.Zhou1 at amd.com>; Jiang, Sonny
> <Sonny.Jiang at amd.com>; Limonciello, Mario <Mario.Limonciello at amd.com>;
> Liu, Leo <Leo.Liu at amd.com>; Zhang, Hawking <Hawking.Zhang at amd.com>
> Subject: [PATCH v3 6/6] drm/amdgpu: add RAS POISON interrupt funcs for
> jpeg_v4_0
>
> Add ras_poison_irq and functions. And fix the amdgpu_irq_put call trace in
> jpeg_v4_0_hw_fini.
>
> [ 50.497562] RIP: 0010:amdgpu_irq_put+0xa4/0xc0 [amdgpu]
> [ 50.497619] RSP: 0018:ffffaa2400fcfcb0 EFLAGS: 00010246
> [ 50.497620] RAX: 0000000000000000 RBX: 0000000000000001 RCX:
> 0000000000000000
> [ 50.497621] RDX: 0000000000000000 RSI: 0000000000000000 RDI:
> 0000000000000000
> [ 50.497621] RBP: ffffaa2400fcfcd0 R08: 0000000000000000 R09:
> 0000000000000000
> [ 50.497622] R10: 0000000000000000 R11: 0000000000000000 R12:
> ffff99b2105242d8
> [ 50.497622] R13: 0000000000000000 R14: ffff99b210500000 R15:
> ffff99b210500000
> [ 50.497623] FS: 0000000000000000(0000) GS:ffff99b518480000(0000)
> knlGS:0000000000000000
> [ 50.497623] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
> [ 50.497624] CR2: 00007f9d32aa91e8 CR3: 00000001ba210000 CR4:
> 0000000000750ee0
> [ 50.497624] PKRU: 55555554
> [ 50.497625] Call Trace:
> [ 50.497625] <TASK>
> [ 50.497627] jpeg_v4_0_hw_fini+0x43/0xc0 [amdgpu]
> [ 50.497693] jpeg_v4_0_suspend+0x13/0x30 [amdgpu]
> [ 50.497751] amdgpu_device_ip_suspend_phase2+0x240/0x470 [amdgpu]
> [ 50.497802] amdgpu_device_ip_suspend+0x41/0x80 [amdgpu]
> [ 50.497854] amdgpu_device_pre_asic_reset+0xd9/0x4a0 [amdgpu]
> [ 50.497905] amdgpu_device_gpu_recover.cold+0x548/0xcf1 [amdgpu]
> [ 50.498005] amdgpu_debugfs_reset_work+0x4c/0x80 [amdgpu]
> [ 50.498060] process_one_work+0x21f/0x400
> [ 50.498063] worker_thread+0x200/0x3f0
> [ 50.498064] ? process_one_work+0x400/0x400
> [ 50.498065] kthread+0xee/0x120
> [ 50.498067] ? kthread_complete_and_exit+0x20/0x20
> [ 50.498068] ret_from_fork+0x22/0x30
>
> Suggested-by: Hawking Zhang <Hawking.Zhang at amd.com>
> Signed-off-by: Horatio Zhang <Hongkun.Zhang at amd.com>
> ---
> drivers/gpu/drm/amd/amdgpu/jpeg_v4_0.c | 27 +++++++++++++++++++-------
> 1 file changed, 20 insertions(+), 7 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/jpeg_v4_0.c
> b/drivers/gpu/drm/amd/amdgpu/jpeg_v4_0.c
> index 495facb885f4..8690467b3285 100644
> --- a/drivers/gpu/drm/amd/amdgpu/jpeg_v4_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/jpeg_v4_0.c
> @@ -87,13 +87,13 @@ static int jpeg_v4_0_sw_init(void *handle)
>
> /* JPEG DJPEG POISON EVENT */
> r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
> - VCN_4_0__SRCID_DJPEG0_POISON, &adev->jpeg.inst-
> >irq);
> + VCN_4_0__SRCID_DJPEG0_POISON, &adev->jpeg.inst-
> >ras_poison_irq);
> if (r)
> return r;
>
> /* JPEG EJPEG POISON EVENT */
> r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_VCN,
> - VCN_4_0__SRCID_EJPEG0_POISON, &adev->jpeg.inst-
> >irq);
> + VCN_4_0__SRCID_EJPEG0_POISON, &adev->jpeg.inst-
> >ras_poison_irq);
> if (r)
> return r;
>
> @@ -202,7 +202,8 @@ static int jpeg_v4_0_hw_fini(void *handle)
> RREG32_SOC15(JPEG, 0, regUVD_JRBC_STATUS))
> jpeg_v4_0_set_powergating_state(adev,
> AMD_PG_STATE_GATE);
> }
> - amdgpu_irq_put(adev, &adev->jpeg.inst->irq, 0);
> + if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__JPEG))
> + amdgpu_irq_put(adev, &adev->jpeg.inst->ras_poison_irq, 0);
>
> return 0;
> }
> @@ -670,6 +671,14 @@ static int jpeg_v4_0_set_interrupt_state(struct
> amdgpu_device *adev,
> return 0;
> }
>
> +static int jpeg_v4_0_set_ras_interrupt_state(struct amdgpu_device *adev,
> + struct amdgpu_irq_src *source,
> + unsigned int type,
> + enum amdgpu_interrupt_state state) {
> + return 0;
> +}
> +
> static int jpeg_v4_0_process_interrupt(struct amdgpu_device *adev,
> struct amdgpu_irq_src *source,
> struct amdgpu_iv_entry *entry) @@ -680,10
> +689,6 @@ static int jpeg_v4_0_process_interrupt(struct amdgpu_device *adev,
> case VCN_4_0__SRCID__JPEG_DECODE:
> amdgpu_fence_process(adev->jpeg.inst->ring_dec);
> break;
> - case VCN_4_0__SRCID_DJPEG0_POISON:
> - case VCN_4_0__SRCID_EJPEG0_POISON:
> - amdgpu_jpeg_process_poison_irq(adev, source, entry);
> - break;
> default:
> DRM_DEV_ERROR(adev->dev, "Unhandled interrupt: %d %d\n",
> entry->src_id, entry->src_data[0]); @@ -753,10
> +758,18 @@ static const struct amdgpu_irq_src_funcs jpeg_v4_0_irq_funcs = {
> .process = jpeg_v4_0_process_interrupt, };
>
> +static const struct amdgpu_irq_src_funcs jpeg_v4_0_ras_irq_funcs = {
> + .set = jpeg_v4_0_set_ras_interrupt_state,
> + .process = amdgpu_jpeg_process_poison_irq, };
> +
> static void jpeg_v4_0_set_irq_funcs(struct amdgpu_device *adev) {
> adev->jpeg.inst->irq.num_types = 1;
> adev->jpeg.inst->irq.funcs = &jpeg_v4_0_irq_funcs;
> +
> + adev->jpeg.inst->ras_poison_irq.num_types = 1;
> + adev->jpeg.inst->ras_poison_irq.funcs = &jpeg_v4_0_ras_irq_funcs;
> }
>
> const struct amdgpu_ip_block_version jpeg_v4_0_ip_block = {
> --
> 2.34.1
More information about the amd-gfx
mailing list