[PATCH 1/3] drm/amdgpu: move umc late init from gmc to umc block

Zhou1, Tao Tao.Zhou1 at amd.com
Fri Sep 6 10:55:58 UTC 2019



> -----Original Message-----
> From: Chen, Guchun <Guchun.Chen at amd.com>
> Sent: 2019年9月6日 18:01
> To: Zhou1, Tao <Tao.Zhou1 at amd.com>; amd-gfx at lists.freedesktop.org;
> Zhang, Hawking <Hawking.Zhang at amd.com>
> Subject: RE: [PATCH 1/3] drm/amdgpu: move umc late init from gmc to umc
> block
> 
> 
> 
> -----Original Message-----
> From: Zhou1, Tao <Tao.Zhou1 at amd.com>
> Sent: Friday, September 6, 2019 5:01 PM
> To: amd-gfx at lists.freedesktop.org; Zhang, Hawking
> <Hawking.Zhang at amd.com>; Chen, Guchun <Guchun.Chen at amd.com>
> Cc: Zhou1, Tao <Tao.Zhou1 at amd.com>
> Subject: [PATCH 1/3] drm/amdgpu: move umc late init from gmc to umc
> block
> 
> umc late init is umc specific, it's more suitable to be put in umc block
> 
> Signed-off-by: Tao Zhou <tao.zhou1 at amd.com>
> ---
>  drivers/gpu/drm/amd/amdgpu/Makefile     |  2 +-
>  drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.c | 48 ----------------
> drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h |  2 -
> drivers/gpu/drm/amd/amdgpu/amdgpu_umc.c | 73
> +++++++++++++++++++++++++
> drivers/gpu/drm/amd/amdgpu/amdgpu_umc.h |  2 +
>  drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c   |  8 ++-
>  drivers/gpu/drm/amd/amdgpu/umc_v6_1.c   |  1 +
>  7 files changed, 82 insertions(+), 54 deletions(-)  create mode 100644
> drivers/gpu/drm/amd/amdgpu/amdgpu_umc.c
> 
> diff --git a/drivers/gpu/drm/amd/amdgpu/Makefile
> b/drivers/gpu/drm/amd/amdgpu/Makefile
> index 84614a71bb4d..91369c823ce2 100644
> --- a/drivers/gpu/drm/amd/amdgpu/Makefile
> +++ b/drivers/gpu/drm/amd/amdgpu/Makefile
> @@ -55,7 +55,7 @@ amdgpu-y += amdgpu_device.o amdgpu_kms.o \
>  	amdgpu_vf_error.o amdgpu_sched.o amdgpu_debugfs.o
> amdgpu_ids.o \
>  	amdgpu_gmc.o amdgpu_mmhub.o amdgpu_xgmi.o amdgpu_csa.o
> amdgpu_ras.o amdgpu_vm_cpu.o \
>  	amdgpu_vm_sdma.o amdgpu_pmu.o amdgpu_discovery.o
> amdgpu_ras_eeprom.o amdgpu_nbio.o \
> -	smu_v11_0_i2c.o
> +	amdgpu_umc.o smu_v11_0_i2c.o
> 
>  amdgpu-$(CONFIG_PERF_EVENTS) += amdgpu_pmu.o
> 
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.c
> b/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.c
> index 51890b1d8522..dc044eec188e 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.c
> @@ -304,51 +304,3 @@ bool amdgpu_gmc_filter_faults(struct
> amdgpu_device *adev, uint64_t addr,
>  	gmc->fault_hash[hash].idx = gmc->last_fault++;
>  	return false;
>  }
> -
> -int amdgpu_gmc_ras_late_init(struct amdgpu_device *adev,
> -			     void *ras_ih_info)
> -{
> -	int r;
> -	struct ras_ih_if *ih_info = (struct ras_ih_if *)ras_ih_info;
> -	struct ras_fs_if fs_info = {
> -		.sysfs_name = "umc_err_count",
> -		.debugfs_name = "umc_err_inject",
> -	};
> -
> -	if (!ih_info)
> -		return -EINVAL;
> -
> -	if (!adev->gmc.umc_ras_if) {
> -		adev->gmc.umc_ras_if = kmalloc(sizeof(struct
> ras_common_if), GFP_KERNEL);
> -		if (!adev->gmc.umc_ras_if)
> -			return -ENOMEM;
> -		adev->gmc.umc_ras_if->block = AMDGPU_RAS_BLOCK__UMC;
> -		adev->gmc.umc_ras_if->type =
> AMDGPU_RAS_ERROR__MULTI_UNCORRECTABLE;
> -		adev->gmc.umc_ras_if->sub_block_index = 0;
> -		strcpy(adev->gmc.umc_ras_if->name, "umc");
> -	}
> -	ih_info->head = fs_info.head = *adev->gmc.umc_ras_if;
> -
> -	r = amdgpu_ras_late_init(adev, adev->gmc.umc_ras_if,
> -				 &fs_info, ih_info);
> -	if (r)
> -		goto free;
> -
> -	if (amdgpu_ras_is_supported(adev, adev->gmc.umc_ras_if->block)) {
> -		r = amdgpu_irq_get(adev, &adev->gmc.ecc_irq, 0);
> -		if (r)
> -			goto late_fini;
> -	} else {
> -		r = 0;
> -		goto free;
> -	}
> -
> -	return 0;
> -
> -late_fini:
> -	amdgpu_ras_late_fini(adev, adev->gmc.umc_ras_if, ih_info);
> -free:
> -	kfree(adev->gmc.umc_ras_if);
> -	adev->gmc.umc_ras_if = NULL;
> -	return r;
> -}
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
> b/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
> index 331ce50a3a9e..b6e1d98ef01e 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
> @@ -230,7 +230,5 @@ void amdgpu_gmc_agp_location(struct
> amdgpu_device *adev,
>  			     struct amdgpu_gmc *mc);
>  bool amdgpu_gmc_filter_faults(struct amdgpu_device *adev, uint64_t addr,
>  			      uint16_t pasid, uint64_t timestamp); -int
> amdgpu_gmc_ras_late_init(struct amdgpu_device *adev,
> -			     void *ih_info);
> 
>  #endif
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.c
> b/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.c
> new file mode 100644
> index 000000000000..c8de127097ab
> --- /dev/null
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.c
> @@ -0,0 +1,73 @@
> +/*
> + * Copyright 2019 Advanced Micro Devices, Inc.
> + *
> + * Permission is hereby granted, free of charge, to any person
> +obtaining a
> + * copy of this software and associated documentation files (the
> +"Software"),
> + * to deal in the Software without restriction, including without
> +limitation
> + * the rights to use, copy, modify, merge, publish, distribute,
> +sublicense,
> + * and/or sell copies of the Software, and to permit persons to whom
> +the
> + * Software is furnished to do so, subject to the following conditions:
> + *
> + * The above copyright notice and this permission notice shall be
> +included in
> + * all copies or substantial portions of the Software.
> + *
> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
> +EXPRESS OR
> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
> +MERCHANTABILITY,
> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO
> EVENT
> +SHALL
> + * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM,
> +DAMAGES OR
> + * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
> +OTHERWISE,
> + * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
> THE USE
> +OR
> + * OTHER DEALINGS IN THE SOFTWARE.
> + *
> + */
> +
> +#include "amdgpu.h"
> +#include "amdgpu_ras.h"
> +
> +int amdgpu_umc_ras_late_init(struct amdgpu_device *adev, void
> +*ras_ih_info) {
> +	int r;
> +	struct ras_ih_if *ih_info = (struct ras_ih_if *)ras_ih_info;
> +	struct ras_fs_if fs_info = {
> +		.sysfs_name = "umc_err_count",
> +		.debugfs_name = "umc_err_inject",
> +	};
> +
> +	if (!ih_info)
> +		return -EINVAL;
> +
> +	if (!adev->gmc.umc_ras_if) {
> +		adev->gmc.umc_ras_if =
> +			kmalloc(sizeof(struct ras_common_if), GFP_KERNEL);
> +		if (!adev->gmc.umc_ras_if)
> +			return -ENOMEM;
> +		adev->gmc.umc_ras_if->block = AMDGPU_RAS_BLOCK__UMC;
> +		adev->gmc.umc_ras_if->type =
> AMDGPU_RAS_ERROR__MULTI_UNCORRECTABLE;
> +		adev->gmc.umc_ras_if->sub_block_index = 0;
> +		strcpy(adev->gmc.umc_ras_if->name, "umc");
> +	}
> +	ih_info->head = fs_info.head = *adev->gmc.umc_ras_if;
> [Guchun]We have one amdgpu_umc member in adev structure, so is it
> reasonable to move umc_ras_if from gmc to this umc specific structure?

[Tao] In fact, the refinement is not finished, I also consider moving the call back of ecc_irq to common file. I'll continue to refine ras code (including your suggestion) in future's new patch.

> 
> +	r = amdgpu_ras_late_init(adev, adev->gmc.umc_ras_if,
> +				 &fs_info, ih_info);
> +	if (r)
> +		goto free;
> +
> +	if (amdgpu_ras_is_supported(adev, adev->gmc.umc_ras_if->block)) {
> +		r = amdgpu_irq_get(adev, &adev->gmc.ecc_irq, 0);
> +		if (r)
> +			goto late_fini;
> +	} else {
> +		r = 0;
> +		goto free;
> +	}
> +
> +	return 0;
> +
> +late_fini:
> +	amdgpu_ras_late_fini(adev, adev->gmc.umc_ras_if, ih_info);
> +free:
> +	kfree(adev->gmc.umc_ras_if);
> +	adev->gmc.umc_ras_if = NULL;
> +	return r;
> +}
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.h
> b/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.h
> index 975afa04df09..6f22c9704555 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.h
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_umc.h
> @@ -55,6 +55,7 @@
> 
>  struct amdgpu_umc_funcs {
>  	void (*ras_init)(struct amdgpu_device *adev);
> +	int (*ras_late_init)(struct amdgpu_device *adev, void *ras_ih_info);
>  	void (*query_ras_error_count)(struct amdgpu_device *adev,
>  					void *ras_error_status);
>  	void (*query_ras_error_address)(struct amdgpu_device *adev, @@ -
> 79,4 +80,5 @@ struct amdgpu_umc {
>  	const struct amdgpu_umc_funcs *funcs;
>  };
> 
> +int amdgpu_umc_ras_late_init(struct amdgpu_device *adev, void
> +*ras_ih_info);
>  #endif
> diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> index beb6c84ab9e2..3db40342b6c3 100644
> --- a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
> @@ -793,9 +793,11 @@ static int gmc_v9_0_ecc_late_init(void *handle)
>  		.cb = gmc_v9_0_process_ras_data_cb,
>  	};
> 
> -	r = amdgpu_gmc_ras_late_init(adev, &umc_ih_info);
> -	if (r)
> -		return r;
> +	if (adev->umc.funcs && adev->umc.funcs->ras_late_init) {
> +		r = adev->umc.funcs->ras_late_init(adev, &umc_ih_info);
> +		if (r)
> +			return r;
> +	}
> 
>  	if (adev->mmhub_funcs && adev->mmhub_funcs->ras_late_init) {
>  		r = adev->mmhub_funcs->ras_late_init(adev);
> diff --git a/drivers/gpu/drm/amd/amdgpu/umc_v6_1.c
> b/drivers/gpu/drm/amd/amdgpu/umc_v6_1.c
> index 09e316a22f1a..4cdb5c04cd17 100644
> --- a/drivers/gpu/drm/amd/amdgpu/umc_v6_1.c
> +++ b/drivers/gpu/drm/amd/amdgpu/umc_v6_1.c
> @@ -273,6 +273,7 @@ static void umc_v6_1_ras_init(struct amdgpu_device
> *adev)
> 
>  const struct amdgpu_umc_funcs umc_v6_1_funcs = {
>  	.ras_init = umc_v6_1_ras_init,
> +	.ras_late_init = amdgpu_umc_ras_late_init,
>  	.query_ras_error_count = umc_v6_1_query_ras_error_count,
>  	.query_ras_error_address = umc_v6_1_query_ras_error_address,
>  	.enable_umc_index_mode = umc_v6_1_enable_umc_index_mode,
> --
> 2.17.1



More information about the amd-gfx mailing list