[PATCH V2 7/8] accel/amdxdna: Read firmware interface version from registers

Mario Limonciello mario.limonciello at amd.com
Wed Dec 11 00:20:10 UTC 2024


On 12/6/2024 16:00, Lizhi Hou wrote:
> The latest released firmware supports reading firmware interface version
> from registers directly. The driver's probe routine reads the major and
> minor version numbers. If the firmware interface does not compatible with
s/does/is/
> the driver, the driver's probe routine returns failure.
> 
> Co-developed-by: Min Ma <min.ma at amd.com>
> Signed-off-by: Min Ma <min.ma at amd.com>
> Signed-off-by: Lizhi Hou <lizhi.hou at amd.com>

Just to confirm you're not backing yourself into a corner the plan is 
not to bump this major version any time soon for anything already 
supported by the driver; right?

Because once you do that this is going to get messy quickly.

Reviewed-by: Mario Limonciello <mario.limonciello at amd.com>
> ---
>   drivers/accel/amdxdna/aie2_message.c | 26 ----------
>   drivers/accel/amdxdna/aie2_pci.c     | 74 ++++++++++++++++++++++------
>   drivers/accel/amdxdna/aie2_pci.h     |  6 +--
>   drivers/accel/amdxdna/npu1_regs.c    |  2 +-
>   drivers/accel/amdxdna/npu2_regs.c    |  2 +-
>   drivers/accel/amdxdna/npu4_regs.c    |  2 +-
>   drivers/accel/amdxdna/npu5_regs.c    |  2 +-
>   7 files changed, 64 insertions(+), 50 deletions(-)
> 
> diff --git a/drivers/accel/amdxdna/aie2_message.c b/drivers/accel/amdxdna/aie2_message.c
> index 13b5a96f8d25..f6d46e1e5086 100644
> --- a/drivers/accel/amdxdna/aie2_message.c
> +++ b/drivers/accel/amdxdna/aie2_message.c
> @@ -100,32 +100,6 @@ int aie2_get_runtime_cfg(struct amdxdna_dev_hdl *ndev, u32 type, u64 *value)
>   	return 0;
>   }
>   
> -int aie2_check_protocol_version(struct amdxdna_dev_hdl *ndev)
> -{
> -	DECLARE_AIE2_MSG(protocol_version, MSG_OP_GET_PROTOCOL_VERSION);
> -	struct amdxdna_dev *xdna = ndev->xdna;
> -	int ret;
> -
> -	ret = aie2_send_mgmt_msg_wait(ndev, &msg);
> -	if (ret) {
> -		XDNA_ERR(xdna, "Failed to get protocol version, ret %d", ret);
> -		return ret;
> -	}
> -
> -	if (resp.major != ndev->priv->protocol_major) {
> -		XDNA_ERR(xdna, "Incompatible firmware protocol version major %d minor %d",
> -			 resp.major, resp.minor);
> -		return -EINVAL;
> -	}
> -
> -	if (resp.minor < ndev->priv->protocol_minor) {
> -		XDNA_ERR(xdna, "Firmware minor version smaller than supported");
> -		return -EINVAL;
> -	}
> -
> -	return 0;
> -}
> -
>   int aie2_assign_mgmt_pasid(struct amdxdna_dev_hdl *ndev, u16 pasid)
>   {
>   	DECLARE_AIE2_MSG(assign_mgmt_pasid, MSG_OP_ASSIGN_MGMT_PASID);
> diff --git a/drivers/accel/amdxdna/aie2_pci.c b/drivers/accel/amdxdna/aie2_pci.c
> index 489744a2e226..2d2b6b66617a 100644
> --- a/drivers/accel/amdxdna/aie2_pci.c
> +++ b/drivers/accel/amdxdna/aie2_pci.c
> @@ -33,17 +33,51 @@ MODULE_PARM_DESC(aie2_max_col, "Maximum column could be used");
>    * The related register and ring buffer information is on SRAM BAR.
>    * This struct is the register layout.
>    */
> +#define MGMT_MBOX_MAGIC 0x55504e5f /* _NPU */
>   struct mgmt_mbox_chann_info {
> -	u32	x2i_tail;
> -	u32	x2i_head;
> -	u32	x2i_buf;
> -	u32	x2i_buf_sz;
> -	u32	i2x_tail;
> -	u32	i2x_head;
> -	u32	i2x_buf;
> -	u32	i2x_buf_sz;
> +	__u32	x2i_tail;
> +	__u32	x2i_head;
> +	__u32	x2i_buf;
> +	__u32	x2i_buf_sz;
> +	__u32	i2x_tail;
> +	__u32	i2x_head;
> +	__u32	i2x_buf;
> +	__u32	i2x_buf_sz;
> +	__u32	magic;
> +	__u32	msi_id;
> +	__u32	prot_major;
> +	__u32	prot_minor;
> +	__u32	rsvd[4];
>   };
>   
> +static int aie2_check_protocol(struct amdxdna_dev_hdl *ndev, u32 fw_major, u32 fw_minor)
> +{
> +	struct amdxdna_dev *xdna = ndev->xdna;
> +
> +	/*
> +	 * The driver supported mailbox behavior is defined by
> +	 * ndev->priv->protocol_major and protocol_minor.
> +	 *
> +	 * When protocol_major and fw_major are different, it means driver
> +	 * and firmware are incompatible.
> +	 */
> +	if (ndev->priv->protocol_major != fw_major) {
> +		XDNA_ERR(xdna, "Incompatible firmware protocol major %d minor %d",
> +			 fw_major, fw_minor);
> +		return -EINVAL;
> +	}
> +
> +	/*
> +	 * When protocol_minor is greater then fw_minor, that means driver
> +	 * relies on operation the installed firmware does not support.
> +	 */
> +	if (ndev->priv->protocol_minor > fw_minor) {
> +		XDNA_ERR(xdna, "Firmware minor version smaller than supported");
> +		return -EINVAL;
> +	}
> +	return 0;
> +}
> +
>   static void aie2_dump_chann_info_debug(struct amdxdna_dev_hdl *ndev)
>   {
>   	struct amdxdna_dev *xdna = ndev->xdna;
> @@ -57,6 +91,8 @@ static void aie2_dump_chann_info_debug(struct amdxdna_dev_hdl *ndev)
>   	XDNA_DBG(xdna, "x2i ringbuf 0x%x", ndev->mgmt_x2i.rb_start_addr);
>   	XDNA_DBG(xdna, "x2i rsize   0x%x", ndev->mgmt_x2i.rb_size);
>   	XDNA_DBG(xdna, "x2i chann index 0x%x", ndev->mgmt_chan_idx);
> +	XDNA_DBG(xdna, "mailbox protocol major 0x%x", ndev->mgmt_prot_major);
> +	XDNA_DBG(xdna, "mailbox protocol minor 0x%x", ndev->mgmt_prot_minor);
>   }
>   
>   static int aie2_get_mgmt_chann_info(struct amdxdna_dev_hdl *ndev)
> @@ -87,6 +123,12 @@ static int aie2_get_mgmt_chann_info(struct amdxdna_dev_hdl *ndev)
>   	for (i = 0; i < sizeof(info_regs) / sizeof(u32); i++)
>   		reg[i] = readl(ndev->sram_base + off + i * sizeof(u32));
>   
> +	if (info_regs.magic != MGMT_MBOX_MAGIC) {
> +		XDNA_ERR(ndev->xdna, "Invalid mbox magic 0x%x", info_regs.magic);
> +		ret = -EINVAL;
> +		goto done;
> +	}
> +
>   	i2x = &ndev->mgmt_i2x;
>   	x2i = &ndev->mgmt_x2i;
>   
> @@ -99,14 +141,20 @@ static int aie2_get_mgmt_chann_info(struct amdxdna_dev_hdl *ndev)
>   	x2i->mb_tail_ptr_reg = AIE2_MBOX_OFF(ndev, info_regs.x2i_tail);
>   	x2i->rb_start_addr   = AIE2_SRAM_OFF(ndev, info_regs.x2i_buf);
>   	x2i->rb_size         = info_regs.x2i_buf_sz;
> -	ndev->mgmt_chan_idx  = CHANN_INDEX(ndev, x2i->rb_start_addr);
>   
> +	ndev->mgmt_chan_idx  = info_regs.msi_id;
> +	ndev->mgmt_prot_major = info_regs.prot_major;
> +	ndev->mgmt_prot_minor = info_regs.prot_minor;
> +
> +	ret = aie2_check_protocol(ndev, ndev->mgmt_prot_major, ndev->mgmt_prot_minor);
> +
> +done:
>   	aie2_dump_chann_info_debug(ndev);
>   
>   	/* Must clear address at FW_ALIVE_OFF */
>   	writel(0, SRAM_GET_ADDR(ndev, FW_ALIVE_OFF));
>   
> -	return 0;
> +	return ret;
>   }
>   
>   int aie2_runtime_cfg(struct amdxdna_dev_hdl *ndev,
> @@ -155,12 +203,6 @@ static int aie2_mgmt_fw_init(struct amdxdna_dev_hdl *ndev)
>   {
>   	int ret;
>   
> -	ret = aie2_check_protocol_version(ndev);
> -	if (ret) {
> -		XDNA_ERR(ndev->xdna, "Check header hash failed");
> -		return ret;
> -	}
> -
>   	ret = aie2_runtime_cfg(ndev, AIE2_RT_CFG_INIT, NULL);
>   	if (ret) {
>   		XDNA_ERR(ndev->xdna, "Runtime config failed");
> diff --git a/drivers/accel/amdxdna/aie2_pci.h b/drivers/accel/amdxdna/aie2_pci.h
> index 8c17b74654ce..cc159cadff9f 100644
> --- a/drivers/accel/amdxdna/aie2_pci.h
> +++ b/drivers/accel/amdxdna/aie2_pci.h
> @@ -39,9 +39,6 @@
>   })
>   
>   #define CHAN_SLOT_SZ SZ_8K
> -#define CHANN_INDEX(ndev, rbuf_off) \
> -	(((rbuf_off) - SRAM_REG_OFF((ndev), MBOX_CHANN_OFF)) / CHAN_SLOT_SZ)
> -
>   #define MBOX_SIZE(ndev) \
>   ({ \
>   	typeof(ndev) _ndev = (ndev); \
> @@ -170,6 +167,8 @@ struct amdxdna_dev_hdl {
>   	struct xdna_mailbox_chann_res	mgmt_x2i;
>   	struct xdna_mailbox_chann_res	mgmt_i2x;
>   	u32				mgmt_chan_idx;
> +	u32				mgmt_prot_major;
> +	u32				mgmt_prot_minor;
>   
>   	u32				total_col;
>   	struct aie_version		version;
> @@ -262,7 +261,6 @@ int aie2_suspend_fw(struct amdxdna_dev_hdl *ndev);
>   int aie2_resume_fw(struct amdxdna_dev_hdl *ndev);
>   int aie2_set_runtime_cfg(struct amdxdna_dev_hdl *ndev, u32 type, u64 value);
>   int aie2_get_runtime_cfg(struct amdxdna_dev_hdl *ndev, u32 type, u64 *value);
> -int aie2_check_protocol_version(struct amdxdna_dev_hdl *ndev);
>   int aie2_assign_mgmt_pasid(struct amdxdna_dev_hdl *ndev, u16 pasid);
>   int aie2_query_aie_version(struct amdxdna_dev_hdl *ndev, struct aie_version *version);
>   int aie2_query_aie_metadata(struct amdxdna_dev_hdl *ndev, struct aie_metadata *metadata);
> diff --git a/drivers/accel/amdxdna/npu1_regs.c b/drivers/accel/amdxdna/npu1_regs.c
> index c8f4d1cac65d..e408af57e378 100644
> --- a/drivers/accel/amdxdna/npu1_regs.c
> +++ b/drivers/accel/amdxdna/npu1_regs.c
> @@ -65,7 +65,7 @@ const struct dpm_clk_freq npu1_dpm_clk_table[] = {
>   const struct amdxdna_dev_priv npu1_dev_priv = {
>   	.fw_path        = "amdnpu/1502_00/npu.sbin",
>   	.protocol_major = 0x5,
> -	.protocol_minor = 0x1,
> +	.protocol_minor = 0x7,
>   	.rt_config	= npu1_default_rt_cfg,
>   	.dpm_clk_tbl	= npu1_dpm_clk_table,
>   	.col_align	= COL_ALIGN_NONE,
> diff --git a/drivers/accel/amdxdna/npu2_regs.c b/drivers/accel/amdxdna/npu2_regs.c
> index ac63131f9c7c..286bd0d475e2 100644
> --- a/drivers/accel/amdxdna/npu2_regs.c
> +++ b/drivers/accel/amdxdna/npu2_regs.c
> @@ -64,7 +64,7 @@
>   const struct amdxdna_dev_priv npu2_dev_priv = {
>   	.fw_path        = "amdnpu/17f0_00/npu.sbin",
>   	.protocol_major = 0x6,
> -	.protocol_minor = 0x1,
> +	.protocol_minor = 0x6,
>   	.rt_config	= npu4_default_rt_cfg,
>   	.dpm_clk_tbl	= npu4_dpm_clk_table,
>   	.col_align	= COL_ALIGN_NATURE,
> diff --git a/drivers/accel/amdxdna/npu4_regs.c b/drivers/accel/amdxdna/npu4_regs.c
> index a713ac18adfc..00c52833ce89 100644
> --- a/drivers/accel/amdxdna/npu4_regs.c
> +++ b/drivers/accel/amdxdna/npu4_regs.c
> @@ -85,7 +85,7 @@ const struct dpm_clk_freq npu4_dpm_clk_table[] = {
>   const struct amdxdna_dev_priv npu4_dev_priv = {
>   	.fw_path        = "amdnpu/17f0_10/npu.sbin",
>   	.protocol_major = 0x6,
> -	.protocol_minor = 0x1,
> +	.protocol_minor = 12,
>   	.rt_config	= npu4_default_rt_cfg,
>   	.dpm_clk_tbl	= npu4_dpm_clk_table,
>   	.col_align	= COL_ALIGN_NATURE,
> diff --git a/drivers/accel/amdxdna/npu5_regs.c b/drivers/accel/amdxdna/npu5_regs.c
> index 67a5d5bc8a49..118849272f27 100644
> --- a/drivers/accel/amdxdna/npu5_regs.c
> +++ b/drivers/accel/amdxdna/npu5_regs.c
> @@ -64,7 +64,7 @@
>   const struct amdxdna_dev_priv npu5_dev_priv = {
>   	.fw_path        = "amdnpu/17f0_11/npu.sbin",
>   	.protocol_major = 0x6,
> -	.protocol_minor = 0x1,
> +	.protocol_minor = 12,
>   	.rt_config	= npu4_default_rt_cfg,
>   	.dpm_clk_tbl	= npu4_dpm_clk_table,
>   	.col_align	= COL_ALIGN_NATURE,



More information about the dri-devel mailing list