[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <760fa2c5-7de0-4f95-a8dd-966003a30d47@amd.com>
Date: Tue, 10 Dec 2024 18:30:18 -0600
From: Mario Limonciello <mario.limonciello@....com>
To: Lizhi Hou <lizhi.hou@....com>, ogabbay@...nel.org,
quic_jhugo@...cinc.com, dri-devel@...ts.freedesktop.org
Cc: linux-kernel@...r.kernel.org, min.ma@....com, max.zhen@....com,
sonal.santan@....com, king.tam@....com, Xiaoming Ren <xiaoming.ren@....com>
Subject: Re: [PATCH V2 3/8] accel/amdxdna: Add RyzenAI-npu6 support
On 12/6/2024 15:59, Lizhi Hou wrote:
> Add NPU6 registers and other private configurations.
>
> Co-developed-by: Xiaoming Ren <xiaoming.ren@....com>
> Signed-off-by: Xiaoming Ren <xiaoming.ren@....com>
> Signed-off-by: Lizhi Hou <lizhi.hou@....com>
Reviewed-by: Mario Limonciello <mario.limonciello@....com>
> ---
> drivers/accel/amdxdna/Makefile | 3 +-
> drivers/accel/amdxdna/npu6_regs.c | 121 ++++++++++++++++++++++++++++++
> 2 files changed, 123 insertions(+), 1 deletion(-)
> create mode 100644 drivers/accel/amdxdna/npu6_regs.c
>
> diff --git a/drivers/accel/amdxdna/Makefile b/drivers/accel/amdxdna/Makefile
> index ed6f87910880..6baf181298de 100644
> --- a/drivers/accel/amdxdna/Makefile
> +++ b/drivers/accel/amdxdna/Makefile
> @@ -17,5 +17,6 @@ amdxdna-y := \
> npu1_regs.o \
> npu2_regs.o \
> npu4_regs.o \
> - npu5_regs.o
> + npu5_regs.o \
> + npu6_regs.o
> obj-$(CONFIG_DRM_ACCEL_AMDXDNA) = amdxdna.o
> diff --git a/drivers/accel/amdxdna/npu6_regs.c b/drivers/accel/amdxdna/npu6_regs.c
> new file mode 100644
> index 000000000000..d1168fc55533
> --- /dev/null
> +++ b/drivers/accel/amdxdna/npu6_regs.c
> @@ -0,0 +1,121 @@
> +// SPDX-License-Identifier: GPL-2.0
> +/*
> + * Copyright (C) 2024, Advanced Micro Devices, Inc.
> + */
> +
> +#include <drm/amdxdna_accel.h>
> +#include <drm/drm_device.h>
> +#include <drm/gpu_scheduler.h>
> +#include <linux/sizes.h>
> +
> +#include "aie2_pci.h"
> +#include "amdxdna_mailbox.h"
> +#include "amdxdna_pci_drv.h"
> +
> +/* NPU Public Registers on MpNPUAxiXbar (refer to Diag npu_registers.h) */
> +#define MPNPU_PUB_SEC_INTR 0x3010060
> +#define MPNPU_PUB_PWRMGMT_INTR 0x3010064
> +#define MPNPU_PUB_SCRATCH0 0x301006C
> +#define MPNPU_PUB_SCRATCH1 0x3010070
> +#define MPNPU_PUB_SCRATCH2 0x3010074
> +#define MPNPU_PUB_SCRATCH3 0x3010078
> +#define MPNPU_PUB_SCRATCH4 0x301007C
> +#define MPNPU_PUB_SCRATCH5 0x3010080
> +#define MPNPU_PUB_SCRATCH6 0x3010084
> +#define MPNPU_PUB_SCRATCH7 0x3010088
> +#define MPNPU_PUB_SCRATCH8 0x301008C
> +#define MPNPU_PUB_SCRATCH9 0x3010090
> +#define MPNPU_PUB_SCRATCH10 0x3010094
> +#define MPNPU_PUB_SCRATCH11 0x3010098
> +#define MPNPU_PUB_SCRATCH12 0x301009C
> +#define MPNPU_PUB_SCRATCH13 0x30100A0
> +#define MPNPU_PUB_SCRATCH14 0x30100A4
> +#define MPNPU_PUB_SCRATCH15 0x30100A8
> +#define MP0_C2PMSG_73 0x3810A24
> +#define MP0_C2PMSG_123 0x3810AEC
> +
> +#define MP1_C2PMSG_0 0x3B10900
> +#define MP1_C2PMSG_60 0x3B109F0
> +#define MP1_C2PMSG_61 0x3B109F4
> +
> +#define MPNPU_SRAM_X2I_MAILBOX_0 0x3600000
> +#define MPNPU_SRAM_X2I_MAILBOX_15 0x361E000
> +#define MPNPU_SRAM_X2I_MAILBOX_31 0x363E000
> +#define MPNPU_SRAM_I2X_MAILBOX_31 0x363F000
> +
> +#define MMNPU_APERTURE0_BASE 0x3000000
> +#define MMNPU_APERTURE1_BASE 0x3600000
> +#define MMNPU_APERTURE3_BASE 0x3810000
> +#define MMNPU_APERTURE4_BASE 0x3B10000
> +
> +/* PCIe BAR Index for NPU6 */
> +#define NPU6_REG_BAR_INDEX 0
> +#define NPU6_MBOX_BAR_INDEX 0
> +#define NPU6_PSP_BAR_INDEX 4
> +#define NPU6_SMU_BAR_INDEX 5
> +#define NPU6_SRAM_BAR_INDEX 2
> +/* Associated BARs and Apertures */
> +#define NPU6_REG_BAR_BASE MMNPU_APERTURE0_BASE
> +#define NPU6_MBOX_BAR_BASE MMNPU_APERTURE0_BASE
> +#define NPU6_PSP_BAR_BASE MMNPU_APERTURE3_BASE
> +#define NPU6_SMU_BAR_BASE MMNPU_APERTURE4_BASE
> +#define NPU6_SRAM_BAR_BASE MMNPU_APERTURE1_BASE
> +
> +#define NPU6_RT_CFG_TYPE_PDI_LOAD 5
> +#define NPU6_RT_CFG_TYPE_DEBUG_BO 10
> +
> +#define NPU6_RT_CFG_VAL_PDI_LOAD_MGMT 0
> +#define NPU6_RT_CFG_VAL_PDI_LOAD_APP 1
> +
> +#define NPU6_RT_CFG_VAL_DEBUG_BO_DEFAULT 0
> +#define NPU6_RT_CFG_VAL_DEBUG_BO_LARGE 1
> +
> +#define NPU6_MPNPUCLK_FREQ_MAX 1267
> +#define NPU6_HCLK_FREQ_MAX 1800
> +
> +const struct amdxdna_dev_priv npu6_dev_priv = {
> + .fw_path = "amdnpu/17f0_10/npu.sbin",
> + .protocol_major = 0x6,
> + .protocol_minor = 12,
> + .rt_config = {NPU6_RT_CFG_TYPE_PDI_LOAD, NPU6_RT_CFG_VAL_PDI_LOAD_APP},
> + .col_align = COL_ALIGN_NATURE,
> + .mbox_dev_addr = NPU6_MBOX_BAR_BASE,
> + .mbox_size = 0, /* Use BAR size */
> + .sram_dev_addr = NPU6_SRAM_BAR_BASE,
> + .sram_offs = {
> + DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_0),
> + DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_15),
> + },
> + .psp_regs_off = {
> + DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU6_PSP, MP0_C2PMSG_123),
> + DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU6_REG, MPNPU_PUB_SCRATCH3),
> + DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU6_REG, MPNPU_PUB_SCRATCH4),
> + DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU6_REG, MPNPU_PUB_SCRATCH9),
> + DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU6_PSP, MP0_C2PMSG_73),
> + DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU6_PSP, MP0_C2PMSG_123),
> + DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU6_REG, MPNPU_PUB_SCRATCH3),
> + },
> + .smu_regs_off = {
> + DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU6_SMU, MP1_C2PMSG_0),
> + DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU6_SMU, MP1_C2PMSG_60),
> + DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU6_SMU, MMNPU_APERTURE4_BASE),
> + DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU6_SMU, MP1_C2PMSG_61),
> + DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU6_SMU, MP1_C2PMSG_60),
> + },
> +};
> +
> +const struct amdxdna_dev_info dev_npu6_info = {
> + .reg_bar = NPU6_REG_BAR_INDEX,
> + .mbox_bar = NPU6_MBOX_BAR_INDEX,
> + .sram_bar = NPU6_SRAM_BAR_INDEX,
> + .psp_bar = NPU6_PSP_BAR_INDEX,
> + .smu_bar = NPU6_SMU_BAR_INDEX,
> + .first_col = 0,
> + .dev_mem_buf_shift = 15, /* 32 KiB aligned */
> + .dev_mem_base = AIE2_DEVM_BASE,
> + .dev_mem_size = AIE2_DEVM_SIZE,
> + .vbnv = "RyzenAI-npu6",
> + .device_type = AMDXDNA_DEV_TYPE_KMQ,
> + .dev_priv = &npu6_dev_priv,
> + .ops = &aie2_ops,
> +};
Powered by blists - more mailing lists