Message ID | 20241206220001.164049-4-lizhi.hou@amd.com (mailing list archive) |
---|---|
State | New, archived |
Headers | show |
Series | AMD NPU driver improvements | expand |
On 12/6/2024 15:59, Lizhi Hou wrote: > Add NPU6 registers and other private configurations. > > Co-developed-by: Xiaoming Ren <xiaoming.ren@amd.com> > Signed-off-by: Xiaoming Ren <xiaoming.ren@amd.com> > Signed-off-by: Lizhi Hou <lizhi.hou@amd.com> Reviewed-by: Mario Limonciello <mario.limonciello@amd.com> > --- > drivers/accel/amdxdna/Makefile | 3 +- > drivers/accel/amdxdna/npu6_regs.c | 121 ++++++++++++++++++++++++++++++ > 2 files changed, 123 insertions(+), 1 deletion(-) > create mode 100644 drivers/accel/amdxdna/npu6_regs.c > > diff --git a/drivers/accel/amdxdna/Makefile b/drivers/accel/amdxdna/Makefile > index ed6f87910880..6baf181298de 100644 > --- a/drivers/accel/amdxdna/Makefile > +++ b/drivers/accel/amdxdna/Makefile > @@ -17,5 +17,6 @@ amdxdna-y := \ > npu1_regs.o \ > npu2_regs.o \ > npu4_regs.o \ > - npu5_regs.o > + npu5_regs.o \ > + npu6_regs.o > obj-$(CONFIG_DRM_ACCEL_AMDXDNA) = amdxdna.o > diff --git a/drivers/accel/amdxdna/npu6_regs.c b/drivers/accel/amdxdna/npu6_regs.c > new file mode 100644 > index 000000000000..d1168fc55533 > --- /dev/null > +++ b/drivers/accel/amdxdna/npu6_regs.c > @@ -0,0 +1,121 @@ > +// SPDX-License-Identifier: GPL-2.0 > +/* > + * Copyright (C) 2024, Advanced Micro Devices, Inc. > + */ > + > +#include <drm/amdxdna_accel.h> > +#include <drm/drm_device.h> > +#include <drm/gpu_scheduler.h> > +#include <linux/sizes.h> > + > +#include "aie2_pci.h" > +#include "amdxdna_mailbox.h" > +#include "amdxdna_pci_drv.h" > + > +/* NPU Public Registers on MpNPUAxiXbar (refer to Diag npu_registers.h) */ > +#define MPNPU_PUB_SEC_INTR 0x3010060 > +#define MPNPU_PUB_PWRMGMT_INTR 0x3010064 > +#define MPNPU_PUB_SCRATCH0 0x301006C > +#define MPNPU_PUB_SCRATCH1 0x3010070 > +#define MPNPU_PUB_SCRATCH2 0x3010074 > +#define MPNPU_PUB_SCRATCH3 0x3010078 > +#define MPNPU_PUB_SCRATCH4 0x301007C > +#define MPNPU_PUB_SCRATCH5 0x3010080 > +#define MPNPU_PUB_SCRATCH6 0x3010084 > +#define MPNPU_PUB_SCRATCH7 0x3010088 > +#define MPNPU_PUB_SCRATCH8 0x301008C > +#define MPNPU_PUB_SCRATCH9 0x3010090 > +#define MPNPU_PUB_SCRATCH10 0x3010094 > +#define MPNPU_PUB_SCRATCH11 0x3010098 > +#define MPNPU_PUB_SCRATCH12 0x301009C > +#define MPNPU_PUB_SCRATCH13 0x30100A0 > +#define MPNPU_PUB_SCRATCH14 0x30100A4 > +#define MPNPU_PUB_SCRATCH15 0x30100A8 > +#define MP0_C2PMSG_73 0x3810A24 > +#define MP0_C2PMSG_123 0x3810AEC > + > +#define MP1_C2PMSG_0 0x3B10900 > +#define MP1_C2PMSG_60 0x3B109F0 > +#define MP1_C2PMSG_61 0x3B109F4 > + > +#define MPNPU_SRAM_X2I_MAILBOX_0 0x3600000 > +#define MPNPU_SRAM_X2I_MAILBOX_15 0x361E000 > +#define MPNPU_SRAM_X2I_MAILBOX_31 0x363E000 > +#define MPNPU_SRAM_I2X_MAILBOX_31 0x363F000 > + > +#define MMNPU_APERTURE0_BASE 0x3000000 > +#define MMNPU_APERTURE1_BASE 0x3600000 > +#define MMNPU_APERTURE3_BASE 0x3810000 > +#define MMNPU_APERTURE4_BASE 0x3B10000 > + > +/* PCIe BAR Index for NPU6 */ > +#define NPU6_REG_BAR_INDEX 0 > +#define NPU6_MBOX_BAR_INDEX 0 > +#define NPU6_PSP_BAR_INDEX 4 > +#define NPU6_SMU_BAR_INDEX 5 > +#define NPU6_SRAM_BAR_INDEX 2 > +/* Associated BARs and Apertures */ > +#define NPU6_REG_BAR_BASE MMNPU_APERTURE0_BASE > +#define NPU6_MBOX_BAR_BASE MMNPU_APERTURE0_BASE > +#define NPU6_PSP_BAR_BASE MMNPU_APERTURE3_BASE > +#define NPU6_SMU_BAR_BASE MMNPU_APERTURE4_BASE > +#define NPU6_SRAM_BAR_BASE MMNPU_APERTURE1_BASE > + > +#define NPU6_RT_CFG_TYPE_PDI_LOAD 5 > +#define NPU6_RT_CFG_TYPE_DEBUG_BO 10 > + > +#define NPU6_RT_CFG_VAL_PDI_LOAD_MGMT 0 > +#define NPU6_RT_CFG_VAL_PDI_LOAD_APP 1 > + > +#define NPU6_RT_CFG_VAL_DEBUG_BO_DEFAULT 0 > +#define NPU6_RT_CFG_VAL_DEBUG_BO_LARGE 1 > + > +#define NPU6_MPNPUCLK_FREQ_MAX 1267 > +#define NPU6_HCLK_FREQ_MAX 1800 > + > +const struct amdxdna_dev_priv npu6_dev_priv = { > + .fw_path = "amdnpu/17f0_10/npu.sbin", > + .protocol_major = 0x6, > + .protocol_minor = 12, > + .rt_config = {NPU6_RT_CFG_TYPE_PDI_LOAD, NPU6_RT_CFG_VAL_PDI_LOAD_APP}, > + .col_align = COL_ALIGN_NATURE, > + .mbox_dev_addr = NPU6_MBOX_BAR_BASE, > + .mbox_size = 0, /* Use BAR size */ > + .sram_dev_addr = NPU6_SRAM_BAR_BASE, > + .sram_offs = { > + DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_0), > + DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_15), > + }, > + .psp_regs_off = { > + DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU6_PSP, MP0_C2PMSG_123), > + DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU6_REG, MPNPU_PUB_SCRATCH3), > + DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU6_REG, MPNPU_PUB_SCRATCH4), > + DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU6_REG, MPNPU_PUB_SCRATCH9), > + DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU6_PSP, MP0_C2PMSG_73), > + DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU6_PSP, MP0_C2PMSG_123), > + DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU6_REG, MPNPU_PUB_SCRATCH3), > + }, > + .smu_regs_off = { > + DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU6_SMU, MP1_C2PMSG_0), > + DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU6_SMU, MP1_C2PMSG_60), > + DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU6_SMU, MMNPU_APERTURE4_BASE), > + DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU6_SMU, MP1_C2PMSG_61), > + DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU6_SMU, MP1_C2PMSG_60), > + }, > +}; > + > +const struct amdxdna_dev_info dev_npu6_info = { > + .reg_bar = NPU6_REG_BAR_INDEX, > + .mbox_bar = NPU6_MBOX_BAR_INDEX, > + .sram_bar = NPU6_SRAM_BAR_INDEX, > + .psp_bar = NPU6_PSP_BAR_INDEX, > + .smu_bar = NPU6_SMU_BAR_INDEX, > + .first_col = 0, > + .dev_mem_buf_shift = 15, /* 32 KiB aligned */ > + .dev_mem_base = AIE2_DEVM_BASE, > + .dev_mem_size = AIE2_DEVM_SIZE, > + .vbnv = "RyzenAI-npu6", > + .device_type = AMDXDNA_DEV_TYPE_KMQ, > + .dev_priv = &npu6_dev_priv, > + .ops = &aie2_ops, > +};
On 12/6/2024 2:59 PM, Lizhi Hou wrote: > Add NPU6 registers and other private configurations. > > Co-developed-by: Xiaoming Ren <xiaoming.ren@amd.com> > Signed-off-by: Xiaoming Ren <xiaoming.ren@amd.com> > Signed-off-by: Lizhi Hou <lizhi.hou@amd.com> > --- > drivers/accel/amdxdna/Makefile | 3 +- > drivers/accel/amdxdna/npu6_regs.c | 121 ++++++++++++++++++++++++++++++ This looks like dead code to me. I would expect somewhere else in the driver, dev_npu6_info would be used, but that is not the case. What am I missing? -Jeff
On 12/13/24 08:37, Jeffrey Hugo wrote: > On 12/6/2024 2:59 PM, Lizhi Hou wrote: >> Add NPU6 registers and other private configurations. >> >> Co-developed-by: Xiaoming Ren <xiaoming.ren@amd.com> >> Signed-off-by: Xiaoming Ren <xiaoming.ren@amd.com> >> Signed-off-by: Lizhi Hou <lizhi.hou@amd.com> >> --- >> drivers/accel/amdxdna/Makefile | 3 +- >> drivers/accel/amdxdna/npu6_regs.c | 121 ++++++++++++++++++++++++++++++ > > This looks like dead code to me. I would expect somewhere else in the > driver, dev_npu6_info would be used, but that is not the case. What > am I missing? You are correct. I miss merged one line to the patch in amdxdna_idx[].. Thanks a lot. Lizhi > > -Jeff
diff --git a/drivers/accel/amdxdna/Makefile b/drivers/accel/amdxdna/Makefile index ed6f87910880..6baf181298de 100644 --- a/drivers/accel/amdxdna/Makefile +++ b/drivers/accel/amdxdna/Makefile @@ -17,5 +17,6 @@ amdxdna-y := \ npu1_regs.o \ npu2_regs.o \ npu4_regs.o \ - npu5_regs.o + npu5_regs.o \ + npu6_regs.o obj-$(CONFIG_DRM_ACCEL_AMDXDNA) = amdxdna.o diff --git a/drivers/accel/amdxdna/npu6_regs.c b/drivers/accel/amdxdna/npu6_regs.c new file mode 100644 index 000000000000..d1168fc55533 --- /dev/null +++ b/drivers/accel/amdxdna/npu6_regs.c @@ -0,0 +1,121 @@ +// SPDX-License-Identifier: GPL-2.0 +/* + * Copyright (C) 2024, Advanced Micro Devices, Inc. + */ + +#include <drm/amdxdna_accel.h> +#include <drm/drm_device.h> +#include <drm/gpu_scheduler.h> +#include <linux/sizes.h> + +#include "aie2_pci.h" +#include "amdxdna_mailbox.h" +#include "amdxdna_pci_drv.h" + +/* NPU Public Registers on MpNPUAxiXbar (refer to Diag npu_registers.h) */ +#define MPNPU_PUB_SEC_INTR 0x3010060 +#define MPNPU_PUB_PWRMGMT_INTR 0x3010064 +#define MPNPU_PUB_SCRATCH0 0x301006C +#define MPNPU_PUB_SCRATCH1 0x3010070 +#define MPNPU_PUB_SCRATCH2 0x3010074 +#define MPNPU_PUB_SCRATCH3 0x3010078 +#define MPNPU_PUB_SCRATCH4 0x301007C +#define MPNPU_PUB_SCRATCH5 0x3010080 +#define MPNPU_PUB_SCRATCH6 0x3010084 +#define MPNPU_PUB_SCRATCH7 0x3010088 +#define MPNPU_PUB_SCRATCH8 0x301008C +#define MPNPU_PUB_SCRATCH9 0x3010090 +#define MPNPU_PUB_SCRATCH10 0x3010094 +#define MPNPU_PUB_SCRATCH11 0x3010098 +#define MPNPU_PUB_SCRATCH12 0x301009C +#define MPNPU_PUB_SCRATCH13 0x30100A0 +#define MPNPU_PUB_SCRATCH14 0x30100A4 +#define MPNPU_PUB_SCRATCH15 0x30100A8 +#define MP0_C2PMSG_73 0x3810A24 +#define MP0_C2PMSG_123 0x3810AEC + +#define MP1_C2PMSG_0 0x3B10900 +#define MP1_C2PMSG_60 0x3B109F0 +#define MP1_C2PMSG_61 0x3B109F4 + +#define MPNPU_SRAM_X2I_MAILBOX_0 0x3600000 +#define MPNPU_SRAM_X2I_MAILBOX_15 0x361E000 +#define MPNPU_SRAM_X2I_MAILBOX_31 0x363E000 +#define MPNPU_SRAM_I2X_MAILBOX_31 0x363F000 + +#define MMNPU_APERTURE0_BASE 0x3000000 +#define MMNPU_APERTURE1_BASE 0x3600000 +#define MMNPU_APERTURE3_BASE 0x3810000 +#define MMNPU_APERTURE4_BASE 0x3B10000 + +/* PCIe BAR Index for NPU6 */ +#define NPU6_REG_BAR_INDEX 0 +#define NPU6_MBOX_BAR_INDEX 0 +#define NPU6_PSP_BAR_INDEX 4 +#define NPU6_SMU_BAR_INDEX 5 +#define NPU6_SRAM_BAR_INDEX 2 +/* Associated BARs and Apertures */ +#define NPU6_REG_BAR_BASE MMNPU_APERTURE0_BASE +#define NPU6_MBOX_BAR_BASE MMNPU_APERTURE0_BASE +#define NPU6_PSP_BAR_BASE MMNPU_APERTURE3_BASE +#define NPU6_SMU_BAR_BASE MMNPU_APERTURE4_BASE +#define NPU6_SRAM_BAR_BASE MMNPU_APERTURE1_BASE + +#define NPU6_RT_CFG_TYPE_PDI_LOAD 5 +#define NPU6_RT_CFG_TYPE_DEBUG_BO 10 + +#define NPU6_RT_CFG_VAL_PDI_LOAD_MGMT 0 +#define NPU6_RT_CFG_VAL_PDI_LOAD_APP 1 + +#define NPU6_RT_CFG_VAL_DEBUG_BO_DEFAULT 0 +#define NPU6_RT_CFG_VAL_DEBUG_BO_LARGE 1 + +#define NPU6_MPNPUCLK_FREQ_MAX 1267 +#define NPU6_HCLK_FREQ_MAX 1800 + +const struct amdxdna_dev_priv npu6_dev_priv = { + .fw_path = "amdnpu/17f0_10/npu.sbin", + .protocol_major = 0x6, + .protocol_minor = 12, + .rt_config = {NPU6_RT_CFG_TYPE_PDI_LOAD, NPU6_RT_CFG_VAL_PDI_LOAD_APP}, + .col_align = COL_ALIGN_NATURE, + .mbox_dev_addr = NPU6_MBOX_BAR_BASE, + .mbox_size = 0, /* Use BAR size */ + .sram_dev_addr = NPU6_SRAM_BAR_BASE, + .sram_offs = { + DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_0), + DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_15), + }, + .psp_regs_off = { + DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU6_PSP, MP0_C2PMSG_123), + DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU6_REG, MPNPU_PUB_SCRATCH3), + DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU6_REG, MPNPU_PUB_SCRATCH4), + DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU6_REG, MPNPU_PUB_SCRATCH9), + DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU6_PSP, MP0_C2PMSG_73), + DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU6_PSP, MP0_C2PMSG_123), + DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU6_REG, MPNPU_PUB_SCRATCH3), + }, + .smu_regs_off = { + DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU6_SMU, MP1_C2PMSG_0), + DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU6_SMU, MP1_C2PMSG_60), + DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU6_SMU, MMNPU_APERTURE4_BASE), + DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU6_SMU, MP1_C2PMSG_61), + DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU6_SMU, MP1_C2PMSG_60), + }, +}; + +const struct amdxdna_dev_info dev_npu6_info = { + .reg_bar = NPU6_REG_BAR_INDEX, + .mbox_bar = NPU6_MBOX_BAR_INDEX, + .sram_bar = NPU6_SRAM_BAR_INDEX, + .psp_bar = NPU6_PSP_BAR_INDEX, + .smu_bar = NPU6_SMU_BAR_INDEX, + .first_col = 0, + .dev_mem_buf_shift = 15, /* 32 KiB aligned */ + .dev_mem_base = AIE2_DEVM_BASE, + .dev_mem_size = AIE2_DEVM_SIZE, + .vbnv = "RyzenAI-npu6", + .device_type = AMDXDNA_DEV_TYPE_KMQ, + .dev_priv = &npu6_dev_priv, + .ops = &aie2_ops, +};