Skip to content

Commit 273b517

Browse files
houlz0507superm1
authored andcommitted
accel/amdxdna: Add RyzenAI-npu6 support
Add NPU6 registers and other private configurations. Co-developed-by: Xiaoming Ren <xiaoming.ren@amd.com> Signed-off-by: Xiaoming Ren <xiaoming.ren@amd.com> Reviewed-by: Mario Limonciello <mario.limonciello@amd.com> Signed-off-by: Lizhi Hou <lizhi.hou@amd.com> Signed-off-by: Mario Limonciello <mario.limonciello@amd.com> Link: https://patchwork.freedesktop.org/patch/msgid/20241213232933.1545388-2-lizhi.hou@amd.com
1 parent 81a9a93 commit 273b517

File tree

4 files changed

+125
-1
lines changed

4 files changed

+125
-1
lines changed

drivers/accel/amdxdna/Makefile

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,5 +17,6 @@ amdxdna-y := \
1717
npu1_regs.o \
1818
npu2_regs.o \
1919
npu4_regs.o \
20-
npu5_regs.o
20+
npu5_regs.o \
21+
npu6_regs.o
2122
obj-$(CONFIG_DRM_ACCEL_AMDXDNA) = amdxdna.o

drivers/accel/amdxdna/amdxdna_pci_drv.c

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@ static const struct amdxdna_device_id amdxdna_ids[] = {
3939
{ 0x17f0, 0x0, &dev_npu2_info },
4040
{ 0x17f0, 0x10, &dev_npu4_info },
4141
{ 0x17f0, 0x11, &dev_npu5_info },
42+
{ 0x17f0, 0x20, &dev_npu6_info },
4243
{0}
4344
};
4445

drivers/accel/amdxdna/amdxdna_pci_drv.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -116,6 +116,7 @@ extern const struct amdxdna_dev_info dev_npu1_info;
116116
extern const struct amdxdna_dev_info dev_npu2_info;
117117
extern const struct amdxdna_dev_info dev_npu4_info;
118118
extern const struct amdxdna_dev_info dev_npu5_info;
119+
extern const struct amdxdna_dev_info dev_npu6_info;
119120

120121
int amdxdna_sysfs_init(struct amdxdna_dev *xdna);
121122
void amdxdna_sysfs_fini(struct amdxdna_dev *xdna);

drivers/accel/amdxdna/npu6_regs.c

Lines changed: 121 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,121 @@
1+
// SPDX-License-Identifier: GPL-2.0
2+
/*
3+
* Copyright (C) 2024, Advanced Micro Devices, Inc.
4+
*/
5+
6+
#include <drm/amdxdna_accel.h>
7+
#include <drm/drm_device.h>
8+
#include <drm/gpu_scheduler.h>
9+
#include <linux/sizes.h>
10+
11+
#include "aie2_pci.h"
12+
#include "amdxdna_mailbox.h"
13+
#include "amdxdna_pci_drv.h"
14+
15+
/* NPU Public Registers on MpNPUAxiXbar (refer to Diag npu_registers.h) */
16+
#define MPNPU_PUB_SEC_INTR 0x3010060
17+
#define MPNPU_PUB_PWRMGMT_INTR 0x3010064
18+
#define MPNPU_PUB_SCRATCH0 0x301006C
19+
#define MPNPU_PUB_SCRATCH1 0x3010070
20+
#define MPNPU_PUB_SCRATCH2 0x3010074
21+
#define MPNPU_PUB_SCRATCH3 0x3010078
22+
#define MPNPU_PUB_SCRATCH4 0x301007C
23+
#define MPNPU_PUB_SCRATCH5 0x3010080
24+
#define MPNPU_PUB_SCRATCH6 0x3010084
25+
#define MPNPU_PUB_SCRATCH7 0x3010088
26+
#define MPNPU_PUB_SCRATCH8 0x301008C
27+
#define MPNPU_PUB_SCRATCH9 0x3010090
28+
#define MPNPU_PUB_SCRATCH10 0x3010094
29+
#define MPNPU_PUB_SCRATCH11 0x3010098
30+
#define MPNPU_PUB_SCRATCH12 0x301009C
31+
#define MPNPU_PUB_SCRATCH13 0x30100A0
32+
#define MPNPU_PUB_SCRATCH14 0x30100A4
33+
#define MPNPU_PUB_SCRATCH15 0x30100A8
34+
#define MP0_C2PMSG_73 0x3810A24
35+
#define MP0_C2PMSG_123 0x3810AEC
36+
37+
#define MP1_C2PMSG_0 0x3B10900
38+
#define MP1_C2PMSG_60 0x3B109F0
39+
#define MP1_C2PMSG_61 0x3B109F4
40+
41+
#define MPNPU_SRAM_X2I_MAILBOX_0 0x3600000
42+
#define MPNPU_SRAM_X2I_MAILBOX_15 0x361E000
43+
#define MPNPU_SRAM_X2I_MAILBOX_31 0x363E000
44+
#define MPNPU_SRAM_I2X_MAILBOX_31 0x363F000
45+
46+
#define MMNPU_APERTURE0_BASE 0x3000000
47+
#define MMNPU_APERTURE1_BASE 0x3600000
48+
#define MMNPU_APERTURE3_BASE 0x3810000
49+
#define MMNPU_APERTURE4_BASE 0x3B10000
50+
51+
/* PCIe BAR Index for NPU6 */
52+
#define NPU6_REG_BAR_INDEX 0
53+
#define NPU6_MBOX_BAR_INDEX 0
54+
#define NPU6_PSP_BAR_INDEX 4
55+
#define NPU6_SMU_BAR_INDEX 5
56+
#define NPU6_SRAM_BAR_INDEX 2
57+
/* Associated BARs and Apertures */
58+
#define NPU6_REG_BAR_BASE MMNPU_APERTURE0_BASE
59+
#define NPU6_MBOX_BAR_BASE MMNPU_APERTURE0_BASE
60+
#define NPU6_PSP_BAR_BASE MMNPU_APERTURE3_BASE
61+
#define NPU6_SMU_BAR_BASE MMNPU_APERTURE4_BASE
62+
#define NPU6_SRAM_BAR_BASE MMNPU_APERTURE1_BASE
63+
64+
#define NPU6_RT_CFG_TYPE_PDI_LOAD 5
65+
#define NPU6_RT_CFG_TYPE_DEBUG_BO 10
66+
67+
#define NPU6_RT_CFG_VAL_PDI_LOAD_MGMT 0
68+
#define NPU6_RT_CFG_VAL_PDI_LOAD_APP 1
69+
70+
#define NPU6_RT_CFG_VAL_DEBUG_BO_DEFAULT 0
71+
#define NPU6_RT_CFG_VAL_DEBUG_BO_LARGE 1
72+
73+
#define NPU6_MPNPUCLK_FREQ_MAX 1267
74+
#define NPU6_HCLK_FREQ_MAX 1800
75+
76+
const struct amdxdna_dev_priv npu6_dev_priv = {
77+
.fw_path = "amdnpu/17f0_10/npu.sbin",
78+
.protocol_major = 0x6,
79+
.protocol_minor = 12,
80+
.rt_config = {NPU6_RT_CFG_TYPE_PDI_LOAD, NPU6_RT_CFG_VAL_PDI_LOAD_APP},
81+
.col_align = COL_ALIGN_NATURE,
82+
.mbox_dev_addr = NPU6_MBOX_BAR_BASE,
83+
.mbox_size = 0, /* Use BAR size */
84+
.sram_dev_addr = NPU6_SRAM_BAR_BASE,
85+
.sram_offs = {
86+
DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_0),
87+
DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_15),
88+
},
89+
.psp_regs_off = {
90+
DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU6_PSP, MP0_C2PMSG_123),
91+
DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU6_REG, MPNPU_PUB_SCRATCH3),
92+
DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU6_REG, MPNPU_PUB_SCRATCH4),
93+
DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU6_REG, MPNPU_PUB_SCRATCH9),
94+
DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU6_PSP, MP0_C2PMSG_73),
95+
DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU6_PSP, MP0_C2PMSG_123),
96+
DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU6_REG, MPNPU_PUB_SCRATCH3),
97+
},
98+
.smu_regs_off = {
99+
DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU6_SMU, MP1_C2PMSG_0),
100+
DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU6_SMU, MP1_C2PMSG_60),
101+
DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU6_SMU, MMNPU_APERTURE4_BASE),
102+
DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU6_SMU, MP1_C2PMSG_61),
103+
DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU6_SMU, MP1_C2PMSG_60),
104+
},
105+
};
106+
107+
const struct amdxdna_dev_info dev_npu6_info = {
108+
.reg_bar = NPU6_REG_BAR_INDEX,
109+
.mbox_bar = NPU6_MBOX_BAR_INDEX,
110+
.sram_bar = NPU6_SRAM_BAR_INDEX,
111+
.psp_bar = NPU6_PSP_BAR_INDEX,
112+
.smu_bar = NPU6_SMU_BAR_INDEX,
113+
.first_col = 0,
114+
.dev_mem_buf_shift = 15, /* 32 KiB aligned */
115+
.dev_mem_base = AIE2_DEVM_BASE,
116+
.dev_mem_size = AIE2_DEVM_SIZE,
117+
.vbnv = "RyzenAI-npu6",
118+
.device_type = AMDXDNA_DEV_TYPE_KMQ,
119+
.dev_priv = &npu6_dev_priv,
120+
.ops = &aie2_ops,
121+
};

0 commit comments

Comments
 (0)