|
| 1 | +// SPDX-License-Identifier: GPL-2.0 |
| 2 | +/* |
| 3 | + * Copyright (C) 2024, Advanced Micro Devices, Inc. |
| 4 | + */ |
| 5 | + |
| 6 | +#include <drm/amdxdna_accel.h> |
| 7 | +#include <drm/drm_device.h> |
| 8 | +#include <drm/gpu_scheduler.h> |
| 9 | +#include <linux/sizes.h> |
| 10 | + |
| 11 | +#include "aie2_pci.h" |
| 12 | +#include "amdxdna_mailbox.h" |
| 13 | +#include "amdxdna_pci_drv.h" |
| 14 | + |
| 15 | +/* NPU Public Registers on MpNPUAxiXbar (refer to Diag npu_registers.h) */ |
| 16 | +#define MPNPU_PUB_SEC_INTR 0x3010060 |
| 17 | +#define MPNPU_PUB_PWRMGMT_INTR 0x3010064 |
| 18 | +#define MPNPU_PUB_SCRATCH0 0x301006C |
| 19 | +#define MPNPU_PUB_SCRATCH1 0x3010070 |
| 20 | +#define MPNPU_PUB_SCRATCH2 0x3010074 |
| 21 | +#define MPNPU_PUB_SCRATCH3 0x3010078 |
| 22 | +#define MPNPU_PUB_SCRATCH4 0x301007C |
| 23 | +#define MPNPU_PUB_SCRATCH5 0x3010080 |
| 24 | +#define MPNPU_PUB_SCRATCH6 0x3010084 |
| 25 | +#define MPNPU_PUB_SCRATCH7 0x3010088 |
| 26 | +#define MPNPU_PUB_SCRATCH8 0x301008C |
| 27 | +#define MPNPU_PUB_SCRATCH9 0x3010090 |
| 28 | +#define MPNPU_PUB_SCRATCH10 0x3010094 |
| 29 | +#define MPNPU_PUB_SCRATCH11 0x3010098 |
| 30 | +#define MPNPU_PUB_SCRATCH12 0x301009C |
| 31 | +#define MPNPU_PUB_SCRATCH13 0x30100A0 |
| 32 | +#define MPNPU_PUB_SCRATCH14 0x30100A4 |
| 33 | +#define MPNPU_PUB_SCRATCH15 0x30100A8 |
| 34 | +#define MP0_C2PMSG_73 0x3810A24 |
| 35 | +#define MP0_C2PMSG_123 0x3810AEC |
| 36 | + |
| 37 | +#define MP1_C2PMSG_0 0x3B10900 |
| 38 | +#define MP1_C2PMSG_60 0x3B109F0 |
| 39 | +#define MP1_C2PMSG_61 0x3B109F4 |
| 40 | + |
| 41 | +#define MPNPU_SRAM_X2I_MAILBOX_0 0x3600000 |
| 42 | +#define MPNPU_SRAM_X2I_MAILBOX_15 0x361E000 |
| 43 | +#define MPNPU_SRAM_X2I_MAILBOX_31 0x363E000 |
| 44 | +#define MPNPU_SRAM_I2X_MAILBOX_31 0x363F000 |
| 45 | + |
| 46 | +#define MMNPU_APERTURE0_BASE 0x3000000 |
| 47 | +#define MMNPU_APERTURE1_BASE 0x3600000 |
| 48 | +#define MMNPU_APERTURE3_BASE 0x3810000 |
| 49 | +#define MMNPU_APERTURE4_BASE 0x3B10000 |
| 50 | + |
| 51 | +/* PCIe BAR Index for NPU6 */ |
| 52 | +#define NPU6_REG_BAR_INDEX 0 |
| 53 | +#define NPU6_MBOX_BAR_INDEX 0 |
| 54 | +#define NPU6_PSP_BAR_INDEX 4 |
| 55 | +#define NPU6_SMU_BAR_INDEX 5 |
| 56 | +#define NPU6_SRAM_BAR_INDEX 2 |
| 57 | +/* Associated BARs and Apertures */ |
| 58 | +#define NPU6_REG_BAR_BASE MMNPU_APERTURE0_BASE |
| 59 | +#define NPU6_MBOX_BAR_BASE MMNPU_APERTURE0_BASE |
| 60 | +#define NPU6_PSP_BAR_BASE MMNPU_APERTURE3_BASE |
| 61 | +#define NPU6_SMU_BAR_BASE MMNPU_APERTURE4_BASE |
| 62 | +#define NPU6_SRAM_BAR_BASE MMNPU_APERTURE1_BASE |
| 63 | + |
| 64 | +#define NPU6_RT_CFG_TYPE_PDI_LOAD 5 |
| 65 | +#define NPU6_RT_CFG_TYPE_DEBUG_BO 10 |
| 66 | + |
| 67 | +#define NPU6_RT_CFG_VAL_PDI_LOAD_MGMT 0 |
| 68 | +#define NPU6_RT_CFG_VAL_PDI_LOAD_APP 1 |
| 69 | + |
| 70 | +#define NPU6_RT_CFG_VAL_DEBUG_BO_DEFAULT 0 |
| 71 | +#define NPU6_RT_CFG_VAL_DEBUG_BO_LARGE 1 |
| 72 | + |
| 73 | +#define NPU6_MPNPUCLK_FREQ_MAX 1267 |
| 74 | +#define NPU6_HCLK_FREQ_MAX 1800 |
| 75 | + |
| 76 | +const struct amdxdna_dev_priv npu6_dev_priv = { |
| 77 | + .fw_path = "amdnpu/17f0_10/npu.sbin", |
| 78 | + .protocol_major = 0x6, |
| 79 | + .protocol_minor = 12, |
| 80 | + .rt_config = {NPU6_RT_CFG_TYPE_PDI_LOAD, NPU6_RT_CFG_VAL_PDI_LOAD_APP}, |
| 81 | + .col_align = COL_ALIGN_NATURE, |
| 82 | + .mbox_dev_addr = NPU6_MBOX_BAR_BASE, |
| 83 | + .mbox_size = 0, /* Use BAR size */ |
| 84 | + .sram_dev_addr = NPU6_SRAM_BAR_BASE, |
| 85 | + .sram_offs = { |
| 86 | + DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_0), |
| 87 | + DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU6_SRAM, MPNPU_SRAM_X2I_MAILBOX_15), |
| 88 | + }, |
| 89 | + .psp_regs_off = { |
| 90 | + DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU6_PSP, MP0_C2PMSG_123), |
| 91 | + DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU6_REG, MPNPU_PUB_SCRATCH3), |
| 92 | + DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU6_REG, MPNPU_PUB_SCRATCH4), |
| 93 | + DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU6_REG, MPNPU_PUB_SCRATCH9), |
| 94 | + DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU6_PSP, MP0_C2PMSG_73), |
| 95 | + DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU6_PSP, MP0_C2PMSG_123), |
| 96 | + DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU6_REG, MPNPU_PUB_SCRATCH3), |
| 97 | + }, |
| 98 | + .smu_regs_off = { |
| 99 | + DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU6_SMU, MP1_C2PMSG_0), |
| 100 | + DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU6_SMU, MP1_C2PMSG_60), |
| 101 | + DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU6_SMU, MMNPU_APERTURE4_BASE), |
| 102 | + DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU6_SMU, MP1_C2PMSG_61), |
| 103 | + DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU6_SMU, MP1_C2PMSG_60), |
| 104 | + }, |
| 105 | +}; |
| 106 | + |
| 107 | +const struct amdxdna_dev_info dev_npu6_info = { |
| 108 | + .reg_bar = NPU6_REG_BAR_INDEX, |
| 109 | + .mbox_bar = NPU6_MBOX_BAR_INDEX, |
| 110 | + .sram_bar = NPU6_SRAM_BAR_INDEX, |
| 111 | + .psp_bar = NPU6_PSP_BAR_INDEX, |
| 112 | + .smu_bar = NPU6_SMU_BAR_INDEX, |
| 113 | + .first_col = 0, |
| 114 | + .dev_mem_buf_shift = 15, /* 32 KiB aligned */ |
| 115 | + .dev_mem_base = AIE2_DEVM_BASE, |
| 116 | + .dev_mem_size = AIE2_DEVM_SIZE, |
| 117 | + .vbnv = "RyzenAI-npu6", |
| 118 | + .device_type = AMDXDNA_DEV_TYPE_KMQ, |
| 119 | + .dev_priv = &npu6_dev_priv, |
| 120 | + .ops = &aie2_ops, |
| 121 | +}; |
0 commit comments