18c9ff1b1SLizhi Hou // SPDX-License-Identifier: GPL-2.0 28c9ff1b1SLizhi Hou /* 38c9ff1b1SLizhi Hou * Copyright (C) 2023-2024, Advanced Micro Devices, Inc. 48c9ff1b1SLizhi Hou */ 58c9ff1b1SLizhi Hou 68c9ff1b1SLizhi Hou #include <drm/amdxdna_accel.h> 78c9ff1b1SLizhi Hou #include <drm/drm_device.h> 8aac24309SLizhi Hou #include <drm/gpu_scheduler.h> 98c9ff1b1SLizhi Hou #include <linux/sizes.h> 108c9ff1b1SLizhi Hou 118c9ff1b1SLizhi Hou #include "aie2_pci.h" 12b87f920bSLizhi Hou #include "amdxdna_mailbox.h" 138c9ff1b1SLizhi Hou #include "amdxdna_pci_drv.h" 148c9ff1b1SLizhi Hou 158c9ff1b1SLizhi Hou /* NPU Public Registers on MpNPUAxiXbar (refer to Diag npu_registers.h) */ 168c9ff1b1SLizhi Hou #define MPNPU_PUB_SEC_INTR 0x3010060 178c9ff1b1SLizhi Hou #define MPNPU_PUB_PWRMGMT_INTR 0x3010064 188c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH0 0x301006C 198c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH1 0x3010070 208c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH2 0x3010074 218c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH3 0x3010078 228c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH4 0x301007C 238c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH5 0x3010080 248c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH6 0x3010084 258c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH7 0x3010088 268c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH8 0x301008C 278c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH9 0x3010090 288c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH10 0x3010094 298c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH11 0x3010098 308c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH12 0x301009C 318c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH13 0x30100A0 328c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH14 0x30100A4 338c9ff1b1SLizhi Hou #define MPNPU_PUB_SCRATCH15 0x30100A8 348c9ff1b1SLizhi Hou #define MP0_C2PMSG_73 0x3810A24 358c9ff1b1SLizhi Hou #define MP0_C2PMSG_123 0x3810AEC 368c9ff1b1SLizhi Hou 378c9ff1b1SLizhi Hou #define MP1_C2PMSG_0 0x3B10900 388c9ff1b1SLizhi Hou #define MP1_C2PMSG_60 0x3B109F0 398c9ff1b1SLizhi Hou #define MP1_C2PMSG_61 0x3B109F4 408c9ff1b1SLizhi Hou 418c9ff1b1SLizhi Hou #define MPNPU_SRAM_X2I_MAILBOX_0 0x3600000 428c9ff1b1SLizhi Hou #define MPNPU_SRAM_X2I_MAILBOX_15 0x361E000 438c9ff1b1SLizhi Hou #define MPNPU_SRAM_X2I_MAILBOX_31 0x363E000 448c9ff1b1SLizhi Hou #define MPNPU_SRAM_I2X_MAILBOX_31 0x363F000 458c9ff1b1SLizhi Hou 468c9ff1b1SLizhi Hou #define MMNPU_APERTURE0_BASE 0x3000000 478c9ff1b1SLizhi Hou #define MMNPU_APERTURE1_BASE 0x3600000 488c9ff1b1SLizhi Hou #define MMNPU_APERTURE3_BASE 0x3810000 498c9ff1b1SLizhi Hou #define MMNPU_APERTURE4_BASE 0x3B10000 508c9ff1b1SLizhi Hou 518c9ff1b1SLizhi Hou /* PCIe BAR Index for NPU4 */ 528c9ff1b1SLizhi Hou #define NPU4_REG_BAR_INDEX 0 538c9ff1b1SLizhi Hou #define NPU4_MBOX_BAR_INDEX 0 548c9ff1b1SLizhi Hou #define NPU4_PSP_BAR_INDEX 4 558c9ff1b1SLizhi Hou #define NPU4_SMU_BAR_INDEX 5 568c9ff1b1SLizhi Hou #define NPU4_SRAM_BAR_INDEX 2 578c9ff1b1SLizhi Hou /* Associated BARs and Apertures */ 588c9ff1b1SLizhi Hou #define NPU4_REG_BAR_BASE MMNPU_APERTURE0_BASE 598c9ff1b1SLizhi Hou #define NPU4_MBOX_BAR_BASE MMNPU_APERTURE0_BASE 608c9ff1b1SLizhi Hou #define NPU4_PSP_BAR_BASE MMNPU_APERTURE3_BASE 618c9ff1b1SLizhi Hou #define NPU4_SMU_BAR_BASE MMNPU_APERTURE4_BASE 628c9ff1b1SLizhi Hou #define NPU4_SRAM_BAR_BASE MMNPU_APERTURE1_BASE 638c9ff1b1SLizhi Hou 64f4d7b8a6SLizhi Hou const struct rt_config npu4_default_rt_cfg[] = { 65f4d7b8a6SLizhi Hou { 5, 1, AIE2_RT_CFG_INIT }, /* PDI APP LOAD MODE */ 66f4d7b8a6SLizhi Hou { 1, 1, AIE2_RT_CFG_CLK_GATING }, /* Clock gating on */ 67f4d7b8a6SLizhi Hou { 2, 1, AIE2_RT_CFG_CLK_GATING }, /* Clock gating on */ 68f4d7b8a6SLizhi Hou { 3, 1, AIE2_RT_CFG_CLK_GATING }, /* Clock gating on */ 69f4d7b8a6SLizhi Hou { 4, 1, AIE2_RT_CFG_CLK_GATING }, /* Clock gating on */ 70f4d7b8a6SLizhi Hou { 0 }, 71f4d7b8a6SLizhi Hou }; 728c9ff1b1SLizhi Hou 73f4d7b8a6SLizhi Hou const struct dpm_clk_freq npu4_dpm_clk_table[] = { 74f4d7b8a6SLizhi Hou {396, 792}, 75f4d7b8a6SLizhi Hou {600, 1056}, 76f4d7b8a6SLizhi Hou {792, 1152}, 77f4d7b8a6SLizhi Hou {975, 1267}, 78f4d7b8a6SLizhi Hou {975, 1267}, 79f4d7b8a6SLizhi Hou {1056, 1408}, 80f4d7b8a6SLizhi Hou {1152, 1584}, 81f4d7b8a6SLizhi Hou {1267, 1800}, 82f4d7b8a6SLizhi Hou { 0 } 83f4d7b8a6SLizhi Hou }; 848c9ff1b1SLizhi Hou 85*71486e48SLizhi Hou static const struct amdxdna_dev_priv npu4_dev_priv = { 868c9ff1b1SLizhi Hou .fw_path = "amdnpu/17f0_10/npu.sbin", 878c9ff1b1SLizhi Hou .protocol_major = 0x6, 88b1dcfe62SLizhi Hou .protocol_minor = 12, 89f4d7b8a6SLizhi Hou .rt_config = npu4_default_rt_cfg, 90f4d7b8a6SLizhi Hou .dpm_clk_tbl = npu4_dpm_clk_table, 918c9ff1b1SLizhi Hou .col_align = COL_ALIGN_NATURE, 928c9ff1b1SLizhi Hou .mbox_dev_addr = NPU4_MBOX_BAR_BASE, 938c9ff1b1SLizhi Hou .mbox_size = 0, /* Use BAR size */ 948c9ff1b1SLizhi Hou .sram_dev_addr = NPU4_SRAM_BAR_BASE, 958c9ff1b1SLizhi Hou .sram_offs = { 968c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU4_SRAM, MPNPU_SRAM_X2I_MAILBOX_0), 978c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU4_SRAM, MPNPU_SRAM_X2I_MAILBOX_15), 988c9ff1b1SLizhi Hou }, 998c9ff1b1SLizhi Hou .psp_regs_off = { 1008c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU4_PSP, MP0_C2PMSG_123), 1018c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU4_REG, MPNPU_PUB_SCRATCH3), 1028c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU4_REG, MPNPU_PUB_SCRATCH4), 1038c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU4_REG, MPNPU_PUB_SCRATCH9), 1048c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU4_PSP, MP0_C2PMSG_73), 1058c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU4_PSP, MP0_C2PMSG_123), 1068c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU4_REG, MPNPU_PUB_SCRATCH3), 1078c9ff1b1SLizhi Hou }, 1088c9ff1b1SLizhi Hou .smu_regs_off = { 1098c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU4_SMU, MP1_C2PMSG_0), 1108c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU4_SMU, MP1_C2PMSG_60), 1118c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU4_SMU, MMNPU_APERTURE4_BASE), 1128c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU4_SMU, MP1_C2PMSG_61), 1138c9ff1b1SLizhi Hou DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU4_SMU, MP1_C2PMSG_60), 1148c9ff1b1SLizhi Hou }, 115f4d7b8a6SLizhi Hou .hw_ops = { 116f4d7b8a6SLizhi Hou .set_dpm = npu4_set_dpm, 117f4d7b8a6SLizhi Hou }, 1188c9ff1b1SLizhi Hou }; 1198c9ff1b1SLizhi Hou 1208c9ff1b1SLizhi Hou const struct amdxdna_dev_info dev_npu4_info = { 1218c9ff1b1SLizhi Hou .reg_bar = NPU4_REG_BAR_INDEX, 1228c9ff1b1SLizhi Hou .mbox_bar = NPU4_MBOX_BAR_INDEX, 1238c9ff1b1SLizhi Hou .sram_bar = NPU4_SRAM_BAR_INDEX, 1248c9ff1b1SLizhi Hou .psp_bar = NPU4_PSP_BAR_INDEX, 1258c9ff1b1SLizhi Hou .smu_bar = NPU4_SMU_BAR_INDEX, 1268c9ff1b1SLizhi Hou .first_col = 0, 1278c9ff1b1SLizhi Hou .dev_mem_buf_shift = 15, /* 32 KiB aligned */ 1288c9ff1b1SLizhi Hou .dev_mem_base = AIE2_DEVM_BASE, 1298c9ff1b1SLizhi Hou .dev_mem_size = AIE2_DEVM_SIZE, 1308c9ff1b1SLizhi Hou .vbnv = "RyzenAI-npu4", 1318c9ff1b1SLizhi Hou .device_type = AMDXDNA_DEV_TYPE_KMQ, 1328c9ff1b1SLizhi Hou .dev_priv = &npu4_dev_priv, 1338c9ff1b1SLizhi Hou .ops = &aie2_ops, /* NPU4 can share NPU1's callback */ 1348c9ff1b1SLizhi Hou }; 135