npu1_regs.c 4.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (C) 2023-2024, Advanced Micro Devices, Inc.
  4. */
  5. #include <drm/amdxdna_accel.h>
  6. #include <drm/drm_device.h>
  7. #include <drm/gpu_scheduler.h>
  8. #include <linux/bits.h>
  9. #include <linux/sizes.h>
  10. #include "aie2_pci.h"
  11. #include "amdxdna_mailbox.h"
  12. #include "amdxdna_pci_drv.h"
  13. /* Address definition from NPU1 docs */
  14. #define MPNPU_PWAITMODE 0x3010034
  15. #define MPNPU_PUB_SEC_INTR 0x3010090
  16. #define MPNPU_PUB_PWRMGMT_INTR 0x3010094
  17. #define MPNPU_PUB_SCRATCH2 0x30100A0
  18. #define MPNPU_PUB_SCRATCH3 0x30100A4
  19. #define MPNPU_PUB_SCRATCH4 0x30100A8
  20. #define MPNPU_PUB_SCRATCH5 0x30100AC
  21. #define MPNPU_PUB_SCRATCH6 0x30100B0
  22. #define MPNPU_PUB_SCRATCH7 0x30100B4
  23. #define MPNPU_PUB_SCRATCH9 0x30100BC
  24. #define MPNPU_SRAM_X2I_MAILBOX_0 0x30A0000
  25. #define MPNPU_SRAM_X2I_MAILBOX_1 0x30A2000
  26. #define MPNPU_SRAM_I2X_MAILBOX_15 0x30BF000
  27. #define MPNPU_APERTURE0_BASE 0x3000000
  28. #define MPNPU_APERTURE1_BASE 0x3080000
  29. #define MPNPU_APERTURE2_BASE 0x30C0000
  30. /* PCIe BAR Index for NPU1 */
  31. #define NPU1_REG_BAR_INDEX 0
  32. #define NPU1_MBOX_BAR_INDEX 4
  33. #define NPU1_PSP_BAR_INDEX 0
  34. #define NPU1_SMU_BAR_INDEX 0
  35. #define NPU1_SRAM_BAR_INDEX 2
  36. /* Associated BARs and Apertures */
  37. #define NPU1_REG_BAR_BASE MPNPU_APERTURE0_BASE
  38. #define NPU1_MBOX_BAR_BASE MPNPU_APERTURE2_BASE
  39. #define NPU1_PSP_BAR_BASE MPNPU_APERTURE0_BASE
  40. #define NPU1_SMU_BAR_BASE MPNPU_APERTURE0_BASE
  41. #define NPU1_SRAM_BAR_BASE MPNPU_APERTURE1_BASE
  42. const struct rt_config npu1_default_rt_cfg[] = {
  43. { 2, 1, AIE2_RT_CFG_INIT }, /* PDI APP LOAD MODE */
  44. { 4, 1, AIE2_RT_CFG_INIT }, /* Debug BO */
  45. { 1, 1, AIE2_RT_CFG_CLK_GATING }, /* Clock gating on */
  46. { 0 },
  47. };
  48. const struct dpm_clk_freq npu1_dpm_clk_table[] = {
  49. {400, 800},
  50. {600, 1024},
  51. {600, 1024},
  52. {600, 1024},
  53. {600, 1024},
  54. {720, 1309},
  55. {720, 1309},
  56. {847, 1600},
  57. { 0 }
  58. };
  59. static const struct aie2_fw_feature_tbl npu1_fw_feature_table[] = {
  60. { .major = 5, .min_minor = 7 },
  61. { .features = BIT_U64(AIE2_NPU_COMMAND), .major = 5, .min_minor = 8 },
  62. { 0 }
  63. };
  64. static const struct amdxdna_dev_priv npu1_dev_priv = {
  65. .fw_path = "amdnpu/1502_00/",
  66. .rt_config = npu1_default_rt_cfg,
  67. .dpm_clk_tbl = npu1_dpm_clk_table,
  68. .fw_feature_tbl = npu1_fw_feature_table,
  69. .col_align = COL_ALIGN_NONE,
  70. .mbox_dev_addr = NPU1_MBOX_BAR_BASE,
  71. .mbox_size = 0, /* Use BAR size */
  72. .sram_dev_addr = NPU1_SRAM_BAR_BASE,
  73. .hwctx_limit = 6,
  74. .sram_offs = {
  75. DEFINE_BAR_OFFSET(MBOX_CHANN_OFF, NPU1_SRAM, MPNPU_SRAM_X2I_MAILBOX_0),
  76. DEFINE_BAR_OFFSET(FW_ALIVE_OFF, NPU1_SRAM, MPNPU_SRAM_I2X_MAILBOX_15),
  77. },
  78. .psp_regs_off = {
  79. DEFINE_BAR_OFFSET(PSP_CMD_REG, NPU1_PSP, MPNPU_PUB_SCRATCH2),
  80. DEFINE_BAR_OFFSET(PSP_ARG0_REG, NPU1_PSP, MPNPU_PUB_SCRATCH3),
  81. DEFINE_BAR_OFFSET(PSP_ARG1_REG, NPU1_PSP, MPNPU_PUB_SCRATCH4),
  82. DEFINE_BAR_OFFSET(PSP_ARG2_REG, NPU1_PSP, MPNPU_PUB_SCRATCH9),
  83. DEFINE_BAR_OFFSET(PSP_INTR_REG, NPU1_PSP, MPNPU_PUB_SEC_INTR),
  84. DEFINE_BAR_OFFSET(PSP_STATUS_REG, NPU1_PSP, MPNPU_PUB_SCRATCH2),
  85. DEFINE_BAR_OFFSET(PSP_RESP_REG, NPU1_PSP, MPNPU_PUB_SCRATCH3),
  86. DEFINE_BAR_OFFSET(PSP_PWAITMODE_REG, NPU1_PSP, MPNPU_PWAITMODE),
  87. },
  88. .smu_regs_off = {
  89. DEFINE_BAR_OFFSET(SMU_CMD_REG, NPU1_SMU, MPNPU_PUB_SCRATCH5),
  90. DEFINE_BAR_OFFSET(SMU_ARG_REG, NPU1_SMU, MPNPU_PUB_SCRATCH7),
  91. DEFINE_BAR_OFFSET(SMU_INTR_REG, NPU1_SMU, MPNPU_PUB_PWRMGMT_INTR),
  92. DEFINE_BAR_OFFSET(SMU_RESP_REG, NPU1_SMU, MPNPU_PUB_SCRATCH6),
  93. DEFINE_BAR_OFFSET(SMU_OUT_REG, NPU1_SMU, MPNPU_PUB_SCRATCH7),
  94. },
  95. .hw_ops = {
  96. .set_dpm = npu1_set_dpm,
  97. },
  98. };
  99. const struct amdxdna_dev_info dev_npu1_info = {
  100. .reg_bar = NPU1_REG_BAR_INDEX,
  101. .mbox_bar = NPU1_MBOX_BAR_INDEX,
  102. .sram_bar = NPU1_SRAM_BAR_INDEX,
  103. .psp_bar = NPU1_PSP_BAR_INDEX,
  104. .smu_bar = NPU1_SMU_BAR_INDEX,
  105. .first_col = 1,
  106. .dev_mem_buf_shift = 15, /* 32 KiB aligned */
  107. .dev_mem_base = AIE2_DEVM_BASE,
  108. .dev_mem_size = AIE2_DEVM_SIZE,
  109. .vbnv = "RyzenAI-npu1",
  110. .device_type = AMDXDNA_DEV_TYPE_KMQ,
  111. .dev_priv = &npu1_dev_priv,
  112. .ops = &aie2_ops,
  113. };