1 // SPDX-License-Identifier: GPL-2.0 2 3 /* 4 * Copyright 2020-2022 HabanaLabs, Ltd. 5 * All Rights Reserved. 6 */ 7 8 #include "gaudi2P.h" 9 #include "gaudi2_masks.h" 10 #include "../include/gaudi2/gaudi2_special_blocks.h" 11 #include "../include/hw_ip/mmu/mmu_general.h" 12 #include "../include/hw_ip/mmu/mmu_v2_0.h" 13 #include "../include/gaudi2/gaudi2_packets.h" 14 #include "../include/gaudi2/gaudi2_reg_map.h" 15 #include "../include/gaudi2/gaudi2_async_ids_map_extended.h" 16 #include "../include/gaudi2/arc/gaudi2_arc_common_packets.h" 17 18 #include <linux/module.h> 19 #include <linux/pci.h> 20 #include <linux/hwmon.h> 21 #include <linux/iommu.h> 22 23 #define GAUDI2_DMA_POOL_BLK_SIZE SZ_256 /* 256 bytes */ 24 25 #define GAUDI2_RESET_TIMEOUT_MSEC 2000 /* 2000ms */ 26 27 #define GAUDI2_RESET_POLL_TIMEOUT_USEC 500000 /* 500ms */ 28 #define GAUDI2_PLDM_HRESET_TIMEOUT_MSEC 25000 /* 25s */ 29 #define GAUDI2_PLDM_SRESET_TIMEOUT_MSEC 25000 /* 25s */ 30 #define GAUDI2_PLDM_RESET_POLL_TIMEOUT_USEC 3000000 /* 3s */ 31 #define GAUDI2_RESET_POLL_CNT 3 32 #define GAUDI2_RESET_WAIT_MSEC 1 /* 1ms */ 33 #define GAUDI2_CPU_RESET_WAIT_MSEC 100 /* 100ms */ 34 #define GAUDI2_PLDM_RESET_WAIT_MSEC 1000 /* 1s */ 35 #define GAUDI2_CB_POOL_CB_CNT 512 36 #define GAUDI2_CB_POOL_CB_SIZE SZ_128K /* 128KB */ 37 #define GAUDI2_MSG_TO_CPU_TIMEOUT_USEC 4000000 /* 4s */ 38 #define GAUDI2_WAIT_FOR_BL_TIMEOUT_USEC 25000000 /* 25s */ 39 #define GAUDI2_TEST_QUEUE_WAIT_USEC 100000 /* 100ms */ 40 #define GAUDI2_PLDM_TEST_QUEUE_WAIT_USEC 1000000 /* 1s */ 41 42 #define GAUDI2_ALLOC_CPU_MEM_RETRY_CNT 3 43 44 /* 45 * since the code already has built-in support for binning of up to MAX_FAULTY_TPCS TPCs 46 * and the code relies on that value (for array size etc..) we define another value 47 * for MAX faulty TPCs which reflects the cluster binning requirements 48 */ 49 #define MAX_CLUSTER_BINNING_FAULTY_TPCS 1 50 #define MAX_FAULTY_XBARS 1 51 #define MAX_FAULTY_EDMAS 1 52 #define MAX_FAULTY_DECODERS 1 53 54 #define GAUDI2_TPC_FULL_MASK 0x1FFFFFF 55 #define GAUDI2_HIF_HMMU_FULL_MASK 0xFFFF 56 #define GAUDI2_DECODER_FULL_MASK 0x3FF 57 58 #define GAUDI2_NA_EVENT_CAUSE 0xFF 59 #define GAUDI2_NUM_OF_QM_ERR_CAUSE 18 60 #define GAUDI2_NUM_OF_LOWER_QM_ERR_CAUSE 25 61 #define GAUDI2_NUM_OF_QM_ARB_ERR_CAUSE 3 62 #define GAUDI2_NUM_OF_ARC_SEI_ERR_CAUSE 14 63 #define GAUDI2_NUM_OF_CPU_SEI_ERR_CAUSE 3 64 #define GAUDI2_NUM_OF_QM_SEI_ERR_CAUSE 2 65 #define GAUDI2_NUM_OF_ROT_ERR_CAUSE 22 66 #define GAUDI2_NUM_OF_TPC_INTR_CAUSE 31 67 #define GAUDI2_NUM_OF_DEC_ERR_CAUSE 25 68 #define GAUDI2_NUM_OF_MME_ERR_CAUSE 16 69 #define GAUDI2_NUM_OF_MME_WAP_ERR_CAUSE 7 70 #define GAUDI2_NUM_OF_DMA_CORE_INTR_CAUSE 8 71 #define GAUDI2_NUM_OF_MMU_SPI_SEI_CAUSE 19 72 #define GAUDI2_NUM_OF_HBM_SEI_CAUSE 9 73 #define GAUDI2_NUM_OF_SM_SEI_ERR_CAUSE 3 74 #define GAUDI2_NUM_OF_PCIE_ADDR_DEC_ERR_CAUSE 3 75 #define GAUDI2_NUM_OF_PMMU_FATAL_ERR_CAUSE 2 76 #define GAUDI2_NUM_OF_HIF_FATAL_ERR_CAUSE 2 77 #define GAUDI2_NUM_OF_AXI_DRAIN_ERR_CAUSE 2 78 #define GAUDI2_NUM_OF_HBM_MC_SPI_CAUSE 5 79 80 #define GAUDI2_MMU_CACHE_INV_TIMEOUT_USEC (MMU_CONFIG_TIMEOUT_USEC * 10) 81 #define GAUDI2_PLDM_MMU_TIMEOUT_USEC (MMU_CONFIG_TIMEOUT_USEC * 200) 82 #define GAUDI2_ARB_WDT_TIMEOUT (0x1000000) 83 84 #define GAUDI2_VDEC_TIMEOUT_USEC 10000 /* 10ms */ 85 #define GAUDI2_PLDM_VDEC_TIMEOUT_USEC (GAUDI2_VDEC_TIMEOUT_USEC * 100) 86 87 #define KDMA_TIMEOUT_USEC USEC_PER_SEC 88 89 #define IS_DMA_IDLE(dma_core_sts0) \ 90 (!((dma_core_sts0) & (DCORE0_EDMA0_CORE_STS0_BUSY_MASK))) 91 92 #define IS_DMA_HALTED(dma_core_sts1) \ 93 ((dma_core_sts1) & (DCORE0_EDMA0_CORE_STS1_IS_HALT_MASK)) 94 95 #define IS_MME_IDLE(mme_arch_sts) (((mme_arch_sts) & MME_ARCH_IDLE_MASK) == MME_ARCH_IDLE_MASK) 96 97 #define IS_TPC_IDLE(tpc_cfg_sts) (((tpc_cfg_sts) & (TPC_IDLE_MASK)) == (TPC_IDLE_MASK)) 98 99 #define IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts) \ 100 ((((qm_glbl_sts0) & (QM_IDLE_MASK)) == (QM_IDLE_MASK)) && \ 101 (((qm_glbl_sts1) & (QM_ARC_IDLE_MASK)) == (QM_ARC_IDLE_MASK)) && \ 102 (((qm_cgm_sts) & (CGM_IDLE_MASK)) == (CGM_IDLE_MASK))) 103 104 #define PCIE_DEC_EN_MASK 0x300 105 #define DEC_WORK_STATE_IDLE 0 106 #define DEC_WORK_STATE_PEND 3 107 #define IS_DEC_IDLE(dec_swreg15) \ 108 (((dec_swreg15) & DCORE0_DEC0_CMD_SWREG15_SW_WORK_STATE_MASK) == DEC_WORK_STATE_IDLE || \ 109 ((dec_swreg15) & DCORE0_DEC0_CMD_SWREG15_SW_WORK_STATE_MASK) == DEC_WORK_STATE_PEND) 110 111 /* HBM MMU address scrambling parameters */ 112 #define GAUDI2_HBM_MMU_SCRM_MEM_SIZE SZ_8M 113 #define GAUDI2_HBM_MMU_SCRM_DIV_SHIFT 26 114 #define GAUDI2_HBM_MMU_SCRM_MOD_SHIFT 0 115 #define GAUDI2_HBM_MMU_SCRM_ADDRESS_MASK DRAM_VA_HINT_MASK 116 #define GAUDI2_COMPENSATE_TLB_PAGE_SIZE_FACTOR 16 117 #define MMU_RANGE_INV_VA_LSB_SHIFT 12 118 #define MMU_RANGE_INV_VA_MSB_SHIFT 44 119 #define MMU_RANGE_INV_EN_SHIFT 0 120 #define MMU_RANGE_INV_ASID_EN_SHIFT 1 121 #define MMU_RANGE_INV_ASID_SHIFT 2 122 123 /* The last SPI_SEI cause bit, "burst_fifo_full", is expected to be triggered in PMMU because it has 124 * a 2 entries FIFO, and hence it is not enabled for it. 125 */ 126 #define GAUDI2_PMMU_SPI_SEI_ENABLE_MASK GENMASK(GAUDI2_NUM_OF_MMU_SPI_SEI_CAUSE - 2, 0) 127 #define GAUDI2_HMMU_SPI_SEI_ENABLE_MASK GENMASK(GAUDI2_NUM_OF_MMU_SPI_SEI_CAUSE - 1, 0) 128 129 #define GAUDI2_MAX_STRING_LEN 64 130 131 #define GAUDI2_VDEC_MSIX_ENTRIES (GAUDI2_IRQ_NUM_SHARED_DEC1_ABNRM - \ 132 GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM + 1) 133 134 #define ENGINE_ID_DCORE_OFFSET (GAUDI2_DCORE1_ENGINE_ID_EDMA_0 - GAUDI2_DCORE0_ENGINE_ID_EDMA_0) 135 136 /* RAZWI initiator coordinates */ 137 #define RAZWI_GET_AXUSER_XY(x) \ 138 ((x & 0xF8001FF0) >> 4) 139 140 #define RAZWI_GET_AXUSER_LOW_XY(x) \ 141 ((x & 0x00001FF0) >> 4) 142 143 #define RAZWI_INITIATOR_AXUER_L_X_SHIFT 0 144 #define RAZWI_INITIATOR_AXUER_L_X_MASK 0x1F 145 #define RAZWI_INITIATOR_AXUER_L_Y_SHIFT 5 146 #define RAZWI_INITIATOR_AXUER_L_Y_MASK 0xF 147 148 #define RAZWI_INITIATOR_AXUER_H_X_SHIFT 23 149 #define RAZWI_INITIATOR_AXUER_H_X_MASK 0x1F 150 151 #define RAZWI_INITIATOR_ID_X_Y_LOW(x, y) \ 152 ((((y) & RAZWI_INITIATOR_AXUER_L_Y_MASK) << RAZWI_INITIATOR_AXUER_L_Y_SHIFT) | \ 153 (((x) & RAZWI_INITIATOR_AXUER_L_X_MASK) << RAZWI_INITIATOR_AXUER_L_X_SHIFT)) 154 155 #define RAZWI_INITIATOR_ID_X_HIGH(x) \ 156 (((x) & RAZWI_INITIATOR_AXUER_H_X_MASK) << RAZWI_INITIATOR_AXUER_H_X_SHIFT) 157 158 #define RAZWI_INITIATOR_ID_X_Y(xl, yl, xh) \ 159 (RAZWI_INITIATOR_ID_X_Y_LOW(xl, yl) | RAZWI_INITIATOR_ID_X_HIGH(xh)) 160 161 #define PSOC_RAZWI_ENG_STR_SIZE 128 162 #define PSOC_RAZWI_MAX_ENG_PER_RTR 5 163 164 /* HW scrambles only bits 0-25 */ 165 #define HW_UNSCRAMBLED_BITS_MASK GENMASK_ULL(63, 26) 166 167 #define GAUDI2_GLBL_ERR_MAX_CAUSE_NUM 17 168 169 struct gaudi2_razwi_info { 170 u32 axuser_xy; 171 u32 rtr_ctrl; 172 u16 eng_id; 173 char *eng_name; 174 }; 175 176 static struct gaudi2_razwi_info common_razwi_info[] = { 177 {RAZWI_INITIATOR_ID_X_Y(2, 4, 0), mmDCORE0_RTR0_CTRL_BASE, 178 GAUDI2_DCORE0_ENGINE_ID_DEC_0, "DEC0"}, 179 {RAZWI_INITIATOR_ID_X_Y(2, 4, 4), mmDCORE0_RTR0_CTRL_BASE, 180 GAUDI2_DCORE0_ENGINE_ID_DEC_1, "DEC1"}, 181 {RAZWI_INITIATOR_ID_X_Y(17, 4, 18), mmDCORE1_RTR7_CTRL_BASE, 182 GAUDI2_DCORE1_ENGINE_ID_DEC_0, "DEC2"}, 183 {RAZWI_INITIATOR_ID_X_Y(17, 4, 14), mmDCORE1_RTR7_CTRL_BASE, 184 GAUDI2_DCORE1_ENGINE_ID_DEC_1, "DEC3"}, 185 {RAZWI_INITIATOR_ID_X_Y(2, 11, 0), mmDCORE2_RTR0_CTRL_BASE, 186 GAUDI2_DCORE2_ENGINE_ID_DEC_0, "DEC4"}, 187 {RAZWI_INITIATOR_ID_X_Y(2, 11, 4), mmDCORE2_RTR0_CTRL_BASE, 188 GAUDI2_DCORE2_ENGINE_ID_DEC_1, "DEC5"}, 189 {RAZWI_INITIATOR_ID_X_Y(17, 11, 18), mmDCORE3_RTR7_CTRL_BASE, 190 GAUDI2_DCORE3_ENGINE_ID_DEC_0, "DEC6"}, 191 {RAZWI_INITIATOR_ID_X_Y(17, 11, 14), mmDCORE3_RTR7_CTRL_BASE, 192 GAUDI2_DCORE3_ENGINE_ID_DEC_1, "DEC7"}, 193 {RAZWI_INITIATOR_ID_X_Y(2, 4, 6), mmDCORE0_RTR0_CTRL_BASE, 194 GAUDI2_PCIE_ENGINE_ID_DEC_0, "DEC8"}, 195 {RAZWI_INITIATOR_ID_X_Y(2, 4, 7), mmDCORE0_RTR0_CTRL_BASE, 196 GAUDI2_PCIE_ENGINE_ID_DEC_0, "DEC9"}, 197 {RAZWI_INITIATOR_ID_X_Y(3, 4, 2), mmDCORE0_RTR1_CTRL_BASE, 198 GAUDI2_DCORE0_ENGINE_ID_TPC_0, "TPC0"}, 199 {RAZWI_INITIATOR_ID_X_Y(3, 4, 4), mmDCORE0_RTR1_CTRL_BASE, 200 GAUDI2_DCORE0_ENGINE_ID_TPC_1, "TPC1"}, 201 {RAZWI_INITIATOR_ID_X_Y(4, 4, 2), mmDCORE0_RTR2_CTRL_BASE, 202 GAUDI2_DCORE0_ENGINE_ID_TPC_2, "TPC2"}, 203 {RAZWI_INITIATOR_ID_X_Y(4, 4, 4), mmDCORE0_RTR2_CTRL_BASE, 204 GAUDI2_DCORE0_ENGINE_ID_TPC_3, "TPC3"}, 205 {RAZWI_INITIATOR_ID_X_Y(5, 4, 2), mmDCORE0_RTR3_CTRL_BASE, 206 GAUDI2_DCORE0_ENGINE_ID_TPC_4, "TPC4"}, 207 {RAZWI_INITIATOR_ID_X_Y(5, 4, 4), mmDCORE0_RTR3_CTRL_BASE, 208 GAUDI2_DCORE0_ENGINE_ID_TPC_5, "TPC5"}, 209 {RAZWI_INITIATOR_ID_X_Y(16, 4, 14), mmDCORE1_RTR6_CTRL_BASE, 210 GAUDI2_DCORE1_ENGINE_ID_TPC_0, "TPC6"}, 211 {RAZWI_INITIATOR_ID_X_Y(16, 4, 16), mmDCORE1_RTR6_CTRL_BASE, 212 GAUDI2_DCORE1_ENGINE_ID_TPC_1, "TPC7"}, 213 {RAZWI_INITIATOR_ID_X_Y(15, 4, 14), mmDCORE1_RTR5_CTRL_BASE, 214 GAUDI2_DCORE1_ENGINE_ID_TPC_2, "TPC8"}, 215 {RAZWI_INITIATOR_ID_X_Y(15, 4, 16), mmDCORE1_RTR5_CTRL_BASE, 216 GAUDI2_DCORE1_ENGINE_ID_TPC_3, "TPC9"}, 217 {RAZWI_INITIATOR_ID_X_Y(14, 4, 14), mmDCORE1_RTR4_CTRL_BASE, 218 GAUDI2_DCORE1_ENGINE_ID_TPC_4, "TPC10"}, 219 {RAZWI_INITIATOR_ID_X_Y(14, 4, 16), mmDCORE1_RTR4_CTRL_BASE, 220 GAUDI2_DCORE1_ENGINE_ID_TPC_5, "TPC11"}, 221 {RAZWI_INITIATOR_ID_X_Y(5, 11, 2), mmDCORE2_RTR3_CTRL_BASE, 222 GAUDI2_DCORE2_ENGINE_ID_TPC_0, "TPC12"}, 223 {RAZWI_INITIATOR_ID_X_Y(5, 11, 4), mmDCORE2_RTR3_CTRL_BASE, 224 GAUDI2_DCORE2_ENGINE_ID_TPC_1, "TPC13"}, 225 {RAZWI_INITIATOR_ID_X_Y(4, 11, 2), mmDCORE2_RTR2_CTRL_BASE, 226 GAUDI2_DCORE2_ENGINE_ID_TPC_2, "TPC14"}, 227 {RAZWI_INITIATOR_ID_X_Y(4, 11, 4), mmDCORE2_RTR2_CTRL_BASE, 228 GAUDI2_DCORE2_ENGINE_ID_TPC_3, "TPC15"}, 229 {RAZWI_INITIATOR_ID_X_Y(3, 11, 2), mmDCORE2_RTR1_CTRL_BASE, 230 GAUDI2_DCORE2_ENGINE_ID_TPC_4, "TPC16"}, 231 {RAZWI_INITIATOR_ID_X_Y(3, 11, 4), mmDCORE2_RTR1_CTRL_BASE, 232 GAUDI2_DCORE2_ENGINE_ID_TPC_5, "TPC17"}, 233 {RAZWI_INITIATOR_ID_X_Y(14, 11, 14), mmDCORE3_RTR4_CTRL_BASE, 234 GAUDI2_DCORE3_ENGINE_ID_TPC_0, "TPC18"}, 235 {RAZWI_INITIATOR_ID_X_Y(14, 11, 16), mmDCORE3_RTR4_CTRL_BASE, 236 GAUDI2_DCORE3_ENGINE_ID_TPC_1, "TPC19"}, 237 {RAZWI_INITIATOR_ID_X_Y(15, 11, 14), mmDCORE3_RTR5_CTRL_BASE, 238 GAUDI2_DCORE3_ENGINE_ID_TPC_2, "TPC20"}, 239 {RAZWI_INITIATOR_ID_X_Y(15, 11, 16), mmDCORE3_RTR5_CTRL_BASE, 240 GAUDI2_DCORE3_ENGINE_ID_TPC_3, "TPC21"}, 241 {RAZWI_INITIATOR_ID_X_Y(16, 11, 14), mmDCORE3_RTR6_CTRL_BASE, 242 GAUDI2_DCORE3_ENGINE_ID_TPC_4, "TPC22"}, 243 {RAZWI_INITIATOR_ID_X_Y(16, 11, 16), mmDCORE3_RTR6_CTRL_BASE, 244 GAUDI2_DCORE3_ENGINE_ID_TPC_5, "TPC23"}, 245 {RAZWI_INITIATOR_ID_X_Y(2, 4, 2), mmDCORE0_RTR0_CTRL_BASE, 246 GAUDI2_DCORE3_ENGINE_ID_TPC_5, "TPC24"}, 247 {RAZWI_INITIATOR_ID_X_Y(17, 4, 8), mmDCORE1_RTR7_CTRL_BASE, 248 GAUDI2_ENGINE_ID_NIC0_0, "NIC0"}, 249 {RAZWI_INITIATOR_ID_X_Y(17, 4, 10), mmDCORE1_RTR7_CTRL_BASE, 250 GAUDI2_ENGINE_ID_NIC0_1, "NIC1"}, 251 {RAZWI_INITIATOR_ID_X_Y(17, 4, 12), mmDCORE1_RTR7_CTRL_BASE, 252 GAUDI2_ENGINE_ID_NIC1_0, "NIC2"}, 253 {RAZWI_INITIATOR_ID_X_Y(17, 4, 14), mmDCORE1_RTR7_CTRL_BASE, 254 GAUDI2_ENGINE_ID_NIC1_1, "NIC3"}, 255 {RAZWI_INITIATOR_ID_X_Y(17, 4, 15), mmDCORE1_RTR7_CTRL_BASE, 256 GAUDI2_ENGINE_ID_NIC2_0, "NIC4"}, 257 {RAZWI_INITIATOR_ID_X_Y(2, 11, 2), mmDCORE2_RTR0_CTRL_BASE, 258 GAUDI2_ENGINE_ID_NIC2_1, "NIC5"}, 259 {RAZWI_INITIATOR_ID_X_Y(2, 11, 4), mmDCORE2_RTR0_CTRL_BASE, 260 GAUDI2_ENGINE_ID_NIC3_0, "NIC6"}, 261 {RAZWI_INITIATOR_ID_X_Y(2, 11, 6), mmDCORE2_RTR0_CTRL_BASE, 262 GAUDI2_ENGINE_ID_NIC3_1, "NIC7"}, 263 {RAZWI_INITIATOR_ID_X_Y(2, 11, 8), mmDCORE2_RTR0_CTRL_BASE, 264 GAUDI2_ENGINE_ID_NIC4_0, "NIC8"}, 265 {RAZWI_INITIATOR_ID_X_Y(17, 11, 12), mmDCORE3_RTR7_CTRL_BASE, 266 GAUDI2_ENGINE_ID_NIC4_1, "NIC9"}, 267 {RAZWI_INITIATOR_ID_X_Y(17, 11, 14), mmDCORE3_RTR7_CTRL_BASE, 268 GAUDI2_ENGINE_ID_NIC5_0, "NIC10"}, 269 {RAZWI_INITIATOR_ID_X_Y(17, 11, 16), mmDCORE3_RTR7_CTRL_BASE, 270 GAUDI2_ENGINE_ID_NIC5_1, "NIC11"}, 271 {RAZWI_INITIATOR_ID_X_Y(2, 4, 2), mmDCORE0_RTR0_CTRL_BASE, 272 GAUDI2_ENGINE_ID_PDMA_0, "PDMA0"}, 273 {RAZWI_INITIATOR_ID_X_Y(2, 4, 3), mmDCORE0_RTR0_CTRL_BASE, 274 GAUDI2_ENGINE_ID_PDMA_1, "PDMA1"}, 275 {RAZWI_INITIATOR_ID_X_Y(2, 4, 4), mmDCORE0_RTR0_CTRL_BASE, 276 GAUDI2_ENGINE_ID_SIZE, "PMMU"}, 277 {RAZWI_INITIATOR_ID_X_Y(2, 4, 5), mmDCORE0_RTR0_CTRL_BASE, 278 GAUDI2_ENGINE_ID_SIZE, "PCIE"}, 279 {RAZWI_INITIATOR_ID_X_Y(17, 4, 16), mmDCORE1_RTR7_CTRL_BASE, 280 GAUDI2_ENGINE_ID_ARC_FARM, "ARC_FARM"}, 281 {RAZWI_INITIATOR_ID_X_Y(17, 4, 17), mmDCORE1_RTR7_CTRL_BASE, 282 GAUDI2_ENGINE_ID_KDMA, "KDMA"}, 283 {RAZWI_INITIATOR_ID_X_Y(1, 5, 1), mmSFT0_HBW_RTR_IF1_RTR_CTRL_BASE, 284 GAUDI2_DCORE0_ENGINE_ID_EDMA_0, "EDMA0"}, 285 {RAZWI_INITIATOR_ID_X_Y(1, 5, 1), mmSFT0_HBW_RTR_IF0_RTR_CTRL_BASE, 286 GAUDI2_DCORE0_ENGINE_ID_EDMA_1, "EDMA1"}, 287 {RAZWI_INITIATOR_ID_X_Y(18, 5, 18), mmSFT1_HBW_RTR_IF1_RTR_CTRL_BASE, 288 GAUDI2_DCORE1_ENGINE_ID_EDMA_0, "EDMA2"}, 289 {RAZWI_INITIATOR_ID_X_Y(18, 5, 18), mmSFT1_HBW_RTR_IF0_RTR_CTRL_BASE, 290 GAUDI2_DCORE1_ENGINE_ID_EDMA_1, "EDMA3"}, 291 {RAZWI_INITIATOR_ID_X_Y(1, 10, 1), mmSFT2_HBW_RTR_IF0_RTR_CTRL_BASE, 292 GAUDI2_DCORE2_ENGINE_ID_EDMA_0, "EDMA4"}, 293 {RAZWI_INITIATOR_ID_X_Y(1, 10, 1), mmSFT2_HBW_RTR_IF1_RTR_CTRL_BASE, 294 GAUDI2_DCORE2_ENGINE_ID_EDMA_1, "EDMA5"}, 295 {RAZWI_INITIATOR_ID_X_Y(18, 10, 18), mmSFT2_HBW_RTR_IF0_RTR_CTRL_BASE, 296 GAUDI2_DCORE3_ENGINE_ID_EDMA_0, "EDMA6"}, 297 {RAZWI_INITIATOR_ID_X_Y(18, 10, 18), mmSFT2_HBW_RTR_IF1_RTR_CTRL_BASE, 298 GAUDI2_DCORE3_ENGINE_ID_EDMA_1, "EDMA7"}, 299 {RAZWI_INITIATOR_ID_X_Y(1, 5, 0), mmDCORE0_RTR0_CTRL_BASE, 300 GAUDI2_ENGINE_ID_SIZE, "HMMU0"}, 301 {RAZWI_INITIATOR_ID_X_Y(18, 5, 19), mmDCORE1_RTR7_CTRL_BASE, 302 GAUDI2_ENGINE_ID_SIZE, "HMMU1"}, 303 {RAZWI_INITIATOR_ID_X_Y(1, 5, 0), mmDCORE0_RTR0_CTRL_BASE, 304 GAUDI2_ENGINE_ID_SIZE, "HMMU2"}, 305 {RAZWI_INITIATOR_ID_X_Y(18, 5, 19), mmDCORE1_RTR7_CTRL_BASE, 306 GAUDI2_ENGINE_ID_SIZE, "HMMU3"}, 307 {RAZWI_INITIATOR_ID_X_Y(1, 5, 0), mmDCORE0_RTR0_CTRL_BASE, 308 GAUDI2_ENGINE_ID_SIZE, "HMMU4"}, 309 {RAZWI_INITIATOR_ID_X_Y(18, 5, 19), mmDCORE1_RTR7_CTRL_BASE, 310 GAUDI2_ENGINE_ID_SIZE, "HMMU5"}, 311 {RAZWI_INITIATOR_ID_X_Y(1, 5, 0), mmDCORE0_RTR0_CTRL_BASE, 312 GAUDI2_ENGINE_ID_SIZE, "HMMU6"}, 313 {RAZWI_INITIATOR_ID_X_Y(18, 5, 19), mmDCORE1_RTR7_CTRL_BASE, 314 GAUDI2_ENGINE_ID_SIZE, "HMMU7"}, 315 {RAZWI_INITIATOR_ID_X_Y(1, 10, 0), mmDCORE2_RTR0_CTRL_BASE, 316 GAUDI2_ENGINE_ID_SIZE, "HMMU8"}, 317 {RAZWI_INITIATOR_ID_X_Y(18, 10, 19), mmDCORE3_RTR7_CTRL_BASE, 318 GAUDI2_ENGINE_ID_SIZE, "HMMU9"}, 319 {RAZWI_INITIATOR_ID_X_Y(1, 10, 0), mmDCORE2_RTR0_CTRL_BASE, 320 GAUDI2_ENGINE_ID_SIZE, "HMMU10"}, 321 {RAZWI_INITIATOR_ID_X_Y(18, 10, 19), mmDCORE3_RTR7_CTRL_BASE, 322 GAUDI2_ENGINE_ID_SIZE, "HMMU11"}, 323 {RAZWI_INITIATOR_ID_X_Y(1, 10, 0), mmDCORE2_RTR0_CTRL_BASE, 324 GAUDI2_ENGINE_ID_SIZE, "HMMU12"}, 325 {RAZWI_INITIATOR_ID_X_Y(18, 10, 19), mmDCORE3_RTR7_CTRL_BASE, 326 GAUDI2_ENGINE_ID_SIZE, "HMMU13"}, 327 {RAZWI_INITIATOR_ID_X_Y(1, 10, 0), mmDCORE2_RTR0_CTRL_BASE, 328 GAUDI2_ENGINE_ID_SIZE, "HMMU14"}, 329 {RAZWI_INITIATOR_ID_X_Y(18, 10, 19), mmDCORE3_RTR7_CTRL_BASE, 330 GAUDI2_ENGINE_ID_SIZE, "HMMU15"}, 331 {RAZWI_INITIATOR_ID_X_Y(2, 11, 2), mmDCORE2_RTR0_CTRL_BASE, 332 GAUDI2_ENGINE_ID_ROT_0, "ROT0"}, 333 {RAZWI_INITIATOR_ID_X_Y(17, 11, 16), mmDCORE3_RTR7_CTRL_BASE, 334 GAUDI2_ENGINE_ID_ROT_1, "ROT1"}, 335 {RAZWI_INITIATOR_ID_X_Y(2, 11, 2), mmDCORE2_RTR0_CTRL_BASE, 336 GAUDI2_ENGINE_ID_PSOC, "CPU"}, 337 {RAZWI_INITIATOR_ID_X_Y(17, 11, 11), mmDCORE3_RTR7_CTRL_BASE, 338 GAUDI2_ENGINE_ID_PSOC, "PSOC"} 339 }; 340 341 static struct gaudi2_razwi_info mme_razwi_info[] = { 342 /* MME X high coordinate is N/A, hence using only low coordinates */ 343 {RAZWI_INITIATOR_ID_X_Y_LOW(7, 4), mmDCORE0_RTR5_CTRL_BASE, 344 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_WAP0"}, 345 {RAZWI_INITIATOR_ID_X_Y_LOW(9, 4), mmDCORE0_RTR7_CTRL_BASE, 346 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_WAP1"}, 347 {RAZWI_INITIATOR_ID_X_Y_LOW(8, 4), mmDCORE0_RTR6_CTRL_BASE, 348 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_CTRL_WR"}, 349 {RAZWI_INITIATOR_ID_X_Y_LOW(9, 4), mmDCORE0_RTR7_CTRL_BASE, 350 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_CTRL_RD"}, 351 {RAZWI_INITIATOR_ID_X_Y_LOW(6, 4), mmDCORE0_RTR4_CTRL_BASE, 352 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_SBTE0"}, 353 {RAZWI_INITIATOR_ID_X_Y_LOW(6, 4), mmDCORE0_RTR4_CTRL_BASE, 354 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_SBTE1"}, 355 {RAZWI_INITIATOR_ID_X_Y_LOW(7, 4), mmDCORE0_RTR5_CTRL_BASE, 356 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_SBTE2"}, 357 {RAZWI_INITIATOR_ID_X_Y_LOW(8, 4), mmDCORE0_RTR6_CTRL_BASE, 358 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_SBTE3"}, 359 {RAZWI_INITIATOR_ID_X_Y_LOW(9, 4), mmDCORE0_RTR7_CTRL_BASE, 360 GAUDI2_DCORE0_ENGINE_ID_MME, "MME0_SBTE4"}, 361 {RAZWI_INITIATOR_ID_X_Y_LOW(12, 4), mmDCORE1_RTR2_CTRL_BASE, 362 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_WAP0"}, 363 {RAZWI_INITIATOR_ID_X_Y_LOW(10, 4), mmDCORE1_RTR0_CTRL_BASE, 364 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_WAP1"}, 365 {RAZWI_INITIATOR_ID_X_Y_LOW(11, 4), mmDCORE1_RTR1_CTRL_BASE, 366 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_CTRL_WR"}, 367 {RAZWI_INITIATOR_ID_X_Y_LOW(10, 4), mmDCORE1_RTR0_CTRL_BASE, 368 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_CTRL_RD"}, 369 {RAZWI_INITIATOR_ID_X_Y_LOW(13, 4), mmDCORE1_RTR3_CTRL_BASE, 370 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_SBTE0"}, 371 {RAZWI_INITIATOR_ID_X_Y_LOW(13, 4), mmDCORE1_RTR3_CTRL_BASE, 372 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_SBTE1"}, 373 {RAZWI_INITIATOR_ID_X_Y_LOW(12, 4), mmDCORE1_RTR2_CTRL_BASE, 374 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_SBTE2"}, 375 {RAZWI_INITIATOR_ID_X_Y_LOW(11, 4), mmDCORE1_RTR1_CTRL_BASE, 376 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_SBTE3"}, 377 {RAZWI_INITIATOR_ID_X_Y_LOW(10, 4), mmDCORE1_RTR0_CTRL_BASE, 378 GAUDI2_DCORE1_ENGINE_ID_MME, "MME1_SBTE4"}, 379 {RAZWI_INITIATOR_ID_X_Y_LOW(7, 11), mmDCORE2_RTR5_CTRL_BASE, 380 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_WAP0"}, 381 {RAZWI_INITIATOR_ID_X_Y_LOW(9, 11), mmDCORE2_RTR7_CTRL_BASE, 382 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_WAP1"}, 383 {RAZWI_INITIATOR_ID_X_Y_LOW(8, 11), mmDCORE2_RTR6_CTRL_BASE, 384 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_CTRL_WR"}, 385 {RAZWI_INITIATOR_ID_X_Y_LOW(9, 11), mmDCORE2_RTR7_CTRL_BASE, 386 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_CTRL_RD"}, 387 {RAZWI_INITIATOR_ID_X_Y_LOW(6, 11), mmDCORE2_RTR4_CTRL_BASE, 388 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_SBTE0"}, 389 {RAZWI_INITIATOR_ID_X_Y_LOW(6, 11), mmDCORE2_RTR4_CTRL_BASE, 390 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_SBTE1"}, 391 {RAZWI_INITIATOR_ID_X_Y_LOW(7, 11), mmDCORE2_RTR5_CTRL_BASE, 392 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_SBTE2"}, 393 {RAZWI_INITIATOR_ID_X_Y_LOW(8, 11), mmDCORE2_RTR6_CTRL_BASE, 394 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_SBTE3"}, 395 {RAZWI_INITIATOR_ID_X_Y_LOW(9, 11), mmDCORE2_RTR7_CTRL_BASE, 396 GAUDI2_DCORE2_ENGINE_ID_MME, "MME2_SBTE4"}, 397 {RAZWI_INITIATOR_ID_X_Y_LOW(12, 11), mmDCORE3_RTR2_CTRL_BASE, 398 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_WAP0"}, 399 {RAZWI_INITIATOR_ID_X_Y_LOW(10, 11), mmDCORE3_RTR0_CTRL_BASE, 400 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_WAP1"}, 401 {RAZWI_INITIATOR_ID_X_Y_LOW(11, 11), mmDCORE3_RTR1_CTRL_BASE, 402 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_CTRL_WR"}, 403 {RAZWI_INITIATOR_ID_X_Y_LOW(10, 11), mmDCORE3_RTR0_CTRL_BASE, 404 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_CTRL_RD"}, 405 {RAZWI_INITIATOR_ID_X_Y_LOW(13, 11), mmDCORE3_RTR3_CTRL_BASE, 406 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_SBTE0"}, 407 {RAZWI_INITIATOR_ID_X_Y_LOW(13, 11), mmDCORE3_RTR3_CTRL_BASE, 408 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_SBTE1"}, 409 {RAZWI_INITIATOR_ID_X_Y_LOW(12, 11), mmDCORE3_RTR2_CTRL_BASE, 410 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_SBTE2"}, 411 {RAZWI_INITIATOR_ID_X_Y_LOW(11, 11), mmDCORE3_RTR1_CTRL_BASE, 412 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_SBTE3"}, 413 {RAZWI_INITIATOR_ID_X_Y_LOW(10, 11), mmDCORE3_RTR0_CTRL_BASE, 414 GAUDI2_DCORE3_ENGINE_ID_MME, "MME3_SBTE4"} 415 }; 416 417 enum hl_pmmu_fatal_cause { 418 LATENCY_RD_OUT_FIFO_OVERRUN, 419 LATENCY_WR_OUT_FIFO_OVERRUN, 420 }; 421 422 enum hl_pcie_drain_ind_cause { 423 LBW_AXI_DRAIN_IND, 424 HBW_AXI_DRAIN_IND 425 }; 426 427 static const u32 cluster_hmmu_hif_enabled_mask[GAUDI2_HBM_NUM] = { 428 [HBM_ID0] = 0xFFFC, 429 [HBM_ID1] = 0xFFCF, 430 [HBM_ID2] = 0xF7F7, 431 [HBM_ID3] = 0x7F7F, 432 [HBM_ID4] = 0xFCFF, 433 [HBM_ID5] = 0xCFFF, 434 }; 435 436 static const u8 xbar_edge_to_hbm_cluster[EDMA_ID_SIZE] = { 437 [0] = HBM_ID0, 438 [1] = HBM_ID1, 439 [2] = HBM_ID4, 440 [3] = HBM_ID5, 441 }; 442 443 static const u8 edma_to_hbm_cluster[EDMA_ID_SIZE] = { 444 [EDMA_ID_DCORE0_INSTANCE0] = HBM_ID0, 445 [EDMA_ID_DCORE0_INSTANCE1] = HBM_ID2, 446 [EDMA_ID_DCORE1_INSTANCE0] = HBM_ID1, 447 [EDMA_ID_DCORE1_INSTANCE1] = HBM_ID3, 448 [EDMA_ID_DCORE2_INSTANCE0] = HBM_ID2, 449 [EDMA_ID_DCORE2_INSTANCE1] = HBM_ID4, 450 [EDMA_ID_DCORE3_INSTANCE0] = HBM_ID3, 451 [EDMA_ID_DCORE3_INSTANCE1] = HBM_ID5, 452 }; 453 454 static const int gaudi2_qman_async_event_id[] = { 455 [GAUDI2_QUEUE_ID_PDMA_0_0] = GAUDI2_EVENT_PDMA0_QM, 456 [GAUDI2_QUEUE_ID_PDMA_0_1] = GAUDI2_EVENT_PDMA0_QM, 457 [GAUDI2_QUEUE_ID_PDMA_0_2] = GAUDI2_EVENT_PDMA0_QM, 458 [GAUDI2_QUEUE_ID_PDMA_0_3] = GAUDI2_EVENT_PDMA0_QM, 459 [GAUDI2_QUEUE_ID_PDMA_1_0] = GAUDI2_EVENT_PDMA1_QM, 460 [GAUDI2_QUEUE_ID_PDMA_1_1] = GAUDI2_EVENT_PDMA1_QM, 461 [GAUDI2_QUEUE_ID_PDMA_1_2] = GAUDI2_EVENT_PDMA1_QM, 462 [GAUDI2_QUEUE_ID_PDMA_1_3] = GAUDI2_EVENT_PDMA1_QM, 463 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0] = GAUDI2_EVENT_HDMA0_QM, 464 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_1] = GAUDI2_EVENT_HDMA0_QM, 465 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_2] = GAUDI2_EVENT_HDMA0_QM, 466 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_3] = GAUDI2_EVENT_HDMA0_QM, 467 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_0] = GAUDI2_EVENT_HDMA1_QM, 468 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_1] = GAUDI2_EVENT_HDMA1_QM, 469 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_2] = GAUDI2_EVENT_HDMA1_QM, 470 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3] = GAUDI2_EVENT_HDMA1_QM, 471 [GAUDI2_QUEUE_ID_DCORE0_MME_0_0] = GAUDI2_EVENT_MME0_QM, 472 [GAUDI2_QUEUE_ID_DCORE0_MME_0_1] = GAUDI2_EVENT_MME0_QM, 473 [GAUDI2_QUEUE_ID_DCORE0_MME_0_2] = GAUDI2_EVENT_MME0_QM, 474 [GAUDI2_QUEUE_ID_DCORE0_MME_0_3] = GAUDI2_EVENT_MME0_QM, 475 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_0] = GAUDI2_EVENT_TPC0_QM, 476 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_1] = GAUDI2_EVENT_TPC0_QM, 477 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_2] = GAUDI2_EVENT_TPC0_QM, 478 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_3] = GAUDI2_EVENT_TPC0_QM, 479 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_0] = GAUDI2_EVENT_TPC1_QM, 480 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_1] = GAUDI2_EVENT_TPC1_QM, 481 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_2] = GAUDI2_EVENT_TPC1_QM, 482 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_3] = GAUDI2_EVENT_TPC1_QM, 483 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_0] = GAUDI2_EVENT_TPC2_QM, 484 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_1] = GAUDI2_EVENT_TPC2_QM, 485 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_2] = GAUDI2_EVENT_TPC2_QM, 486 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_3] = GAUDI2_EVENT_TPC2_QM, 487 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_0] = GAUDI2_EVENT_TPC3_QM, 488 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_1] = GAUDI2_EVENT_TPC3_QM, 489 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_2] = GAUDI2_EVENT_TPC3_QM, 490 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_3] = GAUDI2_EVENT_TPC3_QM, 491 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_0] = GAUDI2_EVENT_TPC4_QM, 492 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_1] = GAUDI2_EVENT_TPC4_QM, 493 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_2] = GAUDI2_EVENT_TPC4_QM, 494 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_3] = GAUDI2_EVENT_TPC4_QM, 495 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_0] = GAUDI2_EVENT_TPC5_QM, 496 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_1] = GAUDI2_EVENT_TPC5_QM, 497 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_2] = GAUDI2_EVENT_TPC5_QM, 498 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_3] = GAUDI2_EVENT_TPC5_QM, 499 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_0] = GAUDI2_EVENT_TPC24_QM, 500 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_1] = GAUDI2_EVENT_TPC24_QM, 501 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_2] = GAUDI2_EVENT_TPC24_QM, 502 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_3] = GAUDI2_EVENT_TPC24_QM, 503 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0] = GAUDI2_EVENT_HDMA2_QM, 504 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_1] = GAUDI2_EVENT_HDMA2_QM, 505 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_2] = GAUDI2_EVENT_HDMA2_QM, 506 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_3] = GAUDI2_EVENT_HDMA2_QM, 507 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_0] = GAUDI2_EVENT_HDMA3_QM, 508 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_1] = GAUDI2_EVENT_HDMA3_QM, 509 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_2] = GAUDI2_EVENT_HDMA3_QM, 510 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3] = GAUDI2_EVENT_HDMA3_QM, 511 [GAUDI2_QUEUE_ID_DCORE1_MME_0_0] = GAUDI2_EVENT_MME1_QM, 512 [GAUDI2_QUEUE_ID_DCORE1_MME_0_1] = GAUDI2_EVENT_MME1_QM, 513 [GAUDI2_QUEUE_ID_DCORE1_MME_0_2] = GAUDI2_EVENT_MME1_QM, 514 [GAUDI2_QUEUE_ID_DCORE1_MME_0_3] = GAUDI2_EVENT_MME1_QM, 515 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_0] = GAUDI2_EVENT_TPC6_QM, 516 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_1] = GAUDI2_EVENT_TPC6_QM, 517 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_2] = GAUDI2_EVENT_TPC6_QM, 518 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_3] = GAUDI2_EVENT_TPC6_QM, 519 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_0] = GAUDI2_EVENT_TPC7_QM, 520 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_1] = GAUDI2_EVENT_TPC7_QM, 521 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_2] = GAUDI2_EVENT_TPC7_QM, 522 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_3] = GAUDI2_EVENT_TPC7_QM, 523 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_0] = GAUDI2_EVENT_TPC8_QM, 524 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_1] = GAUDI2_EVENT_TPC8_QM, 525 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_2] = GAUDI2_EVENT_TPC8_QM, 526 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_3] = GAUDI2_EVENT_TPC8_QM, 527 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_0] = GAUDI2_EVENT_TPC9_QM, 528 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_1] = GAUDI2_EVENT_TPC9_QM, 529 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_2] = GAUDI2_EVENT_TPC9_QM, 530 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_3] = GAUDI2_EVENT_TPC9_QM, 531 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_0] = GAUDI2_EVENT_TPC10_QM, 532 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_1] = GAUDI2_EVENT_TPC10_QM, 533 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_2] = GAUDI2_EVENT_TPC10_QM, 534 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_3] = GAUDI2_EVENT_TPC10_QM, 535 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_0] = GAUDI2_EVENT_TPC11_QM, 536 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_1] = GAUDI2_EVENT_TPC11_QM, 537 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_2] = GAUDI2_EVENT_TPC11_QM, 538 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_3] = GAUDI2_EVENT_TPC11_QM, 539 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0] = GAUDI2_EVENT_HDMA4_QM, 540 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_1] = GAUDI2_EVENT_HDMA4_QM, 541 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_2] = GAUDI2_EVENT_HDMA4_QM, 542 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_3] = GAUDI2_EVENT_HDMA4_QM, 543 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_0] = GAUDI2_EVENT_HDMA5_QM, 544 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_1] = GAUDI2_EVENT_HDMA5_QM, 545 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_2] = GAUDI2_EVENT_HDMA5_QM, 546 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3] = GAUDI2_EVENT_HDMA5_QM, 547 [GAUDI2_QUEUE_ID_DCORE2_MME_0_0] = GAUDI2_EVENT_MME2_QM, 548 [GAUDI2_QUEUE_ID_DCORE2_MME_0_1] = GAUDI2_EVENT_MME2_QM, 549 [GAUDI2_QUEUE_ID_DCORE2_MME_0_2] = GAUDI2_EVENT_MME2_QM, 550 [GAUDI2_QUEUE_ID_DCORE2_MME_0_3] = GAUDI2_EVENT_MME2_QM, 551 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_0] = GAUDI2_EVENT_TPC12_QM, 552 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_1] = GAUDI2_EVENT_TPC12_QM, 553 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_2] = GAUDI2_EVENT_TPC12_QM, 554 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_3] = GAUDI2_EVENT_TPC12_QM, 555 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_0] = GAUDI2_EVENT_TPC13_QM, 556 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_1] = GAUDI2_EVENT_TPC13_QM, 557 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_2] = GAUDI2_EVENT_TPC13_QM, 558 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_3] = GAUDI2_EVENT_TPC13_QM, 559 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_0] = GAUDI2_EVENT_TPC14_QM, 560 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_1] = GAUDI2_EVENT_TPC14_QM, 561 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_2] = GAUDI2_EVENT_TPC14_QM, 562 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_3] = GAUDI2_EVENT_TPC14_QM, 563 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_0] = GAUDI2_EVENT_TPC15_QM, 564 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_1] = GAUDI2_EVENT_TPC15_QM, 565 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_2] = GAUDI2_EVENT_TPC15_QM, 566 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_3] = GAUDI2_EVENT_TPC15_QM, 567 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_0] = GAUDI2_EVENT_TPC16_QM, 568 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_1] = GAUDI2_EVENT_TPC16_QM, 569 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_2] = GAUDI2_EVENT_TPC16_QM, 570 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_3] = GAUDI2_EVENT_TPC16_QM, 571 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_0] = GAUDI2_EVENT_TPC17_QM, 572 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_1] = GAUDI2_EVENT_TPC17_QM, 573 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_2] = GAUDI2_EVENT_TPC17_QM, 574 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_3] = GAUDI2_EVENT_TPC17_QM, 575 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0] = GAUDI2_EVENT_HDMA6_QM, 576 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_1] = GAUDI2_EVENT_HDMA6_QM, 577 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_2] = GAUDI2_EVENT_HDMA6_QM, 578 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_3] = GAUDI2_EVENT_HDMA6_QM, 579 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0] = GAUDI2_EVENT_HDMA7_QM, 580 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_1] = GAUDI2_EVENT_HDMA7_QM, 581 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_2] = GAUDI2_EVENT_HDMA7_QM, 582 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3] = GAUDI2_EVENT_HDMA7_QM, 583 [GAUDI2_QUEUE_ID_DCORE3_MME_0_0] = GAUDI2_EVENT_MME3_QM, 584 [GAUDI2_QUEUE_ID_DCORE3_MME_0_1] = GAUDI2_EVENT_MME3_QM, 585 [GAUDI2_QUEUE_ID_DCORE3_MME_0_2] = GAUDI2_EVENT_MME3_QM, 586 [GAUDI2_QUEUE_ID_DCORE3_MME_0_3] = GAUDI2_EVENT_MME3_QM, 587 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_0] = GAUDI2_EVENT_TPC18_QM, 588 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_1] = GAUDI2_EVENT_TPC18_QM, 589 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_2] = GAUDI2_EVENT_TPC18_QM, 590 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_3] = GAUDI2_EVENT_TPC18_QM, 591 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_0] = GAUDI2_EVENT_TPC19_QM, 592 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_1] = GAUDI2_EVENT_TPC19_QM, 593 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_2] = GAUDI2_EVENT_TPC19_QM, 594 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_3] = GAUDI2_EVENT_TPC19_QM, 595 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_0] = GAUDI2_EVENT_TPC20_QM, 596 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_1] = GAUDI2_EVENT_TPC20_QM, 597 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_2] = GAUDI2_EVENT_TPC20_QM, 598 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_3] = GAUDI2_EVENT_TPC20_QM, 599 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_0] = GAUDI2_EVENT_TPC21_QM, 600 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_1] = GAUDI2_EVENT_TPC21_QM, 601 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_2] = GAUDI2_EVENT_TPC21_QM, 602 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_3] = GAUDI2_EVENT_TPC21_QM, 603 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_0] = GAUDI2_EVENT_TPC22_QM, 604 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_1] = GAUDI2_EVENT_TPC22_QM, 605 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_2] = GAUDI2_EVENT_TPC22_QM, 606 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_3] = GAUDI2_EVENT_TPC22_QM, 607 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_0] = GAUDI2_EVENT_TPC23_QM, 608 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_1] = GAUDI2_EVENT_TPC23_QM, 609 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_2] = GAUDI2_EVENT_TPC23_QM, 610 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_3] = GAUDI2_EVENT_TPC23_QM, 611 [GAUDI2_QUEUE_ID_NIC_0_0] = GAUDI2_EVENT_NIC0_QM0, 612 [GAUDI2_QUEUE_ID_NIC_0_1] = GAUDI2_EVENT_NIC0_QM0, 613 [GAUDI2_QUEUE_ID_NIC_0_2] = GAUDI2_EVENT_NIC0_QM0, 614 [GAUDI2_QUEUE_ID_NIC_0_3] = GAUDI2_EVENT_NIC0_QM0, 615 [GAUDI2_QUEUE_ID_NIC_1_0] = GAUDI2_EVENT_NIC0_QM1, 616 [GAUDI2_QUEUE_ID_NIC_1_1] = GAUDI2_EVENT_NIC0_QM1, 617 [GAUDI2_QUEUE_ID_NIC_1_2] = GAUDI2_EVENT_NIC0_QM1, 618 [GAUDI2_QUEUE_ID_NIC_1_3] = GAUDI2_EVENT_NIC0_QM1, 619 [GAUDI2_QUEUE_ID_NIC_2_0] = GAUDI2_EVENT_NIC1_QM0, 620 [GAUDI2_QUEUE_ID_NIC_2_1] = GAUDI2_EVENT_NIC1_QM0, 621 [GAUDI2_QUEUE_ID_NIC_2_2] = GAUDI2_EVENT_NIC1_QM0, 622 [GAUDI2_QUEUE_ID_NIC_2_3] = GAUDI2_EVENT_NIC1_QM0, 623 [GAUDI2_QUEUE_ID_NIC_3_0] = GAUDI2_EVENT_NIC1_QM1, 624 [GAUDI2_QUEUE_ID_NIC_3_1] = GAUDI2_EVENT_NIC1_QM1, 625 [GAUDI2_QUEUE_ID_NIC_3_2] = GAUDI2_EVENT_NIC1_QM1, 626 [GAUDI2_QUEUE_ID_NIC_3_3] = GAUDI2_EVENT_NIC1_QM1, 627 [GAUDI2_QUEUE_ID_NIC_4_0] = GAUDI2_EVENT_NIC2_QM0, 628 [GAUDI2_QUEUE_ID_NIC_4_1] = GAUDI2_EVENT_NIC2_QM0, 629 [GAUDI2_QUEUE_ID_NIC_4_2] = GAUDI2_EVENT_NIC2_QM0, 630 [GAUDI2_QUEUE_ID_NIC_4_3] = GAUDI2_EVENT_NIC2_QM0, 631 [GAUDI2_QUEUE_ID_NIC_5_0] = GAUDI2_EVENT_NIC2_QM1, 632 [GAUDI2_QUEUE_ID_NIC_5_1] = GAUDI2_EVENT_NIC2_QM1, 633 [GAUDI2_QUEUE_ID_NIC_5_2] = GAUDI2_EVENT_NIC2_QM1, 634 [GAUDI2_QUEUE_ID_NIC_5_3] = GAUDI2_EVENT_NIC2_QM1, 635 [GAUDI2_QUEUE_ID_NIC_6_0] = GAUDI2_EVENT_NIC3_QM0, 636 [GAUDI2_QUEUE_ID_NIC_6_1] = GAUDI2_EVENT_NIC3_QM0, 637 [GAUDI2_QUEUE_ID_NIC_6_2] = GAUDI2_EVENT_NIC3_QM0, 638 [GAUDI2_QUEUE_ID_NIC_6_3] = GAUDI2_EVENT_NIC3_QM0, 639 [GAUDI2_QUEUE_ID_NIC_7_0] = GAUDI2_EVENT_NIC3_QM1, 640 [GAUDI2_QUEUE_ID_NIC_7_1] = GAUDI2_EVENT_NIC3_QM1, 641 [GAUDI2_QUEUE_ID_NIC_7_2] = GAUDI2_EVENT_NIC3_QM1, 642 [GAUDI2_QUEUE_ID_NIC_7_3] = GAUDI2_EVENT_NIC3_QM1, 643 [GAUDI2_QUEUE_ID_NIC_8_0] = GAUDI2_EVENT_NIC4_QM0, 644 [GAUDI2_QUEUE_ID_NIC_8_1] = GAUDI2_EVENT_NIC4_QM0, 645 [GAUDI2_QUEUE_ID_NIC_8_2] = GAUDI2_EVENT_NIC4_QM0, 646 [GAUDI2_QUEUE_ID_NIC_8_3] = GAUDI2_EVENT_NIC4_QM0, 647 [GAUDI2_QUEUE_ID_NIC_9_0] = GAUDI2_EVENT_NIC4_QM1, 648 [GAUDI2_QUEUE_ID_NIC_9_1] = GAUDI2_EVENT_NIC4_QM1, 649 [GAUDI2_QUEUE_ID_NIC_9_2] = GAUDI2_EVENT_NIC4_QM1, 650 [GAUDI2_QUEUE_ID_NIC_9_3] = GAUDI2_EVENT_NIC4_QM1, 651 [GAUDI2_QUEUE_ID_NIC_10_0] = GAUDI2_EVENT_NIC5_QM0, 652 [GAUDI2_QUEUE_ID_NIC_10_1] = GAUDI2_EVENT_NIC5_QM0, 653 [GAUDI2_QUEUE_ID_NIC_10_2] = GAUDI2_EVENT_NIC5_QM0, 654 [GAUDI2_QUEUE_ID_NIC_10_3] = GAUDI2_EVENT_NIC5_QM0, 655 [GAUDI2_QUEUE_ID_NIC_11_0] = GAUDI2_EVENT_NIC5_QM1, 656 [GAUDI2_QUEUE_ID_NIC_11_1] = GAUDI2_EVENT_NIC5_QM1, 657 [GAUDI2_QUEUE_ID_NIC_11_2] = GAUDI2_EVENT_NIC5_QM1, 658 [GAUDI2_QUEUE_ID_NIC_11_3] = GAUDI2_EVENT_NIC5_QM1, 659 [GAUDI2_QUEUE_ID_NIC_12_0] = GAUDI2_EVENT_NIC6_QM0, 660 [GAUDI2_QUEUE_ID_NIC_12_1] = GAUDI2_EVENT_NIC6_QM0, 661 [GAUDI2_QUEUE_ID_NIC_12_2] = GAUDI2_EVENT_NIC6_QM0, 662 [GAUDI2_QUEUE_ID_NIC_12_3] = GAUDI2_EVENT_NIC6_QM0, 663 [GAUDI2_QUEUE_ID_NIC_13_0] = GAUDI2_EVENT_NIC6_QM1, 664 [GAUDI2_QUEUE_ID_NIC_13_1] = GAUDI2_EVENT_NIC6_QM1, 665 [GAUDI2_QUEUE_ID_NIC_13_2] = GAUDI2_EVENT_NIC6_QM1, 666 [GAUDI2_QUEUE_ID_NIC_13_3] = GAUDI2_EVENT_NIC6_QM1, 667 [GAUDI2_QUEUE_ID_NIC_14_0] = GAUDI2_EVENT_NIC7_QM0, 668 [GAUDI2_QUEUE_ID_NIC_14_1] = GAUDI2_EVENT_NIC7_QM0, 669 [GAUDI2_QUEUE_ID_NIC_14_2] = GAUDI2_EVENT_NIC7_QM0, 670 [GAUDI2_QUEUE_ID_NIC_14_3] = GAUDI2_EVENT_NIC7_QM0, 671 [GAUDI2_QUEUE_ID_NIC_15_0] = GAUDI2_EVENT_NIC7_QM1, 672 [GAUDI2_QUEUE_ID_NIC_15_1] = GAUDI2_EVENT_NIC7_QM1, 673 [GAUDI2_QUEUE_ID_NIC_15_2] = GAUDI2_EVENT_NIC7_QM1, 674 [GAUDI2_QUEUE_ID_NIC_15_3] = GAUDI2_EVENT_NIC7_QM1, 675 [GAUDI2_QUEUE_ID_NIC_16_0] = GAUDI2_EVENT_NIC8_QM0, 676 [GAUDI2_QUEUE_ID_NIC_16_1] = GAUDI2_EVENT_NIC8_QM0, 677 [GAUDI2_QUEUE_ID_NIC_16_2] = GAUDI2_EVENT_NIC8_QM0, 678 [GAUDI2_QUEUE_ID_NIC_16_3] = GAUDI2_EVENT_NIC8_QM0, 679 [GAUDI2_QUEUE_ID_NIC_17_0] = GAUDI2_EVENT_NIC8_QM1, 680 [GAUDI2_QUEUE_ID_NIC_17_1] = GAUDI2_EVENT_NIC8_QM1, 681 [GAUDI2_QUEUE_ID_NIC_17_2] = GAUDI2_EVENT_NIC8_QM1, 682 [GAUDI2_QUEUE_ID_NIC_17_3] = GAUDI2_EVENT_NIC8_QM1, 683 [GAUDI2_QUEUE_ID_NIC_18_0] = GAUDI2_EVENT_NIC9_QM0, 684 [GAUDI2_QUEUE_ID_NIC_18_1] = GAUDI2_EVENT_NIC9_QM0, 685 [GAUDI2_QUEUE_ID_NIC_18_2] = GAUDI2_EVENT_NIC9_QM0, 686 [GAUDI2_QUEUE_ID_NIC_18_3] = GAUDI2_EVENT_NIC9_QM0, 687 [GAUDI2_QUEUE_ID_NIC_19_0] = GAUDI2_EVENT_NIC9_QM1, 688 [GAUDI2_QUEUE_ID_NIC_19_1] = GAUDI2_EVENT_NIC9_QM1, 689 [GAUDI2_QUEUE_ID_NIC_19_2] = GAUDI2_EVENT_NIC9_QM1, 690 [GAUDI2_QUEUE_ID_NIC_19_3] = GAUDI2_EVENT_NIC9_QM1, 691 [GAUDI2_QUEUE_ID_NIC_20_0] = GAUDI2_EVENT_NIC10_QM0, 692 [GAUDI2_QUEUE_ID_NIC_20_1] = GAUDI2_EVENT_NIC10_QM0, 693 [GAUDI2_QUEUE_ID_NIC_20_2] = GAUDI2_EVENT_NIC10_QM0, 694 [GAUDI2_QUEUE_ID_NIC_20_3] = GAUDI2_EVENT_NIC10_QM0, 695 [GAUDI2_QUEUE_ID_NIC_21_0] = GAUDI2_EVENT_NIC10_QM1, 696 [GAUDI2_QUEUE_ID_NIC_21_1] = GAUDI2_EVENT_NIC10_QM1, 697 [GAUDI2_QUEUE_ID_NIC_21_2] = GAUDI2_EVENT_NIC10_QM1, 698 [GAUDI2_QUEUE_ID_NIC_21_3] = GAUDI2_EVENT_NIC10_QM1, 699 [GAUDI2_QUEUE_ID_NIC_22_0] = GAUDI2_EVENT_NIC11_QM0, 700 [GAUDI2_QUEUE_ID_NIC_22_1] = GAUDI2_EVENT_NIC11_QM0, 701 [GAUDI2_QUEUE_ID_NIC_22_2] = GAUDI2_EVENT_NIC11_QM0, 702 [GAUDI2_QUEUE_ID_NIC_22_3] = GAUDI2_EVENT_NIC11_QM0, 703 [GAUDI2_QUEUE_ID_NIC_23_0] = GAUDI2_EVENT_NIC11_QM1, 704 [GAUDI2_QUEUE_ID_NIC_23_1] = GAUDI2_EVENT_NIC11_QM1, 705 [GAUDI2_QUEUE_ID_NIC_23_2] = GAUDI2_EVENT_NIC11_QM1, 706 [GAUDI2_QUEUE_ID_NIC_23_3] = GAUDI2_EVENT_NIC11_QM1, 707 [GAUDI2_QUEUE_ID_ROT_0_0] = GAUDI2_EVENT_ROTATOR0_ROT0_QM, 708 [GAUDI2_QUEUE_ID_ROT_0_1] = GAUDI2_EVENT_ROTATOR0_ROT0_QM, 709 [GAUDI2_QUEUE_ID_ROT_0_2] = GAUDI2_EVENT_ROTATOR0_ROT0_QM, 710 [GAUDI2_QUEUE_ID_ROT_0_3] = GAUDI2_EVENT_ROTATOR0_ROT0_QM, 711 [GAUDI2_QUEUE_ID_ROT_1_0] = GAUDI2_EVENT_ROTATOR1_ROT1_QM, 712 [GAUDI2_QUEUE_ID_ROT_1_1] = GAUDI2_EVENT_ROTATOR1_ROT1_QM, 713 [GAUDI2_QUEUE_ID_ROT_1_2] = GAUDI2_EVENT_ROTATOR1_ROT1_QM, 714 [GAUDI2_QUEUE_ID_ROT_1_3] = GAUDI2_EVENT_ROTATOR1_ROT1_QM 715 }; 716 717 static const int gaudi2_dma_core_async_event_id[] = { 718 [DMA_CORE_ID_EDMA0] = GAUDI2_EVENT_HDMA0_CORE, 719 [DMA_CORE_ID_EDMA1] = GAUDI2_EVENT_HDMA1_CORE, 720 [DMA_CORE_ID_EDMA2] = GAUDI2_EVENT_HDMA2_CORE, 721 [DMA_CORE_ID_EDMA3] = GAUDI2_EVENT_HDMA3_CORE, 722 [DMA_CORE_ID_EDMA4] = GAUDI2_EVENT_HDMA4_CORE, 723 [DMA_CORE_ID_EDMA5] = GAUDI2_EVENT_HDMA5_CORE, 724 [DMA_CORE_ID_EDMA6] = GAUDI2_EVENT_HDMA6_CORE, 725 [DMA_CORE_ID_EDMA7] = GAUDI2_EVENT_HDMA7_CORE, 726 [DMA_CORE_ID_PDMA0] = GAUDI2_EVENT_PDMA0_CORE, 727 [DMA_CORE_ID_PDMA1] = GAUDI2_EVENT_PDMA1_CORE, 728 [DMA_CORE_ID_KDMA] = GAUDI2_EVENT_KDMA0_CORE, 729 }; 730 731 static const char * const gaudi2_qm_sei_error_cause[GAUDI2_NUM_OF_QM_SEI_ERR_CAUSE] = { 732 "qman sei intr", 733 "arc sei intr" 734 }; 735 736 static const char * const gaudi2_cpu_sei_error_cause[GAUDI2_NUM_OF_CPU_SEI_ERR_CAUSE] = { 737 "AXI_TERMINATOR WR", 738 "AXI_TERMINATOR RD", 739 "AXI SPLIT SEI Status" 740 }; 741 742 static const char * const gaudi2_arc_sei_error_cause[GAUDI2_NUM_OF_ARC_SEI_ERR_CAUSE] = { 743 "cbu_bresp_sei_intr_cause", 744 "cbu_rresp_sei_intr_cause", 745 "lbu_bresp_sei_intr_cause", 746 "lbu_rresp_sei_intr_cause", 747 "cbu_axi_split_intr_cause", 748 "lbu_axi_split_intr_cause", 749 "arc_ip_excptn_sei_intr_cause", 750 "dmi_bresp_sei_intr_cause", 751 "aux2apb_err_sei_intr_cause", 752 "cfg_lbw_wr_terminated_intr_cause", 753 "cfg_lbw_rd_terminated_intr_cause", 754 "cfg_dccm_wr_terminated_intr_cause", 755 "cfg_dccm_rd_terminated_intr_cause", 756 "cfg_hbw_rd_terminated_intr_cause" 757 }; 758 759 static const char * const gaudi2_dec_error_cause[GAUDI2_NUM_OF_DEC_ERR_CAUSE] = { 760 "msix_vcd_hbw_sei", 761 "msix_l2c_hbw_sei", 762 "msix_nrm_hbw_sei", 763 "msix_abnrm_hbw_sei", 764 "msix_vcd_lbw_sei", 765 "msix_l2c_lbw_sei", 766 "msix_nrm_lbw_sei", 767 "msix_abnrm_lbw_sei", 768 "apb_vcd_lbw_sei", 769 "apb_l2c_lbw_sei", 770 "apb_nrm_lbw_sei", 771 "apb_abnrm_lbw_sei", 772 "dec_sei", 773 "dec_apb_sei", 774 "trc_apb_sei", 775 "lbw_mstr_if_sei", 776 "axi_split_bresp_err_sei", 777 "hbw_axi_wr_viol_sei", 778 "hbw_axi_rd_viol_sei", 779 "lbw_axi_wr_viol_sei", 780 "lbw_axi_rd_viol_sei", 781 "vcd_spi", 782 "l2c_spi", 783 "nrm_spi", 784 "abnrm_spi", 785 }; 786 787 static const char * const gaudi2_qman_error_cause[GAUDI2_NUM_OF_QM_ERR_CAUSE] = { 788 "PQ AXI HBW error", 789 "CQ AXI HBW error", 790 "CP AXI HBW error", 791 "CP error due to undefined OPCODE", 792 "CP encountered STOP OPCODE", 793 "CP AXI LBW error", 794 "CP WRREG32 or WRBULK returned error", 795 "N/A", 796 "FENCE 0 inc over max value and clipped", 797 "FENCE 1 inc over max value and clipped", 798 "FENCE 2 inc over max value and clipped", 799 "FENCE 3 inc over max value and clipped", 800 "FENCE 0 dec under min value and clipped", 801 "FENCE 1 dec under min value and clipped", 802 "FENCE 2 dec under min value and clipped", 803 "FENCE 3 dec under min value and clipped", 804 "CPDMA Up overflow", 805 "PQC L2H error" 806 }; 807 808 static const char * const gaudi2_lower_qman_error_cause[GAUDI2_NUM_OF_LOWER_QM_ERR_CAUSE] = { 809 "RSVD0", 810 "CQ AXI HBW error", 811 "CP AXI HBW error", 812 "CP error due to undefined OPCODE", 813 "CP encountered STOP OPCODE", 814 "CP AXI LBW error", 815 "CP WRREG32 or WRBULK returned error", 816 "N/A", 817 "FENCE 0 inc over max value and clipped", 818 "FENCE 1 inc over max value and clipped", 819 "FENCE 2 inc over max value and clipped", 820 "FENCE 3 inc over max value and clipped", 821 "FENCE 0 dec under min value and clipped", 822 "FENCE 1 dec under min value and clipped", 823 "FENCE 2 dec under min value and clipped", 824 "FENCE 3 dec under min value and clipped", 825 "CPDMA Up overflow", 826 "RSVD17", 827 "CQ_WR_IFIFO_CI_ERR", 828 "CQ_WR_CTL_CI_ERR", 829 "ARC_CQF_RD_ERR", 830 "ARC_CQ_WR_IFIFO_CI_ERR", 831 "ARC_CQ_WR_CTL_CI_ERR", 832 "ARC_AXI_ERR", 833 "CP_SWITCH_WDT_ERR" 834 }; 835 836 static const char * const gaudi2_qman_arb_error_cause[GAUDI2_NUM_OF_QM_ARB_ERR_CAUSE] = { 837 "Choice push while full error", 838 "Choice Q watchdog error", 839 "MSG AXI LBW returned with error" 840 }; 841 842 static const char * const guadi2_rot_error_cause[GAUDI2_NUM_OF_ROT_ERR_CAUSE] = { 843 "qm_axi_err", 844 "qm_trace_fence_events", 845 "qm_sw_err", 846 "qm_cp_sw_stop", 847 "lbw_mstr_rresp_err", 848 "lbw_mstr_bresp_err", 849 "lbw_msg_slverr", 850 "hbw_msg_slverr", 851 "wbc_slverr", 852 "hbw_mstr_rresp_err", 853 "hbw_mstr_bresp_err", 854 "sb_resp_intr", 855 "mrsb_resp_intr", 856 "core_dw_status_0", 857 "core_dw_status_1", 858 "core_dw_status_2", 859 "core_dw_status_3", 860 "core_dw_status_4", 861 "core_dw_status_5", 862 "core_dw_status_6", 863 "core_dw_status_7", 864 "async_arc2cpu_sei_intr", 865 }; 866 867 static const char * const gaudi2_tpc_interrupts_cause[GAUDI2_NUM_OF_TPC_INTR_CAUSE] = { 868 "tpc_address_exceed_slm", 869 "tpc_div_by_0", 870 "tpc_spu_mac_overflow", 871 "tpc_spu_addsub_overflow", 872 "tpc_spu_abs_overflow", 873 "tpc_spu_fma_fp_dst_nan", 874 "tpc_spu_fma_fp_dst_inf", 875 "tpc_spu_convert_fp_dst_nan", 876 "tpc_spu_convert_fp_dst_inf", 877 "tpc_spu_fp_dst_denorm", 878 "tpc_vpu_mac_overflow", 879 "tpc_vpu_addsub_overflow", 880 "tpc_vpu_abs_overflow", 881 "tpc_vpu_convert_fp_dst_nan", 882 "tpc_vpu_convert_fp_dst_inf", 883 "tpc_vpu_fma_fp_dst_nan", 884 "tpc_vpu_fma_fp_dst_inf", 885 "tpc_vpu_fp_dst_denorm", 886 "tpc_assertions", 887 "tpc_illegal_instruction", 888 "tpc_pc_wrap_around", 889 "tpc_qm_sw_err", 890 "tpc_hbw_rresp_err", 891 "tpc_hbw_bresp_err", 892 "tpc_lbw_rresp_err", 893 "tpc_lbw_bresp_err", 894 "st_unlock_already_locked", 895 "invalid_lock_access", 896 "LD_L protection violation", 897 "ST_L protection violation", 898 "D$ L0CS mismatch", 899 }; 900 901 static const char * const guadi2_mme_error_cause[GAUDI2_NUM_OF_MME_ERR_CAUSE] = { 902 "agu_resp_intr", 903 "qman_axi_err", 904 "wap sei (wbc axi err)", 905 "arc sei", 906 "cfg access error", 907 "qm_sw_err", 908 "sbte_dbg_intr_0", 909 "sbte_dbg_intr_1", 910 "sbte_dbg_intr_2", 911 "sbte_dbg_intr_3", 912 "sbte_dbg_intr_4", 913 "sbte_prtn_intr_0", 914 "sbte_prtn_intr_1", 915 "sbte_prtn_intr_2", 916 "sbte_prtn_intr_3", 917 "sbte_prtn_intr_4", 918 }; 919 920 static const char * const guadi2_mme_wap_error_cause[GAUDI2_NUM_OF_MME_WAP_ERR_CAUSE] = { 921 "WBC ERR RESP_0", 922 "WBC ERR RESP_1", 923 "AP SOURCE POS INF", 924 "AP SOURCE NEG INF", 925 "AP SOURCE NAN", 926 "AP RESULT POS INF", 927 "AP RESULT NEG INF", 928 }; 929 930 static const char * const gaudi2_dma_core_interrupts_cause[GAUDI2_NUM_OF_DMA_CORE_INTR_CAUSE] = { 931 "HBW Read returned with error RRESP", 932 "HBW write returned with error BRESP", 933 "LBW write returned with error BRESP", 934 "descriptor_fifo_overflow", 935 "KDMA SB LBW Read returned with error", 936 "KDMA WBC LBW Write returned with error", 937 "TRANSPOSE ENGINE DESC FIFO OVERFLOW", 938 "WRONG CFG FOR COMMIT IN LIN DMA" 939 }; 940 941 static const char * const gaudi2_kdma_core_interrupts_cause[GAUDI2_NUM_OF_DMA_CORE_INTR_CAUSE] = { 942 "HBW/LBW Read returned with error RRESP", 943 "HBW/LBW write returned with error BRESP", 944 "LBW write returned with error BRESP", 945 "descriptor_fifo_overflow", 946 "KDMA SB LBW Read returned with error", 947 "KDMA WBC LBW Write returned with error", 948 "TRANSPOSE ENGINE DESC FIFO OVERFLOW", 949 "WRONG CFG FOR COMMIT IN LIN DMA" 950 }; 951 952 struct gaudi2_sm_sei_cause_data { 953 const char *cause_name; 954 const char *log_name; 955 }; 956 957 static const struct gaudi2_sm_sei_cause_data 958 gaudi2_sm_sei_cause[GAUDI2_NUM_OF_SM_SEI_ERR_CAUSE] = { 959 {"calculated SO value overflow/underflow", "SOB ID"}, 960 {"payload address of monitor is not aligned to 4B", "monitor addr"}, 961 {"armed monitor write got BRESP (SLVERR or DECERR)", "AXI id"}, 962 }; 963 964 static const char * const 965 gaudi2_pmmu_fatal_interrupts_cause[GAUDI2_NUM_OF_PMMU_FATAL_ERR_CAUSE] = { 966 "LATENCY_RD_OUT_FIFO_OVERRUN", 967 "LATENCY_WR_OUT_FIFO_OVERRUN", 968 }; 969 970 static const char * const 971 gaudi2_hif_fatal_interrupts_cause[GAUDI2_NUM_OF_HIF_FATAL_ERR_CAUSE] = { 972 "LATENCY_RD_OUT_FIFO_OVERRUN", 973 "LATENCY_WR_OUT_FIFO_OVERRUN", 974 }; 975 976 static const char * const 977 gaudi2_psoc_axi_drain_interrupts_cause[GAUDI2_NUM_OF_AXI_DRAIN_ERR_CAUSE] = { 978 "AXI drain HBW", 979 "AXI drain LBW", 980 }; 981 982 static const char * const 983 gaudi2_pcie_addr_dec_error_cause[GAUDI2_NUM_OF_PCIE_ADDR_DEC_ERR_CAUSE] = { 984 "HBW error response", 985 "LBW error response", 986 "TLP is blocked by RR" 987 }; 988 989 static const int gaudi2_queue_id_to_engine_id[] = { 990 [GAUDI2_QUEUE_ID_PDMA_0_0...GAUDI2_QUEUE_ID_PDMA_0_3] = GAUDI2_ENGINE_ID_PDMA_0, 991 [GAUDI2_QUEUE_ID_PDMA_1_0...GAUDI2_QUEUE_ID_PDMA_1_3] = GAUDI2_ENGINE_ID_PDMA_1, 992 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE0_EDMA_0_3] = 993 GAUDI2_DCORE0_ENGINE_ID_EDMA_0, 994 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_0...GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3] = 995 GAUDI2_DCORE0_ENGINE_ID_EDMA_1, 996 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE1_EDMA_0_3] = 997 GAUDI2_DCORE1_ENGINE_ID_EDMA_0, 998 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_0...GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3] = 999 GAUDI2_DCORE1_ENGINE_ID_EDMA_1, 1000 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE2_EDMA_0_3] = 1001 GAUDI2_DCORE2_ENGINE_ID_EDMA_0, 1002 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_0...GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3] = 1003 GAUDI2_DCORE2_ENGINE_ID_EDMA_1, 1004 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE3_EDMA_0_3] = 1005 GAUDI2_DCORE3_ENGINE_ID_EDMA_0, 1006 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0...GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3] = 1007 GAUDI2_DCORE3_ENGINE_ID_EDMA_1, 1008 [GAUDI2_QUEUE_ID_DCORE0_MME_0_0...GAUDI2_QUEUE_ID_DCORE0_MME_0_3] = 1009 GAUDI2_DCORE0_ENGINE_ID_MME, 1010 [GAUDI2_QUEUE_ID_DCORE1_MME_0_0...GAUDI2_QUEUE_ID_DCORE1_MME_0_3] = 1011 GAUDI2_DCORE1_ENGINE_ID_MME, 1012 [GAUDI2_QUEUE_ID_DCORE2_MME_0_0...GAUDI2_QUEUE_ID_DCORE2_MME_0_3] = 1013 GAUDI2_DCORE2_ENGINE_ID_MME, 1014 [GAUDI2_QUEUE_ID_DCORE3_MME_0_0...GAUDI2_QUEUE_ID_DCORE3_MME_0_3] = 1015 GAUDI2_DCORE3_ENGINE_ID_MME, 1016 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_0...GAUDI2_QUEUE_ID_DCORE0_TPC_0_3] = 1017 GAUDI2_DCORE0_ENGINE_ID_TPC_0, 1018 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_0...GAUDI2_QUEUE_ID_DCORE0_TPC_1_3] = 1019 GAUDI2_DCORE0_ENGINE_ID_TPC_1, 1020 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_0...GAUDI2_QUEUE_ID_DCORE0_TPC_2_3] = 1021 GAUDI2_DCORE0_ENGINE_ID_TPC_2, 1022 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_0...GAUDI2_QUEUE_ID_DCORE0_TPC_3_3] = 1023 GAUDI2_DCORE0_ENGINE_ID_TPC_3, 1024 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_0...GAUDI2_QUEUE_ID_DCORE0_TPC_4_3] = 1025 GAUDI2_DCORE0_ENGINE_ID_TPC_4, 1026 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_0...GAUDI2_QUEUE_ID_DCORE0_TPC_5_3] = 1027 GAUDI2_DCORE0_ENGINE_ID_TPC_5, 1028 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_0...GAUDI2_QUEUE_ID_DCORE0_TPC_6_3] = 1029 GAUDI2_DCORE0_ENGINE_ID_TPC_6, 1030 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_0...GAUDI2_QUEUE_ID_DCORE1_TPC_0_3] = 1031 GAUDI2_DCORE1_ENGINE_ID_TPC_0, 1032 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_0...GAUDI2_QUEUE_ID_DCORE1_TPC_1_3] = 1033 GAUDI2_DCORE1_ENGINE_ID_TPC_1, 1034 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_0...GAUDI2_QUEUE_ID_DCORE1_TPC_2_3] = 1035 GAUDI2_DCORE1_ENGINE_ID_TPC_2, 1036 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_0...GAUDI2_QUEUE_ID_DCORE1_TPC_3_3] = 1037 GAUDI2_DCORE1_ENGINE_ID_TPC_3, 1038 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_0...GAUDI2_QUEUE_ID_DCORE1_TPC_4_3] = 1039 GAUDI2_DCORE1_ENGINE_ID_TPC_4, 1040 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_0...GAUDI2_QUEUE_ID_DCORE1_TPC_5_3] = 1041 GAUDI2_DCORE1_ENGINE_ID_TPC_5, 1042 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_0...GAUDI2_QUEUE_ID_DCORE2_TPC_0_3] = 1043 GAUDI2_DCORE2_ENGINE_ID_TPC_0, 1044 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_0...GAUDI2_QUEUE_ID_DCORE2_TPC_1_3] = 1045 GAUDI2_DCORE2_ENGINE_ID_TPC_1, 1046 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_0...GAUDI2_QUEUE_ID_DCORE2_TPC_2_3] = 1047 GAUDI2_DCORE2_ENGINE_ID_TPC_2, 1048 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_0...GAUDI2_QUEUE_ID_DCORE2_TPC_3_3] = 1049 GAUDI2_DCORE2_ENGINE_ID_TPC_3, 1050 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_0...GAUDI2_QUEUE_ID_DCORE2_TPC_4_3] = 1051 GAUDI2_DCORE2_ENGINE_ID_TPC_4, 1052 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_0...GAUDI2_QUEUE_ID_DCORE2_TPC_5_3] = 1053 GAUDI2_DCORE2_ENGINE_ID_TPC_5, 1054 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_0...GAUDI2_QUEUE_ID_DCORE3_TPC_0_3] = 1055 GAUDI2_DCORE3_ENGINE_ID_TPC_0, 1056 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_0...GAUDI2_QUEUE_ID_DCORE3_TPC_1_3] = 1057 GAUDI2_DCORE3_ENGINE_ID_TPC_1, 1058 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_0...GAUDI2_QUEUE_ID_DCORE3_TPC_2_3] = 1059 GAUDI2_DCORE3_ENGINE_ID_TPC_2, 1060 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_0...GAUDI2_QUEUE_ID_DCORE3_TPC_3_3] = 1061 GAUDI2_DCORE3_ENGINE_ID_TPC_3, 1062 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_0...GAUDI2_QUEUE_ID_DCORE3_TPC_4_3] = 1063 GAUDI2_DCORE3_ENGINE_ID_TPC_4, 1064 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_0...GAUDI2_QUEUE_ID_DCORE3_TPC_5_3] = 1065 GAUDI2_DCORE3_ENGINE_ID_TPC_5, 1066 [GAUDI2_QUEUE_ID_NIC_0_0...GAUDI2_QUEUE_ID_NIC_0_3] = GAUDI2_ENGINE_ID_NIC0_0, 1067 [GAUDI2_QUEUE_ID_NIC_1_0...GAUDI2_QUEUE_ID_NIC_1_3] = GAUDI2_ENGINE_ID_NIC0_1, 1068 [GAUDI2_QUEUE_ID_NIC_2_0...GAUDI2_QUEUE_ID_NIC_2_3] = GAUDI2_ENGINE_ID_NIC1_0, 1069 [GAUDI2_QUEUE_ID_NIC_3_0...GAUDI2_QUEUE_ID_NIC_3_3] = GAUDI2_ENGINE_ID_NIC1_1, 1070 [GAUDI2_QUEUE_ID_NIC_4_0...GAUDI2_QUEUE_ID_NIC_4_3] = GAUDI2_ENGINE_ID_NIC2_0, 1071 [GAUDI2_QUEUE_ID_NIC_5_0...GAUDI2_QUEUE_ID_NIC_5_3] = GAUDI2_ENGINE_ID_NIC2_1, 1072 [GAUDI2_QUEUE_ID_NIC_6_0...GAUDI2_QUEUE_ID_NIC_6_3] = GAUDI2_ENGINE_ID_NIC3_0, 1073 [GAUDI2_QUEUE_ID_NIC_7_0...GAUDI2_QUEUE_ID_NIC_7_3] = GAUDI2_ENGINE_ID_NIC3_1, 1074 [GAUDI2_QUEUE_ID_NIC_8_0...GAUDI2_QUEUE_ID_NIC_8_3] = GAUDI2_ENGINE_ID_NIC4_0, 1075 [GAUDI2_QUEUE_ID_NIC_9_0...GAUDI2_QUEUE_ID_NIC_9_3] = GAUDI2_ENGINE_ID_NIC4_1, 1076 [GAUDI2_QUEUE_ID_NIC_10_0...GAUDI2_QUEUE_ID_NIC_10_3] = GAUDI2_ENGINE_ID_NIC5_0, 1077 [GAUDI2_QUEUE_ID_NIC_11_0...GAUDI2_QUEUE_ID_NIC_11_3] = GAUDI2_ENGINE_ID_NIC5_1, 1078 [GAUDI2_QUEUE_ID_NIC_12_0...GAUDI2_QUEUE_ID_NIC_12_3] = GAUDI2_ENGINE_ID_NIC6_0, 1079 [GAUDI2_QUEUE_ID_NIC_13_0...GAUDI2_QUEUE_ID_NIC_13_3] = GAUDI2_ENGINE_ID_NIC6_1, 1080 [GAUDI2_QUEUE_ID_NIC_14_0...GAUDI2_QUEUE_ID_NIC_14_3] = GAUDI2_ENGINE_ID_NIC7_0, 1081 [GAUDI2_QUEUE_ID_NIC_15_0...GAUDI2_QUEUE_ID_NIC_15_3] = GAUDI2_ENGINE_ID_NIC7_1, 1082 [GAUDI2_QUEUE_ID_NIC_16_0...GAUDI2_QUEUE_ID_NIC_16_3] = GAUDI2_ENGINE_ID_NIC8_0, 1083 [GAUDI2_QUEUE_ID_NIC_17_0...GAUDI2_QUEUE_ID_NIC_17_3] = GAUDI2_ENGINE_ID_NIC8_1, 1084 [GAUDI2_QUEUE_ID_NIC_18_0...GAUDI2_QUEUE_ID_NIC_18_3] = GAUDI2_ENGINE_ID_NIC9_0, 1085 [GAUDI2_QUEUE_ID_NIC_19_0...GAUDI2_QUEUE_ID_NIC_19_3] = GAUDI2_ENGINE_ID_NIC9_1, 1086 [GAUDI2_QUEUE_ID_NIC_20_0...GAUDI2_QUEUE_ID_NIC_20_3] = GAUDI2_ENGINE_ID_NIC10_0, 1087 [GAUDI2_QUEUE_ID_NIC_21_0...GAUDI2_QUEUE_ID_NIC_21_3] = GAUDI2_ENGINE_ID_NIC10_1, 1088 [GAUDI2_QUEUE_ID_NIC_22_0...GAUDI2_QUEUE_ID_NIC_22_3] = GAUDI2_ENGINE_ID_NIC11_0, 1089 [GAUDI2_QUEUE_ID_NIC_23_0...GAUDI2_QUEUE_ID_NIC_23_3] = GAUDI2_ENGINE_ID_NIC11_1, 1090 [GAUDI2_QUEUE_ID_ROT_0_0...GAUDI2_QUEUE_ID_ROT_0_3] = GAUDI2_ENGINE_ID_ROT_0, 1091 [GAUDI2_QUEUE_ID_ROT_1_0...GAUDI2_QUEUE_ID_ROT_1_3] = GAUDI2_ENGINE_ID_ROT_1, 1092 }; 1093 1094 const u32 gaudi2_qm_blocks_bases[GAUDI2_QUEUE_ID_SIZE] = { 1095 [GAUDI2_QUEUE_ID_PDMA_0_0] = mmPDMA0_QM_BASE, 1096 [GAUDI2_QUEUE_ID_PDMA_0_1] = mmPDMA0_QM_BASE, 1097 [GAUDI2_QUEUE_ID_PDMA_0_2] = mmPDMA0_QM_BASE, 1098 [GAUDI2_QUEUE_ID_PDMA_0_3] = mmPDMA0_QM_BASE, 1099 [GAUDI2_QUEUE_ID_PDMA_1_0] = mmPDMA1_QM_BASE, 1100 [GAUDI2_QUEUE_ID_PDMA_1_1] = mmPDMA1_QM_BASE, 1101 [GAUDI2_QUEUE_ID_PDMA_1_2] = mmPDMA1_QM_BASE, 1102 [GAUDI2_QUEUE_ID_PDMA_1_3] = mmPDMA1_QM_BASE, 1103 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0] = mmDCORE0_EDMA0_QM_BASE, 1104 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_1] = mmDCORE0_EDMA0_QM_BASE, 1105 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_2] = mmDCORE0_EDMA0_QM_BASE, 1106 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_3] = mmDCORE0_EDMA0_QM_BASE, 1107 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_0] = mmDCORE0_EDMA1_QM_BASE, 1108 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_1] = mmDCORE0_EDMA1_QM_BASE, 1109 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_2] = mmDCORE0_EDMA1_QM_BASE, 1110 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3] = mmDCORE0_EDMA1_QM_BASE, 1111 [GAUDI2_QUEUE_ID_DCORE0_MME_0_0] = mmDCORE0_MME_QM_BASE, 1112 [GAUDI2_QUEUE_ID_DCORE0_MME_0_1] = mmDCORE0_MME_QM_BASE, 1113 [GAUDI2_QUEUE_ID_DCORE0_MME_0_2] = mmDCORE0_MME_QM_BASE, 1114 [GAUDI2_QUEUE_ID_DCORE0_MME_0_3] = mmDCORE0_MME_QM_BASE, 1115 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_0] = mmDCORE0_TPC0_QM_BASE, 1116 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_1] = mmDCORE0_TPC0_QM_BASE, 1117 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_2] = mmDCORE0_TPC0_QM_BASE, 1118 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_3] = mmDCORE0_TPC0_QM_BASE, 1119 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_0] = mmDCORE0_TPC1_QM_BASE, 1120 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_1] = mmDCORE0_TPC1_QM_BASE, 1121 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_2] = mmDCORE0_TPC1_QM_BASE, 1122 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_3] = mmDCORE0_TPC1_QM_BASE, 1123 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_0] = mmDCORE0_TPC2_QM_BASE, 1124 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_1] = mmDCORE0_TPC2_QM_BASE, 1125 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_2] = mmDCORE0_TPC2_QM_BASE, 1126 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_3] = mmDCORE0_TPC2_QM_BASE, 1127 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_0] = mmDCORE0_TPC3_QM_BASE, 1128 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_1] = mmDCORE0_TPC3_QM_BASE, 1129 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_2] = mmDCORE0_TPC3_QM_BASE, 1130 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_3] = mmDCORE0_TPC3_QM_BASE, 1131 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_0] = mmDCORE0_TPC4_QM_BASE, 1132 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_1] = mmDCORE0_TPC4_QM_BASE, 1133 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_2] = mmDCORE0_TPC4_QM_BASE, 1134 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_3] = mmDCORE0_TPC4_QM_BASE, 1135 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_0] = mmDCORE0_TPC5_QM_BASE, 1136 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_1] = mmDCORE0_TPC5_QM_BASE, 1137 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_2] = mmDCORE0_TPC5_QM_BASE, 1138 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_3] = mmDCORE0_TPC5_QM_BASE, 1139 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_0] = mmDCORE0_TPC6_QM_BASE, 1140 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_1] = mmDCORE0_TPC6_QM_BASE, 1141 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_2] = mmDCORE0_TPC6_QM_BASE, 1142 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_3] = mmDCORE0_TPC6_QM_BASE, 1143 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0] = mmDCORE1_EDMA0_QM_BASE, 1144 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_1] = mmDCORE1_EDMA0_QM_BASE, 1145 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_2] = mmDCORE1_EDMA0_QM_BASE, 1146 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_3] = mmDCORE1_EDMA0_QM_BASE, 1147 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_0] = mmDCORE1_EDMA1_QM_BASE, 1148 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_1] = mmDCORE1_EDMA1_QM_BASE, 1149 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_2] = mmDCORE1_EDMA1_QM_BASE, 1150 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3] = mmDCORE1_EDMA1_QM_BASE, 1151 [GAUDI2_QUEUE_ID_DCORE1_MME_0_0] = mmDCORE1_MME_QM_BASE, 1152 [GAUDI2_QUEUE_ID_DCORE1_MME_0_1] = mmDCORE1_MME_QM_BASE, 1153 [GAUDI2_QUEUE_ID_DCORE1_MME_0_2] = mmDCORE1_MME_QM_BASE, 1154 [GAUDI2_QUEUE_ID_DCORE1_MME_0_3] = mmDCORE1_MME_QM_BASE, 1155 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_0] = mmDCORE1_TPC0_QM_BASE, 1156 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_1] = mmDCORE1_TPC0_QM_BASE, 1157 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_2] = mmDCORE1_TPC0_QM_BASE, 1158 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_3] = mmDCORE1_TPC0_QM_BASE, 1159 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_0] = mmDCORE1_TPC1_QM_BASE, 1160 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_1] = mmDCORE1_TPC1_QM_BASE, 1161 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_2] = mmDCORE1_TPC1_QM_BASE, 1162 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_3] = mmDCORE1_TPC1_QM_BASE, 1163 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_0] = mmDCORE1_TPC2_QM_BASE, 1164 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_1] = mmDCORE1_TPC2_QM_BASE, 1165 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_2] = mmDCORE1_TPC2_QM_BASE, 1166 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_3] = mmDCORE1_TPC2_QM_BASE, 1167 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_0] = mmDCORE1_TPC3_QM_BASE, 1168 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_1] = mmDCORE1_TPC3_QM_BASE, 1169 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_2] = mmDCORE1_TPC3_QM_BASE, 1170 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_3] = mmDCORE1_TPC3_QM_BASE, 1171 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_0] = mmDCORE1_TPC4_QM_BASE, 1172 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_1] = mmDCORE1_TPC4_QM_BASE, 1173 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_2] = mmDCORE1_TPC4_QM_BASE, 1174 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_3] = mmDCORE1_TPC4_QM_BASE, 1175 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_0] = mmDCORE1_TPC5_QM_BASE, 1176 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_1] = mmDCORE1_TPC5_QM_BASE, 1177 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_2] = mmDCORE1_TPC5_QM_BASE, 1178 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_3] = mmDCORE1_TPC5_QM_BASE, 1179 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0] = mmDCORE2_EDMA0_QM_BASE, 1180 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_1] = mmDCORE2_EDMA0_QM_BASE, 1181 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_2] = mmDCORE2_EDMA0_QM_BASE, 1182 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_3] = mmDCORE2_EDMA0_QM_BASE, 1183 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_0] = mmDCORE2_EDMA1_QM_BASE, 1184 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_1] = mmDCORE2_EDMA1_QM_BASE, 1185 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_2] = mmDCORE2_EDMA1_QM_BASE, 1186 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3] = mmDCORE2_EDMA1_QM_BASE, 1187 [GAUDI2_QUEUE_ID_DCORE2_MME_0_0] = mmDCORE2_MME_QM_BASE, 1188 [GAUDI2_QUEUE_ID_DCORE2_MME_0_1] = mmDCORE2_MME_QM_BASE, 1189 [GAUDI2_QUEUE_ID_DCORE2_MME_0_2] = mmDCORE2_MME_QM_BASE, 1190 [GAUDI2_QUEUE_ID_DCORE2_MME_0_3] = mmDCORE2_MME_QM_BASE, 1191 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_0] = mmDCORE2_TPC0_QM_BASE, 1192 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_1] = mmDCORE2_TPC0_QM_BASE, 1193 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_2] = mmDCORE2_TPC0_QM_BASE, 1194 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_3] = mmDCORE2_TPC0_QM_BASE, 1195 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_0] = mmDCORE2_TPC1_QM_BASE, 1196 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_1] = mmDCORE2_TPC1_QM_BASE, 1197 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_2] = mmDCORE2_TPC1_QM_BASE, 1198 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_3] = mmDCORE2_TPC1_QM_BASE, 1199 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_0] = mmDCORE2_TPC2_QM_BASE, 1200 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_1] = mmDCORE2_TPC2_QM_BASE, 1201 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_2] = mmDCORE2_TPC2_QM_BASE, 1202 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_3] = mmDCORE2_TPC2_QM_BASE, 1203 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_0] = mmDCORE2_TPC3_QM_BASE, 1204 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_1] = mmDCORE2_TPC3_QM_BASE, 1205 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_2] = mmDCORE2_TPC3_QM_BASE, 1206 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_3] = mmDCORE2_TPC3_QM_BASE, 1207 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_0] = mmDCORE2_TPC4_QM_BASE, 1208 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_1] = mmDCORE2_TPC4_QM_BASE, 1209 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_2] = mmDCORE2_TPC4_QM_BASE, 1210 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_3] = mmDCORE2_TPC4_QM_BASE, 1211 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_0] = mmDCORE2_TPC5_QM_BASE, 1212 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_1] = mmDCORE2_TPC5_QM_BASE, 1213 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_2] = mmDCORE2_TPC5_QM_BASE, 1214 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_3] = mmDCORE2_TPC5_QM_BASE, 1215 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0] = mmDCORE3_EDMA0_QM_BASE, 1216 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_1] = mmDCORE3_EDMA0_QM_BASE, 1217 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_2] = mmDCORE3_EDMA0_QM_BASE, 1218 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_3] = mmDCORE3_EDMA0_QM_BASE, 1219 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0] = mmDCORE3_EDMA1_QM_BASE, 1220 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_1] = mmDCORE3_EDMA1_QM_BASE, 1221 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_2] = mmDCORE3_EDMA1_QM_BASE, 1222 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3] = mmDCORE3_EDMA1_QM_BASE, 1223 [GAUDI2_QUEUE_ID_DCORE3_MME_0_0] = mmDCORE3_MME_QM_BASE, 1224 [GAUDI2_QUEUE_ID_DCORE3_MME_0_1] = mmDCORE3_MME_QM_BASE, 1225 [GAUDI2_QUEUE_ID_DCORE3_MME_0_2] = mmDCORE3_MME_QM_BASE, 1226 [GAUDI2_QUEUE_ID_DCORE3_MME_0_3] = mmDCORE3_MME_QM_BASE, 1227 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_0] = mmDCORE3_TPC0_QM_BASE, 1228 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_1] = mmDCORE3_TPC0_QM_BASE, 1229 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_2] = mmDCORE3_TPC0_QM_BASE, 1230 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_3] = mmDCORE3_TPC0_QM_BASE, 1231 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_0] = mmDCORE3_TPC1_QM_BASE, 1232 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_1] = mmDCORE3_TPC1_QM_BASE, 1233 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_2] = mmDCORE3_TPC1_QM_BASE, 1234 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_3] = mmDCORE3_TPC1_QM_BASE, 1235 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_0] = mmDCORE3_TPC2_QM_BASE, 1236 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_1] = mmDCORE3_TPC2_QM_BASE, 1237 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_2] = mmDCORE3_TPC2_QM_BASE, 1238 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_3] = mmDCORE3_TPC2_QM_BASE, 1239 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_0] = mmDCORE3_TPC3_QM_BASE, 1240 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_1] = mmDCORE3_TPC3_QM_BASE, 1241 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_2] = mmDCORE3_TPC3_QM_BASE, 1242 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_3] = mmDCORE3_TPC3_QM_BASE, 1243 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_0] = mmDCORE3_TPC4_QM_BASE, 1244 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_1] = mmDCORE3_TPC4_QM_BASE, 1245 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_2] = mmDCORE3_TPC4_QM_BASE, 1246 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_3] = mmDCORE3_TPC4_QM_BASE, 1247 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_0] = mmDCORE3_TPC5_QM_BASE, 1248 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_1] = mmDCORE3_TPC5_QM_BASE, 1249 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_2] = mmDCORE3_TPC5_QM_BASE, 1250 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_3] = mmDCORE3_TPC5_QM_BASE, 1251 [GAUDI2_QUEUE_ID_NIC_0_0] = mmNIC0_QM0_BASE, 1252 [GAUDI2_QUEUE_ID_NIC_0_1] = mmNIC0_QM0_BASE, 1253 [GAUDI2_QUEUE_ID_NIC_0_2] = mmNIC0_QM0_BASE, 1254 [GAUDI2_QUEUE_ID_NIC_0_3] = mmNIC0_QM0_BASE, 1255 [GAUDI2_QUEUE_ID_NIC_1_0] = mmNIC0_QM1_BASE, 1256 [GAUDI2_QUEUE_ID_NIC_1_1] = mmNIC0_QM1_BASE, 1257 [GAUDI2_QUEUE_ID_NIC_1_2] = mmNIC0_QM1_BASE, 1258 [GAUDI2_QUEUE_ID_NIC_1_3] = mmNIC0_QM1_BASE, 1259 [GAUDI2_QUEUE_ID_NIC_2_0] = mmNIC1_QM0_BASE, 1260 [GAUDI2_QUEUE_ID_NIC_2_1] = mmNIC1_QM0_BASE, 1261 [GAUDI2_QUEUE_ID_NIC_2_2] = mmNIC1_QM0_BASE, 1262 [GAUDI2_QUEUE_ID_NIC_2_3] = mmNIC1_QM0_BASE, 1263 [GAUDI2_QUEUE_ID_NIC_3_0] = mmNIC1_QM1_BASE, 1264 [GAUDI2_QUEUE_ID_NIC_3_1] = mmNIC1_QM1_BASE, 1265 [GAUDI2_QUEUE_ID_NIC_3_2] = mmNIC1_QM1_BASE, 1266 [GAUDI2_QUEUE_ID_NIC_3_3] = mmNIC1_QM1_BASE, 1267 [GAUDI2_QUEUE_ID_NIC_4_0] = mmNIC2_QM0_BASE, 1268 [GAUDI2_QUEUE_ID_NIC_4_1] = mmNIC2_QM0_BASE, 1269 [GAUDI2_QUEUE_ID_NIC_4_2] = mmNIC2_QM0_BASE, 1270 [GAUDI2_QUEUE_ID_NIC_4_3] = mmNIC2_QM0_BASE, 1271 [GAUDI2_QUEUE_ID_NIC_5_0] = mmNIC2_QM1_BASE, 1272 [GAUDI2_QUEUE_ID_NIC_5_1] = mmNIC2_QM1_BASE, 1273 [GAUDI2_QUEUE_ID_NIC_5_2] = mmNIC2_QM1_BASE, 1274 [GAUDI2_QUEUE_ID_NIC_5_3] = mmNIC2_QM1_BASE, 1275 [GAUDI2_QUEUE_ID_NIC_6_0] = mmNIC3_QM0_BASE, 1276 [GAUDI2_QUEUE_ID_NIC_6_1] = mmNIC3_QM0_BASE, 1277 [GAUDI2_QUEUE_ID_NIC_6_2] = mmNIC3_QM0_BASE, 1278 [GAUDI2_QUEUE_ID_NIC_6_3] = mmNIC3_QM0_BASE, 1279 [GAUDI2_QUEUE_ID_NIC_7_0] = mmNIC3_QM1_BASE, 1280 [GAUDI2_QUEUE_ID_NIC_7_1] = mmNIC3_QM1_BASE, 1281 [GAUDI2_QUEUE_ID_NIC_7_2] = mmNIC3_QM1_BASE, 1282 [GAUDI2_QUEUE_ID_NIC_7_3] = mmNIC3_QM1_BASE, 1283 [GAUDI2_QUEUE_ID_NIC_8_0] = mmNIC4_QM0_BASE, 1284 [GAUDI2_QUEUE_ID_NIC_8_1] = mmNIC4_QM0_BASE, 1285 [GAUDI2_QUEUE_ID_NIC_8_2] = mmNIC4_QM0_BASE, 1286 [GAUDI2_QUEUE_ID_NIC_8_3] = mmNIC4_QM0_BASE, 1287 [GAUDI2_QUEUE_ID_NIC_9_0] = mmNIC4_QM1_BASE, 1288 [GAUDI2_QUEUE_ID_NIC_9_1] = mmNIC4_QM1_BASE, 1289 [GAUDI2_QUEUE_ID_NIC_9_2] = mmNIC4_QM1_BASE, 1290 [GAUDI2_QUEUE_ID_NIC_9_3] = mmNIC4_QM1_BASE, 1291 [GAUDI2_QUEUE_ID_NIC_10_0] = mmNIC5_QM0_BASE, 1292 [GAUDI2_QUEUE_ID_NIC_10_1] = mmNIC5_QM0_BASE, 1293 [GAUDI2_QUEUE_ID_NIC_10_2] = mmNIC5_QM0_BASE, 1294 [GAUDI2_QUEUE_ID_NIC_10_3] = mmNIC5_QM0_BASE, 1295 [GAUDI2_QUEUE_ID_NIC_11_0] = mmNIC5_QM1_BASE, 1296 [GAUDI2_QUEUE_ID_NIC_11_1] = mmNIC5_QM1_BASE, 1297 [GAUDI2_QUEUE_ID_NIC_11_2] = mmNIC5_QM1_BASE, 1298 [GAUDI2_QUEUE_ID_NIC_11_3] = mmNIC5_QM1_BASE, 1299 [GAUDI2_QUEUE_ID_NIC_12_0] = mmNIC6_QM0_BASE, 1300 [GAUDI2_QUEUE_ID_NIC_12_1] = mmNIC6_QM0_BASE, 1301 [GAUDI2_QUEUE_ID_NIC_12_2] = mmNIC6_QM0_BASE, 1302 [GAUDI2_QUEUE_ID_NIC_12_3] = mmNIC6_QM0_BASE, 1303 [GAUDI2_QUEUE_ID_NIC_13_0] = mmNIC6_QM1_BASE, 1304 [GAUDI2_QUEUE_ID_NIC_13_1] = mmNIC6_QM1_BASE, 1305 [GAUDI2_QUEUE_ID_NIC_13_2] = mmNIC6_QM1_BASE, 1306 [GAUDI2_QUEUE_ID_NIC_13_3] = mmNIC6_QM1_BASE, 1307 [GAUDI2_QUEUE_ID_NIC_14_0] = mmNIC7_QM0_BASE, 1308 [GAUDI2_QUEUE_ID_NIC_14_1] = mmNIC7_QM0_BASE, 1309 [GAUDI2_QUEUE_ID_NIC_14_2] = mmNIC7_QM0_BASE, 1310 [GAUDI2_QUEUE_ID_NIC_14_3] = mmNIC7_QM0_BASE, 1311 [GAUDI2_QUEUE_ID_NIC_15_0] = mmNIC7_QM1_BASE, 1312 [GAUDI2_QUEUE_ID_NIC_15_1] = mmNIC7_QM1_BASE, 1313 [GAUDI2_QUEUE_ID_NIC_15_2] = mmNIC7_QM1_BASE, 1314 [GAUDI2_QUEUE_ID_NIC_15_3] = mmNIC7_QM1_BASE, 1315 [GAUDI2_QUEUE_ID_NIC_16_0] = mmNIC8_QM0_BASE, 1316 [GAUDI2_QUEUE_ID_NIC_16_1] = mmNIC8_QM0_BASE, 1317 [GAUDI2_QUEUE_ID_NIC_16_2] = mmNIC8_QM0_BASE, 1318 [GAUDI2_QUEUE_ID_NIC_16_3] = mmNIC8_QM0_BASE, 1319 [GAUDI2_QUEUE_ID_NIC_17_0] = mmNIC8_QM1_BASE, 1320 [GAUDI2_QUEUE_ID_NIC_17_1] = mmNIC8_QM1_BASE, 1321 [GAUDI2_QUEUE_ID_NIC_17_2] = mmNIC8_QM1_BASE, 1322 [GAUDI2_QUEUE_ID_NIC_17_3] = mmNIC8_QM1_BASE, 1323 [GAUDI2_QUEUE_ID_NIC_18_0] = mmNIC9_QM0_BASE, 1324 [GAUDI2_QUEUE_ID_NIC_18_1] = mmNIC9_QM0_BASE, 1325 [GAUDI2_QUEUE_ID_NIC_18_2] = mmNIC9_QM0_BASE, 1326 [GAUDI2_QUEUE_ID_NIC_18_3] = mmNIC9_QM0_BASE, 1327 [GAUDI2_QUEUE_ID_NIC_19_0] = mmNIC9_QM1_BASE, 1328 [GAUDI2_QUEUE_ID_NIC_19_1] = mmNIC9_QM1_BASE, 1329 [GAUDI2_QUEUE_ID_NIC_19_2] = mmNIC9_QM1_BASE, 1330 [GAUDI2_QUEUE_ID_NIC_19_3] = mmNIC9_QM1_BASE, 1331 [GAUDI2_QUEUE_ID_NIC_20_0] = mmNIC10_QM0_BASE, 1332 [GAUDI2_QUEUE_ID_NIC_20_1] = mmNIC10_QM0_BASE, 1333 [GAUDI2_QUEUE_ID_NIC_20_2] = mmNIC10_QM0_BASE, 1334 [GAUDI2_QUEUE_ID_NIC_20_3] = mmNIC10_QM0_BASE, 1335 [GAUDI2_QUEUE_ID_NIC_21_0] = mmNIC10_QM1_BASE, 1336 [GAUDI2_QUEUE_ID_NIC_21_1] = mmNIC10_QM1_BASE, 1337 [GAUDI2_QUEUE_ID_NIC_21_2] = mmNIC10_QM1_BASE, 1338 [GAUDI2_QUEUE_ID_NIC_21_3] = mmNIC10_QM1_BASE, 1339 [GAUDI2_QUEUE_ID_NIC_22_0] = mmNIC11_QM0_BASE, 1340 [GAUDI2_QUEUE_ID_NIC_22_1] = mmNIC11_QM0_BASE, 1341 [GAUDI2_QUEUE_ID_NIC_22_2] = mmNIC11_QM0_BASE, 1342 [GAUDI2_QUEUE_ID_NIC_22_3] = mmNIC11_QM0_BASE, 1343 [GAUDI2_QUEUE_ID_NIC_23_0] = mmNIC11_QM1_BASE, 1344 [GAUDI2_QUEUE_ID_NIC_23_1] = mmNIC11_QM1_BASE, 1345 [GAUDI2_QUEUE_ID_NIC_23_2] = mmNIC11_QM1_BASE, 1346 [GAUDI2_QUEUE_ID_NIC_23_3] = mmNIC11_QM1_BASE, 1347 [GAUDI2_QUEUE_ID_ROT_0_0] = mmROT0_QM_BASE, 1348 [GAUDI2_QUEUE_ID_ROT_0_1] = mmROT0_QM_BASE, 1349 [GAUDI2_QUEUE_ID_ROT_0_2] = mmROT0_QM_BASE, 1350 [GAUDI2_QUEUE_ID_ROT_0_3] = mmROT0_QM_BASE, 1351 [GAUDI2_QUEUE_ID_ROT_1_0] = mmROT1_QM_BASE, 1352 [GAUDI2_QUEUE_ID_ROT_1_1] = mmROT1_QM_BASE, 1353 [GAUDI2_QUEUE_ID_ROT_1_2] = mmROT1_QM_BASE, 1354 [GAUDI2_QUEUE_ID_ROT_1_3] = mmROT1_QM_BASE 1355 }; 1356 1357 static const u32 gaudi2_arc_blocks_bases[NUM_ARC_CPUS] = { 1358 [CPU_ID_SCHED_ARC0] = mmARC_FARM_ARC0_AUX_BASE, 1359 [CPU_ID_SCHED_ARC1] = mmARC_FARM_ARC1_AUX_BASE, 1360 [CPU_ID_SCHED_ARC2] = mmARC_FARM_ARC2_AUX_BASE, 1361 [CPU_ID_SCHED_ARC3] = mmARC_FARM_ARC3_AUX_BASE, 1362 [CPU_ID_SCHED_ARC4] = mmDCORE1_MME_QM_ARC_AUX_BASE, 1363 [CPU_ID_SCHED_ARC5] = mmDCORE3_MME_QM_ARC_AUX_BASE, 1364 [CPU_ID_TPC_QMAN_ARC0] = mmDCORE0_TPC0_QM_ARC_AUX_BASE, 1365 [CPU_ID_TPC_QMAN_ARC1] = mmDCORE0_TPC1_QM_ARC_AUX_BASE, 1366 [CPU_ID_TPC_QMAN_ARC2] = mmDCORE0_TPC2_QM_ARC_AUX_BASE, 1367 [CPU_ID_TPC_QMAN_ARC3] = mmDCORE0_TPC3_QM_ARC_AUX_BASE, 1368 [CPU_ID_TPC_QMAN_ARC4] = mmDCORE0_TPC4_QM_ARC_AUX_BASE, 1369 [CPU_ID_TPC_QMAN_ARC5] = mmDCORE0_TPC5_QM_ARC_AUX_BASE, 1370 [CPU_ID_TPC_QMAN_ARC6] = mmDCORE1_TPC0_QM_ARC_AUX_BASE, 1371 [CPU_ID_TPC_QMAN_ARC7] = mmDCORE1_TPC1_QM_ARC_AUX_BASE, 1372 [CPU_ID_TPC_QMAN_ARC8] = mmDCORE1_TPC2_QM_ARC_AUX_BASE, 1373 [CPU_ID_TPC_QMAN_ARC9] = mmDCORE1_TPC3_QM_ARC_AUX_BASE, 1374 [CPU_ID_TPC_QMAN_ARC10] = mmDCORE1_TPC4_QM_ARC_AUX_BASE, 1375 [CPU_ID_TPC_QMAN_ARC11] = mmDCORE1_TPC5_QM_ARC_AUX_BASE, 1376 [CPU_ID_TPC_QMAN_ARC12] = mmDCORE2_TPC0_QM_ARC_AUX_BASE, 1377 [CPU_ID_TPC_QMAN_ARC13] = mmDCORE2_TPC1_QM_ARC_AUX_BASE, 1378 [CPU_ID_TPC_QMAN_ARC14] = mmDCORE2_TPC2_QM_ARC_AUX_BASE, 1379 [CPU_ID_TPC_QMAN_ARC15] = mmDCORE2_TPC3_QM_ARC_AUX_BASE, 1380 [CPU_ID_TPC_QMAN_ARC16] = mmDCORE2_TPC4_QM_ARC_AUX_BASE, 1381 [CPU_ID_TPC_QMAN_ARC17] = mmDCORE2_TPC5_QM_ARC_AUX_BASE, 1382 [CPU_ID_TPC_QMAN_ARC18] = mmDCORE3_TPC0_QM_ARC_AUX_BASE, 1383 [CPU_ID_TPC_QMAN_ARC19] = mmDCORE3_TPC1_QM_ARC_AUX_BASE, 1384 [CPU_ID_TPC_QMAN_ARC20] = mmDCORE3_TPC2_QM_ARC_AUX_BASE, 1385 [CPU_ID_TPC_QMAN_ARC21] = mmDCORE3_TPC3_QM_ARC_AUX_BASE, 1386 [CPU_ID_TPC_QMAN_ARC22] = mmDCORE3_TPC4_QM_ARC_AUX_BASE, 1387 [CPU_ID_TPC_QMAN_ARC23] = mmDCORE3_TPC5_QM_ARC_AUX_BASE, 1388 [CPU_ID_TPC_QMAN_ARC24] = mmDCORE0_TPC6_QM_ARC_AUX_BASE, 1389 [CPU_ID_MME_QMAN_ARC0] = mmDCORE0_MME_QM_ARC_AUX_BASE, 1390 [CPU_ID_MME_QMAN_ARC1] = mmDCORE2_MME_QM_ARC_AUX_BASE, 1391 [CPU_ID_EDMA_QMAN_ARC0] = mmDCORE0_EDMA0_QM_ARC_AUX_BASE, 1392 [CPU_ID_EDMA_QMAN_ARC1] = mmDCORE0_EDMA1_QM_ARC_AUX_BASE, 1393 [CPU_ID_EDMA_QMAN_ARC2] = mmDCORE1_EDMA0_QM_ARC_AUX_BASE, 1394 [CPU_ID_EDMA_QMAN_ARC3] = mmDCORE1_EDMA1_QM_ARC_AUX_BASE, 1395 [CPU_ID_EDMA_QMAN_ARC4] = mmDCORE2_EDMA0_QM_ARC_AUX_BASE, 1396 [CPU_ID_EDMA_QMAN_ARC5] = mmDCORE2_EDMA1_QM_ARC_AUX_BASE, 1397 [CPU_ID_EDMA_QMAN_ARC6] = mmDCORE3_EDMA0_QM_ARC_AUX_BASE, 1398 [CPU_ID_EDMA_QMAN_ARC7] = mmDCORE3_EDMA1_QM_ARC_AUX_BASE, 1399 [CPU_ID_PDMA_QMAN_ARC0] = mmPDMA0_QM_ARC_AUX_BASE, 1400 [CPU_ID_PDMA_QMAN_ARC1] = mmPDMA1_QM_ARC_AUX_BASE, 1401 [CPU_ID_ROT_QMAN_ARC0] = mmROT0_QM_ARC_AUX_BASE, 1402 [CPU_ID_ROT_QMAN_ARC1] = mmROT1_QM_ARC_AUX_BASE, 1403 [CPU_ID_NIC_QMAN_ARC0] = mmNIC0_QM_ARC_AUX0_BASE, 1404 [CPU_ID_NIC_QMAN_ARC1] = mmNIC0_QM_ARC_AUX1_BASE, 1405 [CPU_ID_NIC_QMAN_ARC2] = mmNIC1_QM_ARC_AUX0_BASE, 1406 [CPU_ID_NIC_QMAN_ARC3] = mmNIC1_QM_ARC_AUX1_BASE, 1407 [CPU_ID_NIC_QMAN_ARC4] = mmNIC2_QM_ARC_AUX0_BASE, 1408 [CPU_ID_NIC_QMAN_ARC5] = mmNIC2_QM_ARC_AUX1_BASE, 1409 [CPU_ID_NIC_QMAN_ARC6] = mmNIC3_QM_ARC_AUX0_BASE, 1410 [CPU_ID_NIC_QMAN_ARC7] = mmNIC3_QM_ARC_AUX1_BASE, 1411 [CPU_ID_NIC_QMAN_ARC8] = mmNIC4_QM_ARC_AUX0_BASE, 1412 [CPU_ID_NIC_QMAN_ARC9] = mmNIC4_QM_ARC_AUX1_BASE, 1413 [CPU_ID_NIC_QMAN_ARC10] = mmNIC5_QM_ARC_AUX0_BASE, 1414 [CPU_ID_NIC_QMAN_ARC11] = mmNIC5_QM_ARC_AUX1_BASE, 1415 [CPU_ID_NIC_QMAN_ARC12] = mmNIC6_QM_ARC_AUX0_BASE, 1416 [CPU_ID_NIC_QMAN_ARC13] = mmNIC6_QM_ARC_AUX1_BASE, 1417 [CPU_ID_NIC_QMAN_ARC14] = mmNIC7_QM_ARC_AUX0_BASE, 1418 [CPU_ID_NIC_QMAN_ARC15] = mmNIC7_QM_ARC_AUX1_BASE, 1419 [CPU_ID_NIC_QMAN_ARC16] = mmNIC8_QM_ARC_AUX0_BASE, 1420 [CPU_ID_NIC_QMAN_ARC17] = mmNIC8_QM_ARC_AUX1_BASE, 1421 [CPU_ID_NIC_QMAN_ARC18] = mmNIC9_QM_ARC_AUX0_BASE, 1422 [CPU_ID_NIC_QMAN_ARC19] = mmNIC9_QM_ARC_AUX1_BASE, 1423 [CPU_ID_NIC_QMAN_ARC20] = mmNIC10_QM_ARC_AUX0_BASE, 1424 [CPU_ID_NIC_QMAN_ARC21] = mmNIC10_QM_ARC_AUX1_BASE, 1425 [CPU_ID_NIC_QMAN_ARC22] = mmNIC11_QM_ARC_AUX0_BASE, 1426 [CPU_ID_NIC_QMAN_ARC23] = mmNIC11_QM_ARC_AUX1_BASE, 1427 }; 1428 1429 static const u32 gaudi2_arc_dccm_bases[NUM_ARC_CPUS] = { 1430 [CPU_ID_SCHED_ARC0] = mmARC_FARM_ARC0_DCCM0_BASE, 1431 [CPU_ID_SCHED_ARC1] = mmARC_FARM_ARC1_DCCM0_BASE, 1432 [CPU_ID_SCHED_ARC2] = mmARC_FARM_ARC2_DCCM0_BASE, 1433 [CPU_ID_SCHED_ARC3] = mmARC_FARM_ARC3_DCCM0_BASE, 1434 [CPU_ID_SCHED_ARC4] = mmDCORE1_MME_QM_ARC_DCCM_BASE, 1435 [CPU_ID_SCHED_ARC5] = mmDCORE3_MME_QM_ARC_DCCM_BASE, 1436 [CPU_ID_TPC_QMAN_ARC0] = mmDCORE0_TPC0_QM_DCCM_BASE, 1437 [CPU_ID_TPC_QMAN_ARC1] = mmDCORE0_TPC1_QM_DCCM_BASE, 1438 [CPU_ID_TPC_QMAN_ARC2] = mmDCORE0_TPC2_QM_DCCM_BASE, 1439 [CPU_ID_TPC_QMAN_ARC3] = mmDCORE0_TPC3_QM_DCCM_BASE, 1440 [CPU_ID_TPC_QMAN_ARC4] = mmDCORE0_TPC4_QM_DCCM_BASE, 1441 [CPU_ID_TPC_QMAN_ARC5] = mmDCORE0_TPC5_QM_DCCM_BASE, 1442 [CPU_ID_TPC_QMAN_ARC6] = mmDCORE1_TPC0_QM_DCCM_BASE, 1443 [CPU_ID_TPC_QMAN_ARC7] = mmDCORE1_TPC1_QM_DCCM_BASE, 1444 [CPU_ID_TPC_QMAN_ARC8] = mmDCORE1_TPC2_QM_DCCM_BASE, 1445 [CPU_ID_TPC_QMAN_ARC9] = mmDCORE1_TPC3_QM_DCCM_BASE, 1446 [CPU_ID_TPC_QMAN_ARC10] = mmDCORE1_TPC4_QM_DCCM_BASE, 1447 [CPU_ID_TPC_QMAN_ARC11] = mmDCORE1_TPC5_QM_DCCM_BASE, 1448 [CPU_ID_TPC_QMAN_ARC12] = mmDCORE2_TPC0_QM_DCCM_BASE, 1449 [CPU_ID_TPC_QMAN_ARC13] = mmDCORE2_TPC1_QM_DCCM_BASE, 1450 [CPU_ID_TPC_QMAN_ARC14] = mmDCORE2_TPC2_QM_DCCM_BASE, 1451 [CPU_ID_TPC_QMAN_ARC15] = mmDCORE2_TPC3_QM_DCCM_BASE, 1452 [CPU_ID_TPC_QMAN_ARC16] = mmDCORE2_TPC4_QM_DCCM_BASE, 1453 [CPU_ID_TPC_QMAN_ARC17] = mmDCORE2_TPC5_QM_DCCM_BASE, 1454 [CPU_ID_TPC_QMAN_ARC18] = mmDCORE3_TPC0_QM_DCCM_BASE, 1455 [CPU_ID_TPC_QMAN_ARC19] = mmDCORE3_TPC1_QM_DCCM_BASE, 1456 [CPU_ID_TPC_QMAN_ARC20] = mmDCORE3_TPC2_QM_DCCM_BASE, 1457 [CPU_ID_TPC_QMAN_ARC21] = mmDCORE3_TPC3_QM_DCCM_BASE, 1458 [CPU_ID_TPC_QMAN_ARC22] = mmDCORE3_TPC4_QM_DCCM_BASE, 1459 [CPU_ID_TPC_QMAN_ARC23] = mmDCORE3_TPC5_QM_DCCM_BASE, 1460 [CPU_ID_TPC_QMAN_ARC24] = mmDCORE0_TPC6_QM_DCCM_BASE, 1461 [CPU_ID_MME_QMAN_ARC0] = mmDCORE0_MME_QM_ARC_DCCM_BASE, 1462 [CPU_ID_MME_QMAN_ARC1] = mmDCORE2_MME_QM_ARC_DCCM_BASE, 1463 [CPU_ID_EDMA_QMAN_ARC0] = mmDCORE0_EDMA0_QM_DCCM_BASE, 1464 [CPU_ID_EDMA_QMAN_ARC1] = mmDCORE0_EDMA1_QM_DCCM_BASE, 1465 [CPU_ID_EDMA_QMAN_ARC2] = mmDCORE1_EDMA0_QM_DCCM_BASE, 1466 [CPU_ID_EDMA_QMAN_ARC3] = mmDCORE1_EDMA1_QM_DCCM_BASE, 1467 [CPU_ID_EDMA_QMAN_ARC4] = mmDCORE2_EDMA0_QM_DCCM_BASE, 1468 [CPU_ID_EDMA_QMAN_ARC5] = mmDCORE2_EDMA1_QM_DCCM_BASE, 1469 [CPU_ID_EDMA_QMAN_ARC6] = mmDCORE3_EDMA0_QM_DCCM_BASE, 1470 [CPU_ID_EDMA_QMAN_ARC7] = mmDCORE3_EDMA1_QM_DCCM_BASE, 1471 [CPU_ID_PDMA_QMAN_ARC0] = mmPDMA0_QM_ARC_DCCM_BASE, 1472 [CPU_ID_PDMA_QMAN_ARC1] = mmPDMA1_QM_ARC_DCCM_BASE, 1473 [CPU_ID_ROT_QMAN_ARC0] = mmROT0_QM_ARC_DCCM_BASE, 1474 [CPU_ID_ROT_QMAN_ARC1] = mmROT1_QM_ARC_DCCM_BASE, 1475 [CPU_ID_NIC_QMAN_ARC0] = mmNIC0_QM_DCCM0_BASE, 1476 [CPU_ID_NIC_QMAN_ARC1] = mmNIC0_QM_DCCM1_BASE, 1477 [CPU_ID_NIC_QMAN_ARC2] = mmNIC1_QM_DCCM0_BASE, 1478 [CPU_ID_NIC_QMAN_ARC3] = mmNIC1_QM_DCCM1_BASE, 1479 [CPU_ID_NIC_QMAN_ARC4] = mmNIC2_QM_DCCM0_BASE, 1480 [CPU_ID_NIC_QMAN_ARC5] = mmNIC2_QM_DCCM1_BASE, 1481 [CPU_ID_NIC_QMAN_ARC6] = mmNIC3_QM_DCCM0_BASE, 1482 [CPU_ID_NIC_QMAN_ARC7] = mmNIC3_QM_DCCM1_BASE, 1483 [CPU_ID_NIC_QMAN_ARC8] = mmNIC4_QM_DCCM0_BASE, 1484 [CPU_ID_NIC_QMAN_ARC9] = mmNIC4_QM_DCCM1_BASE, 1485 [CPU_ID_NIC_QMAN_ARC10] = mmNIC5_QM_DCCM0_BASE, 1486 [CPU_ID_NIC_QMAN_ARC11] = mmNIC5_QM_DCCM1_BASE, 1487 [CPU_ID_NIC_QMAN_ARC12] = mmNIC6_QM_DCCM0_BASE, 1488 [CPU_ID_NIC_QMAN_ARC13] = mmNIC6_QM_DCCM1_BASE, 1489 [CPU_ID_NIC_QMAN_ARC14] = mmNIC7_QM_DCCM0_BASE, 1490 [CPU_ID_NIC_QMAN_ARC15] = mmNIC7_QM_DCCM1_BASE, 1491 [CPU_ID_NIC_QMAN_ARC16] = mmNIC8_QM_DCCM0_BASE, 1492 [CPU_ID_NIC_QMAN_ARC17] = mmNIC8_QM_DCCM1_BASE, 1493 [CPU_ID_NIC_QMAN_ARC18] = mmNIC9_QM_DCCM0_BASE, 1494 [CPU_ID_NIC_QMAN_ARC19] = mmNIC9_QM_DCCM1_BASE, 1495 [CPU_ID_NIC_QMAN_ARC20] = mmNIC10_QM_DCCM0_BASE, 1496 [CPU_ID_NIC_QMAN_ARC21] = mmNIC10_QM_DCCM1_BASE, 1497 [CPU_ID_NIC_QMAN_ARC22] = mmNIC11_QM_DCCM0_BASE, 1498 [CPU_ID_NIC_QMAN_ARC23] = mmNIC11_QM_DCCM1_BASE, 1499 }; 1500 1501 const u32 gaudi2_mme_ctrl_lo_blocks_bases[MME_ID_SIZE] = { 1502 [MME_ID_DCORE0] = mmDCORE0_MME_CTRL_LO_BASE, 1503 [MME_ID_DCORE1] = mmDCORE1_MME_CTRL_LO_BASE, 1504 [MME_ID_DCORE2] = mmDCORE2_MME_CTRL_LO_BASE, 1505 [MME_ID_DCORE3] = mmDCORE3_MME_CTRL_LO_BASE, 1506 }; 1507 1508 static const u32 gaudi2_queue_id_to_arc_id[GAUDI2_QUEUE_ID_SIZE] = { 1509 [GAUDI2_QUEUE_ID_PDMA_0_0] = CPU_ID_PDMA_QMAN_ARC0, 1510 [GAUDI2_QUEUE_ID_PDMA_0_1] = CPU_ID_PDMA_QMAN_ARC0, 1511 [GAUDI2_QUEUE_ID_PDMA_0_2] = CPU_ID_PDMA_QMAN_ARC0, 1512 [GAUDI2_QUEUE_ID_PDMA_0_3] = CPU_ID_PDMA_QMAN_ARC0, 1513 [GAUDI2_QUEUE_ID_PDMA_1_0] = CPU_ID_PDMA_QMAN_ARC1, 1514 [GAUDI2_QUEUE_ID_PDMA_1_1] = CPU_ID_PDMA_QMAN_ARC1, 1515 [GAUDI2_QUEUE_ID_PDMA_1_2] = CPU_ID_PDMA_QMAN_ARC1, 1516 [GAUDI2_QUEUE_ID_PDMA_1_3] = CPU_ID_PDMA_QMAN_ARC1, 1517 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0] = CPU_ID_EDMA_QMAN_ARC0, 1518 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_1] = CPU_ID_EDMA_QMAN_ARC0, 1519 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_2] = CPU_ID_EDMA_QMAN_ARC0, 1520 [GAUDI2_QUEUE_ID_DCORE0_EDMA_0_3] = CPU_ID_EDMA_QMAN_ARC0, 1521 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_0] = CPU_ID_EDMA_QMAN_ARC1, 1522 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_1] = CPU_ID_EDMA_QMAN_ARC1, 1523 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_2] = CPU_ID_EDMA_QMAN_ARC1, 1524 [GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3] = CPU_ID_EDMA_QMAN_ARC1, 1525 [GAUDI2_QUEUE_ID_DCORE0_MME_0_0] = CPU_ID_MME_QMAN_ARC0, 1526 [GAUDI2_QUEUE_ID_DCORE0_MME_0_1] = CPU_ID_MME_QMAN_ARC0, 1527 [GAUDI2_QUEUE_ID_DCORE0_MME_0_2] = CPU_ID_MME_QMAN_ARC0, 1528 [GAUDI2_QUEUE_ID_DCORE0_MME_0_3] = CPU_ID_MME_QMAN_ARC0, 1529 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_0] = CPU_ID_TPC_QMAN_ARC0, 1530 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_1] = CPU_ID_TPC_QMAN_ARC0, 1531 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_2] = CPU_ID_TPC_QMAN_ARC0, 1532 [GAUDI2_QUEUE_ID_DCORE0_TPC_0_3] = CPU_ID_TPC_QMAN_ARC0, 1533 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_0] = CPU_ID_TPC_QMAN_ARC1, 1534 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_1] = CPU_ID_TPC_QMAN_ARC1, 1535 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_2] = CPU_ID_TPC_QMAN_ARC1, 1536 [GAUDI2_QUEUE_ID_DCORE0_TPC_1_3] = CPU_ID_TPC_QMAN_ARC1, 1537 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_0] = CPU_ID_TPC_QMAN_ARC2, 1538 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_1] = CPU_ID_TPC_QMAN_ARC2, 1539 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_2] = CPU_ID_TPC_QMAN_ARC2, 1540 [GAUDI2_QUEUE_ID_DCORE0_TPC_2_3] = CPU_ID_TPC_QMAN_ARC2, 1541 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_0] = CPU_ID_TPC_QMAN_ARC3, 1542 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_1] = CPU_ID_TPC_QMAN_ARC3, 1543 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_2] = CPU_ID_TPC_QMAN_ARC3, 1544 [GAUDI2_QUEUE_ID_DCORE0_TPC_3_3] = CPU_ID_TPC_QMAN_ARC3, 1545 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_0] = CPU_ID_TPC_QMAN_ARC4, 1546 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_1] = CPU_ID_TPC_QMAN_ARC4, 1547 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_2] = CPU_ID_TPC_QMAN_ARC4, 1548 [GAUDI2_QUEUE_ID_DCORE0_TPC_4_3] = CPU_ID_TPC_QMAN_ARC4, 1549 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_0] = CPU_ID_TPC_QMAN_ARC5, 1550 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_1] = CPU_ID_TPC_QMAN_ARC5, 1551 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_2] = CPU_ID_TPC_QMAN_ARC5, 1552 [GAUDI2_QUEUE_ID_DCORE0_TPC_5_3] = CPU_ID_TPC_QMAN_ARC5, 1553 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_0] = CPU_ID_TPC_QMAN_ARC24, 1554 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_1] = CPU_ID_TPC_QMAN_ARC24, 1555 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_2] = CPU_ID_TPC_QMAN_ARC24, 1556 [GAUDI2_QUEUE_ID_DCORE0_TPC_6_3] = CPU_ID_TPC_QMAN_ARC24, 1557 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0] = CPU_ID_EDMA_QMAN_ARC2, 1558 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_1] = CPU_ID_EDMA_QMAN_ARC2, 1559 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_2] = CPU_ID_EDMA_QMAN_ARC2, 1560 [GAUDI2_QUEUE_ID_DCORE1_EDMA_0_3] = CPU_ID_EDMA_QMAN_ARC2, 1561 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_0] = CPU_ID_EDMA_QMAN_ARC3, 1562 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_1] = CPU_ID_EDMA_QMAN_ARC3, 1563 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_2] = CPU_ID_EDMA_QMAN_ARC3, 1564 [GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3] = CPU_ID_EDMA_QMAN_ARC3, 1565 [GAUDI2_QUEUE_ID_DCORE1_MME_0_0] = CPU_ID_SCHED_ARC4, 1566 [GAUDI2_QUEUE_ID_DCORE1_MME_0_1] = CPU_ID_SCHED_ARC4, 1567 [GAUDI2_QUEUE_ID_DCORE1_MME_0_2] = CPU_ID_SCHED_ARC4, 1568 [GAUDI2_QUEUE_ID_DCORE1_MME_0_3] = CPU_ID_SCHED_ARC4, 1569 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_0] = CPU_ID_TPC_QMAN_ARC6, 1570 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_1] = CPU_ID_TPC_QMAN_ARC6, 1571 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_2] = CPU_ID_TPC_QMAN_ARC6, 1572 [GAUDI2_QUEUE_ID_DCORE1_TPC_0_3] = CPU_ID_TPC_QMAN_ARC6, 1573 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_0] = CPU_ID_TPC_QMAN_ARC7, 1574 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_1] = CPU_ID_TPC_QMAN_ARC7, 1575 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_2] = CPU_ID_TPC_QMAN_ARC7, 1576 [GAUDI2_QUEUE_ID_DCORE1_TPC_1_3] = CPU_ID_TPC_QMAN_ARC7, 1577 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_0] = CPU_ID_TPC_QMAN_ARC8, 1578 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_1] = CPU_ID_TPC_QMAN_ARC8, 1579 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_2] = CPU_ID_TPC_QMAN_ARC8, 1580 [GAUDI2_QUEUE_ID_DCORE1_TPC_2_3] = CPU_ID_TPC_QMAN_ARC8, 1581 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_0] = CPU_ID_TPC_QMAN_ARC9, 1582 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_1] = CPU_ID_TPC_QMAN_ARC9, 1583 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_2] = CPU_ID_TPC_QMAN_ARC9, 1584 [GAUDI2_QUEUE_ID_DCORE1_TPC_3_3] = CPU_ID_TPC_QMAN_ARC9, 1585 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_0] = CPU_ID_TPC_QMAN_ARC10, 1586 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_1] = CPU_ID_TPC_QMAN_ARC10, 1587 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_2] = CPU_ID_TPC_QMAN_ARC10, 1588 [GAUDI2_QUEUE_ID_DCORE1_TPC_4_3] = CPU_ID_TPC_QMAN_ARC10, 1589 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_0] = CPU_ID_TPC_QMAN_ARC11, 1590 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_1] = CPU_ID_TPC_QMAN_ARC11, 1591 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_2] = CPU_ID_TPC_QMAN_ARC11, 1592 [GAUDI2_QUEUE_ID_DCORE1_TPC_5_3] = CPU_ID_TPC_QMAN_ARC11, 1593 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0] = CPU_ID_EDMA_QMAN_ARC4, 1594 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_1] = CPU_ID_EDMA_QMAN_ARC4, 1595 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_2] = CPU_ID_EDMA_QMAN_ARC4, 1596 [GAUDI2_QUEUE_ID_DCORE2_EDMA_0_3] = CPU_ID_EDMA_QMAN_ARC4, 1597 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_0] = CPU_ID_EDMA_QMAN_ARC5, 1598 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_1] = CPU_ID_EDMA_QMAN_ARC5, 1599 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_2] = CPU_ID_EDMA_QMAN_ARC5, 1600 [GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3] = CPU_ID_EDMA_QMAN_ARC5, 1601 [GAUDI2_QUEUE_ID_DCORE2_MME_0_0] = CPU_ID_MME_QMAN_ARC1, 1602 [GAUDI2_QUEUE_ID_DCORE2_MME_0_1] = CPU_ID_MME_QMAN_ARC1, 1603 [GAUDI2_QUEUE_ID_DCORE2_MME_0_2] = CPU_ID_MME_QMAN_ARC1, 1604 [GAUDI2_QUEUE_ID_DCORE2_MME_0_3] = CPU_ID_MME_QMAN_ARC1, 1605 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_0] = CPU_ID_TPC_QMAN_ARC12, 1606 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_1] = CPU_ID_TPC_QMAN_ARC12, 1607 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_2] = CPU_ID_TPC_QMAN_ARC12, 1608 [GAUDI2_QUEUE_ID_DCORE2_TPC_0_3] = CPU_ID_TPC_QMAN_ARC12, 1609 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_0] = CPU_ID_TPC_QMAN_ARC13, 1610 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_1] = CPU_ID_TPC_QMAN_ARC13, 1611 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_2] = CPU_ID_TPC_QMAN_ARC13, 1612 [GAUDI2_QUEUE_ID_DCORE2_TPC_1_3] = CPU_ID_TPC_QMAN_ARC13, 1613 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_0] = CPU_ID_TPC_QMAN_ARC14, 1614 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_1] = CPU_ID_TPC_QMAN_ARC14, 1615 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_2] = CPU_ID_TPC_QMAN_ARC14, 1616 [GAUDI2_QUEUE_ID_DCORE2_TPC_2_3] = CPU_ID_TPC_QMAN_ARC14, 1617 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_0] = CPU_ID_TPC_QMAN_ARC15, 1618 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_1] = CPU_ID_TPC_QMAN_ARC15, 1619 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_2] = CPU_ID_TPC_QMAN_ARC15, 1620 [GAUDI2_QUEUE_ID_DCORE2_TPC_3_3] = CPU_ID_TPC_QMAN_ARC15, 1621 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_0] = CPU_ID_TPC_QMAN_ARC16, 1622 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_1] = CPU_ID_TPC_QMAN_ARC16, 1623 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_2] = CPU_ID_TPC_QMAN_ARC16, 1624 [GAUDI2_QUEUE_ID_DCORE2_TPC_4_3] = CPU_ID_TPC_QMAN_ARC16, 1625 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_0] = CPU_ID_TPC_QMAN_ARC17, 1626 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_1] = CPU_ID_TPC_QMAN_ARC17, 1627 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_2] = CPU_ID_TPC_QMAN_ARC17, 1628 [GAUDI2_QUEUE_ID_DCORE2_TPC_5_3] = CPU_ID_TPC_QMAN_ARC17, 1629 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0] = CPU_ID_EDMA_QMAN_ARC6, 1630 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_1] = CPU_ID_EDMA_QMAN_ARC6, 1631 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_2] = CPU_ID_EDMA_QMAN_ARC6, 1632 [GAUDI2_QUEUE_ID_DCORE3_EDMA_0_3] = CPU_ID_EDMA_QMAN_ARC6, 1633 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0] = CPU_ID_EDMA_QMAN_ARC7, 1634 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_1] = CPU_ID_EDMA_QMAN_ARC7, 1635 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_2] = CPU_ID_EDMA_QMAN_ARC7, 1636 [GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3] = CPU_ID_EDMA_QMAN_ARC7, 1637 [GAUDI2_QUEUE_ID_DCORE3_MME_0_0] = CPU_ID_SCHED_ARC5, 1638 [GAUDI2_QUEUE_ID_DCORE3_MME_0_1] = CPU_ID_SCHED_ARC5, 1639 [GAUDI2_QUEUE_ID_DCORE3_MME_0_2] = CPU_ID_SCHED_ARC5, 1640 [GAUDI2_QUEUE_ID_DCORE3_MME_0_3] = CPU_ID_SCHED_ARC5, 1641 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_0] = CPU_ID_TPC_QMAN_ARC18, 1642 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_1] = CPU_ID_TPC_QMAN_ARC18, 1643 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_2] = CPU_ID_TPC_QMAN_ARC18, 1644 [GAUDI2_QUEUE_ID_DCORE3_TPC_0_3] = CPU_ID_TPC_QMAN_ARC18, 1645 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_0] = CPU_ID_TPC_QMAN_ARC19, 1646 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_1] = CPU_ID_TPC_QMAN_ARC19, 1647 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_2] = CPU_ID_TPC_QMAN_ARC19, 1648 [GAUDI2_QUEUE_ID_DCORE3_TPC_1_3] = CPU_ID_TPC_QMAN_ARC19, 1649 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_0] = CPU_ID_TPC_QMAN_ARC20, 1650 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_1] = CPU_ID_TPC_QMAN_ARC20, 1651 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_2] = CPU_ID_TPC_QMAN_ARC20, 1652 [GAUDI2_QUEUE_ID_DCORE3_TPC_2_3] = CPU_ID_TPC_QMAN_ARC20, 1653 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_0] = CPU_ID_TPC_QMAN_ARC21, 1654 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_1] = CPU_ID_TPC_QMAN_ARC21, 1655 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_2] = CPU_ID_TPC_QMAN_ARC21, 1656 [GAUDI2_QUEUE_ID_DCORE3_TPC_3_3] = CPU_ID_TPC_QMAN_ARC21, 1657 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_0] = CPU_ID_TPC_QMAN_ARC22, 1658 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_1] = CPU_ID_TPC_QMAN_ARC22, 1659 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_2] = CPU_ID_TPC_QMAN_ARC22, 1660 [GAUDI2_QUEUE_ID_DCORE3_TPC_4_3] = CPU_ID_TPC_QMAN_ARC22, 1661 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_0] = CPU_ID_TPC_QMAN_ARC23, 1662 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_1] = CPU_ID_TPC_QMAN_ARC23, 1663 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_2] = CPU_ID_TPC_QMAN_ARC23, 1664 [GAUDI2_QUEUE_ID_DCORE3_TPC_5_3] = CPU_ID_TPC_QMAN_ARC23, 1665 [GAUDI2_QUEUE_ID_NIC_0_0] = CPU_ID_NIC_QMAN_ARC0, 1666 [GAUDI2_QUEUE_ID_NIC_0_1] = CPU_ID_NIC_QMAN_ARC0, 1667 [GAUDI2_QUEUE_ID_NIC_0_2] = CPU_ID_NIC_QMAN_ARC0, 1668 [GAUDI2_QUEUE_ID_NIC_0_3] = CPU_ID_NIC_QMAN_ARC0, 1669 [GAUDI2_QUEUE_ID_NIC_1_0] = CPU_ID_NIC_QMAN_ARC1, 1670 [GAUDI2_QUEUE_ID_NIC_1_1] = CPU_ID_NIC_QMAN_ARC1, 1671 [GAUDI2_QUEUE_ID_NIC_1_2] = CPU_ID_NIC_QMAN_ARC1, 1672 [GAUDI2_QUEUE_ID_NIC_1_3] = CPU_ID_NIC_QMAN_ARC1, 1673 [GAUDI2_QUEUE_ID_NIC_2_0] = CPU_ID_NIC_QMAN_ARC2, 1674 [GAUDI2_QUEUE_ID_NIC_2_1] = CPU_ID_NIC_QMAN_ARC2, 1675 [GAUDI2_QUEUE_ID_NIC_2_2] = CPU_ID_NIC_QMAN_ARC2, 1676 [GAUDI2_QUEUE_ID_NIC_2_3] = CPU_ID_NIC_QMAN_ARC2, 1677 [GAUDI2_QUEUE_ID_NIC_3_0] = CPU_ID_NIC_QMAN_ARC3, 1678 [GAUDI2_QUEUE_ID_NIC_3_1] = CPU_ID_NIC_QMAN_ARC3, 1679 [GAUDI2_QUEUE_ID_NIC_3_2] = CPU_ID_NIC_QMAN_ARC3, 1680 [GAUDI2_QUEUE_ID_NIC_3_3] = CPU_ID_NIC_QMAN_ARC3, 1681 [GAUDI2_QUEUE_ID_NIC_4_0] = CPU_ID_NIC_QMAN_ARC4, 1682 [GAUDI2_QUEUE_ID_NIC_4_1] = CPU_ID_NIC_QMAN_ARC4, 1683 [GAUDI2_QUEUE_ID_NIC_4_2] = CPU_ID_NIC_QMAN_ARC4, 1684 [GAUDI2_QUEUE_ID_NIC_4_3] = CPU_ID_NIC_QMAN_ARC4, 1685 [GAUDI2_QUEUE_ID_NIC_5_0] = CPU_ID_NIC_QMAN_ARC5, 1686 [GAUDI2_QUEUE_ID_NIC_5_1] = CPU_ID_NIC_QMAN_ARC5, 1687 [GAUDI2_QUEUE_ID_NIC_5_2] = CPU_ID_NIC_QMAN_ARC5, 1688 [GAUDI2_QUEUE_ID_NIC_5_3] = CPU_ID_NIC_QMAN_ARC5, 1689 [GAUDI2_QUEUE_ID_NIC_6_0] = CPU_ID_NIC_QMAN_ARC6, 1690 [GAUDI2_QUEUE_ID_NIC_6_1] = CPU_ID_NIC_QMAN_ARC6, 1691 [GAUDI2_QUEUE_ID_NIC_6_2] = CPU_ID_NIC_QMAN_ARC6, 1692 [GAUDI2_QUEUE_ID_NIC_6_3] = CPU_ID_NIC_QMAN_ARC6, 1693 [GAUDI2_QUEUE_ID_NIC_7_0] = CPU_ID_NIC_QMAN_ARC7, 1694 [GAUDI2_QUEUE_ID_NIC_7_1] = CPU_ID_NIC_QMAN_ARC7, 1695 [GAUDI2_QUEUE_ID_NIC_7_2] = CPU_ID_NIC_QMAN_ARC7, 1696 [GAUDI2_QUEUE_ID_NIC_7_3] = CPU_ID_NIC_QMAN_ARC7, 1697 [GAUDI2_QUEUE_ID_NIC_8_0] = CPU_ID_NIC_QMAN_ARC8, 1698 [GAUDI2_QUEUE_ID_NIC_8_1] = CPU_ID_NIC_QMAN_ARC8, 1699 [GAUDI2_QUEUE_ID_NIC_8_2] = CPU_ID_NIC_QMAN_ARC8, 1700 [GAUDI2_QUEUE_ID_NIC_8_3] = CPU_ID_NIC_QMAN_ARC8, 1701 [GAUDI2_QUEUE_ID_NIC_9_0] = CPU_ID_NIC_QMAN_ARC9, 1702 [GAUDI2_QUEUE_ID_NIC_9_1] = CPU_ID_NIC_QMAN_ARC9, 1703 [GAUDI2_QUEUE_ID_NIC_9_2] = CPU_ID_NIC_QMAN_ARC9, 1704 [GAUDI2_QUEUE_ID_NIC_9_3] = CPU_ID_NIC_QMAN_ARC9, 1705 [GAUDI2_QUEUE_ID_NIC_10_0] = CPU_ID_NIC_QMAN_ARC10, 1706 [GAUDI2_QUEUE_ID_NIC_10_1] = CPU_ID_NIC_QMAN_ARC10, 1707 [GAUDI2_QUEUE_ID_NIC_10_2] = CPU_ID_NIC_QMAN_ARC10, 1708 [GAUDI2_QUEUE_ID_NIC_10_3] = CPU_ID_NIC_QMAN_ARC10, 1709 [GAUDI2_QUEUE_ID_NIC_11_0] = CPU_ID_NIC_QMAN_ARC11, 1710 [GAUDI2_QUEUE_ID_NIC_11_1] = CPU_ID_NIC_QMAN_ARC11, 1711 [GAUDI2_QUEUE_ID_NIC_11_2] = CPU_ID_NIC_QMAN_ARC11, 1712 [GAUDI2_QUEUE_ID_NIC_11_3] = CPU_ID_NIC_QMAN_ARC11, 1713 [GAUDI2_QUEUE_ID_NIC_12_0] = CPU_ID_NIC_QMAN_ARC12, 1714 [GAUDI2_QUEUE_ID_NIC_12_1] = CPU_ID_NIC_QMAN_ARC12, 1715 [GAUDI2_QUEUE_ID_NIC_12_2] = CPU_ID_NIC_QMAN_ARC12, 1716 [GAUDI2_QUEUE_ID_NIC_12_3] = CPU_ID_NIC_QMAN_ARC12, 1717 [GAUDI2_QUEUE_ID_NIC_13_0] = CPU_ID_NIC_QMAN_ARC13, 1718 [GAUDI2_QUEUE_ID_NIC_13_1] = CPU_ID_NIC_QMAN_ARC13, 1719 [GAUDI2_QUEUE_ID_NIC_13_2] = CPU_ID_NIC_QMAN_ARC13, 1720 [GAUDI2_QUEUE_ID_NIC_13_3] = CPU_ID_NIC_QMAN_ARC13, 1721 [GAUDI2_QUEUE_ID_NIC_14_0] = CPU_ID_NIC_QMAN_ARC14, 1722 [GAUDI2_QUEUE_ID_NIC_14_1] = CPU_ID_NIC_QMAN_ARC14, 1723 [GAUDI2_QUEUE_ID_NIC_14_2] = CPU_ID_NIC_QMAN_ARC14, 1724 [GAUDI2_QUEUE_ID_NIC_14_3] = CPU_ID_NIC_QMAN_ARC14, 1725 [GAUDI2_QUEUE_ID_NIC_15_0] = CPU_ID_NIC_QMAN_ARC15, 1726 [GAUDI2_QUEUE_ID_NIC_15_1] = CPU_ID_NIC_QMAN_ARC15, 1727 [GAUDI2_QUEUE_ID_NIC_15_2] = CPU_ID_NIC_QMAN_ARC15, 1728 [GAUDI2_QUEUE_ID_NIC_15_3] = CPU_ID_NIC_QMAN_ARC15, 1729 [GAUDI2_QUEUE_ID_NIC_16_0] = CPU_ID_NIC_QMAN_ARC16, 1730 [GAUDI2_QUEUE_ID_NIC_16_1] = CPU_ID_NIC_QMAN_ARC16, 1731 [GAUDI2_QUEUE_ID_NIC_16_2] = CPU_ID_NIC_QMAN_ARC16, 1732 [GAUDI2_QUEUE_ID_NIC_16_3] = CPU_ID_NIC_QMAN_ARC16, 1733 [GAUDI2_QUEUE_ID_NIC_17_0] = CPU_ID_NIC_QMAN_ARC17, 1734 [GAUDI2_QUEUE_ID_NIC_17_1] = CPU_ID_NIC_QMAN_ARC17, 1735 [GAUDI2_QUEUE_ID_NIC_17_2] = CPU_ID_NIC_QMAN_ARC17, 1736 [GAUDI2_QUEUE_ID_NIC_17_3] = CPU_ID_NIC_QMAN_ARC17, 1737 [GAUDI2_QUEUE_ID_NIC_18_0] = CPU_ID_NIC_QMAN_ARC18, 1738 [GAUDI2_QUEUE_ID_NIC_18_1] = CPU_ID_NIC_QMAN_ARC18, 1739 [GAUDI2_QUEUE_ID_NIC_18_2] = CPU_ID_NIC_QMAN_ARC18, 1740 [GAUDI2_QUEUE_ID_NIC_18_3] = CPU_ID_NIC_QMAN_ARC18, 1741 [GAUDI2_QUEUE_ID_NIC_19_0] = CPU_ID_NIC_QMAN_ARC19, 1742 [GAUDI2_QUEUE_ID_NIC_19_1] = CPU_ID_NIC_QMAN_ARC19, 1743 [GAUDI2_QUEUE_ID_NIC_19_2] = CPU_ID_NIC_QMAN_ARC19, 1744 [GAUDI2_QUEUE_ID_NIC_19_3] = CPU_ID_NIC_QMAN_ARC19, 1745 [GAUDI2_QUEUE_ID_NIC_20_0] = CPU_ID_NIC_QMAN_ARC20, 1746 [GAUDI2_QUEUE_ID_NIC_20_1] = CPU_ID_NIC_QMAN_ARC20, 1747 [GAUDI2_QUEUE_ID_NIC_20_2] = CPU_ID_NIC_QMAN_ARC20, 1748 [GAUDI2_QUEUE_ID_NIC_20_3] = CPU_ID_NIC_QMAN_ARC20, 1749 [GAUDI2_QUEUE_ID_NIC_21_0] = CPU_ID_NIC_QMAN_ARC21, 1750 [GAUDI2_QUEUE_ID_NIC_21_1] = CPU_ID_NIC_QMAN_ARC21, 1751 [GAUDI2_QUEUE_ID_NIC_21_2] = CPU_ID_NIC_QMAN_ARC21, 1752 [GAUDI2_QUEUE_ID_NIC_21_3] = CPU_ID_NIC_QMAN_ARC21, 1753 [GAUDI2_QUEUE_ID_NIC_22_0] = CPU_ID_NIC_QMAN_ARC22, 1754 [GAUDI2_QUEUE_ID_NIC_22_1] = CPU_ID_NIC_QMAN_ARC22, 1755 [GAUDI2_QUEUE_ID_NIC_22_2] = CPU_ID_NIC_QMAN_ARC22, 1756 [GAUDI2_QUEUE_ID_NIC_22_3] = CPU_ID_NIC_QMAN_ARC22, 1757 [GAUDI2_QUEUE_ID_NIC_23_0] = CPU_ID_NIC_QMAN_ARC23, 1758 [GAUDI2_QUEUE_ID_NIC_23_1] = CPU_ID_NIC_QMAN_ARC23, 1759 [GAUDI2_QUEUE_ID_NIC_23_2] = CPU_ID_NIC_QMAN_ARC23, 1760 [GAUDI2_QUEUE_ID_NIC_23_3] = CPU_ID_NIC_QMAN_ARC23, 1761 [GAUDI2_QUEUE_ID_ROT_0_0] = CPU_ID_ROT_QMAN_ARC0, 1762 [GAUDI2_QUEUE_ID_ROT_0_1] = CPU_ID_ROT_QMAN_ARC0, 1763 [GAUDI2_QUEUE_ID_ROT_0_2] = CPU_ID_ROT_QMAN_ARC0, 1764 [GAUDI2_QUEUE_ID_ROT_0_3] = CPU_ID_ROT_QMAN_ARC0, 1765 [GAUDI2_QUEUE_ID_ROT_1_0] = CPU_ID_ROT_QMAN_ARC1, 1766 [GAUDI2_QUEUE_ID_ROT_1_1] = CPU_ID_ROT_QMAN_ARC1, 1767 [GAUDI2_QUEUE_ID_ROT_1_2] = CPU_ID_ROT_QMAN_ARC1, 1768 [GAUDI2_QUEUE_ID_ROT_1_3] = CPU_ID_ROT_QMAN_ARC1 1769 }; 1770 1771 const u32 gaudi2_dma_core_blocks_bases[DMA_CORE_ID_SIZE] = { 1772 [DMA_CORE_ID_PDMA0] = mmPDMA0_CORE_BASE, 1773 [DMA_CORE_ID_PDMA1] = mmPDMA1_CORE_BASE, 1774 [DMA_CORE_ID_EDMA0] = mmDCORE0_EDMA0_CORE_BASE, 1775 [DMA_CORE_ID_EDMA1] = mmDCORE0_EDMA1_CORE_BASE, 1776 [DMA_CORE_ID_EDMA2] = mmDCORE1_EDMA0_CORE_BASE, 1777 [DMA_CORE_ID_EDMA3] = mmDCORE1_EDMA1_CORE_BASE, 1778 [DMA_CORE_ID_EDMA4] = mmDCORE2_EDMA0_CORE_BASE, 1779 [DMA_CORE_ID_EDMA5] = mmDCORE2_EDMA1_CORE_BASE, 1780 [DMA_CORE_ID_EDMA6] = mmDCORE3_EDMA0_CORE_BASE, 1781 [DMA_CORE_ID_EDMA7] = mmDCORE3_EDMA1_CORE_BASE, 1782 [DMA_CORE_ID_KDMA] = mmARC_FARM_KDMA_BASE 1783 }; 1784 1785 const u32 gaudi2_mme_acc_blocks_bases[MME_ID_SIZE] = { 1786 [MME_ID_DCORE0] = mmDCORE0_MME_ACC_BASE, 1787 [MME_ID_DCORE1] = mmDCORE1_MME_ACC_BASE, 1788 [MME_ID_DCORE2] = mmDCORE2_MME_ACC_BASE, 1789 [MME_ID_DCORE3] = mmDCORE3_MME_ACC_BASE 1790 }; 1791 1792 static const u32 gaudi2_tpc_cfg_blocks_bases[TPC_ID_SIZE] = { 1793 [TPC_ID_DCORE0_TPC0] = mmDCORE0_TPC0_CFG_BASE, 1794 [TPC_ID_DCORE0_TPC1] = mmDCORE0_TPC1_CFG_BASE, 1795 [TPC_ID_DCORE0_TPC2] = mmDCORE0_TPC2_CFG_BASE, 1796 [TPC_ID_DCORE0_TPC3] = mmDCORE0_TPC3_CFG_BASE, 1797 [TPC_ID_DCORE0_TPC4] = mmDCORE0_TPC4_CFG_BASE, 1798 [TPC_ID_DCORE0_TPC5] = mmDCORE0_TPC5_CFG_BASE, 1799 [TPC_ID_DCORE1_TPC0] = mmDCORE1_TPC0_CFG_BASE, 1800 [TPC_ID_DCORE1_TPC1] = mmDCORE1_TPC1_CFG_BASE, 1801 [TPC_ID_DCORE1_TPC2] = mmDCORE1_TPC2_CFG_BASE, 1802 [TPC_ID_DCORE1_TPC3] = mmDCORE1_TPC3_CFG_BASE, 1803 [TPC_ID_DCORE1_TPC4] = mmDCORE1_TPC4_CFG_BASE, 1804 [TPC_ID_DCORE1_TPC5] = mmDCORE1_TPC5_CFG_BASE, 1805 [TPC_ID_DCORE2_TPC0] = mmDCORE2_TPC0_CFG_BASE, 1806 [TPC_ID_DCORE2_TPC1] = mmDCORE2_TPC1_CFG_BASE, 1807 [TPC_ID_DCORE2_TPC2] = mmDCORE2_TPC2_CFG_BASE, 1808 [TPC_ID_DCORE2_TPC3] = mmDCORE2_TPC3_CFG_BASE, 1809 [TPC_ID_DCORE2_TPC4] = mmDCORE2_TPC4_CFG_BASE, 1810 [TPC_ID_DCORE2_TPC5] = mmDCORE2_TPC5_CFG_BASE, 1811 [TPC_ID_DCORE3_TPC0] = mmDCORE3_TPC0_CFG_BASE, 1812 [TPC_ID_DCORE3_TPC1] = mmDCORE3_TPC1_CFG_BASE, 1813 [TPC_ID_DCORE3_TPC2] = mmDCORE3_TPC2_CFG_BASE, 1814 [TPC_ID_DCORE3_TPC3] = mmDCORE3_TPC3_CFG_BASE, 1815 [TPC_ID_DCORE3_TPC4] = mmDCORE3_TPC4_CFG_BASE, 1816 [TPC_ID_DCORE3_TPC5] = mmDCORE3_TPC5_CFG_BASE, 1817 [TPC_ID_DCORE0_TPC6] = mmDCORE0_TPC6_CFG_BASE, 1818 }; 1819 1820 static const u32 gaudi2_tpc_eml_cfg_blocks_bases[TPC_ID_SIZE] = { 1821 [TPC_ID_DCORE0_TPC0] = mmDCORE0_TPC0_EML_CFG_BASE, 1822 [TPC_ID_DCORE0_TPC1] = mmDCORE0_TPC1_EML_CFG_BASE, 1823 [TPC_ID_DCORE0_TPC2] = mmDCORE0_TPC2_EML_CFG_BASE, 1824 [TPC_ID_DCORE0_TPC3] = mmDCORE0_TPC3_EML_CFG_BASE, 1825 [TPC_ID_DCORE0_TPC4] = mmDCORE0_TPC4_EML_CFG_BASE, 1826 [TPC_ID_DCORE0_TPC5] = mmDCORE0_TPC5_EML_CFG_BASE, 1827 [TPC_ID_DCORE1_TPC0] = mmDCORE1_TPC0_EML_CFG_BASE, 1828 [TPC_ID_DCORE1_TPC1] = mmDCORE1_TPC1_EML_CFG_BASE, 1829 [TPC_ID_DCORE1_TPC2] = mmDCORE1_TPC2_EML_CFG_BASE, 1830 [TPC_ID_DCORE1_TPC3] = mmDCORE1_TPC3_EML_CFG_BASE, 1831 [TPC_ID_DCORE1_TPC4] = mmDCORE1_TPC4_EML_CFG_BASE, 1832 [TPC_ID_DCORE1_TPC5] = mmDCORE1_TPC5_EML_CFG_BASE, 1833 [TPC_ID_DCORE2_TPC0] = mmDCORE2_TPC0_EML_CFG_BASE, 1834 [TPC_ID_DCORE2_TPC1] = mmDCORE2_TPC1_EML_CFG_BASE, 1835 [TPC_ID_DCORE2_TPC2] = mmDCORE2_TPC2_EML_CFG_BASE, 1836 [TPC_ID_DCORE2_TPC3] = mmDCORE2_TPC3_EML_CFG_BASE, 1837 [TPC_ID_DCORE2_TPC4] = mmDCORE2_TPC4_EML_CFG_BASE, 1838 [TPC_ID_DCORE2_TPC5] = mmDCORE2_TPC5_EML_CFG_BASE, 1839 [TPC_ID_DCORE3_TPC0] = mmDCORE3_TPC0_EML_CFG_BASE, 1840 [TPC_ID_DCORE3_TPC1] = mmDCORE3_TPC1_EML_CFG_BASE, 1841 [TPC_ID_DCORE3_TPC2] = mmDCORE3_TPC2_EML_CFG_BASE, 1842 [TPC_ID_DCORE3_TPC3] = mmDCORE3_TPC3_EML_CFG_BASE, 1843 [TPC_ID_DCORE3_TPC4] = mmDCORE3_TPC4_EML_CFG_BASE, 1844 [TPC_ID_DCORE3_TPC5] = mmDCORE3_TPC5_EML_CFG_BASE, 1845 [TPC_ID_DCORE0_TPC6] = mmDCORE0_TPC6_EML_CFG_BASE, 1846 }; 1847 1848 const u32 gaudi2_rot_blocks_bases[ROTATOR_ID_SIZE] = { 1849 [ROTATOR_ID_0] = mmROT0_BASE, 1850 [ROTATOR_ID_1] = mmROT1_BASE 1851 }; 1852 1853 static const u32 gaudi2_tpc_id_to_queue_id[TPC_ID_SIZE] = { 1854 [TPC_ID_DCORE0_TPC0] = GAUDI2_QUEUE_ID_DCORE0_TPC_0_0, 1855 [TPC_ID_DCORE0_TPC1] = GAUDI2_QUEUE_ID_DCORE0_TPC_1_0, 1856 [TPC_ID_DCORE0_TPC2] = GAUDI2_QUEUE_ID_DCORE0_TPC_2_0, 1857 [TPC_ID_DCORE0_TPC3] = GAUDI2_QUEUE_ID_DCORE0_TPC_3_0, 1858 [TPC_ID_DCORE0_TPC4] = GAUDI2_QUEUE_ID_DCORE0_TPC_4_0, 1859 [TPC_ID_DCORE0_TPC5] = GAUDI2_QUEUE_ID_DCORE0_TPC_5_0, 1860 [TPC_ID_DCORE1_TPC0] = GAUDI2_QUEUE_ID_DCORE1_TPC_0_0, 1861 [TPC_ID_DCORE1_TPC1] = GAUDI2_QUEUE_ID_DCORE1_TPC_1_0, 1862 [TPC_ID_DCORE1_TPC2] = GAUDI2_QUEUE_ID_DCORE1_TPC_2_0, 1863 [TPC_ID_DCORE1_TPC3] = GAUDI2_QUEUE_ID_DCORE1_TPC_3_0, 1864 [TPC_ID_DCORE1_TPC4] = GAUDI2_QUEUE_ID_DCORE1_TPC_4_0, 1865 [TPC_ID_DCORE1_TPC5] = GAUDI2_QUEUE_ID_DCORE1_TPC_5_0, 1866 [TPC_ID_DCORE2_TPC0] = GAUDI2_QUEUE_ID_DCORE2_TPC_0_0, 1867 [TPC_ID_DCORE2_TPC1] = GAUDI2_QUEUE_ID_DCORE2_TPC_1_0, 1868 [TPC_ID_DCORE2_TPC2] = GAUDI2_QUEUE_ID_DCORE2_TPC_2_0, 1869 [TPC_ID_DCORE2_TPC3] = GAUDI2_QUEUE_ID_DCORE2_TPC_3_0, 1870 [TPC_ID_DCORE2_TPC4] = GAUDI2_QUEUE_ID_DCORE2_TPC_4_0, 1871 [TPC_ID_DCORE2_TPC5] = GAUDI2_QUEUE_ID_DCORE2_TPC_5_0, 1872 [TPC_ID_DCORE3_TPC0] = GAUDI2_QUEUE_ID_DCORE3_TPC_0_0, 1873 [TPC_ID_DCORE3_TPC1] = GAUDI2_QUEUE_ID_DCORE3_TPC_1_0, 1874 [TPC_ID_DCORE3_TPC2] = GAUDI2_QUEUE_ID_DCORE3_TPC_2_0, 1875 [TPC_ID_DCORE3_TPC3] = GAUDI2_QUEUE_ID_DCORE3_TPC_3_0, 1876 [TPC_ID_DCORE3_TPC4] = GAUDI2_QUEUE_ID_DCORE3_TPC_4_0, 1877 [TPC_ID_DCORE3_TPC5] = GAUDI2_QUEUE_ID_DCORE3_TPC_5_0, 1878 [TPC_ID_DCORE0_TPC6] = GAUDI2_QUEUE_ID_DCORE0_TPC_6_0, 1879 }; 1880 1881 static const u32 gaudi2_rot_id_to_queue_id[ROTATOR_ID_SIZE] = { 1882 [ROTATOR_ID_0] = GAUDI2_QUEUE_ID_ROT_0_0, 1883 [ROTATOR_ID_1] = GAUDI2_QUEUE_ID_ROT_1_0, 1884 }; 1885 1886 static const u32 gaudi2_tpc_engine_id_to_tpc_id[] = { 1887 [GAUDI2_DCORE0_ENGINE_ID_TPC_0] = TPC_ID_DCORE0_TPC0, 1888 [GAUDI2_DCORE0_ENGINE_ID_TPC_1] = TPC_ID_DCORE0_TPC1, 1889 [GAUDI2_DCORE0_ENGINE_ID_TPC_2] = TPC_ID_DCORE0_TPC2, 1890 [GAUDI2_DCORE0_ENGINE_ID_TPC_3] = TPC_ID_DCORE0_TPC3, 1891 [GAUDI2_DCORE0_ENGINE_ID_TPC_4] = TPC_ID_DCORE0_TPC4, 1892 [GAUDI2_DCORE0_ENGINE_ID_TPC_5] = TPC_ID_DCORE0_TPC5, 1893 [GAUDI2_DCORE1_ENGINE_ID_TPC_0] = TPC_ID_DCORE1_TPC0, 1894 [GAUDI2_DCORE1_ENGINE_ID_TPC_1] = TPC_ID_DCORE1_TPC1, 1895 [GAUDI2_DCORE1_ENGINE_ID_TPC_2] = TPC_ID_DCORE1_TPC2, 1896 [GAUDI2_DCORE1_ENGINE_ID_TPC_3] = TPC_ID_DCORE1_TPC3, 1897 [GAUDI2_DCORE1_ENGINE_ID_TPC_4] = TPC_ID_DCORE1_TPC4, 1898 [GAUDI2_DCORE1_ENGINE_ID_TPC_5] = TPC_ID_DCORE1_TPC5, 1899 [GAUDI2_DCORE2_ENGINE_ID_TPC_0] = TPC_ID_DCORE2_TPC0, 1900 [GAUDI2_DCORE2_ENGINE_ID_TPC_1] = TPC_ID_DCORE2_TPC1, 1901 [GAUDI2_DCORE2_ENGINE_ID_TPC_2] = TPC_ID_DCORE2_TPC2, 1902 [GAUDI2_DCORE2_ENGINE_ID_TPC_3] = TPC_ID_DCORE2_TPC3, 1903 [GAUDI2_DCORE2_ENGINE_ID_TPC_4] = TPC_ID_DCORE2_TPC4, 1904 [GAUDI2_DCORE2_ENGINE_ID_TPC_5] = TPC_ID_DCORE2_TPC5, 1905 [GAUDI2_DCORE3_ENGINE_ID_TPC_0] = TPC_ID_DCORE3_TPC0, 1906 [GAUDI2_DCORE3_ENGINE_ID_TPC_1] = TPC_ID_DCORE3_TPC1, 1907 [GAUDI2_DCORE3_ENGINE_ID_TPC_2] = TPC_ID_DCORE3_TPC2, 1908 [GAUDI2_DCORE3_ENGINE_ID_TPC_3] = TPC_ID_DCORE3_TPC3, 1909 [GAUDI2_DCORE3_ENGINE_ID_TPC_4] = TPC_ID_DCORE3_TPC4, 1910 [GAUDI2_DCORE3_ENGINE_ID_TPC_5] = TPC_ID_DCORE3_TPC5, 1911 /* the PCI TPC is placed last (mapped liked HW) */ 1912 [GAUDI2_DCORE0_ENGINE_ID_TPC_6] = TPC_ID_DCORE0_TPC6, 1913 }; 1914 1915 static const u32 gaudi2_mme_engine_id_to_mme_id[] = { 1916 [GAUDI2_DCORE0_ENGINE_ID_MME] = MME_ID_DCORE0, 1917 [GAUDI2_DCORE1_ENGINE_ID_MME] = MME_ID_DCORE1, 1918 [GAUDI2_DCORE2_ENGINE_ID_MME] = MME_ID_DCORE2, 1919 [GAUDI2_DCORE3_ENGINE_ID_MME] = MME_ID_DCORE3, 1920 }; 1921 1922 static const u32 gaudi2_edma_engine_id_to_edma_id[] = { 1923 [GAUDI2_ENGINE_ID_PDMA_0] = DMA_CORE_ID_PDMA0, 1924 [GAUDI2_ENGINE_ID_PDMA_1] = DMA_CORE_ID_PDMA1, 1925 [GAUDI2_DCORE0_ENGINE_ID_EDMA_0] = DMA_CORE_ID_EDMA0, 1926 [GAUDI2_DCORE0_ENGINE_ID_EDMA_1] = DMA_CORE_ID_EDMA1, 1927 [GAUDI2_DCORE1_ENGINE_ID_EDMA_0] = DMA_CORE_ID_EDMA2, 1928 [GAUDI2_DCORE1_ENGINE_ID_EDMA_1] = DMA_CORE_ID_EDMA3, 1929 [GAUDI2_DCORE2_ENGINE_ID_EDMA_0] = DMA_CORE_ID_EDMA4, 1930 [GAUDI2_DCORE2_ENGINE_ID_EDMA_1] = DMA_CORE_ID_EDMA5, 1931 [GAUDI2_DCORE3_ENGINE_ID_EDMA_0] = DMA_CORE_ID_EDMA6, 1932 [GAUDI2_DCORE3_ENGINE_ID_EDMA_1] = DMA_CORE_ID_EDMA7, 1933 [GAUDI2_ENGINE_ID_KDMA] = DMA_CORE_ID_KDMA, 1934 }; 1935 1936 const u32 edma_stream_base[NUM_OF_EDMA_PER_DCORE * NUM_OF_DCORES] = { 1937 GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0, 1938 GAUDI2_QUEUE_ID_DCORE0_EDMA_1_0, 1939 GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0, 1940 GAUDI2_QUEUE_ID_DCORE1_EDMA_1_0, 1941 GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0, 1942 GAUDI2_QUEUE_ID_DCORE2_EDMA_1_0, 1943 GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0, 1944 GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0, 1945 }; 1946 1947 static const char gaudi2_vdec_irq_name[GAUDI2_VDEC_MSIX_ENTRIES][GAUDI2_MAX_STRING_LEN] = { 1948 "gaudi2 vdec 0_0", "gaudi2 vdec 0_0 abnormal", 1949 "gaudi2 vdec 0_1", "gaudi2 vdec 0_1 abnormal", 1950 "gaudi2 vdec 1_0", "gaudi2 vdec 1_0 abnormal", 1951 "gaudi2 vdec 1_1", "gaudi2 vdec 1_1 abnormal", 1952 "gaudi2 vdec 2_0", "gaudi2 vdec 2_0 abnormal", 1953 "gaudi2 vdec 2_1", "gaudi2 vdec 2_1 abnormal", 1954 "gaudi2 vdec 3_0", "gaudi2 vdec 3_0 abnormal", 1955 "gaudi2 vdec 3_1", "gaudi2 vdec 3_1 abnormal", 1956 "gaudi2 vdec s_0", "gaudi2 vdec s_0 abnormal", 1957 "gaudi2 vdec s_1", "gaudi2 vdec s_1 abnormal" 1958 }; 1959 1960 enum rtr_id { 1961 DCORE0_RTR0, 1962 DCORE0_RTR1, 1963 DCORE0_RTR2, 1964 DCORE0_RTR3, 1965 DCORE0_RTR4, 1966 DCORE0_RTR5, 1967 DCORE0_RTR6, 1968 DCORE0_RTR7, 1969 DCORE1_RTR0, 1970 DCORE1_RTR1, 1971 DCORE1_RTR2, 1972 DCORE1_RTR3, 1973 DCORE1_RTR4, 1974 DCORE1_RTR5, 1975 DCORE1_RTR6, 1976 DCORE1_RTR7, 1977 DCORE2_RTR0, 1978 DCORE2_RTR1, 1979 DCORE2_RTR2, 1980 DCORE2_RTR3, 1981 DCORE2_RTR4, 1982 DCORE2_RTR5, 1983 DCORE2_RTR6, 1984 DCORE2_RTR7, 1985 DCORE3_RTR0, 1986 DCORE3_RTR1, 1987 DCORE3_RTR2, 1988 DCORE3_RTR3, 1989 DCORE3_RTR4, 1990 DCORE3_RTR5, 1991 DCORE3_RTR6, 1992 DCORE3_RTR7, 1993 }; 1994 1995 static const u32 gaudi2_tpc_initiator_hbw_rtr_id[NUM_OF_TPC_PER_DCORE * NUM_OF_DCORES + 1] = { 1996 DCORE0_RTR1, DCORE0_RTR1, DCORE0_RTR2, DCORE0_RTR2, DCORE0_RTR3, DCORE0_RTR3, 1997 DCORE1_RTR6, DCORE1_RTR6, DCORE1_RTR5, DCORE1_RTR5, DCORE1_RTR4, DCORE1_RTR4, 1998 DCORE2_RTR3, DCORE2_RTR3, DCORE2_RTR2, DCORE2_RTR2, DCORE2_RTR1, DCORE2_RTR1, 1999 DCORE3_RTR4, DCORE3_RTR4, DCORE3_RTR5, DCORE3_RTR5, DCORE3_RTR6, DCORE3_RTR6, 2000 DCORE0_RTR0 2001 }; 2002 2003 static const u32 gaudi2_tpc_initiator_lbw_rtr_id[NUM_OF_TPC_PER_DCORE * NUM_OF_DCORES + 1] = { 2004 DCORE0_RTR1, DCORE0_RTR1, DCORE0_RTR1, DCORE0_RTR1, DCORE0_RTR2, DCORE0_RTR2, 2005 DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR6, DCORE1_RTR6, DCORE1_RTR5, DCORE1_RTR5, 2006 DCORE2_RTR2, DCORE2_RTR2, DCORE2_RTR1, DCORE2_RTR1, DCORE2_RTR0, DCORE2_RTR0, 2007 DCORE3_RTR5, DCORE3_RTR5, DCORE3_RTR6, DCORE3_RTR6, DCORE3_RTR7, DCORE3_RTR7, 2008 DCORE0_RTR0 2009 }; 2010 2011 static const u32 gaudi2_dec_initiator_hbw_rtr_id[NUMBER_OF_DEC] = { 2012 DCORE0_RTR0, DCORE0_RTR0, DCORE1_RTR7, DCORE1_RTR7, DCORE2_RTR0, DCORE2_RTR0, 2013 DCORE3_RTR7, DCORE3_RTR7, DCORE0_RTR0, DCORE0_RTR0 2014 }; 2015 2016 static const u32 gaudi2_dec_initiator_lbw_rtr_id[NUMBER_OF_DEC] = { 2017 DCORE0_RTR1, DCORE0_RTR1, DCORE1_RTR6, DCORE1_RTR6, DCORE2_RTR1, DCORE2_RTR1, 2018 DCORE3_RTR6, DCORE3_RTR6, DCORE0_RTR0, DCORE0_RTR0 2019 }; 2020 2021 static const u32 gaudi2_nic_initiator_hbw_rtr_id[NIC_NUMBER_OF_MACROS] = { 2022 DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR7, DCORE2_RTR0, 2023 DCORE2_RTR0, DCORE2_RTR0, DCORE2_RTR0, DCORE3_RTR7, DCORE3_RTR7, DCORE3_RTR7 2024 }; 2025 2026 static const u32 gaudi2_nic_initiator_lbw_rtr_id[NIC_NUMBER_OF_MACROS] = { 2027 DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR7, DCORE1_RTR7, DCORE2_RTR0, 2028 DCORE2_RTR0, DCORE2_RTR0, DCORE2_RTR0, DCORE3_RTR7, DCORE3_RTR7, DCORE3_RTR7 2029 }; 2030 2031 static const u32 gaudi2_edma_initiator_hbw_sft[NUM_OF_EDMA_PER_DCORE * NUM_OF_DCORES] = { 2032 mmSFT0_HBW_RTR_IF1_MSTR_IF_RR_SHRD_HBW_BASE, 2033 mmSFT0_HBW_RTR_IF0_MSTR_IF_RR_SHRD_HBW_BASE, 2034 mmSFT1_HBW_RTR_IF1_MSTR_IF_RR_SHRD_HBW_BASE, 2035 mmSFT1_HBW_RTR_IF0_MSTR_IF_RR_SHRD_HBW_BASE, 2036 mmSFT2_HBW_RTR_IF0_MSTR_IF_RR_SHRD_HBW_BASE, 2037 mmSFT2_HBW_RTR_IF1_MSTR_IF_RR_SHRD_HBW_BASE, 2038 mmSFT3_HBW_RTR_IF0_MSTR_IF_RR_SHRD_HBW_BASE, 2039 mmSFT3_HBW_RTR_IF1_MSTR_IF_RR_SHRD_HBW_BASE 2040 }; 2041 2042 static const u32 gaudi2_pdma_initiator_hbw_rtr_id[NUM_OF_PDMA] = { 2043 DCORE0_RTR0, DCORE0_RTR0 2044 }; 2045 2046 static const u32 gaudi2_pdma_initiator_lbw_rtr_id[NUM_OF_PDMA] = { 2047 DCORE0_RTR2, DCORE0_RTR2 2048 }; 2049 2050 static const u32 gaudi2_rot_initiator_hbw_rtr_id[NUM_OF_ROT] = { 2051 DCORE2_RTR0, DCORE3_RTR7 2052 }; 2053 2054 static const u32 gaudi2_rot_initiator_lbw_rtr_id[NUM_OF_ROT] = { 2055 DCORE2_RTR2, DCORE3_RTR5 2056 }; 2057 2058 struct mme_initiators_rtr_id { 2059 u32 wap0; 2060 u32 wap1; 2061 u32 write; 2062 u32 read; 2063 u32 sbte0; 2064 u32 sbte1; 2065 u32 sbte2; 2066 u32 sbte3; 2067 u32 sbte4; 2068 }; 2069 2070 enum mme_initiators { 2071 MME_WAP0 = 0, 2072 MME_WAP1, 2073 MME_WRITE, 2074 MME_READ, 2075 MME_SBTE0, 2076 MME_SBTE1, 2077 MME_SBTE2, 2078 MME_SBTE3, 2079 MME_SBTE4, 2080 MME_INITIATORS_MAX 2081 }; 2082 2083 static const struct mme_initiators_rtr_id 2084 gaudi2_mme_initiator_rtr_id[NUM_OF_MME_PER_DCORE * NUM_OF_DCORES] = { 2085 { .wap0 = 5, .wap1 = 7, .write = 6, .read = 7, 2086 .sbte0 = 7, .sbte1 = 4, .sbte2 = 4, .sbte3 = 5, .sbte4 = 6}, 2087 { .wap0 = 10, .wap1 = 8, .write = 9, .read = 8, 2088 .sbte0 = 11, .sbte1 = 11, .sbte2 = 10, .sbte3 = 9, .sbte4 = 8}, 2089 { .wap0 = 21, .wap1 = 23, .write = 22, .read = 23, 2090 .sbte0 = 20, .sbte1 = 20, .sbte2 = 21, .sbte3 = 22, .sbte4 = 23}, 2091 { .wap0 = 30, .wap1 = 28, .write = 29, .read = 30, 2092 .sbte0 = 31, .sbte1 = 31, .sbte2 = 30, .sbte3 = 29, .sbte4 = 28}, 2093 }; 2094 2095 enum razwi_event_sources { 2096 RAZWI_TPC, 2097 RAZWI_MME, 2098 RAZWI_EDMA, 2099 RAZWI_PDMA, 2100 RAZWI_NIC, 2101 RAZWI_DEC, 2102 RAZWI_ROT, 2103 RAZWI_ARC_FARM 2104 }; 2105 2106 struct hbm_mc_error_causes { 2107 u32 mask; 2108 char cause[50]; 2109 }; 2110 2111 static struct hl_special_block_info gaudi2_special_blocks[] = GAUDI2_SPECIAL_BLOCKS; 2112 2113 /* Special blocks iterator is currently used to configure security protection bits, 2114 * and read global errors. Most HW blocks are addressable and those who aren't (N/A)- 2115 * must be skipped. Following configurations are commonly used for both PB config 2116 * and global error reading, since currently they both share the same settings. 2117 * Once it changes, we must remember to use separate configurations for either one. 2118 */ 2119 static int gaudi2_iterator_skip_block_types[] = { 2120 GAUDI2_BLOCK_TYPE_PLL, 2121 GAUDI2_BLOCK_TYPE_EU_BIST, 2122 GAUDI2_BLOCK_TYPE_HBM, 2123 GAUDI2_BLOCK_TYPE_XFT 2124 }; 2125 2126 static struct range gaudi2_iterator_skip_block_ranges[] = { 2127 /* Skip all PSOC blocks except for PSOC_GLOBAL_CONF */ 2128 {mmPSOC_I2C_M0_BASE, mmPSOC_EFUSE_BASE}, 2129 {mmPSOC_BTL_BASE, mmPSOC_MSTR_IF_RR_SHRD_HBW_BASE}, 2130 /* Skip all CPU blocks except for CPU_IF */ 2131 {mmCPU_CA53_CFG_BASE, mmCPU_CA53_CFG_BASE}, 2132 {mmCPU_TIMESTAMP_BASE, mmCPU_MSTR_IF_RR_SHRD_HBW_BASE} 2133 }; 2134 2135 static struct hbm_mc_error_causes hbm_mc_spi[GAUDI2_NUM_OF_HBM_MC_SPI_CAUSE] = { 2136 {HBM_MC_SPI_TEMP_PIN_CHG_MASK, "temperature pins changed"}, 2137 {HBM_MC_SPI_THR_ENG_MASK, "temperature-based throttling engaged"}, 2138 {HBM_MC_SPI_THR_DIS_ENG_MASK, "temperature-based throttling disengaged"}, 2139 {HBM_MC_SPI_IEEE1500_COMP_MASK, "IEEE1500 op comp"}, 2140 {HBM_MC_SPI_IEEE1500_PAUSED_MASK, "IEEE1500 op paused"}, 2141 }; 2142 2143 static const char * const hbm_mc_sei_cause[GAUDI2_NUM_OF_HBM_SEI_CAUSE] = { 2144 [HBM_SEI_CMD_PARITY_EVEN] = "SEI C/A parity even", 2145 [HBM_SEI_CMD_PARITY_ODD] = "SEI C/A parity odd", 2146 [HBM_SEI_READ_ERR] = "SEI read data error", 2147 [HBM_SEI_WRITE_DATA_PARITY_ERR] = "SEI write data parity error", 2148 [HBM_SEI_CATTRIP] = "SEI CATTRIP asserted", 2149 [HBM_SEI_MEM_BIST_FAIL] = "SEI memory BIST fail", 2150 [HBM_SEI_DFI] = "SEI DFI error", 2151 [HBM_SEI_INV_TEMP_READ_OUT] = "SEI invalid temp read", 2152 [HBM_SEI_BIST_FAIL] = "SEI BIST fail" 2153 }; 2154 2155 struct mmu_spi_sei_cause { 2156 char cause[50]; 2157 int clear_bit; 2158 }; 2159 2160 static const struct mmu_spi_sei_cause gaudi2_mmu_spi_sei[GAUDI2_NUM_OF_MMU_SPI_SEI_CAUSE] = { 2161 {"page fault", 1}, /* INTERRUPT_CLR[1] */ 2162 {"page access", 1}, /* INTERRUPT_CLR[1] */ 2163 {"bypass ddr", 2}, /* INTERRUPT_CLR[2] */ 2164 {"multi hit", 2}, /* INTERRUPT_CLR[2] */ 2165 {"mmu rei0", -1}, /* no clear register bit */ 2166 {"mmu rei1", -1}, /* no clear register bit */ 2167 {"stlb rei0", -1}, /* no clear register bit */ 2168 {"stlb rei1", -1}, /* no clear register bit */ 2169 {"rr privileged write hit", 2}, /* INTERRUPT_CLR[2] */ 2170 {"rr privileged read hit", 2}, /* INTERRUPT_CLR[2] */ 2171 {"rr secure write hit", 2}, /* INTERRUPT_CLR[2] */ 2172 {"rr secure read hit", 2}, /* INTERRUPT_CLR[2] */ 2173 {"bist_fail no use", 2}, /* INTERRUPT_CLR[2] */ 2174 {"bist_fail no use", 2}, /* INTERRUPT_CLR[2] */ 2175 {"bist_fail no use", 2}, /* INTERRUPT_CLR[2] */ 2176 {"bist_fail no use", 2}, /* INTERRUPT_CLR[2] */ 2177 {"slave error", 16}, /* INTERRUPT_CLR[16] */ 2178 {"dec error", 17}, /* INTERRUPT_CLR[17] */ 2179 {"burst fifo full", 2} /* INTERRUPT_CLR[2] */ 2180 }; 2181 2182 struct gaudi2_cache_invld_params { 2183 u64 start_va; 2184 u64 end_va; 2185 u32 inv_start_val; 2186 u32 flags; 2187 bool range_invalidation; 2188 }; 2189 2190 struct gaudi2_tpc_idle_data { 2191 struct engines_data *e; 2192 unsigned long *mask; 2193 bool *is_idle; 2194 const char *tpc_fmt; 2195 }; 2196 2197 struct gaudi2_tpc_mmu_data { 2198 u32 rw_asid; 2199 }; 2200 2201 static s64 gaudi2_state_dump_specs_props[SP_MAX] = {0}; 2202 2203 static int gaudi2_memset_device_memory(struct hl_device *hdev, u64 addr, u64 size, u64 val); 2204 static bool gaudi2_is_queue_enabled(struct hl_device *hdev, u32 hw_queue_id); 2205 static bool gaudi2_is_arc_enabled(struct hl_device *hdev, u64 arc_id); 2206 static void gaudi2_clr_arc_id_cap(struct hl_device *hdev, u64 arc_id); 2207 static void gaudi2_set_arc_id_cap(struct hl_device *hdev, u64 arc_id); 2208 static void gaudi2_memset_device_lbw(struct hl_device *hdev, u32 addr, u32 size, u32 val); 2209 static int gaudi2_send_job_to_kdma(struct hl_device *hdev, u64 src_addr, u64 dst_addr, u32 size, 2210 bool is_memset); 2211 static bool gaudi2_get_tpc_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 2212 struct engines_data *e); 2213 static bool gaudi2_get_mme_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 2214 struct engines_data *e); 2215 static bool gaudi2_get_edma_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 2216 struct engines_data *e); 2217 static u64 gaudi2_mmu_scramble_addr(struct hl_device *hdev, u64 raw_addr); 2218 static u64 gaudi2_mmu_descramble_addr(struct hl_device *hdev, u64 scrambled_addr); 2219 2220 static void gaudi2_init_scrambler_hbm(struct hl_device *hdev) 2221 { 2222 2223 } 2224 2225 static u32 gaudi2_get_signal_cb_size(struct hl_device *hdev) 2226 { 2227 return sizeof(struct packet_msg_short); 2228 } 2229 2230 static u32 gaudi2_get_wait_cb_size(struct hl_device *hdev) 2231 { 2232 return sizeof(struct packet_msg_short) * 4 + sizeof(struct packet_fence); 2233 } 2234 2235 void gaudi2_iterate_tpcs(struct hl_device *hdev, struct iterate_module_ctx *ctx) 2236 { 2237 struct asic_fixed_properties *prop = &hdev->asic_prop; 2238 int dcore, inst, tpc_seq; 2239 u32 offset; 2240 2241 /* init the return code */ 2242 ctx->rc = 0; 2243 2244 for (dcore = 0; dcore < NUM_OF_DCORES; dcore++) { 2245 for (inst = 0; inst < NUM_OF_TPC_PER_DCORE; inst++) { 2246 tpc_seq = dcore * NUM_OF_TPC_PER_DCORE + inst; 2247 2248 if (!(prop->tpc_enabled_mask & BIT(tpc_seq))) 2249 continue; 2250 2251 offset = (DCORE_OFFSET * dcore) + (DCORE_TPC_OFFSET * inst); 2252 2253 ctx->fn(hdev, dcore, inst, offset, ctx); 2254 if (ctx->rc) { 2255 dev_err(hdev->dev, "TPC iterator failed for DCORE%d TPC%d\n", 2256 dcore, inst); 2257 return; 2258 } 2259 } 2260 } 2261 2262 if (!(prop->tpc_enabled_mask & BIT(TPC_ID_DCORE0_TPC6))) 2263 return; 2264 2265 /* special check for PCI TPC (DCORE0_TPC6) */ 2266 offset = DCORE_TPC_OFFSET * (NUM_DCORE0_TPC - 1); 2267 ctx->fn(hdev, 0, NUM_DCORE0_TPC - 1, offset, ctx); 2268 if (ctx->rc) 2269 dev_err(hdev->dev, "TPC iterator failed for DCORE0 TPC6\n"); 2270 } 2271 2272 static bool gaudi2_host_phys_addr_valid(u64 addr) 2273 { 2274 if ((addr < HOST_PHYS_BASE_0 + HOST_PHYS_SIZE_0) || (addr >= HOST_PHYS_BASE_1)) 2275 return true; 2276 2277 return false; 2278 } 2279 2280 static int set_number_of_functional_hbms(struct hl_device *hdev) 2281 { 2282 struct asic_fixed_properties *prop = &hdev->asic_prop; 2283 u8 faulty_hbms = hweight64(hdev->dram_binning); 2284 2285 /* check if all HBMs should be used */ 2286 if (!faulty_hbms) { 2287 dev_dbg(hdev->dev, "All HBM are in use (no binning)\n"); 2288 prop->num_functional_hbms = GAUDI2_HBM_NUM; 2289 return 0; 2290 } 2291 2292 /* 2293 * check for error condition in which number of binning 2294 * candidates is higher than the maximum supported by the 2295 * driver (in which case binning mask shall be ignored and driver will 2296 * set the default) 2297 */ 2298 if (faulty_hbms > MAX_FAULTY_HBMS) { 2299 dev_err(hdev->dev, 2300 "HBM binning supports max of %d faulty HBMs, supplied mask 0x%llx.\n", 2301 MAX_FAULTY_HBMS, hdev->dram_binning); 2302 return -EINVAL; 2303 } 2304 2305 /* 2306 * by default, number of functional HBMs in Gaudi2 is always 2307 * GAUDI2_HBM_NUM - 1. 2308 */ 2309 prop->num_functional_hbms = GAUDI2_HBM_NUM - faulty_hbms; 2310 return 0; 2311 } 2312 2313 static bool gaudi2_is_edma_queue_id(u32 queue_id) 2314 { 2315 2316 switch (queue_id) { 2317 case GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3: 2318 case GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3: 2319 case GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3: 2320 case GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3: 2321 return true; 2322 default: 2323 return false; 2324 } 2325 } 2326 2327 static int gaudi2_set_dram_properties(struct hl_device *hdev) 2328 { 2329 struct asic_fixed_properties *prop = &hdev->asic_prop; 2330 u64 hbm_drv_base_offset = 0, edma_pq_base_addr; 2331 u32 basic_hbm_page_size, edma_idx = 0; 2332 int rc, i; 2333 2334 rc = set_number_of_functional_hbms(hdev); 2335 if (rc) 2336 return -EINVAL; 2337 2338 /* 2339 * Due to HW bug in which TLB size is x16 smaller than expected we use a workaround 2340 * in which we are using x16 bigger page size to be able to populate the entire 2341 * HBM mappings in the TLB 2342 */ 2343 basic_hbm_page_size = prop->num_functional_hbms * SZ_8M; 2344 prop->dram_page_size = GAUDI2_COMPENSATE_TLB_PAGE_SIZE_FACTOR * basic_hbm_page_size; 2345 prop->device_mem_alloc_default_page_size = prop->dram_page_size; 2346 prop->dram_size = prop->num_functional_hbms * SZ_16G; 2347 prop->dram_base_address = DRAM_PHYS_BASE; 2348 prop->dram_end_address = prop->dram_base_address + prop->dram_size; 2349 prop->dram_supports_virtual_memory = true; 2350 2351 prop->dram_user_base_address = DRAM_PHYS_BASE + prop->dram_page_size; 2352 prop->dram_hints_align_mask = ~GAUDI2_HBM_MMU_SCRM_ADDRESS_MASK; 2353 prop->hints_dram_reserved_va_range.start_addr = RESERVED_VA_RANGE_FOR_ARC_ON_HBM_START; 2354 prop->hints_dram_reserved_va_range.end_addr = RESERVED_VA_RANGE_FOR_ARC_ON_HBM_END; 2355 2356 /* since DRAM page size differs from DMMU page size we need to allocate 2357 * DRAM memory in units of dram_page size and mapping this memory in 2358 * units of DMMU page size. we overcome this size mismatch using a 2359 * scrambling routine which takes a DRAM page and converts it to a DMMU 2360 * page. 2361 * We therefore: 2362 * 1. partition the virtual address space to DRAM-page (whole) pages. 2363 * (suppose we get n such pages) 2364 * 2. limit the amount of virtual address space we got from 1 above to 2365 * a multiple of 64M as we don't want the scrambled address to cross 2366 * the DRAM virtual address space. 2367 * ( m = (n * DRAM_page_size) / DMMU_page_size). 2368 * 3. determine the and address accordingly 2369 * end_addr = start_addr + m * 48M 2370 * 2371 * the DRAM address MSBs (63:48) are not part of the roundup calculation 2372 */ 2373 prop->dmmu.start_addr = prop->dram_base_address + 2374 (prop->dram_page_size * 2375 DIV_ROUND_UP_SECTOR_T(prop->dram_size, prop->dram_page_size)); 2376 prop->dmmu.end_addr = prop->dmmu.start_addr + prop->dram_page_size * 2377 div_u64((VA_HBM_SPACE_END - prop->dmmu.start_addr), prop->dmmu.page_size); 2378 /* 2379 * Driver can't share an (48MB) HBM page with the F/W in order to prevent FW to block 2380 * the driver part by range register, so it must start at the next (48MB) page 2381 */ 2382 hbm_drv_base_offset = roundup(CPU_FW_IMAGE_SIZE, prop->num_functional_hbms * SZ_8M); 2383 2384 /* 2385 * The NIC driver section size and the HMMU page tables section in the HBM needs 2386 * to be the remaining size in the first dram page after taking into 2387 * account the F/W image size 2388 */ 2389 2390 /* Reserve region in HBM for HMMU page tables */ 2391 prop->mmu_pgt_addr = DRAM_PHYS_BASE + hbm_drv_base_offset + 2392 ((prop->dram_page_size - hbm_drv_base_offset) - 2393 (HMMU_PAGE_TABLES_SIZE + EDMA_PQS_SIZE + EDMA_SCRATCHPAD_SIZE)); 2394 2395 /* Set EDMA PQs HBM addresses */ 2396 edma_pq_base_addr = prop->mmu_pgt_addr + HMMU_PAGE_TABLES_SIZE; 2397 2398 for (i = 0 ; i < GAUDI2_QUEUE_ID_CPU_PQ ; i++) { 2399 if (gaudi2_is_edma_queue_id(i)) { 2400 prop->hw_queues_props[i].q_dram_bd_address = edma_pq_base_addr + 2401 (edma_idx * HL_QUEUE_SIZE_IN_BYTES); 2402 edma_idx++; 2403 } 2404 } 2405 2406 return 0; 2407 } 2408 2409 static int gaudi2_set_fixed_properties(struct hl_device *hdev) 2410 { 2411 struct asic_fixed_properties *prop = &hdev->asic_prop; 2412 struct hw_queue_properties *q_props; 2413 u32 num_sync_stream_queues = 0; 2414 int i, rc; 2415 2416 prop->max_queues = GAUDI2_QUEUE_ID_SIZE; 2417 prop->hw_queues_props = kcalloc(prop->max_queues, sizeof(struct hw_queue_properties), 2418 GFP_KERNEL); 2419 2420 if (!prop->hw_queues_props) 2421 return -ENOMEM; 2422 2423 q_props = prop->hw_queues_props; 2424 2425 for (i = 0 ; i < GAUDI2_QUEUE_ID_CPU_PQ ; i++) { 2426 q_props[i].type = QUEUE_TYPE_HW; 2427 q_props[i].driver_only = 0; 2428 2429 if (i >= GAUDI2_QUEUE_ID_NIC_0_0 && i <= GAUDI2_QUEUE_ID_NIC_23_3) { 2430 q_props[i].supports_sync_stream = 0; 2431 } else { 2432 q_props[i].supports_sync_stream = 1; 2433 num_sync_stream_queues++; 2434 } 2435 2436 q_props[i].cb_alloc_flags = CB_ALLOC_USER; 2437 2438 if (gaudi2_is_edma_queue_id(i)) 2439 q_props[i].dram_bd = 1; 2440 } 2441 2442 q_props[GAUDI2_QUEUE_ID_CPU_PQ].type = QUEUE_TYPE_CPU; 2443 q_props[GAUDI2_QUEUE_ID_CPU_PQ].driver_only = 1; 2444 q_props[GAUDI2_QUEUE_ID_CPU_PQ].cb_alloc_flags = CB_ALLOC_KERNEL; 2445 2446 prop->cache_line_size = DEVICE_CACHE_LINE_SIZE; 2447 prop->cfg_base_address = CFG_BASE; 2448 prop->device_dma_offset_for_host_access = HOST_PHYS_BASE_0; 2449 prop->host_base_address = HOST_PHYS_BASE_0; 2450 prop->host_end_address = prop->host_base_address + HOST_PHYS_SIZE_0; 2451 prop->max_pending_cs = GAUDI2_MAX_PENDING_CS; 2452 prop->completion_queues_count = GAUDI2_RESERVED_CQ_NUMBER; 2453 prop->user_dec_intr_count = NUMBER_OF_DEC; 2454 prop->user_interrupt_count = GAUDI2_IRQ_NUM_USER_LAST - GAUDI2_IRQ_NUM_USER_FIRST + 1; 2455 prop->completion_mode = HL_COMPLETION_MODE_CS; 2456 prop->sync_stream_first_sob = GAUDI2_RESERVED_SOB_NUMBER; 2457 prop->sync_stream_first_mon = GAUDI2_RESERVED_MON_NUMBER; 2458 2459 prop->sram_base_address = SRAM_BASE_ADDR; 2460 prop->sram_size = SRAM_SIZE; 2461 prop->sram_end_address = prop->sram_base_address + prop->sram_size; 2462 prop->sram_user_base_address = prop->sram_base_address + SRAM_USER_BASE_OFFSET; 2463 2464 prop->hints_range_reservation = true; 2465 2466 prop->rotator_enabled_mask = BIT(NUM_OF_ROT) - 1; 2467 2468 prop->max_asid = 2; 2469 2470 prop->dmmu.pgt_size = HMMU_PAGE_TABLES_SIZE; 2471 prop->mmu_pte_size = HL_PTE_SIZE; 2472 2473 prop->dmmu.hop_shifts[MMU_HOP0] = DHOP0_SHIFT; 2474 prop->dmmu.hop_shifts[MMU_HOP1] = DHOP1_SHIFT; 2475 prop->dmmu.hop_shifts[MMU_HOP2] = DHOP2_SHIFT; 2476 prop->dmmu.hop_shifts[MMU_HOP3] = DHOP3_SHIFT; 2477 prop->dmmu.hop_masks[MMU_HOP0] = DHOP0_MASK; 2478 prop->dmmu.hop_masks[MMU_HOP1] = DHOP1_MASK; 2479 prop->dmmu.hop_masks[MMU_HOP2] = DHOP2_MASK; 2480 prop->dmmu.hop_masks[MMU_HOP3] = DHOP3_MASK; 2481 prop->dmmu.page_size = PAGE_SIZE_1GB; 2482 prop->dmmu.num_hops = MMU_ARCH_4_HOPS; 2483 prop->dmmu.last_mask = LAST_MASK; 2484 prop->dmmu.host_resident = 0; 2485 prop->dmmu.hop_table_size = HOP_TABLE_SIZE_512_PTE; 2486 prop->dmmu.hop0_tables_total_size = HOP_TABLE_SIZE_512_PTE * prop->max_asid; 2487 2488 /* As we need to set the pgt address in dram for HMMU init so we cannot 2489 * wait to the fw cpucp info to set the dram props as mmu init comes before 2490 * hw init 2491 */ 2492 rc = hdev->asic_funcs->set_dram_properties(hdev); 2493 if (rc) 2494 goto free_qprops; 2495 2496 prop->mmu_pgt_size = PMMU_PAGE_TABLES_SIZE; 2497 2498 prop->pmmu.pgt_size = prop->mmu_pgt_size; 2499 hdev->pmmu_huge_range = true; 2500 prop->pmmu.host_resident = 1; 2501 prop->pmmu.num_hops = MMU_ARCH_6_HOPS; 2502 prop->pmmu.last_mask = LAST_MASK; 2503 prop->pmmu.hop_table_size = HOP_TABLE_SIZE_512_PTE; 2504 prop->pmmu.hop0_tables_total_size = HOP_TABLE_SIZE_512_PTE * prop->max_asid; 2505 2506 prop->hints_host_reserved_va_range.start_addr = RESERVED_VA_FOR_VIRTUAL_MSIX_DOORBELL_START; 2507 prop->hints_host_reserved_va_range.end_addr = RESERVED_VA_RANGE_FOR_ARC_ON_HOST_END; 2508 prop->hints_host_hpage_reserved_va_range.start_addr = 2509 RESERVED_VA_RANGE_FOR_ARC_ON_HOST_HPAGE_START; 2510 prop->hints_host_hpage_reserved_va_range.end_addr = 2511 RESERVED_VA_RANGE_FOR_ARC_ON_HOST_HPAGE_END; 2512 2513 if (PAGE_SIZE == SZ_64K) { 2514 prop->pmmu.hop_shifts[MMU_HOP0] = HOP0_SHIFT_64K; 2515 prop->pmmu.hop_shifts[MMU_HOP1] = HOP1_SHIFT_64K; 2516 prop->pmmu.hop_shifts[MMU_HOP2] = HOP2_SHIFT_64K; 2517 prop->pmmu.hop_shifts[MMU_HOP3] = HOP3_SHIFT_64K; 2518 prop->pmmu.hop_shifts[MMU_HOP4] = HOP4_SHIFT_64K; 2519 prop->pmmu.hop_shifts[MMU_HOP5] = HOP5_SHIFT_64K; 2520 prop->pmmu.hop_masks[MMU_HOP0] = HOP0_MASK_64K; 2521 prop->pmmu.hop_masks[MMU_HOP1] = HOP1_MASK_64K; 2522 prop->pmmu.hop_masks[MMU_HOP2] = HOP2_MASK_64K; 2523 prop->pmmu.hop_masks[MMU_HOP3] = HOP3_MASK_64K; 2524 prop->pmmu.hop_masks[MMU_HOP4] = HOP4_MASK_64K; 2525 prop->pmmu.hop_masks[MMU_HOP5] = HOP5_MASK_64K; 2526 prop->pmmu.start_addr = VA_HOST_SPACE_PAGE_START; 2527 prop->pmmu.end_addr = VA_HOST_SPACE_PAGE_END; 2528 prop->pmmu.page_size = PAGE_SIZE_64KB; 2529 2530 /* shifts and masks are the same in PMMU and HPMMU */ 2531 memcpy(&prop->pmmu_huge, &prop->pmmu, sizeof(prop->pmmu)); 2532 prop->pmmu_huge.page_size = PAGE_SIZE_16MB; 2533 prop->pmmu_huge.start_addr = VA_HOST_SPACE_HPAGE_START; 2534 prop->pmmu_huge.end_addr = VA_HOST_SPACE_HPAGE_END; 2535 } else { 2536 prop->pmmu.hop_shifts[MMU_HOP0] = HOP0_SHIFT_4K; 2537 prop->pmmu.hop_shifts[MMU_HOP1] = HOP1_SHIFT_4K; 2538 prop->pmmu.hop_shifts[MMU_HOP2] = HOP2_SHIFT_4K; 2539 prop->pmmu.hop_shifts[MMU_HOP3] = HOP3_SHIFT_4K; 2540 prop->pmmu.hop_shifts[MMU_HOP4] = HOP4_SHIFT_4K; 2541 prop->pmmu.hop_shifts[MMU_HOP5] = HOP5_SHIFT_4K; 2542 prop->pmmu.hop_masks[MMU_HOP0] = HOP0_MASK_4K; 2543 prop->pmmu.hop_masks[MMU_HOP1] = HOP1_MASK_4K; 2544 prop->pmmu.hop_masks[MMU_HOP2] = HOP2_MASK_4K; 2545 prop->pmmu.hop_masks[MMU_HOP3] = HOP3_MASK_4K; 2546 prop->pmmu.hop_masks[MMU_HOP4] = HOP4_MASK_4K; 2547 prop->pmmu.hop_masks[MMU_HOP5] = HOP5_MASK_4K; 2548 prop->pmmu.start_addr = VA_HOST_SPACE_PAGE_START; 2549 prop->pmmu.end_addr = VA_HOST_SPACE_PAGE_END; 2550 prop->pmmu.page_size = PAGE_SIZE_4KB; 2551 2552 /* shifts and masks are the same in PMMU and HPMMU */ 2553 memcpy(&prop->pmmu_huge, &prop->pmmu, sizeof(prop->pmmu)); 2554 prop->pmmu_huge.page_size = PAGE_SIZE_2MB; 2555 prop->pmmu_huge.start_addr = VA_HOST_SPACE_HPAGE_START; 2556 prop->pmmu_huge.end_addr = VA_HOST_SPACE_HPAGE_END; 2557 } 2558 2559 prop->max_num_of_engines = GAUDI2_ENGINE_ID_SIZE; 2560 prop->num_engine_cores = CPU_ID_MAX; 2561 prop->cfg_size = CFG_SIZE; 2562 prop->num_of_events = GAUDI2_EVENT_SIZE; 2563 2564 prop->supports_engine_modes = true; 2565 2566 prop->dc_power_default = DC_POWER_DEFAULT; 2567 2568 prop->cb_pool_cb_cnt = GAUDI2_CB_POOL_CB_CNT; 2569 prop->cb_pool_cb_size = GAUDI2_CB_POOL_CB_SIZE; 2570 prop->pcie_dbi_base_address = CFG_BASE + mmPCIE_DBI_BASE; 2571 prop->pcie_aux_dbi_reg_addr = CFG_BASE + mmPCIE_AUX_DBI; 2572 2573 strscpy_pad(prop->cpucp_info.card_name, GAUDI2_DEFAULT_CARD_NAME, CARD_NAME_MAX_LEN); 2574 2575 prop->mme_master_slave_mode = 1; 2576 2577 prop->first_available_user_sob[0] = GAUDI2_RESERVED_SOB_NUMBER + 2578 (num_sync_stream_queues * HL_RSVD_SOBS); 2579 2580 prop->first_available_user_mon[0] = GAUDI2_RESERVED_MON_NUMBER + 2581 (num_sync_stream_queues * HL_RSVD_MONS); 2582 2583 prop->first_available_user_interrupt = GAUDI2_IRQ_NUM_USER_FIRST; 2584 prop->tpc_interrupt_id = GAUDI2_IRQ_NUM_TPC_ASSERT; 2585 prop->eq_interrupt_id = GAUDI2_IRQ_NUM_EVENT_QUEUE; 2586 2587 prop->first_available_cq[0] = GAUDI2_RESERVED_CQ_NUMBER; 2588 2589 prop->fw_cpu_boot_dev_sts0_valid = false; 2590 prop->fw_cpu_boot_dev_sts1_valid = false; 2591 prop->hard_reset_done_by_fw = false; 2592 prop->gic_interrupts_enable = true; 2593 2594 prop->server_type = HL_SERVER_TYPE_UNKNOWN; 2595 2596 prop->max_dec = NUMBER_OF_DEC; 2597 2598 prop->clk_pll_index = HL_GAUDI2_MME_PLL; 2599 2600 prop->dma_mask = 64; 2601 2602 prop->hbw_flush_reg = mmPCIE_WRAP_SPECIAL_GLBL_SPARE_0; 2603 2604 return 0; 2605 2606 free_qprops: 2607 kfree(prop->hw_queues_props); 2608 return rc; 2609 } 2610 2611 static int gaudi2_pci_bars_map(struct hl_device *hdev) 2612 { 2613 static const char * const name[] = {"CFG_SRAM", "MSIX", "DRAM"}; 2614 bool is_wc[3] = {false, false, true}; 2615 int rc; 2616 2617 rc = hl_pci_bars_map(hdev, name, is_wc); 2618 if (rc) 2619 return rc; 2620 2621 hdev->rmmio = hdev->pcie_bar[SRAM_CFG_BAR_ID] + (CFG_BASE - STM_FLASH_BASE_ADDR); 2622 2623 return 0; 2624 } 2625 2626 static u64 gaudi2_set_hbm_bar_base(struct hl_device *hdev, u64 addr) 2627 { 2628 struct gaudi2_device *gaudi2 = hdev->asic_specific; 2629 struct hl_inbound_pci_region pci_region; 2630 u64 old_addr = addr; 2631 int rc; 2632 2633 if ((gaudi2) && (gaudi2->dram_bar_cur_addr == addr)) 2634 return old_addr; 2635 2636 if (hdev->asic_prop.iatu_done_by_fw) 2637 return U64_MAX; 2638 2639 /* Inbound Region 2 - Bar 4 - Point to DRAM */ 2640 pci_region.mode = PCI_BAR_MATCH_MODE; 2641 pci_region.bar = DRAM_BAR_ID; 2642 pci_region.addr = addr; 2643 rc = hl_pci_set_inbound_region(hdev, 2, &pci_region); 2644 if (rc) 2645 return U64_MAX; 2646 2647 if (gaudi2) { 2648 old_addr = gaudi2->dram_bar_cur_addr; 2649 gaudi2->dram_bar_cur_addr = addr; 2650 } 2651 2652 return old_addr; 2653 } 2654 2655 static int gaudi2_init_iatu(struct hl_device *hdev) 2656 { 2657 struct hl_inbound_pci_region inbound_region; 2658 struct hl_outbound_pci_region outbound_region; 2659 u32 bar_addr_low, bar_addr_high; 2660 int rc; 2661 2662 if (hdev->asic_prop.iatu_done_by_fw) 2663 return 0; 2664 2665 /* Temporary inbound Region 0 - Bar 0 - Point to CFG 2666 * We must map this region in BAR match mode in order to 2667 * fetch BAR physical base address 2668 */ 2669 inbound_region.mode = PCI_BAR_MATCH_MODE; 2670 inbound_region.bar = SRAM_CFG_BAR_ID; 2671 /* Base address must be aligned to Bar size which is 256 MB */ 2672 inbound_region.addr = STM_FLASH_BASE_ADDR - STM_FLASH_ALIGNED_OFF; 2673 rc = hl_pci_set_inbound_region(hdev, 0, &inbound_region); 2674 if (rc) 2675 return rc; 2676 2677 /* Fetch physical BAR address */ 2678 bar_addr_high = RREG32(mmPCIE_DBI_BAR1_REG + STM_FLASH_ALIGNED_OFF); 2679 bar_addr_low = RREG32(mmPCIE_DBI_BAR0_REG + STM_FLASH_ALIGNED_OFF) & ~0xF; 2680 2681 hdev->pcie_bar_phys[SRAM_CFG_BAR_ID] = (u64)bar_addr_high << 32 | bar_addr_low; 2682 2683 /* Inbound Region 0 - Bar 0 - Point to CFG */ 2684 inbound_region.mode = PCI_ADDRESS_MATCH_MODE; 2685 inbound_region.bar = SRAM_CFG_BAR_ID; 2686 inbound_region.offset_in_bar = 0; 2687 inbound_region.addr = STM_FLASH_BASE_ADDR; 2688 inbound_region.size = CFG_REGION_SIZE; 2689 rc = hl_pci_set_inbound_region(hdev, 0, &inbound_region); 2690 if (rc) 2691 return rc; 2692 2693 /* Inbound Region 1 - Bar 0 - Point to BAR0_RESERVED + SRAM */ 2694 inbound_region.mode = PCI_ADDRESS_MATCH_MODE; 2695 inbound_region.bar = SRAM_CFG_BAR_ID; 2696 inbound_region.offset_in_bar = CFG_REGION_SIZE; 2697 inbound_region.addr = BAR0_RSRVD_BASE_ADDR; 2698 inbound_region.size = BAR0_RSRVD_SIZE + SRAM_SIZE; 2699 rc = hl_pci_set_inbound_region(hdev, 1, &inbound_region); 2700 if (rc) 2701 return rc; 2702 2703 /* Inbound Region 2 - Bar 4 - Point to DRAM */ 2704 inbound_region.mode = PCI_BAR_MATCH_MODE; 2705 inbound_region.bar = DRAM_BAR_ID; 2706 inbound_region.addr = DRAM_PHYS_BASE; 2707 rc = hl_pci_set_inbound_region(hdev, 2, &inbound_region); 2708 if (rc) 2709 return rc; 2710 2711 /* Outbound Region 0 - Point to Host */ 2712 outbound_region.addr = HOST_PHYS_BASE_0; 2713 outbound_region.size = HOST_PHYS_SIZE_0; 2714 rc = hl_pci_set_outbound_region(hdev, &outbound_region); 2715 2716 return rc; 2717 } 2718 2719 static enum hl_device_hw_state gaudi2_get_hw_state(struct hl_device *hdev) 2720 { 2721 return RREG32(mmHW_STATE); 2722 } 2723 2724 static int gaudi2_tpc_binning_init_prop(struct hl_device *hdev) 2725 { 2726 struct asic_fixed_properties *prop = &hdev->asic_prop; 2727 2728 /* 2729 * check for error condition in which number of binning candidates 2730 * is higher than the maximum supported by the driver 2731 */ 2732 if (hweight64(hdev->tpc_binning) > MAX_CLUSTER_BINNING_FAULTY_TPCS) { 2733 dev_err(hdev->dev, "TPC binning is supported for max of %d faulty TPCs, provided mask 0x%llx\n", 2734 MAX_CLUSTER_BINNING_FAULTY_TPCS, 2735 hdev->tpc_binning); 2736 return -EINVAL; 2737 } 2738 2739 prop->tpc_binning_mask = hdev->tpc_binning; 2740 prop->tpc_enabled_mask = GAUDI2_TPC_FULL_MASK; 2741 2742 return 0; 2743 } 2744 2745 static int gaudi2_set_tpc_binning_masks(struct hl_device *hdev) 2746 { 2747 struct asic_fixed_properties *prop = &hdev->asic_prop; 2748 struct hw_queue_properties *q_props = prop->hw_queues_props; 2749 u64 tpc_binning_mask; 2750 u8 subst_idx = 0; 2751 int i, rc; 2752 2753 rc = gaudi2_tpc_binning_init_prop(hdev); 2754 if (rc) 2755 return rc; 2756 2757 tpc_binning_mask = prop->tpc_binning_mask; 2758 2759 for (i = 0 ; i < MAX_FAULTY_TPCS ; i++) { 2760 u8 subst_seq, binned, qid_base; 2761 2762 if (tpc_binning_mask == 0) 2763 break; 2764 2765 if (subst_idx == 0) { 2766 subst_seq = TPC_ID_DCORE0_TPC6; 2767 qid_base = GAUDI2_QUEUE_ID_DCORE0_TPC_6_0; 2768 } else { 2769 subst_seq = TPC_ID_DCORE3_TPC5; 2770 qid_base = GAUDI2_QUEUE_ID_DCORE3_TPC_5_0; 2771 } 2772 2773 2774 /* clear bit from mask */ 2775 binned = __ffs(tpc_binning_mask); 2776 /* 2777 * Coverity complains about possible out-of-bound access in 2778 * clear_bit 2779 */ 2780 if (binned >= TPC_ID_SIZE) { 2781 dev_err(hdev->dev, 2782 "Invalid binned TPC (binning mask: %llx)\n", 2783 tpc_binning_mask); 2784 return -EINVAL; 2785 } 2786 clear_bit(binned, (unsigned long *)&tpc_binning_mask); 2787 2788 /* also clear replacing TPC bit from enabled mask */ 2789 clear_bit(subst_seq, (unsigned long *)&prop->tpc_enabled_mask); 2790 2791 /* bin substite TPC's Qs */ 2792 q_props[qid_base].binned = 1; 2793 q_props[qid_base + 1].binned = 1; 2794 q_props[qid_base + 2].binned = 1; 2795 q_props[qid_base + 3].binned = 1; 2796 2797 subst_idx++; 2798 } 2799 2800 return 0; 2801 } 2802 2803 static int gaudi2_set_dec_binning_masks(struct hl_device *hdev) 2804 { 2805 struct asic_fixed_properties *prop = &hdev->asic_prop; 2806 u8 num_faulty; 2807 2808 num_faulty = hweight32(hdev->decoder_binning); 2809 2810 /* 2811 * check for error condition in which number of binning candidates 2812 * is higher than the maximum supported by the driver 2813 */ 2814 if (num_faulty > MAX_FAULTY_DECODERS) { 2815 dev_err(hdev->dev, "decoder binning is supported for max of single faulty decoder, provided mask 0x%x\n", 2816 hdev->decoder_binning); 2817 return -EINVAL; 2818 } 2819 2820 prop->decoder_binning_mask = (hdev->decoder_binning & GAUDI2_DECODER_FULL_MASK); 2821 2822 if (prop->decoder_binning_mask) 2823 prop->decoder_enabled_mask = (GAUDI2_DECODER_FULL_MASK & ~BIT(DEC_ID_PCIE_VDEC1)); 2824 else 2825 prop->decoder_enabled_mask = GAUDI2_DECODER_FULL_MASK; 2826 2827 return 0; 2828 } 2829 2830 static void gaudi2_set_dram_binning_masks(struct hl_device *hdev) 2831 { 2832 struct asic_fixed_properties *prop = &hdev->asic_prop; 2833 2834 /* check if we should override default binning */ 2835 if (!hdev->dram_binning) { 2836 prop->dram_binning_mask = 0; 2837 prop->dram_enabled_mask = GAUDI2_DRAM_FULL_MASK; 2838 return; 2839 } 2840 2841 /* set DRAM binning constraints */ 2842 prop->faulty_dram_cluster_map |= hdev->dram_binning; 2843 prop->dram_binning_mask = hdev->dram_binning; 2844 prop->dram_enabled_mask = GAUDI2_DRAM_FULL_MASK & ~BIT(HBM_ID5); 2845 } 2846 2847 static int gaudi2_set_edma_binning_masks(struct hl_device *hdev) 2848 { 2849 struct asic_fixed_properties *prop = &hdev->asic_prop; 2850 struct hw_queue_properties *q_props; 2851 u8 seq, num_faulty; 2852 2853 num_faulty = hweight32(hdev->edma_binning); 2854 2855 /* 2856 * check for error condition in which number of binning candidates 2857 * is higher than the maximum supported by the driver 2858 */ 2859 if (num_faulty > MAX_FAULTY_EDMAS) { 2860 dev_err(hdev->dev, 2861 "EDMA binning is supported for max of single faulty EDMA, provided mask 0x%x\n", 2862 hdev->edma_binning); 2863 return -EINVAL; 2864 } 2865 2866 if (!hdev->edma_binning) { 2867 prop->edma_binning_mask = 0; 2868 prop->edma_enabled_mask = GAUDI2_EDMA_FULL_MASK; 2869 return 0; 2870 } 2871 2872 seq = __ffs((unsigned long)hdev->edma_binning); 2873 2874 /* set binning constraints */ 2875 prop->faulty_dram_cluster_map |= BIT(edma_to_hbm_cluster[seq]); 2876 prop->edma_binning_mask = hdev->edma_binning; 2877 prop->edma_enabled_mask = GAUDI2_EDMA_FULL_MASK & ~BIT(EDMA_ID_DCORE3_INSTANCE1); 2878 2879 /* bin substitute EDMA's queue */ 2880 q_props = prop->hw_queues_props; 2881 q_props[GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0].binned = 1; 2882 q_props[GAUDI2_QUEUE_ID_DCORE3_EDMA_1_1].binned = 1; 2883 q_props[GAUDI2_QUEUE_ID_DCORE3_EDMA_1_2].binned = 1; 2884 q_props[GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3].binned = 1; 2885 2886 return 0; 2887 } 2888 2889 static int gaudi2_set_xbar_edge_enable_mask(struct hl_device *hdev, u32 xbar_edge_iso_mask) 2890 { 2891 struct asic_fixed_properties *prop = &hdev->asic_prop; 2892 u8 num_faulty, seq; 2893 2894 /* check if we should override default binning */ 2895 if (!xbar_edge_iso_mask) { 2896 prop->xbar_edge_enabled_mask = GAUDI2_XBAR_EDGE_FULL_MASK; 2897 return 0; 2898 } 2899 2900 /* 2901 * note that it can be set to value other than 0 only after cpucp packet (i.e. 2902 * only the FW can set a redundancy value). for user it'll always be 0. 2903 */ 2904 num_faulty = hweight32(xbar_edge_iso_mask); 2905 2906 /* 2907 * check for error condition in which number of binning candidates 2908 * is higher than the maximum supported by the driver 2909 */ 2910 if (num_faulty > MAX_FAULTY_XBARS) { 2911 dev_err(hdev->dev, "we cannot have more than %d faulty XBAR EDGE\n", 2912 MAX_FAULTY_XBARS); 2913 return -EINVAL; 2914 } 2915 2916 seq = __ffs((unsigned long)xbar_edge_iso_mask); 2917 2918 /* set binning constraints */ 2919 prop->faulty_dram_cluster_map |= BIT(xbar_edge_to_hbm_cluster[seq]); 2920 prop->xbar_edge_enabled_mask = (~xbar_edge_iso_mask) & GAUDI2_XBAR_EDGE_FULL_MASK; 2921 2922 return 0; 2923 } 2924 2925 static int gaudi2_set_cluster_binning_masks_common(struct hl_device *hdev, u8 xbar_edge_iso_mask) 2926 { 2927 int rc; 2928 2929 /* 2930 * mark all clusters as good, each component will "fail" cluster 2931 * based on eFuse/user values. 2932 * If more than single cluster is faulty- the chip is unusable 2933 */ 2934 hdev->asic_prop.faulty_dram_cluster_map = 0; 2935 2936 gaudi2_set_dram_binning_masks(hdev); 2937 2938 rc = gaudi2_set_edma_binning_masks(hdev); 2939 if (rc) 2940 return rc; 2941 2942 rc = gaudi2_set_xbar_edge_enable_mask(hdev, xbar_edge_iso_mask); 2943 if (rc) 2944 return rc; 2945 2946 2947 /* always initially set to full mask */ 2948 hdev->asic_prop.hmmu_hif_enabled_mask = GAUDI2_HIF_HMMU_FULL_MASK; 2949 2950 return 0; 2951 } 2952 2953 static int gaudi2_set_cluster_binning_masks(struct hl_device *hdev) 2954 { 2955 struct asic_fixed_properties *prop = &hdev->asic_prop; 2956 int rc; 2957 2958 rc = gaudi2_set_cluster_binning_masks_common(hdev, prop->cpucp_info.xbar_binning_mask); 2959 if (rc) 2960 return rc; 2961 2962 /* if we have DRAM binning reported by FW we should perform cluster config */ 2963 if (prop->faulty_dram_cluster_map) { 2964 u8 cluster_seq = __ffs((unsigned long)prop->faulty_dram_cluster_map); 2965 2966 prop->hmmu_hif_enabled_mask = cluster_hmmu_hif_enabled_mask[cluster_seq]; 2967 } 2968 2969 return 0; 2970 } 2971 2972 static int gaudi2_set_binning_masks(struct hl_device *hdev) 2973 { 2974 int rc; 2975 2976 rc = gaudi2_set_cluster_binning_masks(hdev); 2977 if (rc) 2978 return rc; 2979 2980 rc = gaudi2_set_tpc_binning_masks(hdev); 2981 if (rc) 2982 return rc; 2983 2984 rc = gaudi2_set_dec_binning_masks(hdev); 2985 if (rc) 2986 return rc; 2987 2988 return 0; 2989 } 2990 2991 static int gaudi2_cpucp_info_get(struct hl_device *hdev) 2992 { 2993 struct gaudi2_device *gaudi2 = hdev->asic_specific; 2994 struct asic_fixed_properties *prop = &hdev->asic_prop; 2995 long max_power; 2996 u64 dram_size; 2997 int rc; 2998 2999 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) 3000 return 0; 3001 3002 /* No point of asking this information again when not doing hard reset, as the device 3003 * CPU hasn't been reset 3004 */ 3005 if (hdev->reset_info.in_compute_reset) 3006 return 0; 3007 3008 rc = hl_fw_cpucp_handshake(hdev, mmCPU_BOOT_DEV_STS0, mmCPU_BOOT_DEV_STS1, mmCPU_BOOT_ERR0, 3009 mmCPU_BOOT_ERR1); 3010 if (rc) 3011 return rc; 3012 3013 dram_size = le64_to_cpu(prop->cpucp_info.dram_size); 3014 if (dram_size) { 3015 /* we can have wither 5 or 6 HBMs. other values are invalid */ 3016 3017 if ((dram_size != ((GAUDI2_HBM_NUM - 1) * SZ_16G)) && 3018 (dram_size != (GAUDI2_HBM_NUM * SZ_16G))) { 3019 dev_err(hdev->dev, 3020 "F/W reported invalid DRAM size %llu. Trying to use default size %llu\n", 3021 dram_size, prop->dram_size); 3022 dram_size = prop->dram_size; 3023 } 3024 3025 prop->dram_size = dram_size; 3026 prop->dram_end_address = prop->dram_base_address + dram_size; 3027 } 3028 3029 if (!strlen(prop->cpucp_info.card_name)) 3030 strscpy_pad(prop->cpucp_info.card_name, GAUDI2_DEFAULT_CARD_NAME, 3031 CARD_NAME_MAX_LEN); 3032 3033 /* Overwrite binning masks with the actual binning values from F/W */ 3034 hdev->dram_binning = prop->cpucp_info.dram_binning_mask; 3035 hdev->edma_binning = prop->cpucp_info.edma_binning_mask; 3036 hdev->tpc_binning = le64_to_cpu(prop->cpucp_info.tpc_binning_mask); 3037 hdev->decoder_binning = lower_32_bits(le64_to_cpu(prop->cpucp_info.decoder_binning_mask)); 3038 3039 dev_dbg(hdev->dev, "Read binning masks: tpc: 0x%llx, dram: 0x%llx, edma: 0x%x, dec: 0x%x\n", 3040 hdev->tpc_binning, hdev->dram_binning, hdev->edma_binning, 3041 hdev->decoder_binning); 3042 3043 /* 3044 * at this point the DRAM parameters need to be updated according to data obtained 3045 * from the FW 3046 */ 3047 rc = hdev->asic_funcs->set_dram_properties(hdev); 3048 if (rc) 3049 return rc; 3050 3051 rc = hdev->asic_funcs->set_binning_masks(hdev); 3052 if (rc) 3053 return rc; 3054 3055 max_power = hl_fw_get_max_power(hdev); 3056 if (max_power < 0) 3057 return max_power; 3058 3059 prop->max_power_default = (u64) max_power; 3060 3061 return 0; 3062 } 3063 3064 static int gaudi2_fetch_psoc_frequency(struct hl_device *hdev) 3065 { 3066 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3067 u16 pll_freq_arr[HL_PLL_NUM_OUTPUTS]; 3068 int rc; 3069 3070 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) 3071 return 0; 3072 3073 rc = hl_fw_cpucp_pll_info_get(hdev, HL_GAUDI2_CPU_PLL, pll_freq_arr); 3074 if (rc) 3075 return rc; 3076 3077 hdev->asic_prop.psoc_timestamp_frequency = pll_freq_arr[3]; 3078 3079 return 0; 3080 } 3081 3082 static int gaudi2_mmu_clear_pgt_range(struct hl_device *hdev) 3083 { 3084 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3085 struct asic_fixed_properties *prop = &hdev->asic_prop; 3086 int rc; 3087 3088 if (!(gaudi2->hw_cap_initialized & HW_CAP_MMU_MASK)) 3089 return 0; 3090 3091 if (prop->dmmu.host_resident) 3092 return 0; 3093 3094 rc = gaudi2_memset_device_memory(hdev, prop->mmu_pgt_addr, prop->dmmu.pgt_size, 0); 3095 if (rc) 3096 dev_err(hdev->dev, "Failed to clear mmu pgt"); 3097 3098 return rc; 3099 } 3100 3101 static int gaudi2_early_init(struct hl_device *hdev) 3102 { 3103 struct asic_fixed_properties *prop = &hdev->asic_prop; 3104 struct pci_dev *pdev = hdev->pdev; 3105 resource_size_t pci_bar_size; 3106 int rc; 3107 3108 rc = gaudi2_set_fixed_properties(hdev); 3109 if (rc) 3110 return rc; 3111 3112 /* Check BAR sizes */ 3113 pci_bar_size = pci_resource_len(pdev, SRAM_CFG_BAR_ID); 3114 3115 if (pci_bar_size != CFG_BAR_SIZE) { 3116 dev_err(hdev->dev, "Not " HL_NAME "? BAR %d size %pa, expecting %llu\n", 3117 SRAM_CFG_BAR_ID, &pci_bar_size, CFG_BAR_SIZE); 3118 rc = -ENODEV; 3119 goto free_queue_props; 3120 } 3121 3122 pci_bar_size = pci_resource_len(pdev, MSIX_BAR_ID); 3123 if (pci_bar_size != MSIX_BAR_SIZE) { 3124 dev_err(hdev->dev, "Not " HL_NAME "? BAR %d size %pa, expecting %llu\n", 3125 MSIX_BAR_ID, &pci_bar_size, MSIX_BAR_SIZE); 3126 rc = -ENODEV; 3127 goto free_queue_props; 3128 } 3129 3130 prop->dram_pci_bar_size = pci_resource_len(pdev, DRAM_BAR_ID); 3131 hdev->dram_pci_bar_start = pci_resource_start(pdev, DRAM_BAR_ID); 3132 3133 /* 3134 * Only in pldm driver config iATU 3135 */ 3136 if (hdev->pldm) 3137 hdev->asic_prop.iatu_done_by_fw = false; 3138 else 3139 hdev->asic_prop.iatu_done_by_fw = true; 3140 3141 rc = hl_pci_init(hdev); 3142 if (rc) 3143 goto free_queue_props; 3144 3145 /* Before continuing in the initialization, we need to read the preboot 3146 * version to determine whether we run with a security-enabled firmware 3147 */ 3148 rc = hl_fw_read_preboot_status(hdev); 3149 if (rc) { 3150 if (hdev->reset_on_preboot_fail) 3151 /* we are already on failure flow, so don't check if hw_fini fails. */ 3152 hdev->asic_funcs->hw_fini(hdev, true, false); 3153 goto pci_fini; 3154 } 3155 3156 if (gaudi2_get_hw_state(hdev) == HL_DEVICE_HW_STATE_DIRTY) { 3157 dev_dbg(hdev->dev, "H/W state is dirty, must reset before initializing\n"); 3158 rc = hdev->asic_funcs->hw_fini(hdev, true, false); 3159 if (rc) { 3160 dev_err(hdev->dev, "failed to reset HW in dirty state (%d)\n", rc); 3161 goto pci_fini; 3162 } 3163 } 3164 3165 return 0; 3166 3167 pci_fini: 3168 hl_pci_fini(hdev); 3169 free_queue_props: 3170 kfree(hdev->asic_prop.hw_queues_props); 3171 return rc; 3172 } 3173 3174 static int gaudi2_early_fini(struct hl_device *hdev) 3175 { 3176 kfree(hdev->asic_prop.hw_queues_props); 3177 hl_pci_fini(hdev); 3178 3179 return 0; 3180 } 3181 3182 static bool gaudi2_is_arc_nic_owned(u64 arc_id) 3183 { 3184 switch (arc_id) { 3185 case CPU_ID_NIC_QMAN_ARC0...CPU_ID_NIC_QMAN_ARC23: 3186 return true; 3187 default: 3188 return false; 3189 } 3190 } 3191 3192 static bool gaudi2_is_arc_tpc_owned(u64 arc_id) 3193 { 3194 switch (arc_id) { 3195 case CPU_ID_TPC_QMAN_ARC0...CPU_ID_TPC_QMAN_ARC24: 3196 return true; 3197 default: 3198 return false; 3199 } 3200 } 3201 3202 static void gaudi2_init_arcs(struct hl_device *hdev) 3203 { 3204 struct cpu_dyn_regs *dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 3205 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3206 u64 arc_id; 3207 u32 i; 3208 3209 for (i = CPU_ID_SCHED_ARC0 ; i <= CPU_ID_SCHED_ARC3 ; i++) { 3210 if (gaudi2_is_arc_enabled(hdev, i)) 3211 continue; 3212 3213 gaudi2_set_arc_id_cap(hdev, i); 3214 } 3215 3216 for (i = GAUDI2_QUEUE_ID_PDMA_0_0 ; i < GAUDI2_QUEUE_ID_CPU_PQ ; i += 4) { 3217 if (!gaudi2_is_queue_enabled(hdev, i)) 3218 continue; 3219 3220 arc_id = gaudi2_queue_id_to_arc_id[i]; 3221 if (gaudi2_is_arc_enabled(hdev, arc_id)) 3222 continue; 3223 3224 if (gaudi2_is_arc_nic_owned(arc_id) && 3225 !(hdev->nic_ports_mask & BIT_ULL(arc_id - CPU_ID_NIC_QMAN_ARC0))) 3226 continue; 3227 3228 if (gaudi2_is_arc_tpc_owned(arc_id) && !(gaudi2->tpc_hw_cap_initialized & 3229 BIT_ULL(arc_id - CPU_ID_TPC_QMAN_ARC0))) 3230 continue; 3231 3232 gaudi2_set_arc_id_cap(hdev, arc_id); 3233 } 3234 3235 /* Fetch ARC scratchpad address */ 3236 hdev->asic_prop.engine_core_interrupt_reg_addr = 3237 CFG_BASE + le32_to_cpu(dyn_regs->eng_arc_irq_ctrl); 3238 } 3239 3240 static int gaudi2_scrub_arc_dccm(struct hl_device *hdev, u32 cpu_id) 3241 { 3242 u32 reg_base, reg_val; 3243 int rc; 3244 3245 switch (cpu_id) { 3246 case CPU_ID_SCHED_ARC0 ... CPU_ID_SCHED_ARC3: 3247 /* Each ARC scheduler has 2 consecutive DCCM blocks */ 3248 rc = gaudi2_send_job_to_kdma(hdev, 0, CFG_BASE + gaudi2_arc_dccm_bases[cpu_id], 3249 ARC_DCCM_BLOCK_SIZE * 2, true); 3250 if (rc) 3251 return rc; 3252 break; 3253 case CPU_ID_SCHED_ARC4: 3254 case CPU_ID_SCHED_ARC5: 3255 case CPU_ID_MME_QMAN_ARC0: 3256 case CPU_ID_MME_QMAN_ARC1: 3257 reg_base = gaudi2_arc_blocks_bases[cpu_id]; 3258 3259 /* Scrub lower DCCM block */ 3260 rc = gaudi2_send_job_to_kdma(hdev, 0, CFG_BASE + gaudi2_arc_dccm_bases[cpu_id], 3261 ARC_DCCM_BLOCK_SIZE, true); 3262 if (rc) 3263 return rc; 3264 3265 /* Switch to upper DCCM block */ 3266 reg_val = FIELD_PREP(ARC_FARM_ARC0_AUX_MME_ARC_UPPER_DCCM_EN_VAL_MASK, 1); 3267 WREG32(reg_base + ARC_DCCM_UPPER_EN_OFFSET, reg_val); 3268 3269 /* Scrub upper DCCM block */ 3270 rc = gaudi2_send_job_to_kdma(hdev, 0, CFG_BASE + gaudi2_arc_dccm_bases[cpu_id], 3271 ARC_DCCM_BLOCK_SIZE, true); 3272 if (rc) 3273 return rc; 3274 3275 /* Switch to lower DCCM block */ 3276 reg_val = FIELD_PREP(ARC_FARM_ARC0_AUX_MME_ARC_UPPER_DCCM_EN_VAL_MASK, 0); 3277 WREG32(reg_base + ARC_DCCM_UPPER_EN_OFFSET, reg_val); 3278 break; 3279 default: 3280 rc = gaudi2_send_job_to_kdma(hdev, 0, CFG_BASE + gaudi2_arc_dccm_bases[cpu_id], 3281 ARC_DCCM_BLOCK_SIZE, true); 3282 if (rc) 3283 return rc; 3284 } 3285 3286 return 0; 3287 } 3288 3289 static int gaudi2_scrub_arcs_dccm(struct hl_device *hdev) 3290 { 3291 u16 arc_id; 3292 int rc; 3293 3294 for (arc_id = CPU_ID_SCHED_ARC0 ; arc_id < CPU_ID_MAX ; arc_id++) { 3295 if (!gaudi2_is_arc_enabled(hdev, arc_id)) 3296 continue; 3297 3298 rc = gaudi2_scrub_arc_dccm(hdev, arc_id); 3299 if (rc) 3300 return rc; 3301 } 3302 3303 return 0; 3304 } 3305 3306 static int gaudi2_late_init(struct hl_device *hdev) 3307 { 3308 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3309 int rc; 3310 3311 hdev->asic_prop.supports_advanced_cpucp_rc = true; 3312 3313 rc = hl_fw_send_pci_access_msg(hdev, CPUCP_PACKET_ENABLE_PCI_ACCESS, 3314 gaudi2->virt_msix_db_dma_addr); 3315 if (rc) { 3316 dev_err(hdev->dev, "Failed to enable PCI access from CPU\n"); 3317 return rc; 3318 } 3319 3320 rc = gaudi2_fetch_psoc_frequency(hdev); 3321 if (rc) { 3322 dev_err(hdev->dev, "Failed to fetch psoc frequency\n"); 3323 goto disable_pci_access; 3324 } 3325 3326 rc = gaudi2_mmu_clear_pgt_range(hdev); 3327 if (rc) { 3328 dev_err(hdev->dev, "Failed to clear MMU page tables range\n"); 3329 goto disable_pci_access; 3330 } 3331 3332 gaudi2_init_arcs(hdev); 3333 3334 rc = gaudi2_scrub_arcs_dccm(hdev); 3335 if (rc) { 3336 dev_err(hdev->dev, "Failed to scrub arcs DCCM\n"); 3337 goto disable_pci_access; 3338 } 3339 3340 gaudi2_init_security(hdev); 3341 3342 return 0; 3343 3344 disable_pci_access: 3345 hl_fw_send_pci_access_msg(hdev, CPUCP_PACKET_DISABLE_PCI_ACCESS, 0x0); 3346 3347 return rc; 3348 } 3349 3350 static void gaudi2_late_fini(struct hl_device *hdev) 3351 { 3352 hl_hwmon_release_resources(hdev); 3353 } 3354 3355 static void gaudi2_user_mapped_dec_init(struct gaudi2_device *gaudi2, u32 start_idx) 3356 { 3357 struct user_mapped_block *blocks = gaudi2->mapped_blocks; 3358 3359 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE0_DEC0_CMD_BASE, HL_BLOCK_SIZE); 3360 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE0_DEC1_CMD_BASE, HL_BLOCK_SIZE); 3361 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE1_DEC0_CMD_BASE, HL_BLOCK_SIZE); 3362 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE1_DEC1_CMD_BASE, HL_BLOCK_SIZE); 3363 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE2_DEC0_CMD_BASE, HL_BLOCK_SIZE); 3364 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE2_DEC1_CMD_BASE, HL_BLOCK_SIZE); 3365 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE3_DEC0_CMD_BASE, HL_BLOCK_SIZE); 3366 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmDCORE3_DEC1_CMD_BASE, HL_BLOCK_SIZE); 3367 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx++], mmPCIE_DEC0_CMD_BASE, HL_BLOCK_SIZE); 3368 HL_USR_MAPPED_BLK_INIT(&blocks[start_idx], mmPCIE_DEC1_CMD_BASE, HL_BLOCK_SIZE); 3369 } 3370 3371 static void gaudi2_user_mapped_blocks_init(struct hl_device *hdev) 3372 { 3373 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3374 struct user_mapped_block *blocks = gaudi2->mapped_blocks; 3375 u32 block_size, umr_start_idx, num_umr_blocks; 3376 int i; 3377 3378 for (i = 0 ; i < NUM_ARC_CPUS ; i++) { 3379 if (i >= CPU_ID_SCHED_ARC0 && i <= CPU_ID_SCHED_ARC3) 3380 block_size = ARC_DCCM_BLOCK_SIZE * 2; 3381 else 3382 block_size = ARC_DCCM_BLOCK_SIZE; 3383 3384 blocks[i].address = gaudi2_arc_dccm_bases[i]; 3385 blocks[i].size = block_size; 3386 } 3387 3388 blocks[NUM_ARC_CPUS].address = mmARC_FARM_ARC0_ACP_ENG_BASE; 3389 blocks[NUM_ARC_CPUS].size = HL_BLOCK_SIZE; 3390 3391 blocks[NUM_ARC_CPUS + 1].address = mmARC_FARM_ARC1_ACP_ENG_BASE; 3392 blocks[NUM_ARC_CPUS + 1].size = HL_BLOCK_SIZE; 3393 3394 blocks[NUM_ARC_CPUS + 2].address = mmARC_FARM_ARC2_ACP_ENG_BASE; 3395 blocks[NUM_ARC_CPUS + 2].size = HL_BLOCK_SIZE; 3396 3397 blocks[NUM_ARC_CPUS + 3].address = mmARC_FARM_ARC3_ACP_ENG_BASE; 3398 blocks[NUM_ARC_CPUS + 3].size = HL_BLOCK_SIZE; 3399 3400 blocks[NUM_ARC_CPUS + 4].address = mmDCORE0_MME_QM_ARC_ACP_ENG_BASE; 3401 blocks[NUM_ARC_CPUS + 4].size = HL_BLOCK_SIZE; 3402 3403 blocks[NUM_ARC_CPUS + 5].address = mmDCORE1_MME_QM_ARC_ACP_ENG_BASE; 3404 blocks[NUM_ARC_CPUS + 5].size = HL_BLOCK_SIZE; 3405 3406 blocks[NUM_ARC_CPUS + 6].address = mmDCORE2_MME_QM_ARC_ACP_ENG_BASE; 3407 blocks[NUM_ARC_CPUS + 6].size = HL_BLOCK_SIZE; 3408 3409 blocks[NUM_ARC_CPUS + 7].address = mmDCORE3_MME_QM_ARC_ACP_ENG_BASE; 3410 blocks[NUM_ARC_CPUS + 7].size = HL_BLOCK_SIZE; 3411 3412 umr_start_idx = NUM_ARC_CPUS + NUM_OF_USER_ACP_BLOCKS; 3413 num_umr_blocks = NIC_NUMBER_OF_ENGINES * NUM_OF_USER_NIC_UMR_BLOCKS; 3414 for (i = 0 ; i < num_umr_blocks ; i++) { 3415 u8 nic_id, umr_block_id; 3416 3417 nic_id = i / NUM_OF_USER_NIC_UMR_BLOCKS; 3418 umr_block_id = i % NUM_OF_USER_NIC_UMR_BLOCKS; 3419 3420 blocks[umr_start_idx + i].address = 3421 mmNIC0_UMR0_0_UNSECURE_DOORBELL0_BASE + 3422 (nic_id / NIC_NUMBER_OF_QM_PER_MACRO) * NIC_OFFSET + 3423 (nic_id % NIC_NUMBER_OF_QM_PER_MACRO) * NIC_QM_OFFSET + 3424 umr_block_id * NIC_UMR_OFFSET; 3425 blocks[umr_start_idx + i].size = HL_BLOCK_SIZE; 3426 } 3427 3428 /* Expose decoder HW configuration block to user */ 3429 gaudi2_user_mapped_dec_init(gaudi2, USR_MAPPED_BLK_DEC_START_IDX); 3430 3431 for (i = 1; i < NUM_OF_DCORES; ++i) { 3432 blocks[USR_MAPPED_BLK_SM_START_IDX + 2 * (i - 1)].size = SM_OBJS_BLOCK_SIZE; 3433 blocks[USR_MAPPED_BLK_SM_START_IDX + 2 * (i - 1) + 1].size = HL_BLOCK_SIZE; 3434 3435 blocks[USR_MAPPED_BLK_SM_START_IDX + 2 * (i - 1)].address = 3436 mmDCORE0_SYNC_MNGR_OBJS_BASE + i * DCORE_OFFSET; 3437 3438 blocks[USR_MAPPED_BLK_SM_START_IDX + 2 * (i - 1) + 1].address = 3439 mmDCORE0_SYNC_MNGR_GLBL_BASE + i * DCORE_OFFSET; 3440 } 3441 } 3442 3443 static int gaudi2_alloc_cpu_accessible_dma_mem(struct hl_device *hdev) 3444 { 3445 dma_addr_t dma_addr_arr[GAUDI2_ALLOC_CPU_MEM_RETRY_CNT] = {}, end_addr; 3446 void *virt_addr_arr[GAUDI2_ALLOC_CPU_MEM_RETRY_CNT] = {}; 3447 int i, j, rc = 0; 3448 3449 /* The device ARC works with 32-bits addresses, and because there is a single HW register 3450 * that holds the extension bits (49..28), these bits must be identical in all the allocated 3451 * range. 3452 */ 3453 3454 for (i = 0 ; i < GAUDI2_ALLOC_CPU_MEM_RETRY_CNT ; i++) { 3455 virt_addr_arr[i] = hl_asic_dma_alloc_coherent(hdev, HL_CPU_ACCESSIBLE_MEM_SIZE, 3456 &dma_addr_arr[i], GFP_KERNEL | __GFP_ZERO); 3457 if (!virt_addr_arr[i]) { 3458 rc = -ENOMEM; 3459 goto free_dma_mem_arr; 3460 } 3461 3462 end_addr = dma_addr_arr[i] + HL_CPU_ACCESSIBLE_MEM_SIZE - 1; 3463 if (GAUDI2_ARC_PCI_MSB_ADDR(dma_addr_arr[i]) == GAUDI2_ARC_PCI_MSB_ADDR(end_addr)) 3464 break; 3465 } 3466 3467 if (i == GAUDI2_ALLOC_CPU_MEM_RETRY_CNT) { 3468 dev_err(hdev->dev, 3469 "MSB of ARC accessible DMA memory are not identical in all range\n"); 3470 rc = -EFAULT; 3471 goto free_dma_mem_arr; 3472 } 3473 3474 hdev->cpu_accessible_dma_mem = virt_addr_arr[i]; 3475 hdev->cpu_accessible_dma_address = dma_addr_arr[i]; 3476 3477 free_dma_mem_arr: 3478 for (j = 0 ; j < i ; j++) 3479 hl_asic_dma_free_coherent(hdev, HL_CPU_ACCESSIBLE_MEM_SIZE, virt_addr_arr[j], 3480 dma_addr_arr[j]); 3481 3482 return rc; 3483 } 3484 3485 static void gaudi2_set_pci_memory_regions(struct hl_device *hdev) 3486 { 3487 struct asic_fixed_properties *prop = &hdev->asic_prop; 3488 struct pci_mem_region *region; 3489 3490 /* CFG */ 3491 region = &hdev->pci_mem_region[PCI_REGION_CFG]; 3492 region->region_base = CFG_BASE; 3493 region->region_size = CFG_SIZE; 3494 region->offset_in_bar = CFG_BASE - STM_FLASH_BASE_ADDR; 3495 region->bar_size = CFG_BAR_SIZE; 3496 region->bar_id = SRAM_CFG_BAR_ID; 3497 region->used = 1; 3498 3499 /* SRAM */ 3500 region = &hdev->pci_mem_region[PCI_REGION_SRAM]; 3501 region->region_base = SRAM_BASE_ADDR; 3502 region->region_size = SRAM_SIZE; 3503 region->offset_in_bar = CFG_REGION_SIZE + BAR0_RSRVD_SIZE; 3504 region->bar_size = CFG_BAR_SIZE; 3505 region->bar_id = SRAM_CFG_BAR_ID; 3506 region->used = 1; 3507 3508 /* DRAM */ 3509 region = &hdev->pci_mem_region[PCI_REGION_DRAM]; 3510 region->region_base = DRAM_PHYS_BASE; 3511 region->region_size = hdev->asic_prop.dram_size; 3512 region->offset_in_bar = 0; 3513 region->bar_size = prop->dram_pci_bar_size; 3514 region->bar_id = DRAM_BAR_ID; 3515 region->used = 1; 3516 } 3517 3518 static void gaudi2_user_interrupt_setup(struct hl_device *hdev) 3519 { 3520 struct asic_fixed_properties *prop = &hdev->asic_prop; 3521 int i, j, k; 3522 3523 /* Initialize TPC interrupt */ 3524 HL_USR_INTR_STRUCT_INIT(hdev->tpc_interrupt, hdev, 0, HL_USR_INTERRUPT_TPC); 3525 3526 /* Initialize unexpected error interrupt */ 3527 HL_USR_INTR_STRUCT_INIT(hdev->unexpected_error_interrupt, hdev, 0, 3528 HL_USR_INTERRUPT_UNEXPECTED); 3529 3530 /* Initialize common user CQ interrupt */ 3531 HL_USR_INTR_STRUCT_INIT(hdev->common_user_cq_interrupt, hdev, 3532 HL_COMMON_USER_CQ_INTERRUPT_ID, HL_USR_INTERRUPT_CQ); 3533 3534 /* Initialize common decoder interrupt */ 3535 HL_USR_INTR_STRUCT_INIT(hdev->common_decoder_interrupt, hdev, 3536 HL_COMMON_DEC_INTERRUPT_ID, HL_USR_INTERRUPT_DECODER); 3537 3538 /* User interrupts structure holds both decoder and user interrupts from various engines. 3539 * We first initialize the decoder interrupts and then we add the user interrupts. 3540 * The only limitation is that the last decoder interrupt id must be smaller 3541 * then GAUDI2_IRQ_NUM_USER_FIRST. This is checked at compilation time. 3542 */ 3543 3544 /* Initialize decoder interrupts, expose only normal interrupts, 3545 * error interrupts to be handled by driver 3546 */ 3547 for (i = GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM, j = 0 ; i <= GAUDI2_IRQ_NUM_SHARED_DEC1_NRM; 3548 i += 2, j++) 3549 HL_USR_INTR_STRUCT_INIT(hdev->user_interrupt[j], hdev, i, 3550 HL_USR_INTERRUPT_DECODER); 3551 3552 for (i = GAUDI2_IRQ_NUM_USER_FIRST, k = 0 ; k < prop->user_interrupt_count; i++, j++, k++) 3553 HL_USR_INTR_STRUCT_INIT(hdev->user_interrupt[j], hdev, i, HL_USR_INTERRUPT_CQ); 3554 } 3555 3556 static inline int gaudi2_get_non_zero_random_int(void) 3557 { 3558 int rand = get_random_u32(); 3559 3560 return rand ? rand : 1; 3561 } 3562 3563 static void gaudi2_special_blocks_free(struct hl_device *hdev) 3564 { 3565 struct asic_fixed_properties *prop = &hdev->asic_prop; 3566 struct hl_skip_blocks_cfg *skip_special_blocks_cfg = 3567 &prop->skip_special_blocks_cfg; 3568 3569 kfree(prop->special_blocks); 3570 kfree(skip_special_blocks_cfg->block_types); 3571 kfree(skip_special_blocks_cfg->block_ranges); 3572 } 3573 3574 static void gaudi2_special_blocks_iterator_free(struct hl_device *hdev) 3575 { 3576 gaudi2_special_blocks_free(hdev); 3577 } 3578 3579 static bool gaudi2_special_block_skip(struct hl_device *hdev, 3580 struct hl_special_blocks_cfg *special_blocks_cfg, 3581 u32 blk_idx, u32 major, u32 minor, u32 sub_minor) 3582 { 3583 return false; 3584 } 3585 3586 static int gaudi2_special_blocks_config(struct hl_device *hdev) 3587 { 3588 struct asic_fixed_properties *prop = &hdev->asic_prop; 3589 int i, rc; 3590 3591 /* Configure Special blocks */ 3592 prop->glbl_err_max_cause_num = GAUDI2_GLBL_ERR_MAX_CAUSE_NUM; 3593 prop->num_of_special_blocks = ARRAY_SIZE(gaudi2_special_blocks); 3594 prop->special_blocks = kmalloc_array(prop->num_of_special_blocks, 3595 sizeof(*prop->special_blocks), GFP_KERNEL); 3596 if (!prop->special_blocks) 3597 return -ENOMEM; 3598 3599 for (i = 0 ; i < prop->num_of_special_blocks ; i++) 3600 memcpy(&prop->special_blocks[i], &gaudi2_special_blocks[i], 3601 sizeof(*prop->special_blocks)); 3602 3603 /* Configure when to skip Special blocks */ 3604 memset(&prop->skip_special_blocks_cfg, 0, sizeof(prop->skip_special_blocks_cfg)); 3605 prop->skip_special_blocks_cfg.skip_block_hook = gaudi2_special_block_skip; 3606 3607 if (ARRAY_SIZE(gaudi2_iterator_skip_block_types)) { 3608 prop->skip_special_blocks_cfg.block_types = 3609 kmalloc_array(ARRAY_SIZE(gaudi2_iterator_skip_block_types), 3610 sizeof(gaudi2_iterator_skip_block_types[0]), GFP_KERNEL); 3611 if (!prop->skip_special_blocks_cfg.block_types) { 3612 rc = -ENOMEM; 3613 goto free_special_blocks; 3614 } 3615 3616 memcpy(prop->skip_special_blocks_cfg.block_types, gaudi2_iterator_skip_block_types, 3617 sizeof(gaudi2_iterator_skip_block_types)); 3618 3619 prop->skip_special_blocks_cfg.block_types_len = 3620 ARRAY_SIZE(gaudi2_iterator_skip_block_types); 3621 } 3622 3623 if (ARRAY_SIZE(gaudi2_iterator_skip_block_ranges)) { 3624 prop->skip_special_blocks_cfg.block_ranges = 3625 kmalloc_array(ARRAY_SIZE(gaudi2_iterator_skip_block_ranges), 3626 sizeof(gaudi2_iterator_skip_block_ranges[0]), GFP_KERNEL); 3627 if (!prop->skip_special_blocks_cfg.block_ranges) { 3628 rc = -ENOMEM; 3629 goto free_skip_special_blocks_types; 3630 } 3631 3632 for (i = 0 ; i < ARRAY_SIZE(gaudi2_iterator_skip_block_ranges) ; i++) 3633 memcpy(&prop->skip_special_blocks_cfg.block_ranges[i], 3634 &gaudi2_iterator_skip_block_ranges[i], 3635 sizeof(struct range)); 3636 3637 prop->skip_special_blocks_cfg.block_ranges_len = 3638 ARRAY_SIZE(gaudi2_iterator_skip_block_ranges); 3639 } 3640 3641 return 0; 3642 3643 free_skip_special_blocks_types: 3644 kfree(prop->skip_special_blocks_cfg.block_types); 3645 free_special_blocks: 3646 kfree(prop->special_blocks); 3647 3648 return rc; 3649 } 3650 3651 static int gaudi2_special_blocks_iterator_config(struct hl_device *hdev) 3652 { 3653 return gaudi2_special_blocks_config(hdev); 3654 } 3655 3656 static void gaudi2_test_queues_msgs_free(struct hl_device *hdev) 3657 { 3658 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3659 struct gaudi2_queues_test_info *msg_info = gaudi2->queues_test_info; 3660 int i; 3661 3662 for (i = 0 ; i < GAUDI2_NUM_TESTED_QS ; i++) { 3663 /* bail-out if this is an allocation failure point */ 3664 if (!msg_info[i].kern_addr) 3665 break; 3666 3667 hl_asic_dma_pool_free(hdev, msg_info[i].kern_addr, msg_info[i].dma_addr); 3668 msg_info[i].kern_addr = NULL; 3669 } 3670 } 3671 3672 static int gaudi2_test_queues_msgs_alloc(struct hl_device *hdev) 3673 { 3674 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3675 struct gaudi2_queues_test_info *msg_info = gaudi2->queues_test_info; 3676 int i, rc; 3677 3678 /* allocate a message-short buf for each Q we intend to test */ 3679 for (i = 0 ; i < GAUDI2_NUM_TESTED_QS ; i++) { 3680 msg_info[i].kern_addr = 3681 (void *)hl_asic_dma_pool_zalloc(hdev, sizeof(struct packet_msg_short), 3682 GFP_KERNEL, &msg_info[i].dma_addr); 3683 if (!msg_info[i].kern_addr) { 3684 dev_err(hdev->dev, 3685 "Failed to allocate dma memory for H/W queue %d testing\n", i); 3686 rc = -ENOMEM; 3687 goto err_exit; 3688 } 3689 } 3690 3691 return 0; 3692 3693 err_exit: 3694 gaudi2_test_queues_msgs_free(hdev); 3695 return rc; 3696 } 3697 3698 static int gaudi2_sw_init(struct hl_device *hdev) 3699 { 3700 struct asic_fixed_properties *prop = &hdev->asic_prop; 3701 struct gaudi2_device *gaudi2; 3702 int i, rc; 3703 3704 /* Allocate device structure */ 3705 gaudi2 = kzalloc(sizeof(*gaudi2), GFP_KERNEL); 3706 if (!gaudi2) 3707 return -ENOMEM; 3708 3709 for (i = 0 ; i < ARRAY_SIZE(gaudi2_irq_map_table) ; i++) { 3710 if (gaudi2_irq_map_table[i].msg || !gaudi2_irq_map_table[i].valid) 3711 continue; 3712 3713 if (gaudi2->num_of_valid_hw_events == GAUDI2_EVENT_SIZE) { 3714 dev_err(hdev->dev, "H/W events array exceeds the limit of %u events\n", 3715 GAUDI2_EVENT_SIZE); 3716 rc = -EINVAL; 3717 goto free_gaudi2_device; 3718 } 3719 3720 gaudi2->hw_events[gaudi2->num_of_valid_hw_events++] = gaudi2_irq_map_table[i].fc_id; 3721 } 3722 3723 for (i = 0 ; i < MME_NUM_OF_LFSR_SEEDS ; i++) 3724 gaudi2->lfsr_rand_seeds[i] = gaudi2_get_non_zero_random_int(); 3725 3726 gaudi2->cpucp_info_get = gaudi2_cpucp_info_get; 3727 3728 hdev->asic_specific = gaudi2; 3729 3730 /* Create DMA pool for small allocations. 3731 * Use DEVICE_CACHE_LINE_SIZE for alignment since the NIC memory-mapped 3732 * PI/CI registers allocated from this pool have this restriction 3733 */ 3734 hdev->dma_pool = dma_pool_create(dev_name(hdev->dev), &hdev->pdev->dev, 3735 GAUDI2_DMA_POOL_BLK_SIZE, DEVICE_CACHE_LINE_SIZE, 0); 3736 if (!hdev->dma_pool) { 3737 dev_err(hdev->dev, "failed to create DMA pool\n"); 3738 rc = -ENOMEM; 3739 goto free_gaudi2_device; 3740 } 3741 3742 rc = gaudi2_alloc_cpu_accessible_dma_mem(hdev); 3743 if (rc) 3744 goto free_dma_pool; 3745 3746 hdev->cpu_accessible_dma_pool = gen_pool_create(ilog2(32), -1); 3747 if (!hdev->cpu_accessible_dma_pool) { 3748 dev_err(hdev->dev, "Failed to create CPU accessible DMA pool\n"); 3749 rc = -ENOMEM; 3750 goto free_cpu_dma_mem; 3751 } 3752 3753 rc = gen_pool_add(hdev->cpu_accessible_dma_pool, (uintptr_t) hdev->cpu_accessible_dma_mem, 3754 HL_CPU_ACCESSIBLE_MEM_SIZE, -1); 3755 if (rc) { 3756 dev_err(hdev->dev, "Failed to add memory to CPU accessible DMA pool\n"); 3757 rc = -EFAULT; 3758 goto free_cpu_accessible_dma_pool; 3759 } 3760 3761 gaudi2->virt_msix_db_cpu_addr = hl_cpu_accessible_dma_pool_alloc(hdev, prop->pmmu.page_size, 3762 &gaudi2->virt_msix_db_dma_addr); 3763 if (!gaudi2->virt_msix_db_cpu_addr) { 3764 dev_err(hdev->dev, "Failed to allocate DMA memory for virtual MSI-X doorbell\n"); 3765 rc = -ENOMEM; 3766 goto free_cpu_accessible_dma_pool; 3767 } 3768 3769 spin_lock_init(&gaudi2->hw_queues_lock); 3770 3771 gaudi2->scratchpad_bus_address = prop->mmu_pgt_addr + HMMU_PAGE_TABLES_SIZE + EDMA_PQS_SIZE; 3772 3773 gaudi2_user_mapped_blocks_init(hdev); 3774 3775 /* Initialize user interrupts */ 3776 gaudi2_user_interrupt_setup(hdev); 3777 3778 hdev->supports_coresight = true; 3779 hdev->supports_sync_stream = true; 3780 hdev->supports_cb_mapping = true; 3781 hdev->supports_wait_for_multi_cs = false; 3782 3783 prop->supports_compute_reset = true; 3784 3785 /* Event queue sanity check added in FW version 1.11 */ 3786 if (hl_is_fw_sw_ver_below(hdev, 1, 11)) 3787 hdev->event_queue.check_eqe_index = false; 3788 else 3789 hdev->event_queue.check_eqe_index = true; 3790 3791 hdev->asic_funcs->set_pci_memory_regions(hdev); 3792 3793 rc = gaudi2_special_blocks_iterator_config(hdev); 3794 if (rc) 3795 goto free_virt_msix_db_mem; 3796 3797 rc = gaudi2_test_queues_msgs_alloc(hdev); 3798 if (rc) 3799 goto special_blocks_free; 3800 3801 return 0; 3802 3803 special_blocks_free: 3804 gaudi2_special_blocks_iterator_free(hdev); 3805 free_virt_msix_db_mem: 3806 hl_cpu_accessible_dma_pool_free(hdev, prop->pmmu.page_size, gaudi2->virt_msix_db_cpu_addr); 3807 free_cpu_accessible_dma_pool: 3808 gen_pool_destroy(hdev->cpu_accessible_dma_pool); 3809 free_cpu_dma_mem: 3810 hl_asic_dma_free_coherent(hdev, HL_CPU_ACCESSIBLE_MEM_SIZE, hdev->cpu_accessible_dma_mem, 3811 hdev->cpu_accessible_dma_address); 3812 free_dma_pool: 3813 dma_pool_destroy(hdev->dma_pool); 3814 free_gaudi2_device: 3815 kfree(gaudi2); 3816 return rc; 3817 } 3818 3819 static int gaudi2_sw_fini(struct hl_device *hdev) 3820 { 3821 struct asic_fixed_properties *prop = &hdev->asic_prop; 3822 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3823 3824 gaudi2_test_queues_msgs_free(hdev); 3825 3826 gaudi2_special_blocks_iterator_free(hdev); 3827 3828 hl_cpu_accessible_dma_pool_free(hdev, prop->pmmu.page_size, gaudi2->virt_msix_db_cpu_addr); 3829 3830 gen_pool_destroy(hdev->cpu_accessible_dma_pool); 3831 3832 hl_asic_dma_free_coherent(hdev, HL_CPU_ACCESSIBLE_MEM_SIZE, hdev->cpu_accessible_dma_mem, 3833 hdev->cpu_accessible_dma_address); 3834 3835 dma_pool_destroy(hdev->dma_pool); 3836 3837 kfree(gaudi2); 3838 3839 return 0; 3840 } 3841 3842 static void gaudi2_stop_qman_common(struct hl_device *hdev, u32 reg_base) 3843 { 3844 WREG32(reg_base + QM_GLBL_CFG1_OFFSET, QM_GLBL_CFG1_PQF_STOP | 3845 QM_GLBL_CFG1_CQF_STOP | 3846 QM_GLBL_CFG1_CP_STOP); 3847 3848 /* stop also the ARC */ 3849 WREG32(reg_base + QM_GLBL_CFG2_OFFSET, QM_GLBL_CFG2_ARC_CQF_STOP); 3850 } 3851 3852 static void gaudi2_flush_qman_common(struct hl_device *hdev, u32 reg_base) 3853 { 3854 WREG32(reg_base + QM_GLBL_CFG1_OFFSET, QM_GLBL_CFG1_PQF_FLUSH | 3855 QM_GLBL_CFG1_CQF_FLUSH | 3856 QM_GLBL_CFG1_CP_FLUSH); 3857 } 3858 3859 static void gaudi2_flush_qman_arc_common(struct hl_device *hdev, u32 reg_base) 3860 { 3861 WREG32(reg_base + QM_GLBL_CFG2_OFFSET, QM_GLBL_CFG2_ARC_CQF_FLUSH); 3862 } 3863 3864 /** 3865 * gaudi2_clear_qm_fence_counters_common - clear QM's fence counters 3866 * 3867 * @hdev: pointer to the habanalabs device structure 3868 * @queue_id: queue to clear fence counters to 3869 * @skip_fence: if true set maximum fence value to all fence counters to avoid 3870 * getting stuck on any fence value. otherwise set all fence 3871 * counters to 0 (standard clear of fence counters) 3872 */ 3873 static void gaudi2_clear_qm_fence_counters_common(struct hl_device *hdev, u32 queue_id, 3874 bool skip_fence) 3875 { 3876 u32 size, reg_base; 3877 u32 addr, val; 3878 3879 reg_base = gaudi2_qm_blocks_bases[queue_id]; 3880 3881 addr = reg_base + QM_CP_FENCE0_CNT_0_OFFSET; 3882 size = mmPDMA0_QM_CP_BARRIER_CFG - mmPDMA0_QM_CP_FENCE0_CNT_0; 3883 3884 /* 3885 * in case we want to make sure that QM that is stuck on a fence will 3886 * be released we should set the fence counter to a higher value that 3887 * the value the QM waiting for. to comply with any fence counter of 3888 * any value we set maximum fence value to all counters 3889 */ 3890 val = skip_fence ? U32_MAX : 0; 3891 gaudi2_memset_device_lbw(hdev, addr, size, val); 3892 } 3893 3894 static void gaudi2_qman_manual_flush_common(struct hl_device *hdev, u32 queue_id) 3895 { 3896 u32 reg_base = gaudi2_qm_blocks_bases[queue_id]; 3897 3898 gaudi2_clear_qm_fence_counters_common(hdev, queue_id, true); 3899 gaudi2_flush_qman_common(hdev, reg_base); 3900 gaudi2_flush_qman_arc_common(hdev, reg_base); 3901 } 3902 3903 static void gaudi2_stop_dma_qmans(struct hl_device *hdev) 3904 { 3905 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3906 int dcore, inst; 3907 3908 if (!(gaudi2->hw_cap_initialized & HW_CAP_PDMA_MASK)) 3909 goto stop_edma_qmans; 3910 3911 /* Stop CPs of PDMA QMANs */ 3912 gaudi2_stop_qman_common(hdev, mmPDMA0_QM_BASE); 3913 gaudi2_stop_qman_common(hdev, mmPDMA1_QM_BASE); 3914 3915 stop_edma_qmans: 3916 if (!(gaudi2->hw_cap_initialized & HW_CAP_EDMA_MASK)) 3917 return; 3918 3919 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 3920 for (inst = 0 ; inst < NUM_OF_EDMA_PER_DCORE ; inst++) { 3921 u8 seq = dcore * NUM_OF_EDMA_PER_DCORE + inst; 3922 u32 qm_base; 3923 3924 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_EDMA_SHIFT + seq))) 3925 continue; 3926 3927 qm_base = mmDCORE0_EDMA0_QM_BASE + dcore * DCORE_OFFSET + 3928 inst * DCORE_EDMA_OFFSET; 3929 3930 /* Stop CPs of EDMA QMANs */ 3931 gaudi2_stop_qman_common(hdev, qm_base); 3932 } 3933 } 3934 } 3935 3936 static void gaudi2_stop_mme_qmans(struct hl_device *hdev) 3937 { 3938 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3939 u32 offset, i; 3940 3941 offset = mmDCORE1_MME_QM_BASE - mmDCORE0_MME_QM_BASE; 3942 3943 for (i = 0 ; i < NUM_OF_DCORES ; i++) { 3944 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_MME_SHIFT + i))) 3945 continue; 3946 3947 gaudi2_stop_qman_common(hdev, mmDCORE0_MME_QM_BASE + (i * offset)); 3948 } 3949 } 3950 3951 static void gaudi2_stop_tpc_qmans(struct hl_device *hdev) 3952 { 3953 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3954 u32 reg_base; 3955 int i; 3956 3957 if (!(gaudi2->tpc_hw_cap_initialized & HW_CAP_TPC_MASK)) 3958 return; 3959 3960 for (i = 0 ; i < TPC_ID_SIZE ; i++) { 3961 if (!(gaudi2->tpc_hw_cap_initialized & BIT_ULL(HW_CAP_TPC_SHIFT + i))) 3962 continue; 3963 3964 reg_base = gaudi2_qm_blocks_bases[gaudi2_tpc_id_to_queue_id[i]]; 3965 gaudi2_stop_qman_common(hdev, reg_base); 3966 } 3967 } 3968 3969 static void gaudi2_stop_rot_qmans(struct hl_device *hdev) 3970 { 3971 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3972 u32 reg_base; 3973 int i; 3974 3975 if (!(gaudi2->hw_cap_initialized & HW_CAP_ROT_MASK)) 3976 return; 3977 3978 for (i = 0 ; i < ROTATOR_ID_SIZE ; i++) { 3979 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_ROT_SHIFT + i))) 3980 continue; 3981 3982 reg_base = gaudi2_qm_blocks_bases[gaudi2_rot_id_to_queue_id[i]]; 3983 gaudi2_stop_qman_common(hdev, reg_base); 3984 } 3985 } 3986 3987 static void gaudi2_stop_nic_qmans(struct hl_device *hdev) 3988 { 3989 struct gaudi2_device *gaudi2 = hdev->asic_specific; 3990 u32 reg_base, queue_id; 3991 int i; 3992 3993 if (!(gaudi2->nic_hw_cap_initialized & HW_CAP_NIC_MASK)) 3994 return; 3995 3996 queue_id = GAUDI2_QUEUE_ID_NIC_0_0; 3997 3998 for (i = 0 ; i < NIC_NUMBER_OF_ENGINES ; i++, queue_id += NUM_OF_PQ_PER_QMAN) { 3999 if (!(hdev->nic_ports_mask & BIT(i))) 4000 continue; 4001 4002 reg_base = gaudi2_qm_blocks_bases[queue_id]; 4003 gaudi2_stop_qman_common(hdev, reg_base); 4004 } 4005 } 4006 4007 static void gaudi2_stall_dma_common(struct hl_device *hdev, u32 reg_base) 4008 { 4009 u32 reg_val; 4010 4011 reg_val = FIELD_PREP(PDMA0_CORE_CFG_1_HALT_MASK, 0x1); 4012 WREG32(reg_base + DMA_CORE_CFG_1_OFFSET, reg_val); 4013 } 4014 4015 static void gaudi2_dma_stall(struct hl_device *hdev) 4016 { 4017 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4018 int dcore, inst; 4019 4020 if (!(gaudi2->hw_cap_initialized & HW_CAP_PDMA_MASK)) 4021 goto stall_edma; 4022 4023 gaudi2_stall_dma_common(hdev, mmPDMA0_CORE_BASE); 4024 gaudi2_stall_dma_common(hdev, mmPDMA1_CORE_BASE); 4025 4026 stall_edma: 4027 if (!(gaudi2->hw_cap_initialized & HW_CAP_EDMA_MASK)) 4028 return; 4029 4030 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 4031 for (inst = 0 ; inst < NUM_OF_EDMA_PER_DCORE ; inst++) { 4032 u8 seq = dcore * NUM_OF_EDMA_PER_DCORE + inst; 4033 u32 core_base; 4034 4035 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_EDMA_SHIFT + seq))) 4036 continue; 4037 4038 core_base = mmDCORE0_EDMA0_CORE_BASE + dcore * DCORE_OFFSET + 4039 inst * DCORE_EDMA_OFFSET; 4040 4041 /* Stall CPs of EDMA QMANs */ 4042 gaudi2_stall_dma_common(hdev, core_base); 4043 } 4044 } 4045 } 4046 4047 static void gaudi2_mme_stall(struct hl_device *hdev) 4048 { 4049 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4050 u32 offset, i; 4051 4052 offset = mmDCORE1_MME_CTRL_LO_QM_STALL - mmDCORE0_MME_CTRL_LO_QM_STALL; 4053 4054 for (i = 0 ; i < NUM_OF_DCORES ; i++) 4055 if (gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_MME_SHIFT + i)) 4056 WREG32(mmDCORE0_MME_CTRL_LO_QM_STALL + (i * offset), 1); 4057 } 4058 4059 static void gaudi2_tpc_stall(struct hl_device *hdev) 4060 { 4061 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4062 u32 reg_base; 4063 int i; 4064 4065 if (!(gaudi2->tpc_hw_cap_initialized & HW_CAP_TPC_MASK)) 4066 return; 4067 4068 for (i = 0 ; i < TPC_ID_SIZE ; i++) { 4069 if (!(gaudi2->tpc_hw_cap_initialized & BIT_ULL(HW_CAP_TPC_SHIFT + i))) 4070 continue; 4071 4072 reg_base = gaudi2_tpc_cfg_blocks_bases[i]; 4073 WREG32(reg_base + TPC_CFG_STALL_OFFSET, 1); 4074 } 4075 } 4076 4077 static void gaudi2_rotator_stall(struct hl_device *hdev) 4078 { 4079 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4080 u32 reg_val; 4081 int i; 4082 4083 if (!(gaudi2->hw_cap_initialized & HW_CAP_ROT_MASK)) 4084 return; 4085 4086 reg_val = FIELD_PREP(ROT_MSS_HALT_WBC_MASK, 0x1) | 4087 FIELD_PREP(ROT_MSS_HALT_RSB_MASK, 0x1) | 4088 FIELD_PREP(ROT_MSS_HALT_MRSB_MASK, 0x1); 4089 4090 for (i = 0 ; i < ROTATOR_ID_SIZE ; i++) { 4091 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_ROT_SHIFT + i))) 4092 continue; 4093 4094 WREG32(mmROT0_MSS_HALT + i * ROT_OFFSET, reg_val); 4095 } 4096 } 4097 4098 static void gaudi2_disable_qman_common(struct hl_device *hdev, u32 reg_base) 4099 { 4100 WREG32(reg_base + QM_GLBL_CFG0_OFFSET, 0); 4101 } 4102 4103 static void gaudi2_disable_dma_qmans(struct hl_device *hdev) 4104 { 4105 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4106 int dcore, inst; 4107 4108 if (!(gaudi2->hw_cap_initialized & HW_CAP_PDMA_MASK)) 4109 goto stop_edma_qmans; 4110 4111 gaudi2_disable_qman_common(hdev, mmPDMA0_QM_BASE); 4112 gaudi2_disable_qman_common(hdev, mmPDMA1_QM_BASE); 4113 4114 stop_edma_qmans: 4115 if (!(gaudi2->hw_cap_initialized & HW_CAP_EDMA_MASK)) 4116 return; 4117 4118 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 4119 for (inst = 0 ; inst < NUM_OF_EDMA_PER_DCORE ; inst++) { 4120 u8 seq = dcore * NUM_OF_EDMA_PER_DCORE + inst; 4121 u32 qm_base; 4122 4123 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_EDMA_SHIFT + seq))) 4124 continue; 4125 4126 qm_base = mmDCORE0_EDMA0_QM_BASE + dcore * DCORE_OFFSET + 4127 inst * DCORE_EDMA_OFFSET; 4128 4129 /* Disable CPs of EDMA QMANs */ 4130 gaudi2_disable_qman_common(hdev, qm_base); 4131 } 4132 } 4133 } 4134 4135 static void gaudi2_disable_mme_qmans(struct hl_device *hdev) 4136 { 4137 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4138 u32 offset, i; 4139 4140 offset = mmDCORE1_MME_QM_BASE - mmDCORE0_MME_QM_BASE; 4141 4142 for (i = 0 ; i < NUM_OF_DCORES ; i++) 4143 if (gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_MME_SHIFT + i)) 4144 gaudi2_disable_qman_common(hdev, mmDCORE0_MME_QM_BASE + (i * offset)); 4145 } 4146 4147 static void gaudi2_disable_tpc_qmans(struct hl_device *hdev) 4148 { 4149 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4150 u32 reg_base; 4151 int i; 4152 4153 if (!(gaudi2->tpc_hw_cap_initialized & HW_CAP_TPC_MASK)) 4154 return; 4155 4156 for (i = 0 ; i < TPC_ID_SIZE ; i++) { 4157 if (!(gaudi2->tpc_hw_cap_initialized & BIT_ULL(HW_CAP_TPC_SHIFT + i))) 4158 continue; 4159 4160 reg_base = gaudi2_qm_blocks_bases[gaudi2_tpc_id_to_queue_id[i]]; 4161 gaudi2_disable_qman_common(hdev, reg_base); 4162 } 4163 } 4164 4165 static void gaudi2_disable_rot_qmans(struct hl_device *hdev) 4166 { 4167 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4168 u32 reg_base; 4169 int i; 4170 4171 if (!(gaudi2->hw_cap_initialized & HW_CAP_ROT_MASK)) 4172 return; 4173 4174 for (i = 0 ; i < ROTATOR_ID_SIZE ; i++) { 4175 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_ROT_SHIFT + i))) 4176 continue; 4177 4178 reg_base = gaudi2_qm_blocks_bases[gaudi2_rot_id_to_queue_id[i]]; 4179 gaudi2_disable_qman_common(hdev, reg_base); 4180 } 4181 } 4182 4183 static void gaudi2_disable_nic_qmans(struct hl_device *hdev) 4184 { 4185 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4186 u32 reg_base, queue_id; 4187 int i; 4188 4189 if (!(gaudi2->nic_hw_cap_initialized & HW_CAP_NIC_MASK)) 4190 return; 4191 4192 queue_id = GAUDI2_QUEUE_ID_NIC_0_0; 4193 4194 for (i = 0 ; i < NIC_NUMBER_OF_ENGINES ; i++, queue_id += NUM_OF_PQ_PER_QMAN) { 4195 if (!(hdev->nic_ports_mask & BIT(i))) 4196 continue; 4197 4198 reg_base = gaudi2_qm_blocks_bases[queue_id]; 4199 gaudi2_disable_qman_common(hdev, reg_base); 4200 } 4201 } 4202 4203 static void gaudi2_enable_timestamp(struct hl_device *hdev) 4204 { 4205 /* Disable the timestamp counter */ 4206 WREG32(mmPSOC_TIMESTAMP_BASE, 0); 4207 4208 /* Zero the lower/upper parts of the 64-bit counter */ 4209 WREG32(mmPSOC_TIMESTAMP_BASE + 0xC, 0); 4210 WREG32(mmPSOC_TIMESTAMP_BASE + 0x8, 0); 4211 4212 /* Enable the counter */ 4213 WREG32(mmPSOC_TIMESTAMP_BASE, 1); 4214 } 4215 4216 static void gaudi2_disable_timestamp(struct hl_device *hdev) 4217 { 4218 /* Disable the timestamp counter */ 4219 WREG32(mmPSOC_TIMESTAMP_BASE, 0); 4220 } 4221 4222 static const char *gaudi2_irq_name(u16 irq_number) 4223 { 4224 switch (irq_number) { 4225 case GAUDI2_IRQ_NUM_EVENT_QUEUE: 4226 return "gaudi2 cpu eq"; 4227 case GAUDI2_IRQ_NUM_COMPLETION: 4228 return "gaudi2 completion"; 4229 case GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM ... GAUDI2_IRQ_NUM_SHARED_DEC1_ABNRM: 4230 return gaudi2_vdec_irq_name[irq_number - GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM]; 4231 case GAUDI2_IRQ_NUM_TPC_ASSERT: 4232 return "gaudi2 tpc assert"; 4233 case GAUDI2_IRQ_NUM_UNEXPECTED_ERROR: 4234 return "gaudi2 unexpected error"; 4235 case GAUDI2_IRQ_NUM_USER_FIRST ... GAUDI2_IRQ_NUM_USER_LAST: 4236 return "gaudi2 user completion"; 4237 case GAUDI2_IRQ_NUM_EQ_ERROR: 4238 return "gaudi2 eq error"; 4239 default: 4240 return "invalid"; 4241 } 4242 } 4243 4244 static void gaudi2_dec_disable_msix(struct hl_device *hdev, u32 max_irq_num) 4245 { 4246 int i, irq, relative_idx; 4247 struct hl_dec *dec; 4248 4249 for (i = GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM ; i < max_irq_num ; i++) { 4250 irq = pci_irq_vector(hdev->pdev, i); 4251 relative_idx = i - GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM; 4252 4253 dec = hdev->dec + relative_idx / 2; 4254 4255 /* We pass different structures depending on the irq handler. For the abnormal 4256 * interrupt we pass hl_dec and for the regular interrupt we pass the relevant 4257 * user_interrupt entry 4258 */ 4259 free_irq(irq, ((relative_idx % 2) ? 4260 (void *) dec : 4261 (void *) &hdev->user_interrupt[dec->core_id])); 4262 } 4263 } 4264 4265 static int gaudi2_dec_enable_msix(struct hl_device *hdev) 4266 { 4267 int rc, i, irq_init_cnt, irq, relative_idx; 4268 struct hl_dec *dec; 4269 4270 for (i = GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM, irq_init_cnt = 0; 4271 i <= GAUDI2_IRQ_NUM_SHARED_DEC1_ABNRM; 4272 i++, irq_init_cnt++) { 4273 4274 irq = pci_irq_vector(hdev->pdev, i); 4275 relative_idx = i - GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM; 4276 4277 /* We pass different structures depending on the irq handler. For the abnormal 4278 * interrupt we pass hl_dec and for the regular interrupt we pass the relevant 4279 * user_interrupt entry 4280 * 4281 * TODO: change the dec abnrm to threaded irq 4282 */ 4283 4284 dec = hdev->dec + relative_idx / 2; 4285 if (relative_idx % 2) { 4286 rc = request_irq(irq, hl_irq_handler_dec_abnrm, 0, 4287 gaudi2_irq_name(i), (void *) dec); 4288 } else { 4289 rc = request_irq(irq, hl_irq_user_interrupt_handler, 0, gaudi2_irq_name(i), 4290 (void *) &hdev->user_interrupt[dec->core_id]); 4291 } 4292 4293 if (rc) { 4294 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4295 goto free_dec_irqs; 4296 } 4297 } 4298 4299 return 0; 4300 4301 free_dec_irqs: 4302 gaudi2_dec_disable_msix(hdev, (GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM + irq_init_cnt)); 4303 return rc; 4304 } 4305 4306 static int gaudi2_enable_msix(struct hl_device *hdev) 4307 { 4308 struct asic_fixed_properties *prop = &hdev->asic_prop; 4309 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4310 int rc, irq, i, j, user_irq_init_cnt; 4311 struct hl_cq *cq; 4312 4313 if (gaudi2->hw_cap_initialized & HW_CAP_MSIX) 4314 return 0; 4315 4316 hl_init_cpu_for_irq(hdev); 4317 4318 rc = pci_alloc_irq_vectors(hdev->pdev, GAUDI2_MSIX_ENTRIES, GAUDI2_MSIX_ENTRIES, 4319 PCI_IRQ_MSIX); 4320 if (rc < 0) { 4321 dev_err(hdev->dev, "MSI-X: Failed to enable support -- %d/%d\n", 4322 GAUDI2_MSIX_ENTRIES, rc); 4323 return rc; 4324 } 4325 4326 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_COMPLETION); 4327 cq = &hdev->completion_queue[GAUDI2_RESERVED_CQ_CS_COMPLETION]; 4328 rc = request_irq(irq, hl_irq_handler_cq, 0, gaudi2_irq_name(GAUDI2_IRQ_NUM_COMPLETION), cq); 4329 if (rc) { 4330 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4331 goto free_irq_vectors; 4332 } 4333 4334 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EVENT_QUEUE); 4335 rc = request_irq(irq, hl_irq_handler_eq, 0, gaudi2_irq_name(GAUDI2_IRQ_NUM_EVENT_QUEUE), 4336 &hdev->event_queue); 4337 if (rc) { 4338 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4339 goto free_completion_irq; 4340 } 4341 4342 rc = gaudi2_dec_enable_msix(hdev); 4343 if (rc) { 4344 dev_err(hdev->dev, "Failed to enable decoder IRQ"); 4345 goto free_event_irq; 4346 } 4347 4348 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_TPC_ASSERT); 4349 rc = request_threaded_irq(irq, NULL, hl_irq_user_interrupt_thread_handler, IRQF_ONESHOT, 4350 gaudi2_irq_name(GAUDI2_IRQ_NUM_TPC_ASSERT), 4351 &hdev->tpc_interrupt); 4352 if (rc) { 4353 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4354 goto free_dec_irq; 4355 } 4356 4357 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_UNEXPECTED_ERROR); 4358 rc = request_threaded_irq(irq, NULL, hl_irq_user_interrupt_thread_handler, IRQF_ONESHOT, 4359 gaudi2_irq_name(GAUDI2_IRQ_NUM_UNEXPECTED_ERROR), 4360 &hdev->unexpected_error_interrupt); 4361 if (rc) { 4362 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4363 goto free_tpc_irq; 4364 } 4365 4366 for (i = GAUDI2_IRQ_NUM_USER_FIRST, j = prop->user_dec_intr_count, user_irq_init_cnt = 0; 4367 user_irq_init_cnt < prop->user_interrupt_count; 4368 i++, j++, user_irq_init_cnt++) { 4369 4370 irq = pci_irq_vector(hdev->pdev, i); 4371 hl_set_irq_affinity(hdev, irq); 4372 rc = request_irq(irq, hl_irq_user_interrupt_handler, 0, gaudi2_irq_name(i), 4373 &hdev->user_interrupt[j]); 4374 if (rc) { 4375 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4376 goto free_user_irq; 4377 } 4378 } 4379 4380 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EQ_ERROR); 4381 rc = request_threaded_irq(irq, NULL, hl_irq_eq_error_interrupt_thread_handler, 4382 IRQF_ONESHOT, gaudi2_irq_name(GAUDI2_IRQ_NUM_EQ_ERROR), 4383 hdev); 4384 if (rc) { 4385 dev_err(hdev->dev, "Failed to request IRQ %d", irq); 4386 goto free_user_irq; 4387 } 4388 4389 gaudi2->hw_cap_initialized |= HW_CAP_MSIX; 4390 4391 return 0; 4392 4393 free_user_irq: 4394 for (i = GAUDI2_IRQ_NUM_USER_FIRST, j = prop->user_dec_intr_count; 4395 i < GAUDI2_IRQ_NUM_USER_FIRST + user_irq_init_cnt ; i++, j++) { 4396 4397 irq = pci_irq_vector(hdev->pdev, i); 4398 irq_set_affinity_and_hint(irq, NULL); 4399 free_irq(irq, &hdev->user_interrupt[j]); 4400 } 4401 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_UNEXPECTED_ERROR); 4402 free_irq(irq, &hdev->unexpected_error_interrupt); 4403 free_tpc_irq: 4404 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_TPC_ASSERT); 4405 free_irq(irq, &hdev->tpc_interrupt); 4406 free_dec_irq: 4407 gaudi2_dec_disable_msix(hdev, GAUDI2_IRQ_NUM_DEC_LAST + 1); 4408 free_event_irq: 4409 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EVENT_QUEUE); 4410 free_irq(irq, cq); 4411 4412 free_completion_irq: 4413 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_COMPLETION); 4414 free_irq(irq, cq); 4415 4416 free_irq_vectors: 4417 pci_free_irq_vectors(hdev->pdev); 4418 4419 return rc; 4420 } 4421 4422 static void gaudi2_sync_irqs(struct hl_device *hdev) 4423 { 4424 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4425 int i, j; 4426 int irq; 4427 4428 if (!(gaudi2->hw_cap_initialized & HW_CAP_MSIX)) 4429 return; 4430 4431 /* Wait for all pending IRQs to be finished */ 4432 synchronize_irq(pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_COMPLETION)); 4433 4434 for (i = GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM ; i <= GAUDI2_IRQ_NUM_SHARED_DEC1_ABNRM ; i++) { 4435 irq = pci_irq_vector(hdev->pdev, i); 4436 synchronize_irq(irq); 4437 } 4438 4439 synchronize_irq(pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_TPC_ASSERT)); 4440 synchronize_irq(pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_UNEXPECTED_ERROR)); 4441 4442 for (i = GAUDI2_IRQ_NUM_USER_FIRST, j = 0 ; j < hdev->asic_prop.user_interrupt_count; 4443 i++, j++) { 4444 irq = pci_irq_vector(hdev->pdev, i); 4445 synchronize_irq(irq); 4446 } 4447 4448 synchronize_irq(pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EVENT_QUEUE)); 4449 synchronize_irq(pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EQ_ERROR)); 4450 } 4451 4452 static void gaudi2_disable_msix(struct hl_device *hdev) 4453 { 4454 struct asic_fixed_properties *prop = &hdev->asic_prop; 4455 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4456 struct hl_cq *cq; 4457 int irq, i, j, k; 4458 4459 if (!(gaudi2->hw_cap_initialized & HW_CAP_MSIX)) 4460 return; 4461 4462 gaudi2_sync_irqs(hdev); 4463 4464 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EVENT_QUEUE); 4465 free_irq(irq, &hdev->event_queue); 4466 4467 gaudi2_dec_disable_msix(hdev, GAUDI2_IRQ_NUM_SHARED_DEC1_ABNRM + 1); 4468 4469 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_TPC_ASSERT); 4470 free_irq(irq, &hdev->tpc_interrupt); 4471 4472 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_UNEXPECTED_ERROR); 4473 free_irq(irq, &hdev->unexpected_error_interrupt); 4474 4475 for (i = GAUDI2_IRQ_NUM_USER_FIRST, j = prop->user_dec_intr_count, k = 0; 4476 k < hdev->asic_prop.user_interrupt_count ; i++, j++, k++) { 4477 4478 irq = pci_irq_vector(hdev->pdev, i); 4479 irq_set_affinity_and_hint(irq, NULL); 4480 free_irq(irq, &hdev->user_interrupt[j]); 4481 } 4482 4483 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_COMPLETION); 4484 cq = &hdev->completion_queue[GAUDI2_RESERVED_CQ_CS_COMPLETION]; 4485 free_irq(irq, cq); 4486 4487 irq = pci_irq_vector(hdev->pdev, GAUDI2_IRQ_NUM_EQ_ERROR); 4488 free_irq(irq, hdev); 4489 4490 pci_free_irq_vectors(hdev->pdev); 4491 4492 gaudi2->hw_cap_initialized &= ~HW_CAP_MSIX; 4493 } 4494 4495 static void gaudi2_stop_dcore_dec(struct hl_device *hdev, int dcore_id) 4496 { 4497 u32 reg_val = FIELD_PREP(DCORE0_VDEC0_BRDG_CTRL_GRACEFUL_STOP_MASK, 0x1); 4498 u32 graceful_pend_mask = DCORE0_VDEC0_BRDG_CTRL_GRACEFUL_PEND_MASK; 4499 u32 timeout_usec, dec_id, dec_bit, offset, graceful; 4500 int rc; 4501 4502 if (hdev->pldm) 4503 timeout_usec = GAUDI2_PLDM_VDEC_TIMEOUT_USEC; 4504 else 4505 timeout_usec = GAUDI2_VDEC_TIMEOUT_USEC; 4506 4507 for (dec_id = 0 ; dec_id < NUM_OF_DEC_PER_DCORE ; dec_id++) { 4508 dec_bit = dcore_id * NUM_OF_DEC_PER_DCORE + dec_id; 4509 if (!(hdev->asic_prop.decoder_enabled_mask & BIT(dec_bit))) 4510 continue; 4511 4512 offset = dcore_id * DCORE_OFFSET + dec_id * DCORE_VDEC_OFFSET; 4513 4514 WREG32(mmDCORE0_DEC0_CMD_SWREG16 + offset, 0); 4515 4516 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_GRACEFUL + offset, reg_val); 4517 4518 /* Wait till all traffic from decoder stops 4519 * before apply core reset. 4520 */ 4521 rc = hl_poll_timeout( 4522 hdev, 4523 mmDCORE0_VDEC0_BRDG_CTRL_GRACEFUL + offset, 4524 graceful, 4525 (graceful & graceful_pend_mask), 4526 100, 4527 timeout_usec); 4528 if (rc) 4529 dev_err(hdev->dev, 4530 "Failed to stop traffic from DCORE%d Decoder %d\n", 4531 dcore_id, dec_id); 4532 } 4533 } 4534 4535 static void gaudi2_stop_pcie_dec(struct hl_device *hdev) 4536 { 4537 u32 reg_val = FIELD_PREP(DCORE0_VDEC0_BRDG_CTRL_GRACEFUL_STOP_MASK, 0x1); 4538 u32 graceful_pend_mask = PCIE_VDEC0_BRDG_CTRL_GRACEFUL_PEND_MASK; 4539 u32 timeout_usec, dec_id, dec_bit, offset, graceful; 4540 int rc; 4541 4542 if (hdev->pldm) 4543 timeout_usec = GAUDI2_PLDM_VDEC_TIMEOUT_USEC; 4544 else 4545 timeout_usec = GAUDI2_VDEC_TIMEOUT_USEC; 4546 4547 for (dec_id = 0 ; dec_id < NUM_OF_DEC_PER_DCORE ; dec_id++) { 4548 dec_bit = PCIE_DEC_SHIFT + dec_id; 4549 if (!(hdev->asic_prop.decoder_enabled_mask & BIT(dec_bit))) 4550 continue; 4551 4552 offset = dec_id * PCIE_VDEC_OFFSET; 4553 4554 WREG32(mmPCIE_DEC0_CMD_SWREG16 + offset, 0); 4555 4556 WREG32(mmPCIE_VDEC0_BRDG_CTRL_GRACEFUL + offset, reg_val); 4557 4558 /* Wait till all traffic from decoder stops 4559 * before apply core reset. 4560 */ 4561 rc = hl_poll_timeout( 4562 hdev, 4563 mmPCIE_VDEC0_BRDG_CTRL_GRACEFUL + offset, 4564 graceful, 4565 (graceful & graceful_pend_mask), 4566 100, 4567 timeout_usec); 4568 if (rc) 4569 dev_err(hdev->dev, 4570 "Failed to stop traffic from PCIe Decoder %d\n", 4571 dec_id); 4572 } 4573 } 4574 4575 static void gaudi2_stop_dec(struct hl_device *hdev) 4576 { 4577 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4578 int dcore_id; 4579 4580 if ((gaudi2->dec_hw_cap_initialized & HW_CAP_DEC_MASK) == 0) 4581 return; 4582 4583 for (dcore_id = 0 ; dcore_id < NUM_OF_DCORES ; dcore_id++) 4584 gaudi2_stop_dcore_dec(hdev, dcore_id); 4585 4586 gaudi2_stop_pcie_dec(hdev); 4587 } 4588 4589 static void gaudi2_set_arc_running_mode(struct hl_device *hdev, u32 cpu_id, u32 run_mode) 4590 { 4591 u32 reg_base, reg_val; 4592 4593 reg_base = gaudi2_arc_blocks_bases[cpu_id]; 4594 if (run_mode == HL_ENGINE_CORE_RUN) 4595 reg_val = FIELD_PREP(ARC_FARM_ARC0_AUX_RUN_HALT_REQ_RUN_REQ_MASK, 1); 4596 else 4597 reg_val = FIELD_PREP(ARC_FARM_ARC0_AUX_RUN_HALT_REQ_HALT_REQ_MASK, 1); 4598 4599 WREG32(reg_base + ARC_HALT_REQ_OFFSET, reg_val); 4600 } 4601 4602 static void gaudi2_halt_arcs(struct hl_device *hdev) 4603 { 4604 u16 arc_id; 4605 4606 for (arc_id = CPU_ID_SCHED_ARC0; arc_id < CPU_ID_MAX; arc_id++) { 4607 if (gaudi2_is_arc_enabled(hdev, arc_id)) 4608 gaudi2_set_arc_running_mode(hdev, arc_id, HL_ENGINE_CORE_HALT); 4609 } 4610 } 4611 4612 static int gaudi2_verify_arc_running_mode(struct hl_device *hdev, u32 cpu_id, u32 run_mode) 4613 { 4614 int rc; 4615 u32 reg_base, val, ack_mask, timeout_usec = 100000; 4616 4617 if (hdev->pldm) 4618 timeout_usec *= 100; 4619 4620 reg_base = gaudi2_arc_blocks_bases[cpu_id]; 4621 if (run_mode == HL_ENGINE_CORE_RUN) 4622 ack_mask = ARC_FARM_ARC0_AUX_RUN_HALT_ACK_RUN_ACK_MASK; 4623 else 4624 ack_mask = ARC_FARM_ARC0_AUX_RUN_HALT_ACK_HALT_ACK_MASK; 4625 4626 rc = hl_poll_timeout(hdev, reg_base + ARC_HALT_ACK_OFFSET, 4627 val, ((val & ack_mask) == ack_mask), 4628 1000, timeout_usec); 4629 4630 if (!rc) { 4631 /* Clear */ 4632 val = FIELD_PREP(ARC_FARM_ARC0_AUX_RUN_HALT_REQ_RUN_REQ_MASK, 0); 4633 WREG32(reg_base + ARC_HALT_REQ_OFFSET, val); 4634 } 4635 4636 return rc; 4637 } 4638 4639 static void gaudi2_reset_arcs(struct hl_device *hdev) 4640 { 4641 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4642 u16 arc_id; 4643 4644 if (!gaudi2) 4645 return; 4646 4647 for (arc_id = CPU_ID_SCHED_ARC0; arc_id < CPU_ID_MAX; arc_id++) 4648 if (gaudi2_is_arc_enabled(hdev, arc_id)) 4649 gaudi2_clr_arc_id_cap(hdev, arc_id); 4650 } 4651 4652 static void gaudi2_nic_qmans_manual_flush(struct hl_device *hdev) 4653 { 4654 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4655 u32 queue_id; 4656 int i; 4657 4658 if (!(gaudi2->nic_hw_cap_initialized & HW_CAP_NIC_MASK)) 4659 return; 4660 4661 queue_id = GAUDI2_QUEUE_ID_NIC_0_0; 4662 4663 for (i = 0 ; i < NIC_NUMBER_OF_ENGINES ; i++, queue_id += NUM_OF_PQ_PER_QMAN) { 4664 if (!(hdev->nic_ports_mask & BIT(i))) 4665 continue; 4666 4667 gaudi2_qman_manual_flush_common(hdev, queue_id); 4668 } 4669 } 4670 4671 static int gaudi2_set_engine_cores(struct hl_device *hdev, u32 *core_ids, 4672 u32 num_cores, u32 core_command) 4673 { 4674 int i, rc; 4675 4676 for (i = 0 ; i < num_cores ; i++) { 4677 if (gaudi2_is_arc_enabled(hdev, core_ids[i])) 4678 gaudi2_set_arc_running_mode(hdev, core_ids[i], core_command); 4679 } 4680 4681 for (i = 0 ; i < num_cores ; i++) { 4682 if (gaudi2_is_arc_enabled(hdev, core_ids[i])) { 4683 rc = gaudi2_verify_arc_running_mode(hdev, core_ids[i], core_command); 4684 4685 if (rc) { 4686 dev_err(hdev->dev, "failed to %s arc: %d\n", 4687 (core_command == HL_ENGINE_CORE_HALT) ? 4688 "HALT" : "RUN", core_ids[i]); 4689 return -1; 4690 } 4691 } 4692 } 4693 4694 return 0; 4695 } 4696 4697 static int gaudi2_set_tpc_engine_mode(struct hl_device *hdev, u32 engine_id, u32 engine_command) 4698 { 4699 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4700 u32 reg_base, reg_addr, reg_val, tpc_id; 4701 4702 if (!(gaudi2->tpc_hw_cap_initialized & HW_CAP_TPC_MASK)) 4703 return 0; 4704 4705 tpc_id = gaudi2_tpc_engine_id_to_tpc_id[engine_id]; 4706 if (!(gaudi2->tpc_hw_cap_initialized & BIT_ULL(HW_CAP_TPC_SHIFT + tpc_id))) 4707 return 0; 4708 4709 reg_base = gaudi2_tpc_cfg_blocks_bases[tpc_id]; 4710 reg_addr = reg_base + TPC_CFG_STALL_OFFSET; 4711 reg_val = FIELD_PREP(DCORE0_TPC0_CFG_TPC_STALL_V_MASK, 4712 (engine_command == HL_ENGINE_STALL) ? 1 : 0); 4713 WREG32(reg_addr, reg_val); 4714 4715 if (engine_command == HL_ENGINE_RESUME) { 4716 reg_base = gaudi2_tpc_eml_cfg_blocks_bases[tpc_id]; 4717 reg_addr = reg_base + TPC_EML_CFG_DBG_CNT_OFFSET; 4718 RMWREG32(reg_addr, 0x1, DCORE0_TPC0_EML_CFG_DBG_CNT_DBG_EXIT_MASK); 4719 } 4720 4721 return 0; 4722 } 4723 4724 static int gaudi2_set_mme_engine_mode(struct hl_device *hdev, u32 engine_id, u32 engine_command) 4725 { 4726 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4727 u32 reg_base, reg_addr, reg_val, mme_id; 4728 4729 mme_id = gaudi2_mme_engine_id_to_mme_id[engine_id]; 4730 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_MME_SHIFT + mme_id))) 4731 return 0; 4732 4733 reg_base = gaudi2_mme_ctrl_lo_blocks_bases[mme_id]; 4734 reg_addr = reg_base + MME_CTRL_LO_QM_STALL_OFFSET; 4735 reg_val = FIELD_PREP(DCORE0_MME_CTRL_LO_QM_STALL_V_MASK, 4736 (engine_command == HL_ENGINE_STALL) ? 1 : 0); 4737 WREG32(reg_addr, reg_val); 4738 4739 return 0; 4740 } 4741 4742 static int gaudi2_set_edma_engine_mode(struct hl_device *hdev, u32 engine_id, u32 engine_command) 4743 { 4744 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4745 u32 reg_base, reg_addr, reg_val, edma_id; 4746 4747 if (!(gaudi2->hw_cap_initialized & HW_CAP_EDMA_MASK)) 4748 return 0; 4749 4750 edma_id = gaudi2_edma_engine_id_to_edma_id[engine_id]; 4751 if (!(gaudi2->hw_cap_initialized & BIT_ULL(HW_CAP_EDMA_SHIFT + edma_id))) 4752 return 0; 4753 4754 reg_base = gaudi2_dma_core_blocks_bases[edma_id]; 4755 reg_addr = reg_base + EDMA_CORE_CFG_STALL_OFFSET; 4756 reg_val = FIELD_PREP(DCORE0_EDMA0_CORE_CFG_1_HALT_MASK, 4757 (engine_command == HL_ENGINE_STALL) ? 1 : 0); 4758 WREG32(reg_addr, reg_val); 4759 4760 if (engine_command == HL_ENGINE_STALL) { 4761 reg_val = FIELD_PREP(DCORE0_EDMA0_CORE_CFG_1_HALT_MASK, 0x1) | 4762 FIELD_PREP(DCORE0_EDMA0_CORE_CFG_1_FLUSH_MASK, 0x1); 4763 WREG32(reg_addr, reg_val); 4764 } 4765 4766 return 0; 4767 } 4768 4769 static int gaudi2_set_engine_modes(struct hl_device *hdev, 4770 u32 *engine_ids, u32 num_engines, u32 engine_command) 4771 { 4772 int i, rc; 4773 4774 for (i = 0 ; i < num_engines ; ++i) { 4775 switch (engine_ids[i]) { 4776 case GAUDI2_DCORE0_ENGINE_ID_TPC_0 ... GAUDI2_DCORE0_ENGINE_ID_TPC_5: 4777 case GAUDI2_DCORE1_ENGINE_ID_TPC_0 ... GAUDI2_DCORE1_ENGINE_ID_TPC_5: 4778 case GAUDI2_DCORE2_ENGINE_ID_TPC_0 ... GAUDI2_DCORE2_ENGINE_ID_TPC_5: 4779 case GAUDI2_DCORE3_ENGINE_ID_TPC_0 ... GAUDI2_DCORE3_ENGINE_ID_TPC_5: 4780 rc = gaudi2_set_tpc_engine_mode(hdev, engine_ids[i], engine_command); 4781 if (rc) 4782 return rc; 4783 4784 break; 4785 case GAUDI2_DCORE0_ENGINE_ID_MME: 4786 case GAUDI2_DCORE1_ENGINE_ID_MME: 4787 case GAUDI2_DCORE2_ENGINE_ID_MME: 4788 case GAUDI2_DCORE3_ENGINE_ID_MME: 4789 rc = gaudi2_set_mme_engine_mode(hdev, engine_ids[i], engine_command); 4790 if (rc) 4791 return rc; 4792 4793 break; 4794 case GAUDI2_DCORE0_ENGINE_ID_EDMA_0 ... GAUDI2_DCORE0_ENGINE_ID_EDMA_1: 4795 case GAUDI2_DCORE1_ENGINE_ID_EDMA_0 ... GAUDI2_DCORE1_ENGINE_ID_EDMA_1: 4796 case GAUDI2_DCORE2_ENGINE_ID_EDMA_0 ... GAUDI2_DCORE2_ENGINE_ID_EDMA_1: 4797 case GAUDI2_DCORE3_ENGINE_ID_EDMA_0 ... GAUDI2_DCORE3_ENGINE_ID_EDMA_1: 4798 rc = gaudi2_set_edma_engine_mode(hdev, engine_ids[i], engine_command); 4799 if (rc) 4800 return rc; 4801 4802 break; 4803 default: 4804 dev_err(hdev->dev, "Invalid engine ID %u\n", engine_ids[i]); 4805 return -EINVAL; 4806 } 4807 } 4808 4809 return 0; 4810 } 4811 4812 static int gaudi2_set_engines(struct hl_device *hdev, u32 *engine_ids, 4813 u32 num_engines, u32 engine_command) 4814 { 4815 switch (engine_command) { 4816 case HL_ENGINE_CORE_HALT: 4817 case HL_ENGINE_CORE_RUN: 4818 return gaudi2_set_engine_cores(hdev, engine_ids, num_engines, engine_command); 4819 4820 case HL_ENGINE_STALL: 4821 case HL_ENGINE_RESUME: 4822 return gaudi2_set_engine_modes(hdev, engine_ids, num_engines, engine_command); 4823 4824 default: 4825 dev_err(hdev->dev, "failed to execute command id %u\n", engine_command); 4826 return -EINVAL; 4827 } 4828 } 4829 4830 static void gaudi2_halt_engines(struct hl_device *hdev, bool hard_reset, bool fw_reset) 4831 { 4832 u32 wait_timeout_ms; 4833 4834 if (hdev->pldm) 4835 wait_timeout_ms = GAUDI2_PLDM_RESET_WAIT_MSEC; 4836 else 4837 wait_timeout_ms = GAUDI2_RESET_WAIT_MSEC; 4838 4839 if (fw_reset) 4840 goto skip_engines; 4841 4842 gaudi2_stop_dma_qmans(hdev); 4843 gaudi2_stop_mme_qmans(hdev); 4844 gaudi2_stop_tpc_qmans(hdev); 4845 gaudi2_stop_rot_qmans(hdev); 4846 gaudi2_stop_nic_qmans(hdev); 4847 msleep(wait_timeout_ms); 4848 4849 gaudi2_halt_arcs(hdev); 4850 gaudi2_dma_stall(hdev); 4851 gaudi2_mme_stall(hdev); 4852 gaudi2_tpc_stall(hdev); 4853 gaudi2_rotator_stall(hdev); 4854 4855 msleep(wait_timeout_ms); 4856 4857 gaudi2_stop_dec(hdev); 4858 4859 /* 4860 * in case of soft reset do a manual flush for QMANs (currently called 4861 * only for NIC QMANs 4862 */ 4863 if (!hard_reset) 4864 gaudi2_nic_qmans_manual_flush(hdev); 4865 4866 gaudi2_disable_dma_qmans(hdev); 4867 gaudi2_disable_mme_qmans(hdev); 4868 gaudi2_disable_tpc_qmans(hdev); 4869 gaudi2_disable_rot_qmans(hdev); 4870 gaudi2_disable_nic_qmans(hdev); 4871 gaudi2_disable_timestamp(hdev); 4872 4873 skip_engines: 4874 if (hard_reset) { 4875 gaudi2_disable_msix(hdev); 4876 return; 4877 } 4878 4879 gaudi2_sync_irqs(hdev); 4880 } 4881 4882 static void gaudi2_init_firmware_preload_params(struct hl_device *hdev) 4883 { 4884 struct pre_fw_load_props *pre_fw_load = &hdev->fw_loader.pre_fw_load; 4885 4886 pre_fw_load->cpu_boot_status_reg = mmPSOC_GLOBAL_CONF_CPU_BOOT_STATUS; 4887 pre_fw_load->sts_boot_dev_sts0_reg = mmCPU_BOOT_DEV_STS0; 4888 pre_fw_load->sts_boot_dev_sts1_reg = mmCPU_BOOT_DEV_STS1; 4889 pre_fw_load->boot_err0_reg = mmCPU_BOOT_ERR0; 4890 pre_fw_load->boot_err1_reg = mmCPU_BOOT_ERR1; 4891 pre_fw_load->wait_for_preboot_timeout = GAUDI2_PREBOOT_REQ_TIMEOUT_USEC; 4892 pre_fw_load->wait_for_preboot_extended_timeout = 4893 GAUDI2_PREBOOT_EXTENDED_REQ_TIMEOUT_USEC; 4894 } 4895 4896 static void gaudi2_init_firmware_loader(struct hl_device *hdev) 4897 { 4898 struct fw_load_mgr *fw_loader = &hdev->fw_loader; 4899 struct dynamic_fw_load_mgr *dynamic_loader; 4900 struct cpu_dyn_regs *dyn_regs; 4901 4902 /* fill common fields */ 4903 fw_loader->fw_comp_loaded = FW_TYPE_NONE; 4904 fw_loader->boot_fit_img.image_name = GAUDI2_BOOT_FIT_FILE; 4905 fw_loader->linux_img.image_name = GAUDI2_LINUX_FW_FILE; 4906 fw_loader->boot_fit_timeout = GAUDI2_BOOT_FIT_REQ_TIMEOUT_USEC; 4907 fw_loader->skip_bmc = false; 4908 fw_loader->sram_bar_id = SRAM_CFG_BAR_ID; 4909 fw_loader->dram_bar_id = DRAM_BAR_ID; 4910 fw_loader->cpu_timeout = GAUDI2_CPU_TIMEOUT_USEC; 4911 4912 /* here we update initial values for few specific dynamic regs (as 4913 * before reading the first descriptor from FW those value has to be 4914 * hard-coded). in later stages of the protocol those values will be 4915 * updated automatically by reading the FW descriptor so data there 4916 * will always be up-to-date 4917 */ 4918 dynamic_loader = &hdev->fw_loader.dynamic_loader; 4919 dyn_regs = &dynamic_loader->comm_desc.cpu_dyn_regs; 4920 dyn_regs->kmd_msg_to_cpu = cpu_to_le32(mmPSOC_GLOBAL_CONF_KMD_MSG_TO_CPU); 4921 dyn_regs->cpu_cmd_status_to_host = cpu_to_le32(mmCPU_CMD_STATUS_TO_HOST); 4922 dynamic_loader->wait_for_bl_timeout = GAUDI2_WAIT_FOR_BL_TIMEOUT_USEC; 4923 } 4924 4925 static int gaudi2_init_cpu(struct hl_device *hdev) 4926 { 4927 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4928 int rc; 4929 4930 if (!(hdev->fw_components & FW_TYPE_PREBOOT_CPU)) 4931 return 0; 4932 4933 if (gaudi2->hw_cap_initialized & HW_CAP_CPU) 4934 return 0; 4935 4936 rc = hl_fw_init_cpu(hdev); 4937 if (rc) 4938 return rc; 4939 4940 gaudi2->hw_cap_initialized |= HW_CAP_CPU; 4941 4942 return 0; 4943 } 4944 4945 static int gaudi2_init_cpu_queues(struct hl_device *hdev, u32 cpu_timeout) 4946 { 4947 struct hl_hw_queue *cpu_pq = &hdev->kernel_queues[GAUDI2_QUEUE_ID_CPU_PQ]; 4948 struct asic_fixed_properties *prop = &hdev->asic_prop; 4949 struct gaudi2_device *gaudi2 = hdev->asic_specific; 4950 struct cpu_dyn_regs *dyn_regs; 4951 struct hl_eq *eq; 4952 u32 status; 4953 int err; 4954 4955 if (!hdev->cpu_queues_enable) 4956 return 0; 4957 4958 if (gaudi2->hw_cap_initialized & HW_CAP_CPU_Q) 4959 return 0; 4960 4961 eq = &hdev->event_queue; 4962 4963 dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 4964 4965 WREG32(mmCPU_IF_PQ_BASE_ADDR_LOW, lower_32_bits(cpu_pq->bus_address)); 4966 WREG32(mmCPU_IF_PQ_BASE_ADDR_HIGH, upper_32_bits(cpu_pq->bus_address)); 4967 4968 WREG32(mmCPU_IF_EQ_BASE_ADDR_LOW, lower_32_bits(eq->bus_address)); 4969 WREG32(mmCPU_IF_EQ_BASE_ADDR_HIGH, upper_32_bits(eq->bus_address)); 4970 4971 WREG32(mmCPU_IF_CQ_BASE_ADDR_LOW, lower_32_bits(hdev->cpu_accessible_dma_address)); 4972 WREG32(mmCPU_IF_CQ_BASE_ADDR_HIGH, upper_32_bits(hdev->cpu_accessible_dma_address)); 4973 4974 WREG32(mmCPU_IF_PQ_LENGTH, HL_QUEUE_SIZE_IN_BYTES); 4975 WREG32(mmCPU_IF_EQ_LENGTH, HL_EQ_SIZE_IN_BYTES); 4976 WREG32(mmCPU_IF_CQ_LENGTH, HL_CPU_ACCESSIBLE_MEM_SIZE); 4977 4978 /* Used for EQ CI */ 4979 WREG32(mmCPU_IF_EQ_RD_OFFS, 0); 4980 4981 WREG32(mmCPU_IF_PF_PQ_PI, 0); 4982 4983 WREG32(mmCPU_IF_QUEUE_INIT, PQ_INIT_STATUS_READY_FOR_CP); 4984 4985 /* Let the ARC know we are ready as it is now handling those queues */ 4986 4987 WREG32(le32_to_cpu(dyn_regs->gic_host_pi_upd_irq), 4988 gaudi2_irq_map_table[GAUDI2_EVENT_CPU_PI_UPDATE].cpu_id); 4989 4990 err = hl_poll_timeout( 4991 hdev, 4992 mmCPU_IF_QUEUE_INIT, 4993 status, 4994 (status == PQ_INIT_STATUS_READY_FOR_HOST), 4995 1000, 4996 cpu_timeout); 4997 4998 if (err) { 4999 dev_err(hdev->dev, "Failed to communicate with device CPU (timeout)\n"); 5000 return -EIO; 5001 } 5002 5003 /* update FW application security bits */ 5004 if (prop->fw_cpu_boot_dev_sts0_valid) 5005 prop->fw_app_cpu_boot_dev_sts0 = RREG32(mmCPU_BOOT_DEV_STS0); 5006 5007 if (prop->fw_cpu_boot_dev_sts1_valid) 5008 prop->fw_app_cpu_boot_dev_sts1 = RREG32(mmCPU_BOOT_DEV_STS1); 5009 5010 gaudi2->hw_cap_initialized |= HW_CAP_CPU_Q; 5011 return 0; 5012 } 5013 5014 static void gaudi2_init_qman_pq(struct hl_device *hdev, u32 reg_base, 5015 u32 queue_id_base) 5016 { 5017 struct hl_hw_queue *q; 5018 u32 pq_id, pq_offset; 5019 5020 for (pq_id = 0 ; pq_id < NUM_OF_PQ_PER_QMAN ; pq_id++) { 5021 q = &hdev->kernel_queues[queue_id_base + pq_id]; 5022 pq_offset = pq_id * 4; 5023 5024 if (q->dram_bd) { 5025 WREG32(reg_base + QM_PQ_BASE_LO_0_OFFSET + pq_offset, 5026 lower_32_bits(q->pq_dram_address)); 5027 WREG32(reg_base + QM_PQ_BASE_HI_0_OFFSET + pq_offset, 5028 upper_32_bits(q->pq_dram_address)); 5029 } else { 5030 WREG32(reg_base + QM_PQ_BASE_LO_0_OFFSET + pq_offset, 5031 lower_32_bits(q->bus_address)); 5032 WREG32(reg_base + QM_PQ_BASE_HI_0_OFFSET + pq_offset, 5033 upper_32_bits(q->bus_address)); 5034 } 5035 WREG32(reg_base + QM_PQ_SIZE_0_OFFSET + pq_offset, ilog2(HL_QUEUE_LENGTH)); 5036 WREG32(reg_base + QM_PQ_PI_0_OFFSET + pq_offset, 0); 5037 WREG32(reg_base + QM_PQ_CI_0_OFFSET + pq_offset, 0); 5038 } 5039 } 5040 5041 static void gaudi2_init_qman_cp(struct hl_device *hdev, u32 reg_base) 5042 { 5043 u32 cp_id, cp_offset, mtr_base_lo, mtr_base_hi, so_base_lo, so_base_hi; 5044 5045 mtr_base_lo = lower_32_bits(CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0); 5046 mtr_base_hi = upper_32_bits(CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0); 5047 so_base_lo = lower_32_bits(CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0); 5048 so_base_hi = upper_32_bits(CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0); 5049 5050 for (cp_id = 0 ; cp_id < NUM_OF_CP_PER_QMAN; cp_id++) { 5051 cp_offset = cp_id * 4; 5052 5053 WREG32(reg_base + QM_CP_MSG_BASE0_ADDR_LO_0_OFFSET + cp_offset, mtr_base_lo); 5054 WREG32(reg_base + QM_CP_MSG_BASE0_ADDR_HI_0_OFFSET + cp_offset, mtr_base_hi); 5055 WREG32(reg_base + QM_CP_MSG_BASE1_ADDR_LO_0_OFFSET + cp_offset, so_base_lo); 5056 WREG32(reg_base + QM_CP_MSG_BASE1_ADDR_HI_0_OFFSET + cp_offset, so_base_hi); 5057 } 5058 5059 /* allow QMANs to accept work from ARC CQF */ 5060 WREG32(reg_base + QM_CP_CFG_OFFSET, FIELD_PREP(PDMA0_QM_CP_CFG_SWITCH_EN_MASK, 0x1)); 5061 } 5062 5063 static void gaudi2_init_qman_pqc(struct hl_device *hdev, u32 reg_base, 5064 u32 queue_id_base) 5065 { 5066 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5067 u32 pq_id, pq_offset, so_base_lo, so_base_hi; 5068 5069 so_base_lo = lower_32_bits(CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0); 5070 so_base_hi = upper_32_bits(CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0); 5071 5072 for (pq_id = 0 ; pq_id < NUM_OF_PQ_PER_QMAN ; pq_id++) { 5073 pq_offset = pq_id * 4; 5074 5075 /* Configure QMAN HBW to scratchpad as it is not needed */ 5076 WREG32(reg_base + QM_PQC_HBW_BASE_LO_0_OFFSET + pq_offset, 5077 lower_32_bits(gaudi2->scratchpad_bus_address)); 5078 WREG32(reg_base + QM_PQC_HBW_BASE_HI_0_OFFSET + pq_offset, 5079 upper_32_bits(gaudi2->scratchpad_bus_address)); 5080 WREG32(reg_base + QM_PQC_SIZE_0_OFFSET + pq_offset, 5081 ilog2(PAGE_SIZE / sizeof(struct hl_cq_entry))); 5082 5083 WREG32(reg_base + QM_PQC_PI_0_OFFSET + pq_offset, 0); 5084 WREG32(reg_base + QM_PQC_LBW_WDATA_0_OFFSET + pq_offset, QM_PQC_LBW_WDATA); 5085 WREG32(reg_base + QM_PQC_LBW_BASE_LO_0_OFFSET + pq_offset, so_base_lo); 5086 WREG32(reg_base + QM_PQC_LBW_BASE_HI_0_OFFSET + pq_offset, so_base_hi); 5087 } 5088 5089 /* Enable QMAN H/W completion */ 5090 WREG32(reg_base + QM_PQC_CFG_OFFSET, 1 << PDMA0_QM_PQC_CFG_EN_SHIFT); 5091 } 5092 5093 static u32 gaudi2_get_dyn_sp_reg(struct hl_device *hdev, u32 queue_id_base) 5094 { 5095 struct cpu_dyn_regs *dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 5096 u32 sp_reg_addr; 5097 5098 switch (queue_id_base) { 5099 case GAUDI2_QUEUE_ID_PDMA_0_0...GAUDI2_QUEUE_ID_PDMA_1_3: 5100 fallthrough; 5101 case GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3: 5102 fallthrough; 5103 case GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3: 5104 fallthrough; 5105 case GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3: 5106 fallthrough; 5107 case GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3: 5108 sp_reg_addr = le32_to_cpu(dyn_regs->gic_dma_qm_irq_ctrl); 5109 break; 5110 case GAUDI2_QUEUE_ID_DCORE0_MME_0_0...GAUDI2_QUEUE_ID_DCORE0_MME_0_3: 5111 fallthrough; 5112 case GAUDI2_QUEUE_ID_DCORE1_MME_0_0...GAUDI2_QUEUE_ID_DCORE1_MME_0_3: 5113 fallthrough; 5114 case GAUDI2_QUEUE_ID_DCORE2_MME_0_0...GAUDI2_QUEUE_ID_DCORE2_MME_0_3: 5115 fallthrough; 5116 case GAUDI2_QUEUE_ID_DCORE3_MME_0_0...GAUDI2_QUEUE_ID_DCORE3_MME_0_3: 5117 sp_reg_addr = le32_to_cpu(dyn_regs->gic_mme_qm_irq_ctrl); 5118 break; 5119 case GAUDI2_QUEUE_ID_DCORE0_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE0_TPC_6_3: 5120 fallthrough; 5121 case GAUDI2_QUEUE_ID_DCORE1_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE1_TPC_5_3: 5122 fallthrough; 5123 case GAUDI2_QUEUE_ID_DCORE2_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE2_TPC_5_3: 5124 fallthrough; 5125 case GAUDI2_QUEUE_ID_DCORE3_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE3_TPC_5_3: 5126 sp_reg_addr = le32_to_cpu(dyn_regs->gic_tpc_qm_irq_ctrl); 5127 break; 5128 case GAUDI2_QUEUE_ID_ROT_0_0...GAUDI2_QUEUE_ID_ROT_1_3: 5129 sp_reg_addr = le32_to_cpu(dyn_regs->gic_rot_qm_irq_ctrl); 5130 break; 5131 case GAUDI2_QUEUE_ID_NIC_0_0...GAUDI2_QUEUE_ID_NIC_23_3: 5132 sp_reg_addr = le32_to_cpu(dyn_regs->gic_nic_qm_irq_ctrl); 5133 break; 5134 default: 5135 dev_err(hdev->dev, "Unexpected h/w queue %d\n", queue_id_base); 5136 return 0; 5137 } 5138 5139 return sp_reg_addr; 5140 } 5141 5142 static void gaudi2_init_qman_common(struct hl_device *hdev, u32 reg_base, 5143 u32 queue_id_base) 5144 { 5145 u32 glbl_prot = QMAN_MAKE_TRUSTED, irq_handler_offset; 5146 int map_table_entry; 5147 5148 WREG32(reg_base + QM_GLBL_PROT_OFFSET, glbl_prot); 5149 5150 irq_handler_offset = gaudi2_get_dyn_sp_reg(hdev, queue_id_base); 5151 WREG32(reg_base + QM_GLBL_ERR_ADDR_LO_OFFSET, lower_32_bits(CFG_BASE + irq_handler_offset)); 5152 WREG32(reg_base + QM_GLBL_ERR_ADDR_HI_OFFSET, upper_32_bits(CFG_BASE + irq_handler_offset)); 5153 5154 map_table_entry = gaudi2_qman_async_event_id[queue_id_base]; 5155 WREG32(reg_base + QM_GLBL_ERR_WDATA_OFFSET, 5156 gaudi2_irq_map_table[map_table_entry].cpu_id); 5157 5158 WREG32(reg_base + QM_ARB_ERR_MSG_EN_OFFSET, QM_ARB_ERR_MSG_EN_MASK); 5159 5160 WREG32(reg_base + QM_ARB_SLV_CHOISE_WDT_OFFSET, GAUDI2_ARB_WDT_TIMEOUT); 5161 WREG32(reg_base + QM_GLBL_CFG1_OFFSET, 0); 5162 WREG32(reg_base + QM_GLBL_CFG2_OFFSET, 0); 5163 5164 /* Enable the QMAN channel. 5165 * PDMA QMAN configuration is different, as we do not allow user to 5166 * access some of the CPs. 5167 * PDMA0: CP2/3 are reserved for the ARC usage. 5168 * PDMA1: CP1/2/3 are reserved for the ARC usage. 5169 */ 5170 if (reg_base == gaudi2_qm_blocks_bases[GAUDI2_QUEUE_ID_PDMA_1_0]) 5171 WREG32(reg_base + QM_GLBL_CFG0_OFFSET, PDMA1_QMAN_ENABLE); 5172 else if (reg_base == gaudi2_qm_blocks_bases[GAUDI2_QUEUE_ID_PDMA_0_0]) 5173 WREG32(reg_base + QM_GLBL_CFG0_OFFSET, PDMA0_QMAN_ENABLE); 5174 else 5175 WREG32(reg_base + QM_GLBL_CFG0_OFFSET, QMAN_ENABLE); 5176 } 5177 5178 static void gaudi2_init_qman(struct hl_device *hdev, u32 reg_base, 5179 u32 queue_id_base) 5180 { 5181 u32 pq_id; 5182 5183 for (pq_id = 0 ; pq_id < NUM_OF_PQ_PER_QMAN ; pq_id++) 5184 hdev->kernel_queues[queue_id_base + pq_id].cq_id = GAUDI2_RESERVED_CQ_CS_COMPLETION; 5185 5186 gaudi2_init_qman_pq(hdev, reg_base, queue_id_base); 5187 gaudi2_init_qman_cp(hdev, reg_base); 5188 gaudi2_init_qman_pqc(hdev, reg_base, queue_id_base); 5189 gaudi2_init_qman_common(hdev, reg_base, queue_id_base); 5190 } 5191 5192 static void gaudi2_init_dma_core(struct hl_device *hdev, u32 reg_base, 5193 u32 dma_core_id, bool is_secure) 5194 { 5195 u32 prot, irq_handler_offset; 5196 struct cpu_dyn_regs *dyn_regs; 5197 int map_table_entry; 5198 5199 prot = 1 << ARC_FARM_KDMA_PROT_ERR_VAL_SHIFT; 5200 if (is_secure) 5201 prot |= 1 << ARC_FARM_KDMA_PROT_VAL_SHIFT; 5202 5203 WREG32(reg_base + DMA_CORE_PROT_OFFSET, prot); 5204 5205 dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 5206 irq_handler_offset = le32_to_cpu(dyn_regs->gic_dma_core_irq_ctrl); 5207 5208 WREG32(reg_base + DMA_CORE_ERRMSG_ADDR_LO_OFFSET, 5209 lower_32_bits(CFG_BASE + irq_handler_offset)); 5210 5211 WREG32(reg_base + DMA_CORE_ERRMSG_ADDR_HI_OFFSET, 5212 upper_32_bits(CFG_BASE + irq_handler_offset)); 5213 5214 map_table_entry = gaudi2_dma_core_async_event_id[dma_core_id]; 5215 WREG32(reg_base + DMA_CORE_ERRMSG_WDATA_OFFSET, 5216 gaudi2_irq_map_table[map_table_entry].cpu_id); 5217 5218 /* Enable the DMA channel */ 5219 WREG32(reg_base + DMA_CORE_CFG_0_OFFSET, 1 << ARC_FARM_KDMA_CFG_0_EN_SHIFT); 5220 } 5221 5222 static void gaudi2_init_kdma(struct hl_device *hdev) 5223 { 5224 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5225 u32 reg_base; 5226 5227 if ((gaudi2->hw_cap_initialized & HW_CAP_KDMA) == HW_CAP_KDMA) 5228 return; 5229 5230 reg_base = gaudi2_dma_core_blocks_bases[DMA_CORE_ID_KDMA]; 5231 5232 gaudi2_init_dma_core(hdev, reg_base, DMA_CORE_ID_KDMA, true); 5233 5234 gaudi2->hw_cap_initialized |= HW_CAP_KDMA; 5235 } 5236 5237 static void gaudi2_init_pdma(struct hl_device *hdev) 5238 { 5239 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5240 u32 reg_base; 5241 5242 if ((gaudi2->hw_cap_initialized & HW_CAP_PDMA_MASK) == HW_CAP_PDMA_MASK) 5243 return; 5244 5245 reg_base = gaudi2_dma_core_blocks_bases[DMA_CORE_ID_PDMA0]; 5246 gaudi2_init_dma_core(hdev, reg_base, DMA_CORE_ID_PDMA0, false); 5247 5248 reg_base = gaudi2_qm_blocks_bases[GAUDI2_QUEUE_ID_PDMA_0_0]; 5249 gaudi2_init_qman(hdev, reg_base, GAUDI2_QUEUE_ID_PDMA_0_0); 5250 5251 reg_base = gaudi2_dma_core_blocks_bases[DMA_CORE_ID_PDMA1]; 5252 gaudi2_init_dma_core(hdev, reg_base, DMA_CORE_ID_PDMA1, false); 5253 5254 reg_base = gaudi2_qm_blocks_bases[GAUDI2_QUEUE_ID_PDMA_1_0]; 5255 gaudi2_init_qman(hdev, reg_base, GAUDI2_QUEUE_ID_PDMA_1_0); 5256 5257 gaudi2->hw_cap_initialized |= HW_CAP_PDMA_MASK; 5258 } 5259 5260 static void gaudi2_init_edma_instance(struct hl_device *hdev, u8 seq) 5261 { 5262 u32 reg_base, base_edma_core_id, base_edma_qman_id; 5263 5264 base_edma_core_id = DMA_CORE_ID_EDMA0 + seq; 5265 base_edma_qman_id = edma_stream_base[seq]; 5266 5267 reg_base = gaudi2_dma_core_blocks_bases[base_edma_core_id]; 5268 gaudi2_init_dma_core(hdev, reg_base, base_edma_core_id, false); 5269 5270 reg_base = gaudi2_qm_blocks_bases[base_edma_qman_id]; 5271 gaudi2_init_qman(hdev, reg_base, base_edma_qman_id); 5272 } 5273 5274 static void gaudi2_init_edma(struct hl_device *hdev) 5275 { 5276 struct asic_fixed_properties *prop = &hdev->asic_prop; 5277 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5278 int dcore, inst; 5279 5280 if ((gaudi2->hw_cap_initialized & HW_CAP_EDMA_MASK) == HW_CAP_EDMA_MASK) 5281 return; 5282 5283 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 5284 for (inst = 0 ; inst < NUM_OF_EDMA_PER_DCORE ; inst++) { 5285 u8 seq = dcore * NUM_OF_EDMA_PER_DCORE + inst; 5286 5287 if (!(prop->edma_enabled_mask & BIT(seq))) 5288 continue; 5289 5290 gaudi2_init_edma_instance(hdev, seq); 5291 5292 gaudi2->hw_cap_initialized |= BIT_ULL(HW_CAP_EDMA_SHIFT + seq); 5293 } 5294 } 5295 } 5296 5297 /* 5298 * gaudi2_arm_monitors_for_virt_msix_db() - Arm monitors for writing to the virtual MSI-X doorbell. 5299 * @hdev: pointer to habanalabs device structure. 5300 * @sob_id: sync object ID. 5301 * @first_mon_id: ID of first monitor out of 3 consecutive monitors. 5302 * @interrupt_id: interrupt ID. 5303 * 5304 * Some initiators cannot have HBW address in their completion address registers, and thus cannot 5305 * write directly to the HBW host memory of the virtual MSI-X doorbell. 5306 * Instead, they are configured to LBW write to a sync object, and a monitor will do the HBW write. 5307 * 5308 * The mechanism in the sync manager block is composed of a master monitor with 3 messages. 5309 * In addition to the HBW write, the other 2 messages are for preparing the monitor to next 5310 * completion, by decrementing the sync object value and re-arming the monitor. 5311 */ 5312 static void gaudi2_arm_monitors_for_virt_msix_db(struct hl_device *hdev, u32 sob_id, 5313 u32 first_mon_id, u32 interrupt_id) 5314 { 5315 u32 sob_offset, first_mon_offset, mon_offset, payload, sob_group, mode, arm, config; 5316 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5317 u64 addr; 5318 u8 mask; 5319 5320 /* Reset the SOB value */ 5321 sob_offset = sob_id * sizeof(u32); 5322 WREG32(mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_offset, 0); 5323 5324 /* Configure 3 monitors: 5325 * 1. Write interrupt ID to the virtual MSI-X doorbell (master monitor) 5326 * 2. Decrement SOB value by 1. 5327 * 3. Re-arm the master monitor. 5328 */ 5329 5330 first_mon_offset = first_mon_id * sizeof(u32); 5331 5332 /* 2nd monitor: Decrement SOB value by 1 */ 5333 mon_offset = first_mon_offset + sizeof(u32); 5334 5335 addr = CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_offset; 5336 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 + mon_offset, lower_32_bits(addr)); 5337 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRH_0 + mon_offset, upper_32_bits(addr)); 5338 5339 payload = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_VAL_MASK, 0x7FFF) | /* "-1" */ 5340 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_SIGN_MASK, 1) | 5341 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_INC_MASK, 1); 5342 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_DATA_0 + mon_offset, payload); 5343 5344 /* 3rd monitor: Re-arm the master monitor */ 5345 mon_offset = first_mon_offset + 2 * sizeof(u32); 5346 5347 addr = CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_MON_ARM_0 + first_mon_offset; 5348 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 + mon_offset, lower_32_bits(addr)); 5349 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRH_0 + mon_offset, upper_32_bits(addr)); 5350 5351 sob_group = sob_id / 8; 5352 mask = ~BIT(sob_id & 0x7); 5353 mode = 0; /* comparison mode is "greater than or equal to" */ 5354 arm = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_SID_MASK, sob_group) | 5355 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_MASK_MASK, mask) | 5356 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_SOP_MASK, mode) | 5357 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_SOD_MASK, 1); 5358 5359 payload = arm; 5360 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_DATA_0 + mon_offset, payload); 5361 5362 /* 1st monitor (master): Write interrupt ID to the virtual MSI-X doorbell */ 5363 mon_offset = first_mon_offset; 5364 5365 config = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_CONFIG_WR_NUM_MASK, 2); /* "2": 3 writes */ 5366 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_CONFIG_0 + mon_offset, config); 5367 5368 addr = gaudi2->virt_msix_db_dma_addr; 5369 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 + mon_offset, lower_32_bits(addr)); 5370 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRH_0 + mon_offset, upper_32_bits(addr)); 5371 5372 payload = interrupt_id; 5373 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_DATA_0 + mon_offset, payload); 5374 5375 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_ARM_0 + mon_offset, arm); 5376 } 5377 5378 static void gaudi2_prepare_sm_for_virt_msix_db(struct hl_device *hdev) 5379 { 5380 u32 decoder_id, sob_id, first_mon_id, interrupt_id; 5381 struct asic_fixed_properties *prop = &hdev->asic_prop; 5382 5383 /* Decoder normal/abnormal interrupts */ 5384 for (decoder_id = 0 ; decoder_id < NUMBER_OF_DEC ; ++decoder_id) { 5385 if (!(prop->decoder_enabled_mask & BIT(decoder_id))) 5386 continue; 5387 5388 sob_id = GAUDI2_RESERVED_SOB_DEC_NRM_FIRST + decoder_id; 5389 first_mon_id = GAUDI2_RESERVED_MON_DEC_NRM_FIRST + 3 * decoder_id; 5390 interrupt_id = GAUDI2_IRQ_NUM_DCORE0_DEC0_NRM + 2 * decoder_id; 5391 gaudi2_arm_monitors_for_virt_msix_db(hdev, sob_id, first_mon_id, interrupt_id); 5392 5393 sob_id = GAUDI2_RESERVED_SOB_DEC_ABNRM_FIRST + decoder_id; 5394 first_mon_id = GAUDI2_RESERVED_MON_DEC_ABNRM_FIRST + 3 * decoder_id; 5395 interrupt_id += 1; 5396 gaudi2_arm_monitors_for_virt_msix_db(hdev, sob_id, first_mon_id, interrupt_id); 5397 } 5398 } 5399 5400 static void gaudi2_init_sm(struct hl_device *hdev) 5401 { 5402 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5403 u64 cq_address; 5404 u32 reg_val; 5405 int i; 5406 5407 /* Enable HBW/LBW CQ for completion monitors */ 5408 reg_val = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_CONFIG_CQ_EN_MASK, 1); 5409 reg_val |= FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_CONFIG_LBW_EN_MASK, 1); 5410 5411 for (i = 0 ; i < GAUDI2_MAX_PENDING_CS ; i++) 5412 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_CONFIG_0 + (4 * i), reg_val); 5413 5414 /* Enable only HBW CQ for KDMA completion monitor */ 5415 reg_val = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_CONFIG_CQ_EN_MASK, 1); 5416 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_CONFIG_0 + (4 * i), reg_val); 5417 5418 /* Init CQ0 DB - configure the monitor to trigger MSI-X interrupt */ 5419 WREG32(mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_L_0, lower_32_bits(gaudi2->virt_msix_db_dma_addr)); 5420 WREG32(mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_H_0, upper_32_bits(gaudi2->virt_msix_db_dma_addr)); 5421 WREG32(mmDCORE0_SYNC_MNGR_GLBL_LBW_DATA_0, GAUDI2_IRQ_NUM_COMPLETION); 5422 5423 for (i = 0 ; i < GAUDI2_RESERVED_CQ_NUMBER ; i++) { 5424 cq_address = 5425 hdev->completion_queue[i].bus_address; 5426 5427 WREG32(mmDCORE0_SYNC_MNGR_GLBL_CQ_BASE_ADDR_L_0 + (4 * i), 5428 lower_32_bits(cq_address)); 5429 WREG32(mmDCORE0_SYNC_MNGR_GLBL_CQ_BASE_ADDR_H_0 + (4 * i), 5430 upper_32_bits(cq_address)); 5431 WREG32(mmDCORE0_SYNC_MNGR_GLBL_CQ_SIZE_LOG2_0 + (4 * i), 5432 ilog2(HL_CQ_SIZE_IN_BYTES)); 5433 } 5434 5435 /* Configure kernel ASID and MMU BP*/ 5436 WREG32(mmDCORE0_SYNC_MNGR_GLBL_ASID_SEC, 0x10000); 5437 WREG32(mmDCORE0_SYNC_MNGR_GLBL_ASID_NONE_SEC_PRIV, 0); 5438 5439 /* Initialize sync objects and monitors which are used for the virtual MSI-X doorbell */ 5440 gaudi2_prepare_sm_for_virt_msix_db(hdev); 5441 } 5442 5443 static void gaudi2_init_mme_acc(struct hl_device *hdev, u32 reg_base) 5444 { 5445 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5446 u32 reg_val; 5447 int i; 5448 5449 reg_val = FIELD_PREP(MME_ACC_INTR_MASK_WBC_ERR_RESP_MASK, 0); 5450 reg_val |= FIELD_PREP(MME_ACC_INTR_MASK_AP_SRC_POS_INF_MASK, 1); 5451 reg_val |= FIELD_PREP(MME_ACC_INTR_MASK_AP_SRC_NEG_INF_MASK, 1); 5452 reg_val |= FIELD_PREP(MME_ACC_INTR_MASK_AP_SRC_NAN_MASK, 1); 5453 reg_val |= FIELD_PREP(MME_ACC_INTR_MASK_AP_RESULT_POS_INF_MASK, 1); 5454 reg_val |= FIELD_PREP(MME_ACC_INTR_MASK_AP_RESULT_NEG_INF_MASK, 1); 5455 5456 WREG32(reg_base + MME_ACC_INTR_MASK_OFFSET, reg_val); 5457 WREG32(reg_base + MME_ACC_AP_LFSR_POLY_OFFSET, 0x80DEADAF); 5458 5459 for (i = 0 ; i < MME_NUM_OF_LFSR_SEEDS ; i++) { 5460 WREG32(reg_base + MME_ACC_AP_LFSR_SEED_SEL_OFFSET, i); 5461 WREG32(reg_base + MME_ACC_AP_LFSR_SEED_WDATA_OFFSET, gaudi2->lfsr_rand_seeds[i]); 5462 } 5463 } 5464 5465 static void gaudi2_init_dcore_mme(struct hl_device *hdev, int dcore_id, 5466 bool config_qman_only) 5467 { 5468 u32 queue_id_base, reg_base; 5469 5470 switch (dcore_id) { 5471 case 0: 5472 queue_id_base = GAUDI2_QUEUE_ID_DCORE0_MME_0_0; 5473 break; 5474 case 1: 5475 queue_id_base = GAUDI2_QUEUE_ID_DCORE1_MME_0_0; 5476 break; 5477 case 2: 5478 queue_id_base = GAUDI2_QUEUE_ID_DCORE2_MME_0_0; 5479 break; 5480 case 3: 5481 queue_id_base = GAUDI2_QUEUE_ID_DCORE3_MME_0_0; 5482 break; 5483 default: 5484 dev_err(hdev->dev, "Invalid dcore id %u\n", dcore_id); 5485 return; 5486 } 5487 5488 if (!config_qman_only) { 5489 reg_base = gaudi2_mme_acc_blocks_bases[dcore_id]; 5490 gaudi2_init_mme_acc(hdev, reg_base); 5491 } 5492 5493 reg_base = gaudi2_qm_blocks_bases[queue_id_base]; 5494 gaudi2_init_qman(hdev, reg_base, queue_id_base); 5495 } 5496 5497 static void gaudi2_init_mme(struct hl_device *hdev) 5498 { 5499 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5500 int i; 5501 5502 if ((gaudi2->hw_cap_initialized & HW_CAP_MME_MASK) == HW_CAP_MME_MASK) 5503 return; 5504 5505 for (i = 0 ; i < NUM_OF_DCORES ; i++) { 5506 gaudi2_init_dcore_mme(hdev, i, false); 5507 5508 gaudi2->hw_cap_initialized |= BIT_ULL(HW_CAP_MME_SHIFT + i); 5509 } 5510 } 5511 5512 static void gaudi2_init_tpc_cfg(struct hl_device *hdev, u32 reg_base) 5513 { 5514 /* Mask arithmetic and QM interrupts in TPC */ 5515 WREG32(reg_base + TPC_CFG_TPC_INTR_MASK_OFFSET, 0x23FFFE); 5516 5517 /* Set 16 cache lines */ 5518 WREG32(reg_base + TPC_CFG_MSS_CONFIG_OFFSET, 5519 2 << DCORE0_TPC0_CFG_MSS_CONFIG_ICACHE_FETCH_LINE_NUM_SHIFT); 5520 } 5521 5522 struct gaudi2_tpc_init_cfg_data { 5523 enum gaudi2_queue_id dcore_tpc_qid_base[NUM_OF_DCORES]; 5524 }; 5525 5526 static void gaudi2_init_tpc_config(struct hl_device *hdev, int dcore, int inst, 5527 u32 offset, struct iterate_module_ctx *ctx) 5528 { 5529 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5530 struct gaudi2_tpc_init_cfg_data *cfg_data = ctx->data; 5531 u32 queue_id_base; 5532 u8 seq; 5533 5534 queue_id_base = cfg_data->dcore_tpc_qid_base[dcore] + (inst * NUM_OF_PQ_PER_QMAN); 5535 5536 if (dcore == 0 && inst == (NUM_DCORE0_TPC - 1)) 5537 /* gets last sequence number */ 5538 seq = NUM_OF_DCORES * NUM_OF_TPC_PER_DCORE; 5539 else 5540 seq = dcore * NUM_OF_TPC_PER_DCORE + inst; 5541 5542 gaudi2_init_tpc_cfg(hdev, mmDCORE0_TPC0_CFG_BASE + offset); 5543 gaudi2_init_qman(hdev, mmDCORE0_TPC0_QM_BASE + offset, queue_id_base); 5544 5545 gaudi2->tpc_hw_cap_initialized |= BIT_ULL(HW_CAP_TPC_SHIFT + seq); 5546 } 5547 5548 static void gaudi2_init_tpc(struct hl_device *hdev) 5549 { 5550 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5551 struct gaudi2_tpc_init_cfg_data init_cfg_data; 5552 struct iterate_module_ctx tpc_iter; 5553 5554 if (!hdev->asic_prop.tpc_enabled_mask) 5555 return; 5556 5557 if ((gaudi2->tpc_hw_cap_initialized & HW_CAP_TPC_MASK) == HW_CAP_TPC_MASK) 5558 return; 5559 5560 init_cfg_data.dcore_tpc_qid_base[0] = GAUDI2_QUEUE_ID_DCORE0_TPC_0_0; 5561 init_cfg_data.dcore_tpc_qid_base[1] = GAUDI2_QUEUE_ID_DCORE1_TPC_0_0; 5562 init_cfg_data.dcore_tpc_qid_base[2] = GAUDI2_QUEUE_ID_DCORE2_TPC_0_0; 5563 init_cfg_data.dcore_tpc_qid_base[3] = GAUDI2_QUEUE_ID_DCORE3_TPC_0_0; 5564 tpc_iter.fn = &gaudi2_init_tpc_config; 5565 tpc_iter.data = &init_cfg_data; 5566 gaudi2_iterate_tpcs(hdev, &tpc_iter); 5567 } 5568 5569 static void gaudi2_init_rotator(struct hl_device *hdev) 5570 { 5571 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5572 u32 i, reg_base, queue_id; 5573 5574 queue_id = GAUDI2_QUEUE_ID_ROT_0_0; 5575 5576 for (i = 0 ; i < NUM_OF_ROT ; i++, queue_id += NUM_OF_PQ_PER_QMAN) { 5577 reg_base = gaudi2_qm_blocks_bases[queue_id]; 5578 gaudi2_init_qman(hdev, reg_base, queue_id); 5579 5580 gaudi2->hw_cap_initialized |= BIT_ULL(HW_CAP_ROT_SHIFT + i); 5581 } 5582 } 5583 5584 static void gaudi2_init_vdec_brdg_ctrl(struct hl_device *hdev, u64 base_addr, u32 decoder_id) 5585 { 5586 u32 sob_id; 5587 5588 /* VCMD normal interrupt */ 5589 sob_id = GAUDI2_RESERVED_SOB_DEC_NRM_FIRST + decoder_id; 5590 WREG32(base_addr + BRDG_CTRL_NRM_MSIX_LBW_AWADDR, 5591 mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_id * sizeof(u32)); 5592 WREG32(base_addr + BRDG_CTRL_NRM_MSIX_LBW_WDATA, GAUDI2_SOB_INCREMENT_BY_ONE); 5593 5594 /* VCMD abnormal interrupt */ 5595 sob_id = GAUDI2_RESERVED_SOB_DEC_ABNRM_FIRST + decoder_id; 5596 WREG32(base_addr + BRDG_CTRL_ABNRM_MSIX_LBW_AWADDR, 5597 mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_id * sizeof(u32)); 5598 WREG32(base_addr + BRDG_CTRL_ABNRM_MSIX_LBW_WDATA, GAUDI2_SOB_INCREMENT_BY_ONE); 5599 } 5600 5601 static void gaudi2_init_dec(struct hl_device *hdev) 5602 { 5603 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5604 u32 dcore_id, dec_id, dec_bit; 5605 u64 base_addr; 5606 5607 if (!hdev->asic_prop.decoder_enabled_mask) 5608 return; 5609 5610 if ((gaudi2->dec_hw_cap_initialized & HW_CAP_DEC_MASK) == HW_CAP_DEC_MASK) 5611 return; 5612 5613 for (dcore_id = 0 ; dcore_id < NUM_OF_DCORES ; dcore_id++) 5614 for (dec_id = 0 ; dec_id < NUM_OF_DEC_PER_DCORE ; dec_id++) { 5615 dec_bit = dcore_id * NUM_OF_DEC_PER_DCORE + dec_id; 5616 5617 if (!(hdev->asic_prop.decoder_enabled_mask & BIT(dec_bit))) 5618 continue; 5619 5620 base_addr = mmDCORE0_DEC0_CMD_BASE + 5621 BRDG_CTRL_BLOCK_OFFSET + 5622 dcore_id * DCORE_OFFSET + 5623 dec_id * DCORE_VDEC_OFFSET; 5624 5625 gaudi2_init_vdec_brdg_ctrl(hdev, base_addr, dec_bit); 5626 5627 gaudi2->dec_hw_cap_initialized |= BIT_ULL(HW_CAP_DEC_SHIFT + dec_bit); 5628 } 5629 5630 for (dec_id = 0 ; dec_id < NUM_OF_PCIE_VDEC ; dec_id++) { 5631 dec_bit = PCIE_DEC_SHIFT + dec_id; 5632 if (!(hdev->asic_prop.decoder_enabled_mask & BIT(dec_bit))) 5633 continue; 5634 5635 base_addr = mmPCIE_DEC0_CMD_BASE + BRDG_CTRL_BLOCK_OFFSET + 5636 dec_id * DCORE_VDEC_OFFSET; 5637 5638 gaudi2_init_vdec_brdg_ctrl(hdev, base_addr, dec_bit); 5639 5640 gaudi2->dec_hw_cap_initialized |= BIT_ULL(HW_CAP_DEC_SHIFT + dec_bit); 5641 } 5642 } 5643 5644 static int gaudi2_mmu_update_asid_hop0_addr(struct hl_device *hdev, 5645 u32 stlb_base, u32 asid, u64 phys_addr) 5646 { 5647 u32 status, timeout_usec; 5648 int rc; 5649 5650 if (hdev->pldm || !hdev->pdev) 5651 timeout_usec = GAUDI2_PLDM_MMU_TIMEOUT_USEC; 5652 else 5653 timeout_usec = MMU_CONFIG_TIMEOUT_USEC; 5654 5655 WREG32(stlb_base + STLB_ASID_OFFSET, asid); 5656 WREG32(stlb_base + STLB_HOP0_PA43_12_OFFSET, phys_addr >> MMU_HOP0_PA43_12_SHIFT); 5657 WREG32(stlb_base + STLB_HOP0_PA63_44_OFFSET, phys_addr >> MMU_HOP0_PA63_44_SHIFT); 5658 WREG32(stlb_base + STLB_BUSY_OFFSET, 0x80000000); 5659 5660 rc = hl_poll_timeout( 5661 hdev, 5662 stlb_base + STLB_BUSY_OFFSET, 5663 status, 5664 !(status & 0x80000000), 5665 1000, 5666 timeout_usec); 5667 5668 if (rc) { 5669 dev_err(hdev->dev, "Timeout during MMU hop0 config of asid %d\n", asid); 5670 return rc; 5671 } 5672 5673 return 0; 5674 } 5675 5676 static void gaudi2_mmu_send_invalidate_cache_cmd(struct hl_device *hdev, u32 stlb_base, 5677 u32 start_offset, u32 inv_start_val, 5678 u32 flags) 5679 { 5680 /* clear PMMU mem line cache (only needed in mmu range invalidation) */ 5681 if (flags & MMU_OP_CLEAR_MEMCACHE) 5682 WREG32(mmPMMU_HBW_STLB_MEM_CACHE_INVALIDATION, 0x1); 5683 5684 if (flags & MMU_OP_SKIP_LOW_CACHE_INV) 5685 return; 5686 5687 WREG32(stlb_base + start_offset, inv_start_val); 5688 } 5689 5690 static int gaudi2_mmu_invalidate_cache_status_poll(struct hl_device *hdev, u32 stlb_base, 5691 struct gaudi2_cache_invld_params *inv_params) 5692 { 5693 u32 status, timeout_usec, start_offset; 5694 int rc; 5695 5696 timeout_usec = (hdev->pldm) ? GAUDI2_PLDM_MMU_TIMEOUT_USEC : 5697 GAUDI2_MMU_CACHE_INV_TIMEOUT_USEC; 5698 5699 /* poll PMMU mem line cache (only needed in mmu range invalidation) */ 5700 if (inv_params->flags & MMU_OP_CLEAR_MEMCACHE) { 5701 rc = hl_poll_timeout( 5702 hdev, 5703 mmPMMU_HBW_STLB_MEM_CACHE_INV_STATUS, 5704 status, 5705 status & 0x1, 5706 1000, 5707 timeout_usec); 5708 5709 if (rc) 5710 return rc; 5711 5712 /* Need to manually reset the status to 0 */ 5713 WREG32(mmPMMU_HBW_STLB_MEM_CACHE_INV_STATUS, 0x0); 5714 } 5715 5716 /* Lower cache does not work with cache lines, hence we can skip its 5717 * invalidation upon map and invalidate only upon unmap 5718 */ 5719 if (inv_params->flags & MMU_OP_SKIP_LOW_CACHE_INV) 5720 return 0; 5721 5722 start_offset = inv_params->range_invalidation ? 5723 STLB_RANGE_CACHE_INVALIDATION_OFFSET : STLB_INV_ALL_START_OFFSET; 5724 5725 rc = hl_poll_timeout( 5726 hdev, 5727 stlb_base + start_offset, 5728 status, 5729 !(status & 0x1), 5730 1000, 5731 timeout_usec); 5732 5733 return rc; 5734 } 5735 5736 bool gaudi2_is_hmmu_enabled(struct hl_device *hdev, int dcore_id, int hmmu_id) 5737 { 5738 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5739 u32 hw_cap; 5740 5741 hw_cap = HW_CAP_DCORE0_DMMU0 << (NUM_OF_HMMU_PER_DCORE * dcore_id + hmmu_id); 5742 5743 if (gaudi2->hw_cap_initialized & hw_cap) 5744 return true; 5745 5746 return false; 5747 } 5748 5749 /* this function shall be called only for HMMUs for which capability bit is set */ 5750 static inline u32 get_hmmu_stlb_base(int dcore_id, int hmmu_id) 5751 { 5752 u32 offset; 5753 5754 offset = (u32) (dcore_id * DCORE_OFFSET + hmmu_id * DCORE_HMMU_OFFSET); 5755 return (u32)(mmDCORE0_HMMU0_STLB_BASE + offset); 5756 } 5757 5758 static void gaudi2_mmu_invalidate_cache_trigger(struct hl_device *hdev, u32 stlb_base, 5759 struct gaudi2_cache_invld_params *inv_params) 5760 { 5761 u32 start_offset; 5762 5763 if (inv_params->range_invalidation) { 5764 /* Set the addresses range 5765 * Note: that the start address we set in register, is not included in 5766 * the range of the invalidation, by design. 5767 * that's why we need to set lower address than the one we actually 5768 * want to be included in the range invalidation. 5769 */ 5770 u64 start = inv_params->start_va - 1; 5771 5772 start_offset = STLB_RANGE_CACHE_INVALIDATION_OFFSET; 5773 5774 WREG32(stlb_base + STLB_RANGE_INV_START_LSB_OFFSET, 5775 start >> MMU_RANGE_INV_VA_LSB_SHIFT); 5776 5777 WREG32(stlb_base + STLB_RANGE_INV_START_MSB_OFFSET, 5778 start >> MMU_RANGE_INV_VA_MSB_SHIFT); 5779 5780 WREG32(stlb_base + STLB_RANGE_INV_END_LSB_OFFSET, 5781 inv_params->end_va >> MMU_RANGE_INV_VA_LSB_SHIFT); 5782 5783 WREG32(stlb_base + STLB_RANGE_INV_END_MSB_OFFSET, 5784 inv_params->end_va >> MMU_RANGE_INV_VA_MSB_SHIFT); 5785 } else { 5786 start_offset = STLB_INV_ALL_START_OFFSET; 5787 } 5788 5789 gaudi2_mmu_send_invalidate_cache_cmd(hdev, stlb_base, start_offset, 5790 inv_params->inv_start_val, inv_params->flags); 5791 } 5792 5793 static inline void gaudi2_hmmu_invalidate_cache_trigger(struct hl_device *hdev, 5794 int dcore_id, int hmmu_id, 5795 struct gaudi2_cache_invld_params *inv_params) 5796 { 5797 u32 stlb_base = get_hmmu_stlb_base(dcore_id, hmmu_id); 5798 5799 gaudi2_mmu_invalidate_cache_trigger(hdev, stlb_base, inv_params); 5800 } 5801 5802 static inline int gaudi2_hmmu_invalidate_cache_status_poll(struct hl_device *hdev, 5803 int dcore_id, int hmmu_id, 5804 struct gaudi2_cache_invld_params *inv_params) 5805 { 5806 u32 stlb_base = get_hmmu_stlb_base(dcore_id, hmmu_id); 5807 5808 return gaudi2_mmu_invalidate_cache_status_poll(hdev, stlb_base, inv_params); 5809 } 5810 5811 static int gaudi2_hmmus_invalidate_cache(struct hl_device *hdev, 5812 struct gaudi2_cache_invld_params *inv_params) 5813 { 5814 int dcore_id, hmmu_id; 5815 5816 /* first send all invalidation commands */ 5817 for (dcore_id = 0 ; dcore_id < NUM_OF_DCORES ; dcore_id++) { 5818 for (hmmu_id = 0 ; hmmu_id < NUM_OF_HMMU_PER_DCORE ; hmmu_id++) { 5819 if (!gaudi2_is_hmmu_enabled(hdev, dcore_id, hmmu_id)) 5820 continue; 5821 5822 gaudi2_hmmu_invalidate_cache_trigger(hdev, dcore_id, hmmu_id, inv_params); 5823 } 5824 } 5825 5826 /* next, poll all invalidations status */ 5827 for (dcore_id = 0 ; dcore_id < NUM_OF_DCORES ; dcore_id++) { 5828 for (hmmu_id = 0 ; hmmu_id < NUM_OF_HMMU_PER_DCORE ; hmmu_id++) { 5829 int rc; 5830 5831 if (!gaudi2_is_hmmu_enabled(hdev, dcore_id, hmmu_id)) 5832 continue; 5833 5834 rc = gaudi2_hmmu_invalidate_cache_status_poll(hdev, dcore_id, hmmu_id, 5835 inv_params); 5836 if (rc) 5837 return rc; 5838 } 5839 } 5840 5841 return 0; 5842 } 5843 5844 static int gaudi2_mmu_invalidate_cache(struct hl_device *hdev, bool is_hard, u32 flags) 5845 { 5846 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5847 struct gaudi2_cache_invld_params invld_params; 5848 int rc = 0; 5849 5850 if (hdev->reset_info.hard_reset_pending) 5851 return rc; 5852 5853 invld_params.range_invalidation = false; 5854 invld_params.inv_start_val = 1; 5855 5856 if ((flags & MMU_OP_USERPTR) && (gaudi2->hw_cap_initialized & HW_CAP_PMMU)) { 5857 invld_params.flags = flags; 5858 gaudi2_mmu_invalidate_cache_trigger(hdev, mmPMMU_HBW_STLB_BASE, &invld_params); 5859 rc = gaudi2_mmu_invalidate_cache_status_poll(hdev, mmPMMU_HBW_STLB_BASE, 5860 &invld_params); 5861 } else if (flags & MMU_OP_PHYS_PACK) { 5862 invld_params.flags = 0; 5863 rc = gaudi2_hmmus_invalidate_cache(hdev, &invld_params); 5864 } 5865 5866 return rc; 5867 } 5868 5869 static int gaudi2_mmu_invalidate_cache_range(struct hl_device *hdev, bool is_hard, 5870 u32 flags, u32 asid, u64 va, u64 size) 5871 { 5872 struct gaudi2_cache_invld_params invld_params = {0}; 5873 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5874 u64 start_va, end_va; 5875 u32 inv_start_val; 5876 int rc = 0; 5877 5878 if (hdev->reset_info.hard_reset_pending) 5879 return 0; 5880 5881 inv_start_val = (1 << MMU_RANGE_INV_EN_SHIFT | 5882 1 << MMU_RANGE_INV_ASID_EN_SHIFT | 5883 asid << MMU_RANGE_INV_ASID_SHIFT); 5884 start_va = va; 5885 end_va = start_va + size; 5886 5887 if ((flags & MMU_OP_USERPTR) && (gaudi2->hw_cap_initialized & HW_CAP_PMMU)) { 5888 /* As range invalidation does not support zero address we will 5889 * do full invalidation in this case 5890 */ 5891 if (start_va) { 5892 invld_params.range_invalidation = true; 5893 invld_params.start_va = start_va; 5894 invld_params.end_va = end_va; 5895 invld_params.inv_start_val = inv_start_val; 5896 invld_params.flags = flags | MMU_OP_CLEAR_MEMCACHE; 5897 } else { 5898 invld_params.range_invalidation = false; 5899 invld_params.inv_start_val = 1; 5900 invld_params.flags = flags; 5901 } 5902 5903 5904 gaudi2_mmu_invalidate_cache_trigger(hdev, mmPMMU_HBW_STLB_BASE, &invld_params); 5905 rc = gaudi2_mmu_invalidate_cache_status_poll(hdev, mmPMMU_HBW_STLB_BASE, 5906 &invld_params); 5907 if (rc) 5908 return rc; 5909 5910 } else if (flags & MMU_OP_PHYS_PACK) { 5911 invld_params.start_va = gaudi2_mmu_scramble_addr(hdev, start_va); 5912 invld_params.end_va = gaudi2_mmu_scramble_addr(hdev, end_va); 5913 invld_params.inv_start_val = inv_start_val; 5914 invld_params.flags = flags; 5915 rc = gaudi2_hmmus_invalidate_cache(hdev, &invld_params); 5916 } 5917 5918 return rc; 5919 } 5920 5921 static int gaudi2_mmu_update_hop0_addr(struct hl_device *hdev, u32 stlb_base, 5922 bool host_resident_pgt) 5923 { 5924 struct asic_fixed_properties *prop = &hdev->asic_prop; 5925 u64 hop0_addr; 5926 u32 asid, max_asid = prop->max_asid; 5927 int rc; 5928 5929 /* it takes too much time to init all of the ASIDs on palladium */ 5930 if (hdev->pldm) 5931 max_asid = min((u32) 8, max_asid); 5932 5933 for (asid = 0 ; asid < max_asid ; asid++) { 5934 if (host_resident_pgt) 5935 hop0_addr = hdev->mmu_priv.hr.mmu_asid_hop0[asid].phys_addr; 5936 else 5937 hop0_addr = prop->mmu_pgt_addr + (asid * prop->dmmu.hop_table_size); 5938 5939 rc = gaudi2_mmu_update_asid_hop0_addr(hdev, stlb_base, asid, hop0_addr); 5940 if (rc) { 5941 dev_err(hdev->dev, "failed to set hop0 addr for asid %d\n", asid); 5942 return rc; 5943 } 5944 } 5945 5946 return 0; 5947 } 5948 5949 static int gaudi2_mmu_init_common(struct hl_device *hdev, u32 mmu_base, u32 stlb_base, 5950 bool host_resident_pgt) 5951 { 5952 u32 status, timeout_usec; 5953 int rc; 5954 5955 if (hdev->pldm || !hdev->pdev) 5956 timeout_usec = GAUDI2_PLDM_MMU_TIMEOUT_USEC; 5957 else 5958 timeout_usec = GAUDI2_MMU_CACHE_INV_TIMEOUT_USEC; 5959 5960 WREG32(stlb_base + STLB_INV_ALL_START_OFFSET, 1); 5961 5962 rc = hl_poll_timeout( 5963 hdev, 5964 stlb_base + STLB_SRAM_INIT_OFFSET, 5965 status, 5966 !status, 5967 1000, 5968 timeout_usec); 5969 5970 if (rc) 5971 dev_notice_ratelimited(hdev->dev, "Timeout when waiting for MMU SRAM init\n"); 5972 5973 rc = gaudi2_mmu_update_hop0_addr(hdev, stlb_base, host_resident_pgt); 5974 if (rc) 5975 return rc; 5976 5977 WREG32(mmu_base + MMU_BYPASS_OFFSET, 0); 5978 5979 rc = hl_poll_timeout( 5980 hdev, 5981 stlb_base + STLB_INV_ALL_START_OFFSET, 5982 status, 5983 !status, 5984 1000, 5985 timeout_usec); 5986 5987 if (rc) 5988 dev_notice_ratelimited(hdev->dev, "Timeout when waiting for MMU invalidate all\n"); 5989 5990 WREG32(mmu_base + MMU_ENABLE_OFFSET, 1); 5991 5992 return rc; 5993 } 5994 5995 static int gaudi2_pci_mmu_init(struct hl_device *hdev) 5996 { 5997 struct asic_fixed_properties *prop = &hdev->asic_prop; 5998 struct gaudi2_device *gaudi2 = hdev->asic_specific; 5999 u32 mmu_base, stlb_base; 6000 int rc; 6001 6002 if (gaudi2->hw_cap_initialized & HW_CAP_PMMU) 6003 return 0; 6004 6005 mmu_base = mmPMMU_HBW_MMU_BASE; 6006 stlb_base = mmPMMU_HBW_STLB_BASE; 6007 6008 RMWREG32_SHIFTED(stlb_base + STLB_HOP_CONFIGURATION_OFFSET, 6009 (0 << PMMU_HBW_STLB_HOP_CONFIGURATION_FIRST_HOP_SHIFT) | 6010 (5 << PMMU_HBW_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_SMALL_P_SHIFT) | 6011 (4 << PMMU_HBW_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_LARGE_P_SHIFT) | 6012 (5 << PMMU_HBW_STLB_HOP_CONFIGURATION_LAST_HOP_SHIFT) | 6013 (5 << PMMU_HBW_STLB_HOP_CONFIGURATION_FOLLOWER_HOP_SHIFT), 6014 PMMU_HBW_STLB_HOP_CONFIGURATION_FIRST_HOP_MASK | 6015 PMMU_HBW_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_SMALL_P_MASK | 6016 PMMU_HBW_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_LARGE_P_MASK | 6017 PMMU_HBW_STLB_HOP_CONFIGURATION_LAST_HOP_MASK | 6018 PMMU_HBW_STLB_HOP_CONFIGURATION_FOLLOWER_HOP_MASK); 6019 6020 WREG32(stlb_base + STLB_LL_LOOKUP_MASK_63_32_OFFSET, 0); 6021 6022 if (PAGE_SIZE == SZ_64K) { 6023 /* Set page sizes to 64K on hop5 and 16M on hop4 + enable 8 bit hops */ 6024 RMWREG32_SHIFTED(mmu_base + MMU_STATIC_MULTI_PAGE_SIZE_OFFSET, 6025 FIELD_PREP(DCORE0_HMMU0_MMU_STATIC_MULTI_PAGE_SIZE_HOP5_PAGE_SIZE_MASK, 4) | 6026 FIELD_PREP(DCORE0_HMMU0_MMU_STATIC_MULTI_PAGE_SIZE_HOP4_PAGE_SIZE_MASK, 3) | 6027 FIELD_PREP( 6028 DCORE0_HMMU0_MMU_STATIC_MULTI_PAGE_SIZE_CFG_8_BITS_HOP_MODE_EN_MASK, 6029 1), 6030 DCORE0_HMMU0_MMU_STATIC_MULTI_PAGE_SIZE_HOP5_PAGE_SIZE_MASK | 6031 DCORE0_HMMU0_MMU_STATIC_MULTI_PAGE_SIZE_HOP4_PAGE_SIZE_MASK | 6032 DCORE0_HMMU0_MMU_STATIC_MULTI_PAGE_SIZE_CFG_8_BITS_HOP_MODE_EN_MASK); 6033 } 6034 6035 WREG32(mmu_base + MMU_SPI_SEI_MASK_OFFSET, GAUDI2_PMMU_SPI_SEI_ENABLE_MASK); 6036 6037 rc = gaudi2_mmu_init_common(hdev, mmu_base, stlb_base, prop->pmmu.host_resident); 6038 if (rc) 6039 return rc; 6040 6041 gaudi2->hw_cap_initialized |= HW_CAP_PMMU; 6042 6043 return 0; 6044 } 6045 6046 static int gaudi2_dcore_hmmu_init(struct hl_device *hdev, int dcore_id, 6047 int hmmu_id) 6048 { 6049 struct asic_fixed_properties *prop = &hdev->asic_prop; 6050 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6051 u32 offset, mmu_base, stlb_base, hw_cap; 6052 u8 dmmu_seq; 6053 int rc; 6054 6055 dmmu_seq = NUM_OF_HMMU_PER_DCORE * dcore_id + hmmu_id; 6056 hw_cap = HW_CAP_DCORE0_DMMU0 << dmmu_seq; 6057 6058 /* 6059 * return if DMMU is already initialized or if it's not out of 6060 * isolation (due to cluster binning) 6061 */ 6062 if ((gaudi2->hw_cap_initialized & hw_cap) || !(prop->hmmu_hif_enabled_mask & BIT(dmmu_seq))) 6063 return 0; 6064 6065 offset = (u32) (dcore_id * DCORE_OFFSET + hmmu_id * DCORE_HMMU_OFFSET); 6066 mmu_base = mmDCORE0_HMMU0_MMU_BASE + offset; 6067 stlb_base = mmDCORE0_HMMU0_STLB_BASE + offset; 6068 6069 RMWREG32(mmu_base + MMU_STATIC_MULTI_PAGE_SIZE_OFFSET, 5 /* 64MB */, 6070 MMU_STATIC_MULTI_PAGE_SIZE_HOP4_PAGE_SIZE_MASK); 6071 6072 RMWREG32_SHIFTED(stlb_base + STLB_HOP_CONFIGURATION_OFFSET, 6073 FIELD_PREP(DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FIRST_HOP_MASK, 0) | 6074 FIELD_PREP(DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_SMALL_P_MASK, 3) | 6075 FIELD_PREP(DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_LARGE_P_MASK, 3) | 6076 FIELD_PREP(DCORE0_HMMU0_STLB_HOP_CONFIGURATION_LAST_HOP_MASK, 3) | 6077 FIELD_PREP(DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FOLLOWER_HOP_MASK, 3), 6078 DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FIRST_HOP_MASK | 6079 DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_SMALL_P_MASK | 6080 DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FIRST_LOOKUP_HOP_LARGE_P_MASK | 6081 DCORE0_HMMU0_STLB_HOP_CONFIGURATION_LAST_HOP_MASK | 6082 DCORE0_HMMU0_STLB_HOP_CONFIGURATION_FOLLOWER_HOP_MASK); 6083 6084 RMWREG32(stlb_base + STLB_HOP_CONFIGURATION_OFFSET, 1, 6085 STLB_HOP_CONFIGURATION_ONLY_LARGE_PAGE_MASK); 6086 6087 WREG32(mmu_base + MMU_SPI_SEI_MASK_OFFSET, GAUDI2_HMMU_SPI_SEI_ENABLE_MASK); 6088 6089 rc = gaudi2_mmu_init_common(hdev, mmu_base, stlb_base, prop->dmmu.host_resident); 6090 if (rc) 6091 return rc; 6092 6093 gaudi2->hw_cap_initialized |= hw_cap; 6094 6095 return 0; 6096 } 6097 6098 static int gaudi2_hbm_mmu_init(struct hl_device *hdev) 6099 { 6100 int rc, dcore_id, hmmu_id; 6101 6102 for (dcore_id = 0 ; dcore_id < NUM_OF_DCORES ; dcore_id++) 6103 for (hmmu_id = 0 ; hmmu_id < NUM_OF_HMMU_PER_DCORE; hmmu_id++) { 6104 rc = gaudi2_dcore_hmmu_init(hdev, dcore_id, hmmu_id); 6105 if (rc) 6106 return rc; 6107 } 6108 6109 return 0; 6110 } 6111 6112 static int gaudi2_mmu_init(struct hl_device *hdev) 6113 { 6114 int rc; 6115 6116 rc = gaudi2_pci_mmu_init(hdev); 6117 if (rc) 6118 return rc; 6119 6120 rc = gaudi2_hbm_mmu_init(hdev); 6121 if (rc) 6122 return rc; 6123 6124 return 0; 6125 } 6126 6127 static int gaudi2_hw_init(struct hl_device *hdev) 6128 { 6129 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6130 int rc; 6131 6132 /* Let's mark in the H/W that we have reached this point. We check 6133 * this value in the reset_before_init function to understand whether 6134 * we need to reset the chip before doing H/W init. This register is 6135 * cleared by the H/W upon H/W reset 6136 */ 6137 WREG32(mmHW_STATE, HL_DEVICE_HW_STATE_DIRTY); 6138 6139 /* Perform read from the device to make sure device is up */ 6140 RREG32(mmHW_STATE); 6141 6142 /* If iATU is done by FW, the HBM bar ALWAYS points to DRAM_PHYS_BASE. 6143 * So we set it here and if anyone tries to move it later to 6144 * a different address, there will be an error 6145 */ 6146 if (hdev->asic_prop.iatu_done_by_fw) 6147 gaudi2->dram_bar_cur_addr = DRAM_PHYS_BASE; 6148 6149 /* 6150 * Before pushing u-boot/linux to device, need to set the hbm bar to 6151 * base address of dram 6152 */ 6153 if (gaudi2_set_hbm_bar_base(hdev, DRAM_PHYS_BASE) == U64_MAX) { 6154 dev_err(hdev->dev, "failed to map HBM bar to DRAM base address\n"); 6155 return -EIO; 6156 } 6157 6158 rc = gaudi2_init_cpu(hdev); 6159 if (rc) { 6160 dev_err(hdev->dev, "failed to initialize CPU\n"); 6161 return rc; 6162 } 6163 6164 gaudi2_init_scrambler_hbm(hdev); 6165 gaudi2_init_kdma(hdev); 6166 6167 rc = gaudi2_init_cpu_queues(hdev, GAUDI2_CPU_TIMEOUT_USEC); 6168 if (rc) { 6169 dev_err(hdev->dev, "failed to initialize CPU H/W queues %d\n", rc); 6170 return rc; 6171 } 6172 6173 rc = gaudi2->cpucp_info_get(hdev); 6174 if (rc) { 6175 dev_err(hdev->dev, "Failed to get cpucp info\n"); 6176 return rc; 6177 } 6178 6179 rc = gaudi2_mmu_init(hdev); 6180 if (rc) 6181 return rc; 6182 6183 gaudi2_init_pdma(hdev); 6184 gaudi2_init_edma(hdev); 6185 gaudi2_init_sm(hdev); 6186 gaudi2_init_tpc(hdev); 6187 gaudi2_init_mme(hdev); 6188 gaudi2_init_rotator(hdev); 6189 gaudi2_init_dec(hdev); 6190 gaudi2_enable_timestamp(hdev); 6191 6192 rc = gaudi2_coresight_init(hdev); 6193 if (rc) 6194 goto disable_queues; 6195 6196 rc = gaudi2_enable_msix(hdev); 6197 if (rc) 6198 goto disable_queues; 6199 6200 /* Perform read from the device to flush all configuration */ 6201 RREG32(mmHW_STATE); 6202 6203 return 0; 6204 6205 disable_queues: 6206 gaudi2_disable_dma_qmans(hdev); 6207 gaudi2_disable_mme_qmans(hdev); 6208 gaudi2_disable_tpc_qmans(hdev); 6209 gaudi2_disable_rot_qmans(hdev); 6210 gaudi2_disable_nic_qmans(hdev); 6211 6212 gaudi2_disable_timestamp(hdev); 6213 6214 return rc; 6215 } 6216 6217 /** 6218 * gaudi2_send_hard_reset_cmd - common function to handle reset 6219 * 6220 * @hdev: pointer to the habanalabs device structure 6221 * 6222 * This function handles the various possible scenarios for reset. 6223 * It considers if reset is handled by driver\FW and what FW components are loaded 6224 */ 6225 static void gaudi2_send_hard_reset_cmd(struct hl_device *hdev) 6226 { 6227 struct cpu_dyn_regs *dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 6228 bool heartbeat_reset, preboot_only, cpu_initialized = false; 6229 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6230 u32 cpu_boot_status; 6231 6232 preboot_only = (hdev->fw_loader.fw_comp_loaded == FW_TYPE_PREBOOT_CPU); 6233 heartbeat_reset = (hdev->reset_info.curr_reset_cause == HL_RESET_CAUSE_HEARTBEAT); 6234 6235 /* 6236 * Handle corner case where failure was at cpu management app load, 6237 * and driver didn't detect any failure while loading the FW, 6238 * then at such scenario driver will send only HALT_MACHINE 6239 * and no one will respond to this request since FW already back to preboot 6240 * and it cannot handle such cmd. 6241 * In this case next time the management app loads it'll check on events register 6242 * which will still have the halt indication, and will reboot the device. 6243 * The solution is to let preboot clear all relevant registers before next boot 6244 * once driver send COMMS_RST_DEV. 6245 */ 6246 cpu_boot_status = RREG32(mmPSOC_GLOBAL_CONF_CPU_BOOT_STATUS); 6247 6248 if (gaudi2 && (gaudi2->hw_cap_initialized & HW_CAP_CPU) && 6249 (cpu_boot_status == CPU_BOOT_STATUS_SRAM_AVAIL)) 6250 cpu_initialized = true; 6251 6252 /* 6253 * when Linux/Bootfit exist this write to the SP can be interpreted in 2 ways: 6254 * 1. FW reset: FW initiate the reset sequence 6255 * 2. driver reset: FW will start HALT sequence (the preparations for the 6256 * reset but not the reset itself as it is not implemented 6257 * on their part) and LKD will wait to let FW complete the 6258 * sequence before issuing the reset 6259 */ 6260 if (!preboot_only && cpu_initialized) { 6261 WREG32(le32_to_cpu(dyn_regs->gic_host_halt_irq), 6262 gaudi2_irq_map_table[GAUDI2_EVENT_CPU_HALT_MACHINE].cpu_id); 6263 6264 msleep(GAUDI2_CPU_RESET_WAIT_MSEC); 6265 } 6266 6267 /* 6268 * When working with preboot (without Linux/Boot fit) we can 6269 * communicate only using the COMMS commands to issue halt/reset. 6270 * 6271 * For the case in which we are working with Linux/Bootfit this is a hail-mary 6272 * attempt to revive the card in the small chance that the f/w has 6273 * experienced a watchdog event, which caused it to return back to preboot. 6274 * In that case, triggering reset through GIC won't help. We need to 6275 * trigger the reset as if Linux wasn't loaded. 6276 * 6277 * We do it only if the reset cause was HB, because that would be the 6278 * indication of such an event. 6279 * 6280 * In case watchdog hasn't expired but we still got HB, then this won't 6281 * do any damage. 6282 */ 6283 6284 if (heartbeat_reset || preboot_only || !cpu_initialized) { 6285 if (hdev->asic_prop.hard_reset_done_by_fw) 6286 hl_fw_ask_hard_reset_without_linux(hdev); 6287 else 6288 hl_fw_ask_halt_machine_without_linux(hdev); 6289 } 6290 } 6291 6292 /** 6293 * gaudi2_execute_hard_reset - execute hard reset by driver/FW 6294 * 6295 * @hdev: pointer to the habanalabs device structure 6296 * 6297 * This function executes hard reset based on if driver/FW should do the reset 6298 */ 6299 static void gaudi2_execute_hard_reset(struct hl_device *hdev) 6300 { 6301 if (hdev->asic_prop.hard_reset_done_by_fw) { 6302 gaudi2_send_hard_reset_cmd(hdev); 6303 return; 6304 } 6305 6306 /* Set device to handle FLR by H/W as we will put the device 6307 * CPU to halt mode 6308 */ 6309 WREG32(mmPCIE_AUX_FLR_CTRL, 6310 (PCIE_AUX_FLR_CTRL_HW_CTRL_MASK | PCIE_AUX_FLR_CTRL_INT_MASK_MASK)); 6311 6312 gaudi2_send_hard_reset_cmd(hdev); 6313 6314 WREG32(mmPSOC_RESET_CONF_SW_ALL_RST, 1); 6315 } 6316 6317 static int gaudi2_get_soft_rst_done_indication(struct hl_device *hdev, u32 poll_timeout_us) 6318 { 6319 int i, rc = 0; 6320 u32 reg_val; 6321 6322 for (i = 0 ; i < GAUDI2_RESET_POLL_CNT ; i++) 6323 rc = hl_poll_timeout( 6324 hdev, 6325 mmCPU_RST_STATUS_TO_HOST, 6326 reg_val, 6327 reg_val == CPU_RST_STATUS_SOFT_RST_DONE, 6328 1000, 6329 poll_timeout_us); 6330 6331 if (rc) 6332 dev_err(hdev->dev, "Timeout while waiting for FW to complete soft reset (0x%x)\n", 6333 reg_val); 6334 return rc; 6335 } 6336 6337 /** 6338 * gaudi2_execute_soft_reset - execute soft reset by driver/FW 6339 * 6340 * @hdev: pointer to the habanalabs device structure 6341 * @driver_performs_reset: true if driver should perform reset instead of f/w. 6342 * @poll_timeout_us: time to wait for response from f/w. 6343 * 6344 * This function executes soft reset based on if driver/FW should do the reset 6345 */ 6346 static int gaudi2_execute_soft_reset(struct hl_device *hdev, bool driver_performs_reset, 6347 u32 poll_timeout_us) 6348 { 6349 int rc; 6350 6351 if (!driver_performs_reset) { 6352 if (hl_is_fw_sw_ver_below(hdev, 1, 10)) { 6353 /* set SP to indicate reset request sent to FW */ 6354 WREG32(mmCPU_RST_STATUS_TO_HOST, CPU_RST_STATUS_NA); 6355 6356 WREG32(mmGIC_HOST_SOFT_RST_IRQ_POLL_REG, 6357 gaudi2_irq_map_table[GAUDI2_EVENT_CPU_SOFT_RESET].cpu_id); 6358 6359 /* wait for f/w response */ 6360 rc = gaudi2_get_soft_rst_done_indication(hdev, poll_timeout_us); 6361 } else { 6362 rc = hl_fw_send_soft_reset(hdev); 6363 } 6364 return rc; 6365 } 6366 6367 /* Block access to engines, QMANs and SM during reset, these 6368 * RRs will be reconfigured after soft reset. 6369 * PCIE_MSIX is left unsecured to allow NIC packets processing during the reset. 6370 */ 6371 gaudi2_write_rr_to_all_lbw_rtrs(hdev, RR_TYPE_LONG, NUM_LONG_LBW_RR - 1, 6372 mmDCORE0_TPC0_QM_DCCM_BASE, mmPCIE_MSIX_BASE); 6373 6374 gaudi2_write_rr_to_all_lbw_rtrs(hdev, RR_TYPE_LONG, NUM_LONG_LBW_RR - 2, 6375 mmPCIE_MSIX_BASE + HL_BLOCK_SIZE, 6376 mmPCIE_VDEC1_MSTR_IF_RR_SHRD_HBW_BASE + HL_BLOCK_SIZE); 6377 6378 WREG32(mmPSOC_RESET_CONF_SOFT_RST, 1); 6379 return 0; 6380 } 6381 6382 static void gaudi2_poll_btm_indication(struct hl_device *hdev, u32 poll_timeout_us) 6383 { 6384 int i, rc = 0; 6385 u32 reg_val; 6386 6387 /* We poll the BTM done indication multiple times after reset due to 6388 * a HW errata 'GAUDI2_0300' 6389 */ 6390 for (i = 0 ; i < GAUDI2_RESET_POLL_CNT ; i++) 6391 rc = hl_poll_timeout( 6392 hdev, 6393 mmPSOC_GLOBAL_CONF_BTM_FSM, 6394 reg_val, 6395 reg_val == 0, 6396 1000, 6397 poll_timeout_us); 6398 6399 if (rc) 6400 dev_err(hdev->dev, "Timeout while waiting for device to reset 0x%x\n", reg_val); 6401 } 6402 6403 static int gaudi2_hw_fini(struct hl_device *hdev, bool hard_reset, bool fw_reset) 6404 { 6405 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6406 u32 poll_timeout_us, reset_sleep_ms; 6407 bool driver_performs_reset = false; 6408 int rc; 6409 6410 if (hdev->pldm) { 6411 reset_sleep_ms = hard_reset ? GAUDI2_PLDM_HRESET_TIMEOUT_MSEC : 6412 GAUDI2_PLDM_SRESET_TIMEOUT_MSEC; 6413 poll_timeout_us = GAUDI2_PLDM_RESET_POLL_TIMEOUT_USEC; 6414 } else { 6415 reset_sleep_ms = GAUDI2_RESET_TIMEOUT_MSEC; 6416 poll_timeout_us = GAUDI2_RESET_POLL_TIMEOUT_USEC; 6417 } 6418 6419 if (fw_reset) 6420 goto skip_reset; 6421 6422 gaudi2_reset_arcs(hdev); 6423 6424 if (hard_reset) { 6425 driver_performs_reset = !hdev->asic_prop.hard_reset_done_by_fw; 6426 gaudi2_execute_hard_reset(hdev); 6427 } else { 6428 /* 6429 * As we have to support also work with preboot only (which does not supports 6430 * soft reset) we have to make sure that security is disabled before letting driver 6431 * do the reset. user shall control the BFE flags to avoid asking soft reset in 6432 * secured device with preboot only. 6433 */ 6434 driver_performs_reset = (hdev->fw_components == FW_TYPE_PREBOOT_CPU && 6435 !hdev->asic_prop.fw_security_enabled); 6436 rc = gaudi2_execute_soft_reset(hdev, driver_performs_reset, poll_timeout_us); 6437 if (rc) 6438 return rc; 6439 } 6440 6441 skip_reset: 6442 if (driver_performs_reset || hard_reset) { 6443 /* 6444 * Instead of waiting for BTM indication we should wait for preboot ready: 6445 * Consider the below scenario: 6446 * 1. FW update is being triggered 6447 * - setting the dirty bit 6448 * 2. hard reset will be triggered due to the dirty bit 6449 * 3. FW initiates the reset: 6450 * - dirty bit cleared 6451 * - BTM indication cleared 6452 * - preboot ready indication cleared 6453 * 4. during hard reset: 6454 * - BTM indication will be set 6455 * - BIST test performed and another reset triggered 6456 * 5. only after this reset the preboot will set the preboot ready 6457 * 6458 * when polling on BTM indication alone we can lose sync with FW while trying to 6459 * communicate with FW that is during reset. 6460 * to overcome this we will always wait to preboot ready indication 6461 */ 6462 6463 /* without this sleep reset will not work */ 6464 msleep(reset_sleep_ms); 6465 6466 if (hdev->fw_components & FW_TYPE_PREBOOT_CPU) 6467 hl_fw_wait_preboot_ready(hdev); 6468 else 6469 gaudi2_poll_btm_indication(hdev, poll_timeout_us); 6470 } 6471 6472 if (!gaudi2) 6473 return 0; 6474 6475 gaudi2->dec_hw_cap_initialized &= ~(HW_CAP_DEC_MASK); 6476 gaudi2->tpc_hw_cap_initialized &= ~(HW_CAP_TPC_MASK); 6477 6478 /* 6479 * Clear NIC capability mask in order for driver to re-configure 6480 * NIC QMANs. NIC ports will not be re-configured during soft 6481 * reset as we call gaudi2_nic_init only during hard reset 6482 */ 6483 gaudi2->nic_hw_cap_initialized &= ~(HW_CAP_NIC_MASK); 6484 6485 if (hard_reset) { 6486 gaudi2->hw_cap_initialized &= 6487 ~(HW_CAP_DRAM | HW_CAP_CLK_GATE | HW_CAP_HBM_SCRAMBLER_MASK | 6488 HW_CAP_PMMU | HW_CAP_CPU | HW_CAP_CPU_Q | 6489 HW_CAP_SRAM_SCRAMBLER | HW_CAP_DMMU_MASK | 6490 HW_CAP_PDMA_MASK | HW_CAP_EDMA_MASK | HW_CAP_KDMA | 6491 HW_CAP_MME_MASK | HW_CAP_ROT_MASK); 6492 6493 memset(gaudi2->events_stat, 0, sizeof(gaudi2->events_stat)); 6494 } else { 6495 gaudi2->hw_cap_initialized &= 6496 ~(HW_CAP_CLK_GATE | HW_CAP_HBM_SCRAMBLER_SW_RESET | 6497 HW_CAP_PDMA_MASK | HW_CAP_EDMA_MASK | HW_CAP_MME_MASK | 6498 HW_CAP_ROT_MASK); 6499 } 6500 return 0; 6501 } 6502 6503 static int gaudi2_suspend(struct hl_device *hdev) 6504 { 6505 int rc; 6506 6507 rc = hl_fw_send_pci_access_msg(hdev, CPUCP_PACKET_DISABLE_PCI_ACCESS, 0x0); 6508 if (rc) 6509 dev_err(hdev->dev, "Failed to disable PCI access from CPU\n"); 6510 6511 return rc; 6512 } 6513 6514 static int gaudi2_resume(struct hl_device *hdev) 6515 { 6516 return gaudi2_init_iatu(hdev); 6517 } 6518 6519 static int gaudi2_mmap(struct hl_device *hdev, struct vm_area_struct *vma, 6520 void *cpu_addr, dma_addr_t dma_addr, size_t size) 6521 { 6522 int rc; 6523 6524 vm_flags_set(vma, VM_IO | VM_PFNMAP | VM_DONTEXPAND | VM_DONTDUMP | 6525 VM_DONTCOPY | VM_NORESERVE); 6526 6527 #ifdef _HAS_DMA_MMAP_COHERENT 6528 6529 rc = dma_mmap_coherent(hdev->dev, vma, cpu_addr, dma_addr, size); 6530 if (rc) 6531 dev_err(hdev->dev, "dma_mmap_coherent error %d", rc); 6532 6533 #else 6534 6535 rc = remap_pfn_range(vma, vma->vm_start, 6536 virt_to_phys(cpu_addr) >> PAGE_SHIFT, 6537 size, vma->vm_page_prot); 6538 if (rc) 6539 dev_err(hdev->dev, "remap_pfn_range error %d", rc); 6540 6541 #endif 6542 6543 return rc; 6544 } 6545 6546 static bool gaudi2_is_queue_enabled(struct hl_device *hdev, u32 hw_queue_id) 6547 { 6548 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6549 u64 hw_cap_mask = 0; 6550 u64 hw_tpc_cap_bit = 0; 6551 u64 hw_nic_cap_bit = 0; 6552 u64 hw_test_cap_bit = 0; 6553 6554 switch (hw_queue_id) { 6555 case GAUDI2_QUEUE_ID_PDMA_0_0: 6556 case GAUDI2_QUEUE_ID_PDMA_0_1: 6557 case GAUDI2_QUEUE_ID_PDMA_1_0: 6558 hw_cap_mask = HW_CAP_PDMA_MASK; 6559 break; 6560 case GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE0_EDMA_1_3: 6561 hw_test_cap_bit = HW_CAP_EDMA_SHIFT + 6562 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0) >> 2); 6563 break; 6564 case GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE1_EDMA_1_3: 6565 hw_test_cap_bit = HW_CAP_EDMA_SHIFT + NUM_OF_EDMA_PER_DCORE + 6566 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0) >> 2); 6567 break; 6568 case GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE2_EDMA_1_3: 6569 hw_test_cap_bit = HW_CAP_EDMA_SHIFT + 2 * NUM_OF_EDMA_PER_DCORE + 6570 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0) >> 2); 6571 break; 6572 case GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0...GAUDI2_QUEUE_ID_DCORE3_EDMA_1_3: 6573 hw_test_cap_bit = HW_CAP_EDMA_SHIFT + 3 * NUM_OF_EDMA_PER_DCORE + 6574 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0) >> 2); 6575 break; 6576 6577 case GAUDI2_QUEUE_ID_DCORE0_MME_0_0 ... GAUDI2_QUEUE_ID_DCORE0_MME_0_3: 6578 hw_test_cap_bit = HW_CAP_MME_SHIFT; 6579 break; 6580 6581 case GAUDI2_QUEUE_ID_DCORE1_MME_0_0 ... GAUDI2_QUEUE_ID_DCORE1_MME_0_3: 6582 hw_test_cap_bit = HW_CAP_MME_SHIFT + 1; 6583 break; 6584 6585 case GAUDI2_QUEUE_ID_DCORE2_MME_0_0 ... GAUDI2_QUEUE_ID_DCORE2_MME_0_3: 6586 hw_test_cap_bit = HW_CAP_MME_SHIFT + 2; 6587 break; 6588 6589 case GAUDI2_QUEUE_ID_DCORE3_MME_0_0 ... GAUDI2_QUEUE_ID_DCORE3_MME_0_3: 6590 hw_test_cap_bit = HW_CAP_MME_SHIFT + 3; 6591 break; 6592 6593 case GAUDI2_QUEUE_ID_DCORE0_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE0_TPC_5_3: 6594 hw_tpc_cap_bit = HW_CAP_TPC_SHIFT + 6595 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE0_TPC_0_0) >> 2); 6596 6597 /* special case where cap bit refers to the first queue id */ 6598 if (!hw_tpc_cap_bit) 6599 return !!(gaudi2->tpc_hw_cap_initialized & BIT_ULL(0)); 6600 break; 6601 6602 case GAUDI2_QUEUE_ID_DCORE1_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE1_TPC_5_3: 6603 hw_tpc_cap_bit = HW_CAP_TPC_SHIFT + NUM_OF_TPC_PER_DCORE + 6604 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE1_TPC_0_0) >> 2); 6605 break; 6606 6607 case GAUDI2_QUEUE_ID_DCORE2_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE2_TPC_5_3: 6608 hw_tpc_cap_bit = HW_CAP_TPC_SHIFT + (2 * NUM_OF_TPC_PER_DCORE) + 6609 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE2_TPC_0_0) >> 2); 6610 break; 6611 6612 case GAUDI2_QUEUE_ID_DCORE3_TPC_0_0 ... GAUDI2_QUEUE_ID_DCORE3_TPC_5_3: 6613 hw_tpc_cap_bit = HW_CAP_TPC_SHIFT + (3 * NUM_OF_TPC_PER_DCORE) + 6614 ((hw_queue_id - GAUDI2_QUEUE_ID_DCORE3_TPC_0_0) >> 2); 6615 break; 6616 6617 case GAUDI2_QUEUE_ID_DCORE0_TPC_6_0 ... GAUDI2_QUEUE_ID_DCORE0_TPC_6_3: 6618 hw_tpc_cap_bit = HW_CAP_TPC_SHIFT + (4 * NUM_OF_TPC_PER_DCORE); 6619 break; 6620 6621 case GAUDI2_QUEUE_ID_ROT_0_0 ... GAUDI2_QUEUE_ID_ROT_1_3: 6622 hw_test_cap_bit = HW_CAP_ROT_SHIFT + ((hw_queue_id - GAUDI2_QUEUE_ID_ROT_0_0) >> 2); 6623 break; 6624 6625 case GAUDI2_QUEUE_ID_NIC_0_0 ... GAUDI2_QUEUE_ID_NIC_23_3: 6626 hw_nic_cap_bit = HW_CAP_NIC_SHIFT + ((hw_queue_id - GAUDI2_QUEUE_ID_NIC_0_0) >> 2); 6627 6628 /* special case where cap bit refers to the first queue id */ 6629 if (!hw_nic_cap_bit) 6630 return !!(gaudi2->nic_hw_cap_initialized & BIT_ULL(0)); 6631 break; 6632 6633 case GAUDI2_QUEUE_ID_CPU_PQ: 6634 return !!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q); 6635 6636 default: 6637 return false; 6638 } 6639 6640 if (hw_tpc_cap_bit) 6641 return !!(gaudi2->tpc_hw_cap_initialized & BIT_ULL(hw_tpc_cap_bit)); 6642 6643 if (hw_nic_cap_bit) 6644 return !!(gaudi2->nic_hw_cap_initialized & BIT_ULL(hw_nic_cap_bit)); 6645 6646 if (hw_test_cap_bit) 6647 hw_cap_mask = BIT_ULL(hw_test_cap_bit); 6648 6649 return !!(gaudi2->hw_cap_initialized & hw_cap_mask); 6650 } 6651 6652 static bool gaudi2_is_arc_enabled(struct hl_device *hdev, u64 arc_id) 6653 { 6654 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6655 6656 switch (arc_id) { 6657 case CPU_ID_SCHED_ARC0 ... CPU_ID_SCHED_ARC5: 6658 case CPU_ID_MME_QMAN_ARC0...CPU_ID_ROT_QMAN_ARC1: 6659 return !!(gaudi2->active_hw_arc & BIT_ULL(arc_id)); 6660 6661 case CPU_ID_TPC_QMAN_ARC0...CPU_ID_TPC_QMAN_ARC24: 6662 return !!(gaudi2->active_tpc_arc & BIT_ULL(arc_id - CPU_ID_TPC_QMAN_ARC0)); 6663 6664 case CPU_ID_NIC_QMAN_ARC0...CPU_ID_NIC_QMAN_ARC23: 6665 return !!(gaudi2->active_nic_arc & BIT_ULL(arc_id - CPU_ID_NIC_QMAN_ARC0)); 6666 6667 default: 6668 return false; 6669 } 6670 } 6671 6672 static void gaudi2_clr_arc_id_cap(struct hl_device *hdev, u64 arc_id) 6673 { 6674 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6675 6676 switch (arc_id) { 6677 case CPU_ID_SCHED_ARC0 ... CPU_ID_SCHED_ARC5: 6678 case CPU_ID_MME_QMAN_ARC0...CPU_ID_ROT_QMAN_ARC1: 6679 gaudi2->active_hw_arc &= ~(BIT_ULL(arc_id)); 6680 break; 6681 6682 case CPU_ID_TPC_QMAN_ARC0...CPU_ID_TPC_QMAN_ARC24: 6683 gaudi2->active_tpc_arc &= ~(BIT_ULL(arc_id - CPU_ID_TPC_QMAN_ARC0)); 6684 break; 6685 6686 case CPU_ID_NIC_QMAN_ARC0...CPU_ID_NIC_QMAN_ARC23: 6687 gaudi2->active_nic_arc &= ~(BIT_ULL(arc_id - CPU_ID_NIC_QMAN_ARC0)); 6688 break; 6689 6690 default: 6691 return; 6692 } 6693 } 6694 6695 static void gaudi2_set_arc_id_cap(struct hl_device *hdev, u64 arc_id) 6696 { 6697 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6698 6699 switch (arc_id) { 6700 case CPU_ID_SCHED_ARC0 ... CPU_ID_SCHED_ARC5: 6701 case CPU_ID_MME_QMAN_ARC0...CPU_ID_ROT_QMAN_ARC1: 6702 gaudi2->active_hw_arc |= BIT_ULL(arc_id); 6703 break; 6704 6705 case CPU_ID_TPC_QMAN_ARC0...CPU_ID_TPC_QMAN_ARC24: 6706 gaudi2->active_tpc_arc |= BIT_ULL(arc_id - CPU_ID_TPC_QMAN_ARC0); 6707 break; 6708 6709 case CPU_ID_NIC_QMAN_ARC0...CPU_ID_NIC_QMAN_ARC23: 6710 gaudi2->active_nic_arc |= BIT_ULL(arc_id - CPU_ID_NIC_QMAN_ARC0); 6711 break; 6712 6713 default: 6714 return; 6715 } 6716 } 6717 6718 static void gaudi2_ring_doorbell(struct hl_device *hdev, u32 hw_queue_id, u32 pi) 6719 { 6720 struct cpu_dyn_regs *dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 6721 u32 pq_offset, reg_base, db_reg_offset, db_value; 6722 6723 if (hw_queue_id != GAUDI2_QUEUE_ID_CPU_PQ) { 6724 /* 6725 * QMAN has 4 successive PQ_PI registers, 1 for each of the QMAN PQs. 6726 * Masking the H/W queue ID with 0x3 extracts the QMAN internal PQ 6727 * number. 6728 */ 6729 pq_offset = (hw_queue_id & 0x3) * 4; 6730 reg_base = gaudi2_qm_blocks_bases[hw_queue_id]; 6731 db_reg_offset = reg_base + QM_PQ_PI_0_OFFSET + pq_offset; 6732 } else { 6733 db_reg_offset = mmCPU_IF_PF_PQ_PI; 6734 } 6735 6736 db_value = pi; 6737 6738 /* ring the doorbell */ 6739 WREG32(db_reg_offset, db_value); 6740 6741 if (hw_queue_id == GAUDI2_QUEUE_ID_CPU_PQ) { 6742 /* make sure device CPU will read latest data from host */ 6743 mb(); 6744 WREG32(le32_to_cpu(dyn_regs->gic_host_pi_upd_irq), 6745 gaudi2_irq_map_table[GAUDI2_EVENT_CPU_PI_UPDATE].cpu_id); 6746 } 6747 } 6748 6749 static void gaudi2_pqe_write(struct hl_device *hdev, __le64 *pqe, struct hl_bd *bd) 6750 { 6751 __le64 *pbd = (__le64 *) bd; 6752 6753 /* The QMANs are on the host memory so a simple copy suffice */ 6754 pqe[0] = pbd[0]; 6755 pqe[1] = pbd[1]; 6756 } 6757 6758 static void *gaudi2_dma_alloc_coherent(struct hl_device *hdev, size_t size, 6759 dma_addr_t *dma_handle, gfp_t flags) 6760 { 6761 return dma_alloc_coherent(&hdev->pdev->dev, size, dma_handle, flags); 6762 } 6763 6764 static void gaudi2_dma_free_coherent(struct hl_device *hdev, size_t size, 6765 void *cpu_addr, dma_addr_t dma_handle) 6766 { 6767 dma_free_coherent(&hdev->pdev->dev, size, cpu_addr, dma_handle); 6768 } 6769 6770 static int gaudi2_send_cpu_message(struct hl_device *hdev, u32 *msg, u16 len, 6771 u32 timeout, u64 *result) 6772 { 6773 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6774 6775 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) { 6776 if (result) 6777 *result = 0; 6778 return 0; 6779 } 6780 6781 if (!timeout) 6782 timeout = GAUDI2_MSG_TO_CPU_TIMEOUT_USEC; 6783 6784 return hl_fw_send_cpu_message(hdev, GAUDI2_QUEUE_ID_CPU_PQ, msg, len, timeout, result); 6785 } 6786 6787 static void *gaudi2_dma_pool_zalloc(struct hl_device *hdev, size_t size, 6788 gfp_t mem_flags, dma_addr_t *dma_handle) 6789 { 6790 if (size > GAUDI2_DMA_POOL_BLK_SIZE) 6791 return NULL; 6792 6793 return dma_pool_zalloc(hdev->dma_pool, mem_flags, dma_handle); 6794 } 6795 6796 static void gaudi2_dma_pool_free(struct hl_device *hdev, void *vaddr, dma_addr_t dma_addr) 6797 { 6798 dma_pool_free(hdev->dma_pool, vaddr, dma_addr); 6799 } 6800 6801 static void *gaudi2_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size, 6802 dma_addr_t *dma_handle) 6803 { 6804 return hl_fw_cpu_accessible_dma_pool_alloc(hdev, size, dma_handle); 6805 } 6806 6807 static void gaudi2_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size, void *vaddr) 6808 { 6809 hl_fw_cpu_accessible_dma_pool_free(hdev, size, vaddr); 6810 } 6811 6812 static int gaudi2_validate_cb_address(struct hl_device *hdev, struct hl_cs_parser *parser) 6813 { 6814 struct asic_fixed_properties *asic_prop = &hdev->asic_prop; 6815 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6816 6817 if (!gaudi2_is_queue_enabled(hdev, parser->hw_queue_id)) { 6818 dev_err(hdev->dev, "h/w queue %d is disabled\n", parser->hw_queue_id); 6819 return -EINVAL; 6820 } 6821 6822 /* Just check if CB address is valid */ 6823 6824 if (hl_mem_area_inside_range((u64) (uintptr_t) parser->user_cb, 6825 parser->user_cb_size, 6826 asic_prop->sram_user_base_address, 6827 asic_prop->sram_end_address)) 6828 return 0; 6829 6830 if (hl_mem_area_inside_range((u64) (uintptr_t) parser->user_cb, 6831 parser->user_cb_size, 6832 asic_prop->dram_user_base_address, 6833 asic_prop->dram_end_address)) 6834 return 0; 6835 6836 if ((gaudi2->hw_cap_initialized & HW_CAP_DMMU_MASK) && 6837 hl_mem_area_inside_range((u64) (uintptr_t) parser->user_cb, 6838 parser->user_cb_size, 6839 asic_prop->dmmu.start_addr, 6840 asic_prop->dmmu.end_addr)) 6841 return 0; 6842 6843 if (gaudi2->hw_cap_initialized & HW_CAP_PMMU) { 6844 if (hl_mem_area_inside_range((u64) (uintptr_t) parser->user_cb, 6845 parser->user_cb_size, 6846 asic_prop->pmmu.start_addr, 6847 asic_prop->pmmu.end_addr) || 6848 hl_mem_area_inside_range( 6849 (u64) (uintptr_t) parser->user_cb, 6850 parser->user_cb_size, 6851 asic_prop->pmmu_huge.start_addr, 6852 asic_prop->pmmu_huge.end_addr)) 6853 return 0; 6854 6855 } else if (gaudi2_host_phys_addr_valid((u64) (uintptr_t) parser->user_cb)) { 6856 if (!hdev->pdev) 6857 return 0; 6858 6859 if (!device_iommu_mapped(&hdev->pdev->dev)) 6860 return 0; 6861 } 6862 6863 dev_err(hdev->dev, "CB address %p + 0x%x for internal QMAN is not valid\n", 6864 parser->user_cb, parser->user_cb_size); 6865 6866 return -EFAULT; 6867 } 6868 6869 static int gaudi2_cs_parser(struct hl_device *hdev, struct hl_cs_parser *parser) 6870 { 6871 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6872 6873 if (!parser->is_kernel_allocated_cb) 6874 return gaudi2_validate_cb_address(hdev, parser); 6875 6876 if (!(gaudi2->hw_cap_initialized & HW_CAP_PMMU)) { 6877 dev_err(hdev->dev, "PMMU not initialized - Unsupported mode in Gaudi2\n"); 6878 return -EINVAL; 6879 } 6880 6881 return 0; 6882 } 6883 6884 static int gaudi2_send_heartbeat(struct hl_device *hdev) 6885 { 6886 struct gaudi2_device *gaudi2 = hdev->asic_specific; 6887 6888 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) 6889 return 0; 6890 6891 return hl_fw_send_heartbeat(hdev); 6892 } 6893 6894 /* This is an internal helper function, used to update the KDMA mmu props. 6895 * Should be called with a proper kdma lock. 6896 */ 6897 static void gaudi2_kdma_set_mmbp_asid(struct hl_device *hdev, 6898 bool mmu_bypass, u32 asid) 6899 { 6900 u32 rw_asid, rw_mmu_bp; 6901 6902 rw_asid = (asid << ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_RD_SHIFT) | 6903 (asid << ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_WR_SHIFT); 6904 6905 rw_mmu_bp = (!!mmu_bypass << ARC_FARM_KDMA_CTX_AXUSER_HB_MMU_BP_RD_SHIFT) | 6906 (!!mmu_bypass << ARC_FARM_KDMA_CTX_AXUSER_HB_MMU_BP_WR_SHIFT); 6907 6908 WREG32(mmARC_FARM_KDMA_CTX_AXUSER_HB_ASID, rw_asid); 6909 WREG32(mmARC_FARM_KDMA_CTX_AXUSER_HB_MMU_BP, rw_mmu_bp); 6910 } 6911 6912 static void gaudi2_arm_cq_monitor(struct hl_device *hdev, u32 sob_id, u32 mon_id, u32 cq_id, 6913 u32 mon_payload, u32 sync_value) 6914 { 6915 u32 sob_offset, mon_offset, sync_group_id, mode, mon_arm; 6916 u8 mask; 6917 6918 sob_offset = sob_id * 4; 6919 mon_offset = mon_id * 4; 6920 6921 /* Reset the SOB value */ 6922 WREG32(mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_offset, 0); 6923 6924 /* Configure this address with CQ_ID 0 because CQ_EN is set */ 6925 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 + mon_offset, cq_id); 6926 6927 /* Configure this address with CS index because CQ_EN is set */ 6928 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_DATA_0 + mon_offset, mon_payload); 6929 6930 sync_group_id = sob_id / 8; 6931 mask = ~(1 << (sob_id & 0x7)); 6932 mode = 1; /* comparison mode is "equal to" */ 6933 6934 mon_arm = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_SOD_MASK, sync_value); 6935 mon_arm |= FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_SOP_MASK, mode); 6936 mon_arm |= FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_MASK_MASK, mask); 6937 mon_arm |= FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_MON_ARM_SID_MASK, sync_group_id); 6938 WREG32(mmDCORE0_SYNC_MNGR_OBJS_MON_ARM_0 + mon_offset, mon_arm); 6939 } 6940 6941 /* This is an internal helper function used by gaudi2_send_job_to_kdma only */ 6942 static int gaudi2_send_job_to_kdma(struct hl_device *hdev, 6943 u64 src_addr, u64 dst_addr, 6944 u32 size, bool is_memset) 6945 { 6946 u32 comp_val, commit_mask, *polling_addr, timeout, status = 0; 6947 struct hl_cq_entry *cq_base; 6948 struct hl_cq *cq; 6949 u64 comp_addr; 6950 int rc; 6951 6952 gaudi2_arm_cq_monitor(hdev, GAUDI2_RESERVED_SOB_KDMA_COMPLETION, 6953 GAUDI2_RESERVED_MON_KDMA_COMPLETION, 6954 GAUDI2_RESERVED_CQ_KDMA_COMPLETION, 1, 1); 6955 6956 comp_addr = CFG_BASE + mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + 6957 (GAUDI2_RESERVED_SOB_KDMA_COMPLETION * sizeof(u32)); 6958 6959 comp_val = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_INC_MASK, 1) | 6960 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_VAL_MASK, 1); 6961 6962 WREG32(mmARC_FARM_KDMA_CTX_SRC_BASE_LO, lower_32_bits(src_addr)); 6963 WREG32(mmARC_FARM_KDMA_CTX_SRC_BASE_HI, upper_32_bits(src_addr)); 6964 WREG32(mmARC_FARM_KDMA_CTX_DST_BASE_LO, lower_32_bits(dst_addr)); 6965 WREG32(mmARC_FARM_KDMA_CTX_DST_BASE_HI, upper_32_bits(dst_addr)); 6966 WREG32(mmARC_FARM_KDMA_CTX_WR_COMP_ADDR_LO, lower_32_bits(comp_addr)); 6967 WREG32(mmARC_FARM_KDMA_CTX_WR_COMP_ADDR_HI, upper_32_bits(comp_addr)); 6968 WREG32(mmARC_FARM_KDMA_CTX_WR_COMP_WDATA, comp_val); 6969 WREG32(mmARC_FARM_KDMA_CTX_DST_TSIZE_0, size); 6970 6971 commit_mask = FIELD_PREP(ARC_FARM_KDMA_CTX_COMMIT_LIN_MASK, 1) | 6972 FIELD_PREP(ARC_FARM_KDMA_CTX_COMMIT_WR_COMP_EN_MASK, 1); 6973 6974 if (is_memset) 6975 commit_mask |= FIELD_PREP(ARC_FARM_KDMA_CTX_COMMIT_MEM_SET_MASK, 1); 6976 6977 WREG32(mmARC_FARM_KDMA_CTX_COMMIT, commit_mask); 6978 6979 /* Wait for completion */ 6980 cq = &hdev->completion_queue[GAUDI2_RESERVED_CQ_KDMA_COMPLETION]; 6981 cq_base = cq->kernel_address; 6982 polling_addr = (u32 *)&cq_base[cq->ci]; 6983 6984 if (hdev->pldm) 6985 /* for each 1MB 20 second of timeout */ 6986 timeout = ((size / SZ_1M) + 1) * USEC_PER_SEC * 20; 6987 else 6988 timeout = KDMA_TIMEOUT_USEC; 6989 6990 /* Polling */ 6991 rc = hl_poll_timeout_memory( 6992 hdev, 6993 polling_addr, 6994 status, 6995 (status == 1), 6996 1000, 6997 timeout, 6998 true); 6999 7000 *polling_addr = 0; 7001 7002 if (rc) { 7003 dev_err(hdev->dev, "Timeout while waiting for KDMA to be idle\n"); 7004 WREG32(mmARC_FARM_KDMA_CFG_1, 1 << ARC_FARM_KDMA_CFG_1_HALT_SHIFT); 7005 return rc; 7006 } 7007 7008 cq->ci = hl_cq_inc_ptr(cq->ci); 7009 7010 return 0; 7011 } 7012 7013 static void gaudi2_memset_device_lbw(struct hl_device *hdev, u32 addr, u32 size, u32 val) 7014 { 7015 u32 i; 7016 7017 for (i = 0 ; i < size ; i += sizeof(u32)) 7018 WREG32(addr + i, val); 7019 } 7020 7021 static void gaudi2_qman_set_test_mode(struct hl_device *hdev, u32 hw_queue_id, bool enable) 7022 { 7023 u32 reg_base = gaudi2_qm_blocks_bases[hw_queue_id]; 7024 7025 if (enable) { 7026 WREG32(reg_base + QM_GLBL_PROT_OFFSET, QMAN_MAKE_TRUSTED_TEST_MODE); 7027 WREG32(reg_base + QM_PQC_CFG_OFFSET, 0); 7028 } else { 7029 WREG32(reg_base + QM_GLBL_PROT_OFFSET, QMAN_MAKE_TRUSTED); 7030 WREG32(reg_base + QM_PQC_CFG_OFFSET, 1 << PDMA0_QM_PQC_CFG_EN_SHIFT); 7031 } 7032 } 7033 7034 static inline u32 gaudi2_test_queue_hw_queue_id_to_sob_id(struct hl_device *hdev, u32 hw_queue_id) 7035 { 7036 return hdev->asic_prop.first_available_user_sob[0] + 7037 hw_queue_id - GAUDI2_QUEUE_ID_PDMA_0_0; 7038 } 7039 7040 static void gaudi2_test_queue_clear(struct hl_device *hdev, u32 hw_queue_id) 7041 { 7042 u32 sob_offset = gaudi2_test_queue_hw_queue_id_to_sob_id(hdev, hw_queue_id) * 4; 7043 u32 sob_addr = mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_offset; 7044 7045 /* Reset the SOB value */ 7046 WREG32(sob_addr, 0); 7047 } 7048 7049 static int gaudi2_test_queue_send_msg_short(struct hl_device *hdev, u32 hw_queue_id, u32 sob_val, 7050 struct gaudi2_queues_test_info *msg_info) 7051 { 7052 u32 sob_offset = gaudi2_test_queue_hw_queue_id_to_sob_id(hdev, hw_queue_id) * 4; 7053 u32 tmp, sob_base = 1; 7054 struct packet_msg_short *msg_short_pkt = msg_info->kern_addr; 7055 size_t pkt_size = sizeof(struct packet_msg_short); 7056 int rc; 7057 7058 tmp = (PACKET_MSG_SHORT << GAUDI2_PKT_CTL_OPCODE_SHIFT) | 7059 (1 << GAUDI2_PKT_CTL_EB_SHIFT) | 7060 (1 << GAUDI2_PKT_CTL_MB_SHIFT) | 7061 (sob_base << GAUDI2_PKT_SHORT_CTL_BASE_SHIFT) | 7062 (sob_offset << GAUDI2_PKT_SHORT_CTL_ADDR_SHIFT); 7063 7064 msg_short_pkt->value = cpu_to_le32(sob_val); 7065 msg_short_pkt->ctl = cpu_to_le32(tmp); 7066 7067 rc = hl_hw_queue_send_cb_no_cmpl(hdev, hw_queue_id, pkt_size, msg_info->dma_addr); 7068 if (rc) 7069 dev_err(hdev->dev, 7070 "Failed to send msg_short packet to H/W queue %d\n", hw_queue_id); 7071 7072 return rc; 7073 } 7074 7075 static int gaudi2_test_queue_wait_completion(struct hl_device *hdev, u32 hw_queue_id, u32 sob_val) 7076 { 7077 u32 sob_offset = gaudi2_test_queue_hw_queue_id_to_sob_id(hdev, hw_queue_id) * 4; 7078 u32 sob_addr = mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_offset; 7079 u32 timeout_usec, tmp; 7080 int rc; 7081 7082 if (hdev->pldm) 7083 timeout_usec = GAUDI2_PLDM_TEST_QUEUE_WAIT_USEC; 7084 else 7085 timeout_usec = GAUDI2_TEST_QUEUE_WAIT_USEC; 7086 7087 rc = hl_poll_timeout( 7088 hdev, 7089 sob_addr, 7090 tmp, 7091 (tmp == sob_val), 7092 1000, 7093 timeout_usec); 7094 7095 if (rc == -ETIMEDOUT) { 7096 dev_err(hdev->dev, "H/W queue %d test failed (SOB_OBJ_0 == 0x%x)\n", 7097 hw_queue_id, tmp); 7098 rc = -EIO; 7099 } 7100 7101 return rc; 7102 } 7103 7104 static int gaudi2_test_cpu_queue(struct hl_device *hdev) 7105 { 7106 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7107 7108 /* 7109 * check capability here as send_cpu_message() won't update the result 7110 * value if no capability 7111 */ 7112 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) 7113 return 0; 7114 7115 return hl_fw_test_cpu_queue(hdev); 7116 } 7117 7118 static int gaudi2_test_queues(struct hl_device *hdev) 7119 { 7120 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7121 struct gaudi2_queues_test_info *msg_info; 7122 u32 sob_val = 0x5a5a; 7123 int i, rc; 7124 7125 /* send test message on all enabled Qs */ 7126 for (i = GAUDI2_QUEUE_ID_PDMA_0_0 ; i < GAUDI2_QUEUE_ID_CPU_PQ; i++) { 7127 if (!gaudi2_is_queue_enabled(hdev, i) || gaudi2_is_edma_queue_id(i)) 7128 continue; 7129 7130 msg_info = &gaudi2->queues_test_info[i - GAUDI2_QUEUE_ID_PDMA_0_0]; 7131 gaudi2_qman_set_test_mode(hdev, i, true); 7132 gaudi2_test_queue_clear(hdev, i); 7133 rc = gaudi2_test_queue_send_msg_short(hdev, i, sob_val, msg_info); 7134 if (rc) 7135 goto done; 7136 } 7137 7138 rc = gaudi2_test_cpu_queue(hdev); 7139 if (rc) 7140 goto done; 7141 7142 /* verify that all messages were processed */ 7143 for (i = GAUDI2_QUEUE_ID_PDMA_0_0 ; i < GAUDI2_QUEUE_ID_CPU_PQ; i++) { 7144 if (!gaudi2_is_queue_enabled(hdev, i) || gaudi2_is_edma_queue_id(i)) 7145 continue; 7146 7147 rc = gaudi2_test_queue_wait_completion(hdev, i, sob_val); 7148 if (rc) 7149 /* chip is not usable, no need for cleanups, just bail-out with error */ 7150 goto done; 7151 7152 gaudi2_test_queue_clear(hdev, i); 7153 gaudi2_qman_set_test_mode(hdev, i, false); 7154 } 7155 7156 done: 7157 return rc; 7158 } 7159 7160 static int gaudi2_compute_reset_late_init(struct hl_device *hdev) 7161 { 7162 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7163 size_t irq_arr_size; 7164 int rc; 7165 7166 gaudi2_init_arcs(hdev); 7167 7168 rc = gaudi2_scrub_arcs_dccm(hdev); 7169 if (rc) { 7170 dev_err(hdev->dev, "Failed to scrub arcs DCCM\n"); 7171 return rc; 7172 } 7173 7174 gaudi2_init_security(hdev); 7175 7176 /* Unmask all IRQs since some could have been received during the soft reset */ 7177 irq_arr_size = gaudi2->num_of_valid_hw_events * sizeof(gaudi2->hw_events[0]); 7178 return hl_fw_unmask_irq_arr(hdev, gaudi2->hw_events, irq_arr_size); 7179 } 7180 7181 static bool gaudi2_get_edma_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7182 struct engines_data *e) 7183 { 7184 u32 qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts, dma_core_sts0, dma_core_sts1; 7185 struct asic_fixed_properties *prop = &hdev->asic_prop; 7186 unsigned long *mask = (unsigned long *) mask_arr; 7187 const char *edma_fmt = "%-6d%-6d%-9s%#-14x%#-15x%#x\n"; 7188 bool is_idle = true, is_eng_idle; 7189 int engine_idx, i, j; 7190 u64 offset; 7191 7192 if (e) 7193 hl_engine_data_sprintf(e, 7194 "\nCORE EDMA is_idle QM_GLBL_STS0 DMA_CORE_STS0 DMA_CORE_STS1\n" 7195 "---- ---- ------- ------------ ------------- -------------\n"); 7196 7197 for (i = 0; i < NUM_OF_DCORES; i++) { 7198 for (j = 0 ; j < NUM_OF_EDMA_PER_DCORE ; j++) { 7199 int seq = i * NUM_OF_EDMA_PER_DCORE + j; 7200 7201 if (!(prop->edma_enabled_mask & BIT(seq))) 7202 continue; 7203 7204 engine_idx = GAUDI2_DCORE0_ENGINE_ID_EDMA_0 + 7205 i * GAUDI2_ENGINE_ID_DCORE_OFFSET + j; 7206 offset = i * DCORE_OFFSET + j * DCORE_EDMA_OFFSET; 7207 7208 dma_core_sts0 = RREG32(mmDCORE0_EDMA0_CORE_STS0 + offset); 7209 dma_core_sts1 = RREG32(mmDCORE0_EDMA0_CORE_STS1 + offset); 7210 7211 qm_glbl_sts0 = RREG32(mmDCORE0_EDMA0_QM_GLBL_STS0 + offset); 7212 qm_glbl_sts1 = RREG32(mmDCORE0_EDMA0_QM_GLBL_STS1 + offset); 7213 qm_cgm_sts = RREG32(mmDCORE0_EDMA0_QM_CGM_STS + offset); 7214 7215 is_eng_idle = IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts) && 7216 IS_DMA_IDLE(dma_core_sts0) && !IS_DMA_HALTED(dma_core_sts1); 7217 is_idle &= is_eng_idle; 7218 7219 if (mask && !is_eng_idle) 7220 set_bit(engine_idx, mask); 7221 7222 if (e) 7223 hl_engine_data_sprintf(e, edma_fmt, i, j, is_eng_idle ? "Y" : "N", 7224 qm_glbl_sts0, dma_core_sts0, dma_core_sts1); 7225 } 7226 } 7227 7228 return is_idle; 7229 } 7230 7231 static bool gaudi2_get_pdma_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7232 struct engines_data *e) 7233 { 7234 u32 qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts, dma_core_sts0, dma_core_sts1; 7235 unsigned long *mask = (unsigned long *) mask_arr; 7236 const char *pdma_fmt = "%-6d%-9s%#-14x%#-15x%#x\n"; 7237 bool is_idle = true, is_eng_idle; 7238 int engine_idx, i; 7239 u64 offset; 7240 7241 if (e) 7242 hl_engine_data_sprintf(e, 7243 "\nPDMA is_idle QM_GLBL_STS0 DMA_CORE_STS0 DMA_CORE_STS1\n" 7244 "---- ------- ------------ ------------- -------------\n"); 7245 7246 for (i = 0 ; i < NUM_OF_PDMA ; i++) { 7247 engine_idx = GAUDI2_ENGINE_ID_PDMA_0 + i; 7248 offset = i * PDMA_OFFSET; 7249 dma_core_sts0 = RREG32(mmPDMA0_CORE_STS0 + offset); 7250 dma_core_sts1 = RREG32(mmPDMA0_CORE_STS1 + offset); 7251 7252 qm_glbl_sts0 = RREG32(mmPDMA0_QM_GLBL_STS0 + offset); 7253 qm_glbl_sts1 = RREG32(mmPDMA0_QM_GLBL_STS1 + offset); 7254 qm_cgm_sts = RREG32(mmPDMA0_QM_CGM_STS + offset); 7255 7256 is_eng_idle = IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts) && 7257 IS_DMA_IDLE(dma_core_sts0) && !IS_DMA_HALTED(dma_core_sts1); 7258 is_idle &= is_eng_idle; 7259 7260 if (mask && !is_eng_idle) 7261 set_bit(engine_idx, mask); 7262 7263 if (e) 7264 hl_engine_data_sprintf(e, pdma_fmt, i, is_eng_idle ? "Y" : "N", 7265 qm_glbl_sts0, dma_core_sts0, dma_core_sts1); 7266 } 7267 7268 return is_idle; 7269 } 7270 7271 static bool gaudi2_get_nic_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7272 struct engines_data *e) 7273 { 7274 unsigned long *mask = (unsigned long *) mask_arr; 7275 const char *nic_fmt = "%-5d%-9s%#-14x%#-12x\n"; 7276 u32 qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts; 7277 bool is_idle = true, is_eng_idle; 7278 int engine_idx, i; 7279 u64 offset = 0; 7280 7281 /* NIC, twelve macros in Full chip */ 7282 if (e && hdev->nic_ports_mask) 7283 hl_engine_data_sprintf(e, 7284 "\nNIC is_idle QM_GLBL_STS0 QM_CGM_STS\n" 7285 "--- ------- ------------ ----------\n"); 7286 7287 for (i = 0 ; i < NIC_NUMBER_OF_ENGINES ; i++) { 7288 if (!(i & 1)) 7289 offset = i / 2 * NIC_OFFSET; 7290 else 7291 offset += NIC_QM_OFFSET; 7292 7293 if (!(hdev->nic_ports_mask & BIT(i))) 7294 continue; 7295 7296 engine_idx = GAUDI2_ENGINE_ID_NIC0_0 + i; 7297 7298 7299 qm_glbl_sts0 = RREG32(mmNIC0_QM0_GLBL_STS0 + offset); 7300 qm_glbl_sts1 = RREG32(mmNIC0_QM0_GLBL_STS1 + offset); 7301 qm_cgm_sts = RREG32(mmNIC0_QM0_CGM_STS + offset); 7302 7303 is_eng_idle = IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts); 7304 is_idle &= is_eng_idle; 7305 7306 if (mask && !is_eng_idle) 7307 set_bit(engine_idx, mask); 7308 7309 if (e) 7310 hl_engine_data_sprintf(e, nic_fmt, i, is_eng_idle ? "Y" : "N", 7311 qm_glbl_sts0, qm_cgm_sts); 7312 } 7313 7314 return is_idle; 7315 } 7316 7317 static bool gaudi2_get_mme_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7318 struct engines_data *e) 7319 { 7320 u32 qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts, mme_arch_sts; 7321 unsigned long *mask = (unsigned long *) mask_arr; 7322 const char *mme_fmt = "%-5d%-6s%-9s%#-14x%#x\n"; 7323 bool is_idle = true, is_eng_idle; 7324 int engine_idx, i; 7325 u64 offset; 7326 7327 if (e) 7328 hl_engine_data_sprintf(e, 7329 "\nMME Stub is_idle QM_GLBL_STS0 MME_ARCH_STATUS\n" 7330 "--- ---- ------- ------------ ---------------\n"); 7331 /* MME, one per Dcore */ 7332 for (i = 0 ; i < NUM_OF_DCORES ; i++) { 7333 engine_idx = GAUDI2_DCORE0_ENGINE_ID_MME + i * GAUDI2_ENGINE_ID_DCORE_OFFSET; 7334 offset = i * DCORE_OFFSET; 7335 7336 qm_glbl_sts0 = RREG32(mmDCORE0_MME_QM_GLBL_STS0 + offset); 7337 qm_glbl_sts1 = RREG32(mmDCORE0_MME_QM_GLBL_STS1 + offset); 7338 qm_cgm_sts = RREG32(mmDCORE0_MME_QM_CGM_STS + offset); 7339 7340 is_eng_idle = IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts); 7341 is_idle &= is_eng_idle; 7342 7343 mme_arch_sts = RREG32(mmDCORE0_MME_CTRL_LO_ARCH_STATUS + offset); 7344 is_eng_idle &= IS_MME_IDLE(mme_arch_sts); 7345 is_idle &= is_eng_idle; 7346 7347 if (e) 7348 hl_engine_data_sprintf(e, mme_fmt, i, "N", 7349 is_eng_idle ? "Y" : "N", 7350 qm_glbl_sts0, 7351 mme_arch_sts); 7352 7353 if (mask && !is_eng_idle) 7354 set_bit(engine_idx, mask); 7355 } 7356 7357 return is_idle; 7358 } 7359 7360 static void gaudi2_is_tpc_engine_idle(struct hl_device *hdev, int dcore, int inst, u32 offset, 7361 struct iterate_module_ctx *ctx) 7362 { 7363 struct gaudi2_tpc_idle_data *idle_data = ctx->data; 7364 u32 tpc_cfg_sts, qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts; 7365 bool is_eng_idle; 7366 int engine_idx; 7367 7368 if ((dcore == 0) && (inst == (NUM_DCORE0_TPC - 1))) 7369 engine_idx = GAUDI2_DCORE0_ENGINE_ID_TPC_6; 7370 else 7371 engine_idx = GAUDI2_DCORE0_ENGINE_ID_TPC_0 + 7372 dcore * GAUDI2_ENGINE_ID_DCORE_OFFSET + inst; 7373 7374 tpc_cfg_sts = RREG32(mmDCORE0_TPC0_CFG_STATUS + offset); 7375 qm_glbl_sts0 = RREG32(mmDCORE0_TPC0_QM_GLBL_STS0 + offset); 7376 qm_glbl_sts1 = RREG32(mmDCORE0_TPC0_QM_GLBL_STS1 + offset); 7377 qm_cgm_sts = RREG32(mmDCORE0_TPC0_QM_CGM_STS + offset); 7378 7379 is_eng_idle = IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts) && 7380 IS_TPC_IDLE(tpc_cfg_sts); 7381 *(idle_data->is_idle) &= is_eng_idle; 7382 7383 if (idle_data->mask && !is_eng_idle) 7384 set_bit(engine_idx, idle_data->mask); 7385 7386 if (idle_data->e) 7387 hl_engine_data_sprintf(idle_data->e, 7388 idle_data->tpc_fmt, dcore, inst, 7389 is_eng_idle ? "Y" : "N", 7390 qm_glbl_sts0, qm_cgm_sts, tpc_cfg_sts); 7391 } 7392 7393 static bool gaudi2_get_tpc_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7394 struct engines_data *e) 7395 { 7396 struct asic_fixed_properties *prop = &hdev->asic_prop; 7397 unsigned long *mask = (unsigned long *) mask_arr; 7398 bool is_idle = true; 7399 7400 struct gaudi2_tpc_idle_data tpc_idle_data = { 7401 .tpc_fmt = "%-6d%-5d%-9s%#-14x%#-12x%#x\n", 7402 .e = e, 7403 .mask = mask, 7404 .is_idle = &is_idle, 7405 }; 7406 struct iterate_module_ctx tpc_iter = { 7407 .fn = &gaudi2_is_tpc_engine_idle, 7408 .data = &tpc_idle_data, 7409 }; 7410 7411 if (e && prop->tpc_enabled_mask) 7412 hl_engine_data_sprintf(e, 7413 "\nCORE TPC is_idle QM_GLBL_STS0 QM_CGM_STS STATUS\n" 7414 "---- --- ------- ------------ ---------- ------\n"); 7415 7416 gaudi2_iterate_tpcs(hdev, &tpc_iter); 7417 7418 return *tpc_idle_data.is_idle; 7419 } 7420 7421 static bool gaudi2_get_decoder_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7422 struct engines_data *e) 7423 { 7424 struct asic_fixed_properties *prop = &hdev->asic_prop; 7425 unsigned long *mask = (unsigned long *) mask_arr; 7426 const char *pcie_dec_fmt = "%-10d%-9s%#x\n"; 7427 const char *dec_fmt = "%-6d%-5d%-9s%#x\n"; 7428 bool is_idle = true, is_eng_idle; 7429 u32 dec_swreg15, dec_enabled_bit; 7430 int engine_idx, i, j; 7431 u64 offset; 7432 7433 /* Decoders, two each Dcore and two shared PCIe decoders */ 7434 if (e && (prop->decoder_enabled_mask & (~PCIE_DEC_EN_MASK))) 7435 hl_engine_data_sprintf(e, 7436 "\nCORE DEC is_idle VSI_CMD_SWREG15\n" 7437 "---- --- ------- ---------------\n"); 7438 7439 for (i = 0 ; i < NUM_OF_DCORES ; i++) { 7440 for (j = 0 ; j < NUM_OF_DEC_PER_DCORE ; j++) { 7441 dec_enabled_bit = 1 << (i * NUM_OF_DEC_PER_DCORE + j); 7442 if (!(prop->decoder_enabled_mask & dec_enabled_bit)) 7443 continue; 7444 7445 engine_idx = GAUDI2_DCORE0_ENGINE_ID_DEC_0 + 7446 i * GAUDI2_ENGINE_ID_DCORE_OFFSET + j; 7447 offset = i * DCORE_OFFSET + j * DCORE_DEC_OFFSET; 7448 7449 dec_swreg15 = RREG32(mmDCORE0_DEC0_CMD_SWREG15 + offset); 7450 is_eng_idle = IS_DEC_IDLE(dec_swreg15); 7451 is_idle &= is_eng_idle; 7452 7453 if (mask && !is_eng_idle) 7454 set_bit(engine_idx, mask); 7455 7456 if (e) 7457 hl_engine_data_sprintf(e, dec_fmt, i, j, 7458 is_eng_idle ? "Y" : "N", dec_swreg15); 7459 } 7460 } 7461 7462 if (e && (prop->decoder_enabled_mask & PCIE_DEC_EN_MASK)) 7463 hl_engine_data_sprintf(e, 7464 "\nPCIe DEC is_idle VSI_CMD_SWREG15\n" 7465 "-------- ------- ---------------\n"); 7466 7467 /* Check shared(PCIe) decoders */ 7468 for (i = 0 ; i < NUM_OF_DEC_PER_DCORE ; i++) { 7469 dec_enabled_bit = PCIE_DEC_SHIFT + i; 7470 if (!(prop->decoder_enabled_mask & BIT(dec_enabled_bit))) 7471 continue; 7472 7473 engine_idx = GAUDI2_PCIE_ENGINE_ID_DEC_0 + i; 7474 offset = i * DCORE_DEC_OFFSET; 7475 dec_swreg15 = RREG32(mmPCIE_DEC0_CMD_SWREG15 + offset); 7476 is_eng_idle = IS_DEC_IDLE(dec_swreg15); 7477 is_idle &= is_eng_idle; 7478 7479 if (mask && !is_eng_idle) 7480 set_bit(engine_idx, mask); 7481 7482 if (e) 7483 hl_engine_data_sprintf(e, pcie_dec_fmt, i, 7484 is_eng_idle ? "Y" : "N", dec_swreg15); 7485 } 7486 7487 return is_idle; 7488 } 7489 7490 static bool gaudi2_get_rotator_idle_status(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7491 struct engines_data *e) 7492 { 7493 const char *rot_fmt = "%-6d%-5d%-9s%#-14x%#-14x%#x\n"; 7494 unsigned long *mask = (unsigned long *) mask_arr; 7495 u32 qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts; 7496 bool is_idle = true, is_eng_idle; 7497 int engine_idx, i; 7498 u64 offset; 7499 7500 if (e) 7501 hl_engine_data_sprintf(e, 7502 "\nCORE ROT is_idle QM_GLBL_STS0 QM_GLBL_STS1 QM_CGM_STS\n" 7503 "---- --- ------- ------------ ------------ ----------\n"); 7504 7505 for (i = 0 ; i < NUM_OF_ROT ; i++) { 7506 engine_idx = GAUDI2_ENGINE_ID_ROT_0 + i; 7507 7508 offset = i * ROT_OFFSET; 7509 7510 qm_glbl_sts0 = RREG32(mmROT0_QM_GLBL_STS0 + offset); 7511 qm_glbl_sts1 = RREG32(mmROT0_QM_GLBL_STS1 + offset); 7512 qm_cgm_sts = RREG32(mmROT0_QM_CGM_STS + offset); 7513 7514 is_eng_idle = IS_QM_IDLE(qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts); 7515 is_idle &= is_eng_idle; 7516 7517 if (mask && !is_eng_idle) 7518 set_bit(engine_idx, mask); 7519 7520 if (e) 7521 hl_engine_data_sprintf(e, rot_fmt, i, 0, is_eng_idle ? "Y" : "N", 7522 qm_glbl_sts0, qm_glbl_sts1, qm_cgm_sts); 7523 } 7524 7525 return is_idle; 7526 } 7527 7528 static bool gaudi2_is_device_idle(struct hl_device *hdev, u64 *mask_arr, u8 mask_len, 7529 struct engines_data *e) 7530 { 7531 bool is_idle = true; 7532 7533 is_idle &= gaudi2_get_edma_idle_status(hdev, mask_arr, mask_len, e); 7534 is_idle &= gaudi2_get_pdma_idle_status(hdev, mask_arr, mask_len, e); 7535 is_idle &= gaudi2_get_nic_idle_status(hdev, mask_arr, mask_len, e); 7536 is_idle &= gaudi2_get_mme_idle_status(hdev, mask_arr, mask_len, e); 7537 is_idle &= gaudi2_get_tpc_idle_status(hdev, mask_arr, mask_len, e); 7538 is_idle &= gaudi2_get_decoder_idle_status(hdev, mask_arr, mask_len, e); 7539 is_idle &= gaudi2_get_rotator_idle_status(hdev, mask_arr, mask_len, e); 7540 7541 return is_idle; 7542 } 7543 7544 static void gaudi2_hw_queues_lock(struct hl_device *hdev) 7545 __acquires(&gaudi2->hw_queues_lock) 7546 { 7547 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7548 7549 spin_lock(&gaudi2->hw_queues_lock); 7550 } 7551 7552 static void gaudi2_hw_queues_unlock(struct hl_device *hdev) 7553 __releases(&gaudi2->hw_queues_lock) 7554 { 7555 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7556 7557 spin_unlock(&gaudi2->hw_queues_lock); 7558 } 7559 7560 static u32 gaudi2_get_pci_id(struct hl_device *hdev) 7561 { 7562 return hdev->pdev->device; 7563 } 7564 7565 static int gaudi2_get_eeprom_data(struct hl_device *hdev, void *data, size_t max_size) 7566 { 7567 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7568 7569 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) 7570 return 0; 7571 7572 return hl_fw_get_eeprom_data(hdev, data, max_size); 7573 } 7574 7575 static void gaudi2_update_eq_ci(struct hl_device *hdev, u32 val) 7576 { 7577 WREG32(mmCPU_IF_EQ_RD_OFFS, val); 7578 } 7579 7580 static void *gaudi2_get_events_stat(struct hl_device *hdev, bool aggregate, u32 *size) 7581 { 7582 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7583 7584 if (aggregate) { 7585 *size = (u32) sizeof(gaudi2->events_stat_aggregate); 7586 return gaudi2->events_stat_aggregate; 7587 } 7588 7589 *size = (u32) sizeof(gaudi2->events_stat); 7590 return gaudi2->events_stat; 7591 } 7592 7593 static void gaudi2_mmu_vdec_dcore_prepare(struct hl_device *hdev, int dcore_id, 7594 int dcore_vdec_id, u32 rw_asid, u32 rw_mmu_bp) 7595 { 7596 u32 offset = (mmDCORE0_VDEC1_BRDG_CTRL_BASE - mmDCORE0_VDEC0_BRDG_CTRL_BASE) * 7597 dcore_vdec_id + DCORE_OFFSET * dcore_id; 7598 7599 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_DEC_HB_MMU_BP + offset, rw_mmu_bp); 7600 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_DEC_HB_ASID + offset, rw_asid); 7601 7602 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_ABNRM_HB_MMU_BP + offset, rw_mmu_bp); 7603 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_ABNRM_HB_ASID + offset, rw_asid); 7604 7605 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_L2C_HB_MMU_BP + offset, rw_mmu_bp); 7606 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_L2C_HB_ASID + offset, rw_asid); 7607 7608 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_NRM_HB_MMU_BP + offset, rw_mmu_bp); 7609 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_NRM_HB_ASID + offset, rw_asid); 7610 7611 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_VCD_HB_MMU_BP + offset, rw_mmu_bp); 7612 WREG32(mmDCORE0_VDEC0_BRDG_CTRL_AXUSER_MSIX_VCD_HB_ASID + offset, rw_asid); 7613 } 7614 7615 static void gaudi2_mmu_dcore_prepare(struct hl_device *hdev, int dcore_id, u32 asid) 7616 { 7617 u32 rw_asid = (asid << ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_RD_SHIFT) | 7618 (asid << ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_WR_SHIFT); 7619 struct asic_fixed_properties *prop = &hdev->asic_prop; 7620 u32 dcore_offset = dcore_id * DCORE_OFFSET; 7621 u32 vdec_id, i, ports_offset, reg_val; 7622 u8 edma_seq_base; 7623 7624 /* EDMA */ 7625 edma_seq_base = dcore_id * NUM_OF_EDMA_PER_DCORE; 7626 if (prop->edma_enabled_mask & BIT(edma_seq_base)) { 7627 WREG32(mmDCORE0_EDMA0_QM_AXUSER_NONSECURED_HB_MMU_BP + dcore_offset, 0); 7628 WREG32(mmDCORE0_EDMA0_QM_AXUSER_NONSECURED_HB_ASID + dcore_offset, rw_asid); 7629 WREG32(mmDCORE0_EDMA0_CORE_CTX_AXUSER_HB_MMU_BP + dcore_offset, 0); 7630 WREG32(mmDCORE0_EDMA0_CORE_CTX_AXUSER_HB_ASID + dcore_offset, rw_asid); 7631 } 7632 7633 if (prop->edma_enabled_mask & BIT(edma_seq_base + 1)) { 7634 WREG32(mmDCORE0_EDMA1_QM_AXUSER_NONSECURED_HB_MMU_BP + dcore_offset, 0); 7635 WREG32(mmDCORE0_EDMA1_QM_AXUSER_NONSECURED_HB_ASID + dcore_offset, rw_asid); 7636 WREG32(mmDCORE0_EDMA1_CORE_CTX_AXUSER_HB_ASID + dcore_offset, rw_asid); 7637 WREG32(mmDCORE0_EDMA1_CORE_CTX_AXUSER_HB_MMU_BP + dcore_offset, 0); 7638 } 7639 7640 /* Sync Mngr */ 7641 WREG32(mmDCORE0_SYNC_MNGR_GLBL_ASID_NONE_SEC_PRIV + dcore_offset, asid); 7642 /* 7643 * Sync Mngrs on dcores 1 - 3 are exposed to user, so must use user ASID 7644 * for any access type 7645 */ 7646 if (dcore_id > 0) { 7647 reg_val = (asid << DCORE0_SYNC_MNGR_MSTR_IF_AXUSER_HB_ASID_RD_SHIFT) | 7648 (asid << DCORE0_SYNC_MNGR_MSTR_IF_AXUSER_HB_ASID_WR_SHIFT); 7649 WREG32(mmDCORE0_SYNC_MNGR_MSTR_IF_AXUSER_HB_ASID + dcore_offset, reg_val); 7650 WREG32(mmDCORE0_SYNC_MNGR_MSTR_IF_AXUSER_HB_MMU_BP + dcore_offset, 0); 7651 } 7652 7653 WREG32(mmDCORE0_MME_CTRL_LO_MME_AXUSER_HB_MMU_BP + dcore_offset, 0); 7654 WREG32(mmDCORE0_MME_CTRL_LO_MME_AXUSER_HB_ASID + dcore_offset, rw_asid); 7655 7656 for (i = 0 ; i < NUM_OF_MME_SBTE_PORTS ; i++) { 7657 ports_offset = i * DCORE_MME_SBTE_OFFSET; 7658 WREG32(mmDCORE0_MME_SBTE0_MSTR_IF_AXUSER_HB_MMU_BP + 7659 dcore_offset + ports_offset, 0); 7660 WREG32(mmDCORE0_MME_SBTE0_MSTR_IF_AXUSER_HB_ASID + 7661 dcore_offset + ports_offset, rw_asid); 7662 } 7663 7664 for (i = 0 ; i < NUM_OF_MME_WB_PORTS ; i++) { 7665 ports_offset = i * DCORE_MME_WB_OFFSET; 7666 WREG32(mmDCORE0_MME_WB0_MSTR_IF_AXUSER_HB_MMU_BP + 7667 dcore_offset + ports_offset, 0); 7668 WREG32(mmDCORE0_MME_WB0_MSTR_IF_AXUSER_HB_ASID + 7669 dcore_offset + ports_offset, rw_asid); 7670 } 7671 7672 WREG32(mmDCORE0_MME_QM_AXUSER_NONSECURED_HB_MMU_BP + dcore_offset, 0); 7673 WREG32(mmDCORE0_MME_QM_AXUSER_NONSECURED_HB_ASID + dcore_offset, rw_asid); 7674 7675 /* 7676 * Decoders 7677 */ 7678 for (vdec_id = 0 ; vdec_id < NUM_OF_DEC_PER_DCORE ; vdec_id++) { 7679 if (prop->decoder_enabled_mask & BIT(dcore_id * NUM_OF_DEC_PER_DCORE + vdec_id)) 7680 gaudi2_mmu_vdec_dcore_prepare(hdev, dcore_id, vdec_id, rw_asid, 0); 7681 } 7682 } 7683 7684 static void gudi2_mmu_vdec_shared_prepare(struct hl_device *hdev, 7685 int shared_vdec_id, u32 rw_asid, u32 rw_mmu_bp) 7686 { 7687 u32 offset = (mmPCIE_VDEC1_BRDG_CTRL_BASE - mmPCIE_VDEC0_BRDG_CTRL_BASE) * shared_vdec_id; 7688 7689 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_DEC_HB_MMU_BP + offset, rw_mmu_bp); 7690 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_DEC_HB_ASID + offset, rw_asid); 7691 7692 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_ABNRM_HB_MMU_BP + offset, rw_mmu_bp); 7693 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_ABNRM_HB_ASID + offset, rw_asid); 7694 7695 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_L2C_HB_MMU_BP + offset, rw_mmu_bp); 7696 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_L2C_HB_ASID + offset, rw_asid); 7697 7698 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_NRM_HB_MMU_BP + offset, rw_mmu_bp); 7699 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_NRM_HB_ASID + offset, rw_asid); 7700 7701 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_VCD_HB_MMU_BP + offset, rw_mmu_bp); 7702 WREG32(mmPCIE_VDEC0_BRDG_CTRL_AXUSER_MSIX_VCD_HB_ASID + offset, rw_asid); 7703 } 7704 7705 static void gudi2_mmu_arc_farm_arc_dup_eng_prepare(struct hl_device *hdev, int arc_farm_id, 7706 u32 rw_asid, u32 rw_mmu_bp) 7707 { 7708 u32 offset = (mmARC_FARM_ARC1_DUP_ENG_BASE - mmARC_FARM_ARC0_DUP_ENG_BASE) * arc_farm_id; 7709 7710 WREG32(mmARC_FARM_ARC0_DUP_ENG_AXUSER_HB_MMU_BP + offset, rw_mmu_bp); 7711 WREG32(mmARC_FARM_ARC0_DUP_ENG_AXUSER_HB_ASID + offset, rw_asid); 7712 } 7713 7714 static void gaudi2_arc_mmu_prepare(struct hl_device *hdev, u32 cpu_id, u32 asid) 7715 { 7716 u32 reg_base, reg_offset, reg_val = 0; 7717 7718 reg_base = gaudi2_arc_blocks_bases[cpu_id]; 7719 7720 /* Enable MMU and configure asid for all relevant ARC regions */ 7721 reg_val = FIELD_PREP(ARC_FARM_ARC0_AUX_ARC_REGION_CFG_MMU_BP_MASK, 0); 7722 reg_val |= FIELD_PREP(ARC_FARM_ARC0_AUX_ARC_REGION_CFG_0_ASID_MASK, asid); 7723 7724 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION3_GENERAL); 7725 WREG32(reg_base + reg_offset, reg_val); 7726 7727 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION4_HBM0_FW); 7728 WREG32(reg_base + reg_offset, reg_val); 7729 7730 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION5_HBM1_GC_DATA); 7731 WREG32(reg_base + reg_offset, reg_val); 7732 7733 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION6_HBM2_GC_DATA); 7734 WREG32(reg_base + reg_offset, reg_val); 7735 7736 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION7_HBM3_GC_DATA); 7737 WREG32(reg_base + reg_offset, reg_val); 7738 7739 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION9_PCIE); 7740 WREG32(reg_base + reg_offset, reg_val); 7741 7742 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION10_GENERAL); 7743 WREG32(reg_base + reg_offset, reg_val); 7744 7745 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION11_GENERAL); 7746 WREG32(reg_base + reg_offset, reg_val); 7747 7748 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION12_GENERAL); 7749 WREG32(reg_base + reg_offset, reg_val); 7750 7751 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION13_GENERAL); 7752 WREG32(reg_base + reg_offset, reg_val); 7753 7754 reg_offset = ARC_REGION_CFG_OFFSET(ARC_REGION14_GENERAL); 7755 WREG32(reg_base + reg_offset, reg_val); 7756 } 7757 7758 static int gaudi2_arc_mmu_prepare_all(struct hl_device *hdev, u32 asid) 7759 { 7760 int i; 7761 7762 if (hdev->fw_components & FW_TYPE_BOOT_CPU) 7763 return hl_fw_cpucp_engine_core_asid_set(hdev, asid); 7764 7765 for (i = CPU_ID_SCHED_ARC0 ; i < NUM_OF_ARC_FARMS_ARC ; i++) 7766 gaudi2_arc_mmu_prepare(hdev, i, asid); 7767 7768 for (i = GAUDI2_QUEUE_ID_PDMA_0_0 ; i < GAUDI2_QUEUE_ID_CPU_PQ ; i += 4) { 7769 if (!gaudi2_is_queue_enabled(hdev, i)) 7770 continue; 7771 7772 gaudi2_arc_mmu_prepare(hdev, gaudi2_queue_id_to_arc_id[i], asid); 7773 } 7774 7775 return 0; 7776 } 7777 7778 static int gaudi2_mmu_shared_prepare(struct hl_device *hdev, u32 asid) 7779 { 7780 struct asic_fixed_properties *prop = &hdev->asic_prop; 7781 u32 rw_asid, offset; 7782 int rc, i; 7783 7784 rw_asid = FIELD_PREP(ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_RD_MASK, asid) | 7785 FIELD_PREP(ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_WR_MASK, asid); 7786 7787 WREG32(mmPDMA0_QM_AXUSER_NONSECURED_HB_ASID, rw_asid); 7788 WREG32(mmPDMA0_QM_AXUSER_NONSECURED_HB_MMU_BP, 0); 7789 WREG32(mmPDMA0_CORE_CTX_AXUSER_HB_ASID, rw_asid); 7790 WREG32(mmPDMA0_CORE_CTX_AXUSER_HB_MMU_BP, 0); 7791 7792 WREG32(mmPDMA1_QM_AXUSER_NONSECURED_HB_ASID, rw_asid); 7793 WREG32(mmPDMA1_QM_AXUSER_NONSECURED_HB_MMU_BP, 0); 7794 WREG32(mmPDMA1_CORE_CTX_AXUSER_HB_ASID, rw_asid); 7795 WREG32(mmPDMA1_CORE_CTX_AXUSER_HB_MMU_BP, 0); 7796 7797 /* ROT */ 7798 for (i = 0 ; i < NUM_OF_ROT ; i++) { 7799 offset = i * ROT_OFFSET; 7800 WREG32(mmROT0_QM_AXUSER_NONSECURED_HB_ASID + offset, rw_asid); 7801 WREG32(mmROT0_QM_AXUSER_NONSECURED_HB_MMU_BP + offset, 0); 7802 RMWREG32(mmROT0_CPL_QUEUE_AWUSER + offset, asid, MMUBP_ASID_MASK); 7803 RMWREG32(mmROT0_DESC_HBW_ARUSER_LO + offset, asid, MMUBP_ASID_MASK); 7804 RMWREG32(mmROT0_DESC_HBW_AWUSER_LO + offset, asid, MMUBP_ASID_MASK); 7805 } 7806 7807 /* Shared Decoders are the last bits in the decoders mask */ 7808 if (prop->decoder_enabled_mask & BIT(NUM_OF_DCORES * NUM_OF_DEC_PER_DCORE + 0)) 7809 gudi2_mmu_vdec_shared_prepare(hdev, 0, rw_asid, 0); 7810 7811 if (prop->decoder_enabled_mask & BIT(NUM_OF_DCORES * NUM_OF_DEC_PER_DCORE + 1)) 7812 gudi2_mmu_vdec_shared_prepare(hdev, 1, rw_asid, 0); 7813 7814 /* arc farm arc dup eng */ 7815 for (i = 0 ; i < NUM_OF_ARC_FARMS_ARC ; i++) 7816 gudi2_mmu_arc_farm_arc_dup_eng_prepare(hdev, i, rw_asid, 0); 7817 7818 rc = gaudi2_arc_mmu_prepare_all(hdev, asid); 7819 if (rc) 7820 return rc; 7821 7822 return 0; 7823 } 7824 7825 static void gaudi2_tpc_mmu_prepare(struct hl_device *hdev, int dcore, int inst, u32 offset, 7826 struct iterate_module_ctx *ctx) 7827 { 7828 struct gaudi2_tpc_mmu_data *mmu_data = ctx->data; 7829 7830 WREG32(mmDCORE0_TPC0_CFG_AXUSER_HB_MMU_BP + offset, 0); 7831 WREG32(mmDCORE0_TPC0_CFG_AXUSER_HB_ASID + offset, mmu_data->rw_asid); 7832 WREG32(mmDCORE0_TPC0_QM_AXUSER_NONSECURED_HB_MMU_BP + offset, 0); 7833 WREG32(mmDCORE0_TPC0_QM_AXUSER_NONSECURED_HB_ASID + offset, mmu_data->rw_asid); 7834 } 7835 7836 /* zero the MMUBP and set the ASID */ 7837 static int gaudi2_mmu_prepare(struct hl_device *hdev, u32 asid) 7838 { 7839 struct gaudi2_device *gaudi2 = hdev->asic_specific; 7840 struct gaudi2_tpc_mmu_data tpc_mmu_data; 7841 struct iterate_module_ctx tpc_iter = { 7842 .fn = &gaudi2_tpc_mmu_prepare, 7843 .data = &tpc_mmu_data, 7844 }; 7845 int rc, i; 7846 7847 if (asid & ~DCORE0_HMMU0_STLB_ASID_ASID_MASK) { 7848 dev_crit(hdev->dev, "asid %u is too big\n", asid); 7849 return -EINVAL; 7850 } 7851 7852 if (!(gaudi2->hw_cap_initialized & HW_CAP_MMU_MASK)) 7853 return 0; 7854 7855 rc = gaudi2_mmu_shared_prepare(hdev, asid); 7856 if (rc) 7857 return rc; 7858 7859 /* configure DCORE MMUs */ 7860 tpc_mmu_data.rw_asid = (asid << ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_RD_SHIFT) | 7861 (asid << ARC_FARM_KDMA_CTX_AXUSER_HB_ASID_WR_SHIFT); 7862 gaudi2_iterate_tpcs(hdev, &tpc_iter); 7863 for (i = 0 ; i < NUM_OF_DCORES ; i++) 7864 gaudi2_mmu_dcore_prepare(hdev, i, asid); 7865 7866 return 0; 7867 } 7868 7869 static inline bool is_info_event(u32 event) 7870 { 7871 switch (event) { 7872 case GAUDI2_EVENT_CPU_CPLD_SHUTDOWN_CAUSE: 7873 case GAUDI2_EVENT_CPU_FIX_POWER_ENV_S ... GAUDI2_EVENT_CPU_FIX_THERMAL_ENV_E: 7874 case GAUDI2_EVENT_ARC_PWR_BRK_ENTRY ... GAUDI2_EVENT_ARC_PWR_RD_MODE3: 7875 7876 /* return in case of NIC status event - these events are received periodically and not as 7877 * an indication to an error. 7878 */ 7879 case GAUDI2_EVENT_CPU0_STATUS_NIC0_ENG0 ... GAUDI2_EVENT_CPU11_STATUS_NIC11_ENG1: 7880 case GAUDI2_EVENT_ARC_EQ_HEARTBEAT: 7881 return true; 7882 default: 7883 return false; 7884 } 7885 } 7886 7887 static void gaudi2_print_event(struct hl_device *hdev, u16 event_type, 7888 bool ratelimited, const char *fmt, ...) 7889 { 7890 struct va_format vaf; 7891 va_list args; 7892 7893 va_start(args, fmt); 7894 vaf.fmt = fmt; 7895 vaf.va = &args; 7896 7897 if (ratelimited) 7898 dev_err_ratelimited(hdev->dev, "%s: %pV\n", 7899 gaudi2_irq_map_table[event_type].valid ? 7900 gaudi2_irq_map_table[event_type].name : "N/A Event", &vaf); 7901 else 7902 dev_err(hdev->dev, "%s: %pV\n", 7903 gaudi2_irq_map_table[event_type].valid ? 7904 gaudi2_irq_map_table[event_type].name : "N/A Event", &vaf); 7905 7906 va_end(args); 7907 } 7908 7909 static bool gaudi2_handle_ecc_event(struct hl_device *hdev, u16 event_type, 7910 struct hl_eq_ecc_data *ecc_data) 7911 { 7912 u64 ecc_address = 0, ecc_syndrome = 0; 7913 u8 memory_wrapper_idx = 0; 7914 bool has_block_id = false; 7915 u16 block_id; 7916 7917 if (!hl_is_fw_sw_ver_below(hdev, 1, 12)) 7918 has_block_id = true; 7919 7920 ecc_address = le64_to_cpu(ecc_data->ecc_address); 7921 ecc_syndrome = le64_to_cpu(ecc_data->ecc_syndrom); 7922 memory_wrapper_idx = ecc_data->memory_wrapper_idx; 7923 7924 if (has_block_id) { 7925 block_id = le16_to_cpu(ecc_data->block_id); 7926 gaudi2_print_event(hdev, event_type, !ecc_data->is_critical, 7927 "ECC error detected. address: %#llx. Syndrome: %#llx. wrapper id %u. block id %#x. critical %u.", 7928 ecc_address, ecc_syndrome, memory_wrapper_idx, block_id, 7929 ecc_data->is_critical); 7930 } else { 7931 gaudi2_print_event(hdev, event_type, !ecc_data->is_critical, 7932 "ECC error detected. address: %#llx. Syndrome: %#llx. wrapper id %u. critical %u.", 7933 ecc_address, ecc_syndrome, memory_wrapper_idx, ecc_data->is_critical); 7934 } 7935 7936 return !!ecc_data->is_critical; 7937 } 7938 7939 static void handle_lower_qman_data_on_err(struct hl_device *hdev, u64 qman_base, u32 engine_id) 7940 { 7941 struct undefined_opcode_info *undef_opcode = &hdev->captured_err_info.undef_opcode; 7942 u64 cq_ptr, cp_current_inst; 7943 u32 lo, hi, cq_size, cp_sts; 7944 bool is_arc_cq; 7945 7946 cp_sts = RREG32(qman_base + QM_CP_STS_4_OFFSET); 7947 is_arc_cq = FIELD_GET(PDMA0_QM_CP_STS_CUR_CQ_MASK, cp_sts); /* 0 - legacy CQ, 1 - ARC_CQ */ 7948 7949 if (is_arc_cq) { 7950 lo = RREG32(qman_base + QM_ARC_CQ_PTR_LO_STS_OFFSET); 7951 hi = RREG32(qman_base + QM_ARC_CQ_PTR_HI_STS_OFFSET); 7952 cq_ptr = ((u64) hi) << 32 | lo; 7953 cq_size = RREG32(qman_base + QM_ARC_CQ_TSIZE_STS_OFFSET); 7954 } else { 7955 lo = RREG32(qman_base + QM_CQ_PTR_LO_STS_4_OFFSET); 7956 hi = RREG32(qman_base + QM_CQ_PTR_HI_STS_4_OFFSET); 7957 cq_ptr = ((u64) hi) << 32 | lo; 7958 cq_size = RREG32(qman_base + QM_CQ_TSIZE_STS_4_OFFSET); 7959 } 7960 7961 lo = RREG32(qman_base + QM_CP_CURRENT_INST_LO_4_OFFSET); 7962 hi = RREG32(qman_base + QM_CP_CURRENT_INST_HI_4_OFFSET); 7963 cp_current_inst = ((u64) hi) << 32 | lo; 7964 7965 dev_info(hdev->dev, 7966 "LowerQM. %sCQ: {ptr %#llx, size %u}, CP: {instruction %#018llx}\n", 7967 is_arc_cq ? "ARC_" : "", cq_ptr, cq_size, cp_current_inst); 7968 7969 if (undef_opcode->write_enable) { 7970 memset(undef_opcode, 0, sizeof(*undef_opcode)); 7971 undef_opcode->timestamp = ktime_get(); 7972 undef_opcode->cq_addr = cq_ptr; 7973 undef_opcode->cq_size = cq_size; 7974 undef_opcode->engine_id = engine_id; 7975 undef_opcode->stream_id = QMAN_STREAMS; 7976 undef_opcode->write_enable = 0; 7977 } 7978 } 7979 7980 static int gaudi2_handle_qman_err_generic(struct hl_device *hdev, u16 event_type, 7981 u64 qman_base, u32 qid_base, u64 *event_mask) 7982 { 7983 u32 i, j, glbl_sts_val, arb_err_val, num_error_causes, error_count = 0; 7984 u64 glbl_sts_addr, arb_err_addr; 7985 char reg_desc[32]; 7986 7987 glbl_sts_addr = qman_base + (mmDCORE0_TPC0_QM_GLBL_ERR_STS_0 - mmDCORE0_TPC0_QM_BASE); 7988 arb_err_addr = qman_base + (mmDCORE0_TPC0_QM_ARB_ERR_CAUSE - mmDCORE0_TPC0_QM_BASE); 7989 7990 /* Iterate through all stream GLBL_ERR_STS registers + Lower CP */ 7991 for (i = 0 ; i < QMAN_STREAMS + 1 ; i++) { 7992 glbl_sts_val = RREG32(glbl_sts_addr + 4 * i); 7993 7994 if (!glbl_sts_val) 7995 continue; 7996 7997 if (i == QMAN_STREAMS) { 7998 snprintf(reg_desc, ARRAY_SIZE(reg_desc), "LowerQM"); 7999 num_error_causes = GAUDI2_NUM_OF_LOWER_QM_ERR_CAUSE; 8000 } else { 8001 snprintf(reg_desc, ARRAY_SIZE(reg_desc), "stream%u", i); 8002 num_error_causes = GAUDI2_NUM_OF_QM_ERR_CAUSE; 8003 } 8004 8005 for (j = 0 ; j < num_error_causes ; j++) 8006 if (glbl_sts_val & BIT(j)) { 8007 gaudi2_print_event(hdev, event_type, true, 8008 "%s. err cause: %s", reg_desc, 8009 i == QMAN_STREAMS ? 8010 gaudi2_lower_qman_error_cause[j] : 8011 gaudi2_qman_error_cause[j]); 8012 error_count++; 8013 } 8014 8015 /* Check for undefined opcode error in lower QM */ 8016 if ((i == QMAN_STREAMS) && 8017 (glbl_sts_val & PDMA0_QM_GLBL_ERR_STS_CP_UNDEF_CMD_ERR_MASK)) { 8018 handle_lower_qman_data_on_err(hdev, qman_base, 8019 gaudi2_queue_id_to_engine_id[qid_base]); 8020 *event_mask |= HL_NOTIFIER_EVENT_UNDEFINED_OPCODE; 8021 } 8022 } 8023 8024 arb_err_val = RREG32(arb_err_addr); 8025 8026 if (!arb_err_val) 8027 goto out; 8028 8029 for (j = 0 ; j < GAUDI2_NUM_OF_QM_ARB_ERR_CAUSE ; j++) { 8030 if (arb_err_val & BIT(j)) { 8031 gaudi2_print_event(hdev, event_type, true, 8032 "ARB_ERR. err cause: %s", 8033 gaudi2_qman_arb_error_cause[j]); 8034 error_count++; 8035 } 8036 } 8037 8038 out: 8039 return error_count; 8040 } 8041 8042 static void gaudi2_razwi_rr_hbw_shared_printf_info(struct hl_device *hdev, 8043 u64 rtr_mstr_if_base_addr, bool is_write, char *name, 8044 enum gaudi2_engine_id id, u64 *event_mask) 8045 { 8046 u32 razwi_hi, razwi_lo, razwi_xy; 8047 u16 eng_id = id; 8048 u8 rd_wr_flag; 8049 8050 if (is_write) { 8051 razwi_hi = RREG32(rtr_mstr_if_base_addr + RR_SHRD_HBW_AW_RAZWI_HI); 8052 razwi_lo = RREG32(rtr_mstr_if_base_addr + RR_SHRD_HBW_AW_RAZWI_LO); 8053 razwi_xy = RREG32(rtr_mstr_if_base_addr + RR_SHRD_HBW_AW_RAZWI_XY); 8054 rd_wr_flag = HL_RAZWI_WRITE; 8055 } else { 8056 razwi_hi = RREG32(rtr_mstr_if_base_addr + RR_SHRD_HBW_AR_RAZWI_HI); 8057 razwi_lo = RREG32(rtr_mstr_if_base_addr + RR_SHRD_HBW_AR_RAZWI_LO); 8058 razwi_xy = RREG32(rtr_mstr_if_base_addr + RR_SHRD_HBW_AR_RAZWI_XY); 8059 rd_wr_flag = HL_RAZWI_READ; 8060 } 8061 8062 hl_handle_razwi(hdev, (u64)razwi_hi << 32 | razwi_lo, &eng_id, 1, 8063 rd_wr_flag | HL_RAZWI_HBW, event_mask); 8064 8065 dev_err_ratelimited(hdev->dev, 8066 "%s-RAZWI SHARED RR HBW %s error, address %#llx, Initiator coordinates 0x%x\n", 8067 name, is_write ? "WR" : "RD", (u64)razwi_hi << 32 | razwi_lo, razwi_xy); 8068 } 8069 8070 static void gaudi2_razwi_rr_lbw_shared_printf_info(struct hl_device *hdev, 8071 u64 rtr_mstr_if_base_addr, bool is_write, char *name, 8072 enum gaudi2_engine_id id, u64 *event_mask) 8073 { 8074 u64 razwi_addr = CFG_BASE; 8075 u32 razwi_xy; 8076 u16 eng_id = id; 8077 u8 rd_wr_flag; 8078 8079 if (is_write) { 8080 razwi_addr += RREG32(rtr_mstr_if_base_addr + RR_SHRD_LBW_AW_RAZWI); 8081 razwi_xy = RREG32(rtr_mstr_if_base_addr + RR_SHRD_LBW_AW_RAZWI_XY); 8082 rd_wr_flag = HL_RAZWI_WRITE; 8083 } else { 8084 razwi_addr += RREG32(rtr_mstr_if_base_addr + RR_SHRD_LBW_AR_RAZWI); 8085 razwi_xy = RREG32(rtr_mstr_if_base_addr + RR_SHRD_LBW_AR_RAZWI_XY); 8086 rd_wr_flag = HL_RAZWI_READ; 8087 } 8088 8089 hl_handle_razwi(hdev, razwi_addr, &eng_id, 1, rd_wr_flag | HL_RAZWI_LBW, event_mask); 8090 dev_err_ratelimited(hdev->dev, 8091 "%s-RAZWI SHARED RR LBW %s error, mstr_if 0x%llx, captured address 0x%llX Initiator coordinates 0x%x\n", 8092 name, is_write ? "WR" : "RD", rtr_mstr_if_base_addr, razwi_addr, 8093 razwi_xy); 8094 } 8095 8096 static enum gaudi2_engine_id gaudi2_razwi_calc_engine_id(struct hl_device *hdev, 8097 enum razwi_event_sources module, u8 module_idx) 8098 { 8099 switch (module) { 8100 case RAZWI_TPC: 8101 if (module_idx == (NUM_OF_TPC_PER_DCORE * NUM_OF_DCORES)) 8102 return GAUDI2_DCORE0_ENGINE_ID_TPC_6; 8103 return (((module_idx / NUM_OF_TPC_PER_DCORE) * ENGINE_ID_DCORE_OFFSET) + 8104 (module_idx % NUM_OF_TPC_PER_DCORE) + 8105 (GAUDI2_DCORE0_ENGINE_ID_TPC_0 - GAUDI2_DCORE0_ENGINE_ID_EDMA_0)); 8106 8107 case RAZWI_MME: 8108 return ((GAUDI2_DCORE0_ENGINE_ID_MME - GAUDI2_DCORE0_ENGINE_ID_EDMA_0) + 8109 (module_idx * ENGINE_ID_DCORE_OFFSET)); 8110 8111 case RAZWI_EDMA: 8112 return (((module_idx / NUM_OF_EDMA_PER_DCORE) * ENGINE_ID_DCORE_OFFSET) + 8113 (module_idx % NUM_OF_EDMA_PER_DCORE)); 8114 8115 case RAZWI_PDMA: 8116 return (GAUDI2_ENGINE_ID_PDMA_0 + module_idx); 8117 8118 case RAZWI_NIC: 8119 return (GAUDI2_ENGINE_ID_NIC0_0 + (NIC_NUMBER_OF_QM_PER_MACRO * module_idx)); 8120 8121 case RAZWI_DEC: 8122 if (module_idx == 8) 8123 return GAUDI2_PCIE_ENGINE_ID_DEC_0; 8124 8125 if (module_idx == 9) 8126 return GAUDI2_PCIE_ENGINE_ID_DEC_1; 8127 ; 8128 return (((module_idx / NUM_OF_DEC_PER_DCORE) * ENGINE_ID_DCORE_OFFSET) + 8129 (module_idx % NUM_OF_DEC_PER_DCORE) + 8130 (GAUDI2_DCORE0_ENGINE_ID_DEC_0 - GAUDI2_DCORE0_ENGINE_ID_EDMA_0)); 8131 8132 case RAZWI_ROT: 8133 return GAUDI2_ENGINE_ID_ROT_0 + module_idx; 8134 8135 case RAZWI_ARC_FARM: 8136 return GAUDI2_ENGINE_ID_ARC_FARM; 8137 8138 default: 8139 return GAUDI2_ENGINE_ID_SIZE; 8140 } 8141 } 8142 8143 /* 8144 * This function handles RR(Range register) hit events. 8145 * raised be initiators not PSOC RAZWI. 8146 */ 8147 static void gaudi2_ack_module_razwi_event_handler(struct hl_device *hdev, 8148 enum razwi_event_sources module, u8 module_idx, 8149 u8 module_sub_idx, u64 *event_mask) 8150 { 8151 bool via_sft = false; 8152 u32 hbw_rtr_id, lbw_rtr_id, dcore_id, dcore_rtr_id, eng_id, binned_idx; 8153 u64 hbw_rtr_mstr_if_base_addr, lbw_rtr_mstr_if_base_addr; 8154 u32 hbw_shrd_aw = 0, hbw_shrd_ar = 0; 8155 u32 lbw_shrd_aw = 0, lbw_shrd_ar = 0; 8156 char initiator_name[64]; 8157 8158 switch (module) { 8159 case RAZWI_TPC: 8160 sprintf(initiator_name, "TPC_%u", module_idx); 8161 if (hdev->tpc_binning) { 8162 binned_idx = __ffs(hdev->tpc_binning); 8163 if (binned_idx == module_idx) 8164 module_idx = TPC_ID_DCORE0_TPC6; 8165 } 8166 8167 hbw_rtr_id = gaudi2_tpc_initiator_hbw_rtr_id[module_idx]; 8168 8169 if (hl_is_fw_sw_ver_below(hdev, 1, 9) && 8170 !hdev->asic_prop.fw_security_enabled && 8171 ((module_idx == 0) || (module_idx == 1))) 8172 lbw_rtr_id = DCORE0_RTR0; 8173 else 8174 lbw_rtr_id = gaudi2_tpc_initiator_lbw_rtr_id[module_idx]; 8175 break; 8176 case RAZWI_MME: 8177 sprintf(initiator_name, "MME_%u", module_idx); 8178 switch (module_sub_idx) { 8179 case MME_WAP0: 8180 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].wap0; 8181 break; 8182 case MME_WAP1: 8183 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].wap1; 8184 break; 8185 case MME_WRITE: 8186 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].write; 8187 break; 8188 case MME_READ: 8189 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].read; 8190 break; 8191 case MME_SBTE0: 8192 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].sbte0; 8193 break; 8194 case MME_SBTE1: 8195 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].sbte1; 8196 break; 8197 case MME_SBTE2: 8198 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].sbte2; 8199 break; 8200 case MME_SBTE3: 8201 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].sbte3; 8202 break; 8203 case MME_SBTE4: 8204 hbw_rtr_id = gaudi2_mme_initiator_rtr_id[module_idx].sbte4; 8205 break; 8206 default: 8207 return; 8208 } 8209 lbw_rtr_id = hbw_rtr_id; 8210 break; 8211 case RAZWI_EDMA: 8212 hbw_rtr_mstr_if_base_addr = gaudi2_edma_initiator_hbw_sft[module_idx]; 8213 dcore_id = module_idx / NUM_OF_EDMA_PER_DCORE; 8214 /* SFT has separate MSTR_IF for LBW, only there we can 8215 * read the LBW razwi related registers 8216 */ 8217 lbw_rtr_mstr_if_base_addr = mmSFT0_LBW_RTR_IF_MSTR_IF_RR_SHRD_HBW_BASE + 8218 dcore_id * SFT_DCORE_OFFSET; 8219 via_sft = true; 8220 sprintf(initiator_name, "EDMA_%u", module_idx); 8221 break; 8222 case RAZWI_PDMA: 8223 hbw_rtr_id = gaudi2_pdma_initiator_hbw_rtr_id[module_idx]; 8224 lbw_rtr_id = gaudi2_pdma_initiator_lbw_rtr_id[module_idx]; 8225 sprintf(initiator_name, "PDMA_%u", module_idx); 8226 break; 8227 case RAZWI_NIC: 8228 hbw_rtr_id = gaudi2_nic_initiator_hbw_rtr_id[module_idx]; 8229 lbw_rtr_id = gaudi2_nic_initiator_lbw_rtr_id[module_idx]; 8230 sprintf(initiator_name, "NIC_%u", module_idx); 8231 break; 8232 case RAZWI_DEC: 8233 sprintf(initiator_name, "DEC_%u", module_idx); 8234 if (hdev->decoder_binning) { 8235 binned_idx = __ffs(hdev->decoder_binning); 8236 if (binned_idx == module_idx) 8237 module_idx = DEC_ID_PCIE_VDEC1; 8238 } 8239 hbw_rtr_id = gaudi2_dec_initiator_hbw_rtr_id[module_idx]; 8240 lbw_rtr_id = gaudi2_dec_initiator_lbw_rtr_id[module_idx]; 8241 break; 8242 case RAZWI_ROT: 8243 hbw_rtr_id = gaudi2_rot_initiator_hbw_rtr_id[module_idx]; 8244 lbw_rtr_id = gaudi2_rot_initiator_lbw_rtr_id[module_idx]; 8245 sprintf(initiator_name, "ROT_%u", module_idx); 8246 break; 8247 case RAZWI_ARC_FARM: 8248 lbw_rtr_id = DCORE1_RTR5; 8249 hbw_rtr_id = DCORE1_RTR7; 8250 sprintf(initiator_name, "ARC_FARM_%u", module_idx); 8251 break; 8252 default: 8253 return; 8254 } 8255 8256 /* Find router mstr_if register base */ 8257 if (!via_sft) { 8258 dcore_id = hbw_rtr_id / NUM_OF_RTR_PER_DCORE; 8259 dcore_rtr_id = hbw_rtr_id % NUM_OF_RTR_PER_DCORE; 8260 hbw_rtr_mstr_if_base_addr = mmDCORE0_RTR0_CTRL_BASE + 8261 dcore_id * DCORE_OFFSET + 8262 dcore_rtr_id * DCORE_RTR_OFFSET + 8263 RTR_MSTR_IF_OFFSET; 8264 lbw_rtr_mstr_if_base_addr = hbw_rtr_mstr_if_base_addr + 8265 (((s32)lbw_rtr_id - hbw_rtr_id) * DCORE_RTR_OFFSET); 8266 } 8267 8268 /* Find out event cause by reading "RAZWI_HAPPENED" registers */ 8269 hbw_shrd_aw = RREG32(hbw_rtr_mstr_if_base_addr + RR_SHRD_HBW_AW_RAZWI_HAPPENED); 8270 hbw_shrd_ar = RREG32(hbw_rtr_mstr_if_base_addr + RR_SHRD_HBW_AR_RAZWI_HAPPENED); 8271 lbw_shrd_aw = RREG32(lbw_rtr_mstr_if_base_addr + RR_SHRD_LBW_AW_RAZWI_HAPPENED); 8272 lbw_shrd_ar = RREG32(lbw_rtr_mstr_if_base_addr + RR_SHRD_LBW_AR_RAZWI_HAPPENED); 8273 8274 eng_id = gaudi2_razwi_calc_engine_id(hdev, module, module_idx); 8275 if (hbw_shrd_aw) { 8276 gaudi2_razwi_rr_hbw_shared_printf_info(hdev, hbw_rtr_mstr_if_base_addr, true, 8277 initiator_name, eng_id, event_mask); 8278 8279 /* Clear event indication */ 8280 WREG32(hbw_rtr_mstr_if_base_addr + RR_SHRD_HBW_AW_RAZWI_HAPPENED, hbw_shrd_aw); 8281 } 8282 8283 if (hbw_shrd_ar) { 8284 gaudi2_razwi_rr_hbw_shared_printf_info(hdev, hbw_rtr_mstr_if_base_addr, false, 8285 initiator_name, eng_id, event_mask); 8286 8287 /* Clear event indication */ 8288 WREG32(hbw_rtr_mstr_if_base_addr + RR_SHRD_HBW_AR_RAZWI_HAPPENED, hbw_shrd_ar); 8289 } 8290 8291 if (lbw_shrd_aw) { 8292 gaudi2_razwi_rr_lbw_shared_printf_info(hdev, lbw_rtr_mstr_if_base_addr, true, 8293 initiator_name, eng_id, event_mask); 8294 8295 /* Clear event indication */ 8296 WREG32(lbw_rtr_mstr_if_base_addr + RR_SHRD_LBW_AW_RAZWI_HAPPENED, lbw_shrd_aw); 8297 } 8298 8299 if (lbw_shrd_ar) { 8300 gaudi2_razwi_rr_lbw_shared_printf_info(hdev, lbw_rtr_mstr_if_base_addr, false, 8301 initiator_name, eng_id, event_mask); 8302 8303 /* Clear event indication */ 8304 WREG32(lbw_rtr_mstr_if_base_addr + RR_SHRD_LBW_AR_RAZWI_HAPPENED, lbw_shrd_ar); 8305 } 8306 } 8307 8308 static void gaudi2_check_if_razwi_happened(struct hl_device *hdev) 8309 { 8310 struct asic_fixed_properties *prop = &hdev->asic_prop; 8311 u8 mod_idx, sub_mod; 8312 8313 /* check all TPCs */ 8314 for (mod_idx = 0 ; mod_idx < (NUM_OF_TPC_PER_DCORE * NUM_OF_DCORES + 1) ; mod_idx++) { 8315 if (prop->tpc_enabled_mask & BIT(mod_idx)) 8316 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_TPC, mod_idx, 0, NULL); 8317 } 8318 8319 /* check all MMEs */ 8320 for (mod_idx = 0 ; mod_idx < (NUM_OF_MME_PER_DCORE * NUM_OF_DCORES) ; mod_idx++) 8321 for (sub_mod = MME_WAP0 ; sub_mod < MME_INITIATORS_MAX ; sub_mod++) 8322 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_MME, mod_idx, 8323 sub_mod, NULL); 8324 8325 /* check all EDMAs */ 8326 for (mod_idx = 0 ; mod_idx < (NUM_OF_EDMA_PER_DCORE * NUM_OF_DCORES) ; mod_idx++) 8327 if (prop->edma_enabled_mask & BIT(mod_idx)) 8328 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_EDMA, mod_idx, 0, NULL); 8329 8330 /* check all PDMAs */ 8331 for (mod_idx = 0 ; mod_idx < NUM_OF_PDMA ; mod_idx++) 8332 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_PDMA, mod_idx, 0, NULL); 8333 8334 /* check all NICs */ 8335 for (mod_idx = 0 ; mod_idx < NIC_NUMBER_OF_PORTS ; mod_idx++) 8336 if (hdev->nic_ports_mask & BIT(mod_idx)) 8337 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_NIC, mod_idx >> 1, 0, 8338 NULL); 8339 8340 /* check all DECs */ 8341 for (mod_idx = 0 ; mod_idx < NUMBER_OF_DEC ; mod_idx++) 8342 if (prop->decoder_enabled_mask & BIT(mod_idx)) 8343 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_DEC, mod_idx, 0, NULL); 8344 8345 /* check all ROTs */ 8346 for (mod_idx = 0 ; mod_idx < NUM_OF_ROT ; mod_idx++) 8347 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_ROT, mod_idx, 0, NULL); 8348 } 8349 8350 static int gaudi2_psoc_razwi_get_engines(struct gaudi2_razwi_info *razwi_info, u32 array_size, 8351 u32 axuser_xy, u32 *base, u16 *eng_id, 8352 char *eng_name) 8353 { 8354 8355 int i, num_of_eng = 0; 8356 u16 str_size = 0; 8357 8358 for (i = 0 ; i < array_size ; i++) { 8359 if (axuser_xy != razwi_info[i].axuser_xy) 8360 continue; 8361 8362 eng_id[num_of_eng] = razwi_info[i].eng_id; 8363 base[num_of_eng] = razwi_info[i].rtr_ctrl; 8364 if (!num_of_eng) 8365 str_size += scnprintf(eng_name + str_size, 8366 PSOC_RAZWI_ENG_STR_SIZE - str_size, "%s", 8367 razwi_info[i].eng_name); 8368 else 8369 str_size += scnprintf(eng_name + str_size, 8370 PSOC_RAZWI_ENG_STR_SIZE - str_size, " or %s", 8371 razwi_info[i].eng_name); 8372 num_of_eng++; 8373 } 8374 8375 return num_of_eng; 8376 } 8377 8378 static bool gaudi2_handle_psoc_razwi_happened(struct hl_device *hdev, u32 razwi_reg, 8379 u64 *event_mask) 8380 { 8381 u32 axuser_xy = RAZWI_GET_AXUSER_XY(razwi_reg), addr_hi = 0, addr_lo = 0; 8382 u32 base[PSOC_RAZWI_MAX_ENG_PER_RTR]; 8383 u16 num_of_eng, eng_id[PSOC_RAZWI_MAX_ENG_PER_RTR]; 8384 char eng_name_str[PSOC_RAZWI_ENG_STR_SIZE]; 8385 bool razwi_happened = false; 8386 u64 addr; 8387 int i; 8388 8389 num_of_eng = gaudi2_psoc_razwi_get_engines(common_razwi_info, ARRAY_SIZE(common_razwi_info), 8390 axuser_xy, base, eng_id, eng_name_str); 8391 8392 /* If no match for XY coordinates, try to find it in MME razwi table */ 8393 if (!num_of_eng) { 8394 axuser_xy = RAZWI_GET_AXUSER_LOW_XY(razwi_reg); 8395 num_of_eng = gaudi2_psoc_razwi_get_engines(mme_razwi_info, 8396 ARRAY_SIZE(mme_razwi_info), 8397 axuser_xy, base, eng_id, 8398 eng_name_str); 8399 } 8400 8401 for (i = 0 ; i < num_of_eng ; i++) { 8402 if (RREG32(base[i] + DEC_RAZWI_HBW_AW_SET)) { 8403 addr_hi = RREG32(base[i] + DEC_RAZWI_HBW_AW_ADDR_HI); 8404 addr_lo = RREG32(base[i] + DEC_RAZWI_HBW_AW_ADDR_LO); 8405 addr = ((u64)addr_hi << 32) + addr_lo; 8406 if (addr) { 8407 dev_err(hdev->dev, 8408 "PSOC HBW AW RAZWI: %s, address (aligned to 128 byte): 0x%llX\n", 8409 eng_name_str, addr); 8410 hl_handle_razwi(hdev, addr, &eng_id[0], 8411 num_of_eng, HL_RAZWI_HBW | HL_RAZWI_WRITE, event_mask); 8412 razwi_happened = true; 8413 } 8414 } 8415 8416 if (RREG32(base[i] + DEC_RAZWI_HBW_AR_SET)) { 8417 addr_hi = RREG32(base[i] + DEC_RAZWI_HBW_AR_ADDR_HI); 8418 addr_lo = RREG32(base[i] + DEC_RAZWI_HBW_AR_ADDR_LO); 8419 addr = ((u64)addr_hi << 32) + addr_lo; 8420 if (addr) { 8421 dev_err(hdev->dev, 8422 "PSOC HBW AR RAZWI: %s, address (aligned to 128 byte): 0x%llX\n", 8423 eng_name_str, addr); 8424 hl_handle_razwi(hdev, addr, &eng_id[0], 8425 num_of_eng, HL_RAZWI_HBW | HL_RAZWI_READ, event_mask); 8426 razwi_happened = true; 8427 } 8428 } 8429 8430 if (RREG32(base[i] + DEC_RAZWI_LBW_AW_SET)) { 8431 addr_lo = RREG32(base[i] + DEC_RAZWI_LBW_AW_ADDR); 8432 if (addr_lo) { 8433 dev_err(hdev->dev, 8434 "PSOC LBW AW RAZWI: %s, address (aligned to 128 byte): 0x%X\n", 8435 eng_name_str, addr_lo); 8436 hl_handle_razwi(hdev, addr_lo, &eng_id[0], 8437 num_of_eng, HL_RAZWI_LBW | HL_RAZWI_WRITE, event_mask); 8438 razwi_happened = true; 8439 } 8440 } 8441 8442 if (RREG32(base[i] + DEC_RAZWI_LBW_AR_SET)) { 8443 addr_lo = RREG32(base[i] + DEC_RAZWI_LBW_AR_ADDR); 8444 if (addr_lo) { 8445 dev_err(hdev->dev, 8446 "PSOC LBW AR RAZWI: %s, address (aligned to 128 byte): 0x%X\n", 8447 eng_name_str, addr_lo); 8448 hl_handle_razwi(hdev, addr_lo, &eng_id[0], 8449 num_of_eng, HL_RAZWI_LBW | HL_RAZWI_READ, event_mask); 8450 razwi_happened = true; 8451 } 8452 } 8453 /* In common case the loop will break, when there is only one engine id, or 8454 * several engines with the same router. The exceptional case is with psoc razwi 8455 * from EDMA, where it's possible to get axuser id which fits 2 routers (2 8456 * interfaces of sft router). In this case, maybe the first router won't hold info 8457 * and we will need to iterate on the other router. 8458 */ 8459 if (razwi_happened) 8460 break; 8461 } 8462 8463 return razwi_happened; 8464 } 8465 8466 /* PSOC RAZWI interrupt occurs only when trying to access a bad address */ 8467 static int gaudi2_ack_psoc_razwi_event_handler(struct hl_device *hdev, u64 *event_mask) 8468 { 8469 u32 razwi_mask_info, razwi_intr = 0, error_count = 0; 8470 8471 if (hdev->pldm || !(hdev->fw_components & FW_TYPE_LINUX)) { 8472 razwi_intr = RREG32(mmPSOC_GLOBAL_CONF_RAZWI_INTERRUPT); 8473 if (!razwi_intr) 8474 return 0; 8475 } 8476 8477 razwi_mask_info = RREG32(mmPSOC_GLOBAL_CONF_RAZWI_MASK_INFO); 8478 8479 dev_err_ratelimited(hdev->dev, 8480 "PSOC RAZWI interrupt: Mask %d, AR %d, AW %d, AXUSER_L 0x%x AXUSER_H 0x%x\n", 8481 FIELD_GET(PSOC_GLOBAL_CONF_RAZWI_MASK_INFO_MASK_MASK, razwi_mask_info), 8482 FIELD_GET(PSOC_GLOBAL_CONF_RAZWI_MASK_INFO_WAS_AR_MASK, razwi_mask_info), 8483 FIELD_GET(PSOC_GLOBAL_CONF_RAZWI_MASK_INFO_WAS_AW_MASK, razwi_mask_info), 8484 FIELD_GET(PSOC_GLOBAL_CONF_RAZWI_MASK_INFO_AXUSER_L_MASK, razwi_mask_info), 8485 FIELD_GET(PSOC_GLOBAL_CONF_RAZWI_MASK_INFO_AXUSER_H_MASK, razwi_mask_info)); 8486 8487 if (gaudi2_handle_psoc_razwi_happened(hdev, razwi_mask_info, event_mask)) 8488 error_count++; 8489 else 8490 dev_err_ratelimited(hdev->dev, 8491 "PSOC RAZWI interrupt: invalid razwi info (0x%x)\n", 8492 razwi_mask_info); 8493 8494 /* Clear Interrupts only on pldm or if f/w doesn't handle interrupts */ 8495 if (hdev->pldm || !(hdev->fw_components & FW_TYPE_LINUX)) 8496 WREG32(mmPSOC_GLOBAL_CONF_RAZWI_INTERRUPT, razwi_intr); 8497 8498 return error_count; 8499 } 8500 8501 static int _gaudi2_handle_qm_sei_err(struct hl_device *hdev, u64 qman_base, u16 event_type) 8502 { 8503 u32 i, sts_val, sts_clr_val = 0, error_count = 0; 8504 8505 sts_val = RREG32(qman_base + QM_SEI_STATUS_OFFSET); 8506 8507 for (i = 0 ; i < GAUDI2_NUM_OF_QM_SEI_ERR_CAUSE ; i++) { 8508 if (sts_val & BIT(i)) { 8509 gaudi2_print_event(hdev, event_type, true, 8510 "err cause: %s", gaudi2_qm_sei_error_cause[i]); 8511 sts_clr_val |= BIT(i); 8512 error_count++; 8513 } 8514 } 8515 8516 WREG32(qman_base + QM_SEI_STATUS_OFFSET, sts_clr_val); 8517 8518 return error_count; 8519 } 8520 8521 static int gaudi2_handle_qm_sei_err(struct hl_device *hdev, u16 event_type, 8522 bool extended_err_check, u64 *event_mask) 8523 { 8524 enum razwi_event_sources module; 8525 u32 error_count = 0; 8526 u64 qman_base; 8527 u8 index; 8528 8529 switch (event_type) { 8530 case GAUDI2_EVENT_TPC0_AXI_ERR_RSP ... GAUDI2_EVENT_TPC23_AXI_ERR_RSP: 8531 index = event_type - GAUDI2_EVENT_TPC0_AXI_ERR_RSP; 8532 qman_base = mmDCORE0_TPC0_QM_BASE + 8533 (index / NUM_OF_TPC_PER_DCORE) * DCORE_OFFSET + 8534 (index % NUM_OF_TPC_PER_DCORE) * DCORE_TPC_OFFSET; 8535 module = RAZWI_TPC; 8536 break; 8537 case GAUDI2_EVENT_TPC24_AXI_ERR_RSP: 8538 qman_base = mmDCORE0_TPC6_QM_BASE; 8539 module = RAZWI_TPC; 8540 break; 8541 case GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE: 8542 case GAUDI2_EVENT_MME1_CTRL_AXI_ERROR_RESPONSE: 8543 case GAUDI2_EVENT_MME2_CTRL_AXI_ERROR_RESPONSE: 8544 case GAUDI2_EVENT_MME3_CTRL_AXI_ERROR_RESPONSE: 8545 index = (event_type - GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE) / 8546 (GAUDI2_EVENT_MME1_CTRL_AXI_ERROR_RESPONSE - 8547 GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE); 8548 qman_base = mmDCORE0_MME_QM_BASE + index * DCORE_OFFSET; 8549 module = RAZWI_MME; 8550 break; 8551 case GAUDI2_EVENT_PDMA_CH0_AXI_ERR_RSP: 8552 case GAUDI2_EVENT_PDMA_CH1_AXI_ERR_RSP: 8553 index = event_type - GAUDI2_EVENT_PDMA_CH0_AXI_ERR_RSP; 8554 qman_base = mmPDMA0_QM_BASE + index * PDMA_OFFSET; 8555 module = RAZWI_PDMA; 8556 break; 8557 case GAUDI2_EVENT_ROTATOR0_AXI_ERROR_RESPONSE: 8558 case GAUDI2_EVENT_ROTATOR1_AXI_ERROR_RESPONSE: 8559 index = event_type - GAUDI2_EVENT_ROTATOR0_AXI_ERROR_RESPONSE; 8560 qman_base = mmROT0_QM_BASE + index * ROT_OFFSET; 8561 module = RAZWI_ROT; 8562 break; 8563 default: 8564 return 0; 8565 } 8566 8567 error_count = _gaudi2_handle_qm_sei_err(hdev, qman_base, event_type); 8568 8569 /* There is a single event per NIC macro, so should check its both QMAN blocks */ 8570 if (event_type >= GAUDI2_EVENT_NIC0_AXI_ERROR_RESPONSE && 8571 event_type <= GAUDI2_EVENT_NIC11_AXI_ERROR_RESPONSE) 8572 error_count += _gaudi2_handle_qm_sei_err(hdev, 8573 qman_base + NIC_QM_OFFSET, event_type); 8574 8575 if (extended_err_check) { 8576 /* check if RAZWI happened */ 8577 gaudi2_ack_module_razwi_event_handler(hdev, module, 0, 0, event_mask); 8578 hl_check_for_glbl_errors(hdev); 8579 } 8580 8581 return error_count; 8582 } 8583 8584 static int gaudi2_handle_qman_err(struct hl_device *hdev, u16 event_type, u64 *event_mask) 8585 { 8586 u32 qid_base, error_count = 0; 8587 u64 qman_base; 8588 u8 index = 0; 8589 8590 switch (event_type) { 8591 case GAUDI2_EVENT_TPC0_QM ... GAUDI2_EVENT_TPC5_QM: 8592 index = event_type - GAUDI2_EVENT_TPC0_QM; 8593 qid_base = GAUDI2_QUEUE_ID_DCORE0_TPC_0_0 + index * QMAN_STREAMS; 8594 qman_base = mmDCORE0_TPC0_QM_BASE + index * DCORE_TPC_OFFSET; 8595 break; 8596 case GAUDI2_EVENT_TPC6_QM ... GAUDI2_EVENT_TPC11_QM: 8597 index = event_type - GAUDI2_EVENT_TPC6_QM; 8598 qid_base = GAUDI2_QUEUE_ID_DCORE1_TPC_0_0 + index * QMAN_STREAMS; 8599 qman_base = mmDCORE1_TPC0_QM_BASE + index * DCORE_TPC_OFFSET; 8600 break; 8601 case GAUDI2_EVENT_TPC12_QM ... GAUDI2_EVENT_TPC17_QM: 8602 index = event_type - GAUDI2_EVENT_TPC12_QM; 8603 qid_base = GAUDI2_QUEUE_ID_DCORE2_TPC_0_0 + index * QMAN_STREAMS; 8604 qman_base = mmDCORE2_TPC0_QM_BASE + index * DCORE_TPC_OFFSET; 8605 break; 8606 case GAUDI2_EVENT_TPC18_QM ... GAUDI2_EVENT_TPC23_QM: 8607 index = event_type - GAUDI2_EVENT_TPC18_QM; 8608 qid_base = GAUDI2_QUEUE_ID_DCORE3_TPC_0_0 + index * QMAN_STREAMS; 8609 qman_base = mmDCORE3_TPC0_QM_BASE + index * DCORE_TPC_OFFSET; 8610 break; 8611 case GAUDI2_EVENT_TPC24_QM: 8612 qid_base = GAUDI2_QUEUE_ID_DCORE0_TPC_6_0; 8613 qman_base = mmDCORE0_TPC6_QM_BASE; 8614 break; 8615 case GAUDI2_EVENT_MME0_QM: 8616 qid_base = GAUDI2_QUEUE_ID_DCORE0_MME_0_0; 8617 qman_base = mmDCORE0_MME_QM_BASE; 8618 break; 8619 case GAUDI2_EVENT_MME1_QM: 8620 qid_base = GAUDI2_QUEUE_ID_DCORE1_MME_0_0; 8621 qman_base = mmDCORE1_MME_QM_BASE; 8622 break; 8623 case GAUDI2_EVENT_MME2_QM: 8624 qid_base = GAUDI2_QUEUE_ID_DCORE2_MME_0_0; 8625 qman_base = mmDCORE2_MME_QM_BASE; 8626 break; 8627 case GAUDI2_EVENT_MME3_QM: 8628 qid_base = GAUDI2_QUEUE_ID_DCORE3_MME_0_0; 8629 qman_base = mmDCORE3_MME_QM_BASE; 8630 break; 8631 case GAUDI2_EVENT_HDMA0_QM: 8632 index = 0; 8633 qid_base = GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0; 8634 qman_base = mmDCORE0_EDMA0_QM_BASE; 8635 break; 8636 case GAUDI2_EVENT_HDMA1_QM: 8637 index = 1; 8638 qid_base = GAUDI2_QUEUE_ID_DCORE0_EDMA_1_0; 8639 qman_base = mmDCORE0_EDMA1_QM_BASE; 8640 break; 8641 case GAUDI2_EVENT_HDMA2_QM: 8642 index = 2; 8643 qid_base = GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0; 8644 qman_base = mmDCORE1_EDMA0_QM_BASE; 8645 break; 8646 case GAUDI2_EVENT_HDMA3_QM: 8647 index = 3; 8648 qid_base = GAUDI2_QUEUE_ID_DCORE1_EDMA_1_0; 8649 qman_base = mmDCORE1_EDMA1_QM_BASE; 8650 break; 8651 case GAUDI2_EVENT_HDMA4_QM: 8652 index = 4; 8653 qid_base = GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0; 8654 qman_base = mmDCORE2_EDMA0_QM_BASE; 8655 break; 8656 case GAUDI2_EVENT_HDMA5_QM: 8657 index = 5; 8658 qid_base = GAUDI2_QUEUE_ID_DCORE2_EDMA_1_0; 8659 qman_base = mmDCORE2_EDMA1_QM_BASE; 8660 break; 8661 case GAUDI2_EVENT_HDMA6_QM: 8662 index = 6; 8663 qid_base = GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0; 8664 qman_base = mmDCORE3_EDMA0_QM_BASE; 8665 break; 8666 case GAUDI2_EVENT_HDMA7_QM: 8667 index = 7; 8668 qid_base = GAUDI2_QUEUE_ID_DCORE3_EDMA_1_0; 8669 qman_base = mmDCORE3_EDMA1_QM_BASE; 8670 break; 8671 case GAUDI2_EVENT_PDMA0_QM: 8672 qid_base = GAUDI2_QUEUE_ID_PDMA_0_0; 8673 qman_base = mmPDMA0_QM_BASE; 8674 break; 8675 case GAUDI2_EVENT_PDMA1_QM: 8676 qid_base = GAUDI2_QUEUE_ID_PDMA_1_0; 8677 qman_base = mmPDMA1_QM_BASE; 8678 break; 8679 case GAUDI2_EVENT_ROTATOR0_ROT0_QM: 8680 qid_base = GAUDI2_QUEUE_ID_ROT_0_0; 8681 qman_base = mmROT0_QM_BASE; 8682 break; 8683 case GAUDI2_EVENT_ROTATOR1_ROT1_QM: 8684 qid_base = GAUDI2_QUEUE_ID_ROT_1_0; 8685 qman_base = mmROT1_QM_BASE; 8686 break; 8687 default: 8688 return 0; 8689 } 8690 8691 error_count = gaudi2_handle_qman_err_generic(hdev, event_type, qman_base, 8692 qid_base, event_mask); 8693 8694 /* Handle EDMA QM SEI here because there is no AXI error response event for EDMA */ 8695 if (event_type >= GAUDI2_EVENT_HDMA2_QM && event_type <= GAUDI2_EVENT_HDMA5_QM) { 8696 error_count += _gaudi2_handle_qm_sei_err(hdev, qman_base, event_type); 8697 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_EDMA, index, 0, event_mask); 8698 } 8699 8700 hl_check_for_glbl_errors(hdev); 8701 8702 return error_count; 8703 } 8704 8705 static int gaudi2_handle_arc_farm_sei_err(struct hl_device *hdev, u16 event_type, u64 *event_mask) 8706 { 8707 u32 i, sts_val, sts_clr_val, error_count = 0, arc_farm; 8708 8709 for (arc_farm = 0 ; arc_farm < NUM_OF_ARC_FARMS_ARC ; arc_farm++) { 8710 sts_clr_val = 0; 8711 sts_val = RREG32(mmARC_FARM_ARC0_AUX_ARC_SEI_INTR_STS + 8712 (arc_farm * ARC_FARM_OFFSET)); 8713 8714 for (i = 0 ; i < GAUDI2_NUM_OF_ARC_SEI_ERR_CAUSE ; i++) { 8715 if (sts_val & BIT(i)) { 8716 gaudi2_print_event(hdev, event_type, true, 8717 "ARC FARM ARC %u err cause: %s", 8718 arc_farm, gaudi2_arc_sei_error_cause[i]); 8719 sts_clr_val |= BIT(i); 8720 error_count++; 8721 } 8722 } 8723 WREG32(mmARC_FARM_ARC0_AUX_ARC_SEI_INTR_CLR + (arc_farm * ARC_FARM_OFFSET), 8724 sts_clr_val); 8725 } 8726 8727 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_ARC_FARM, 0, 0, event_mask); 8728 hl_check_for_glbl_errors(hdev); 8729 8730 return error_count; 8731 } 8732 8733 static int gaudi2_handle_cpu_sei_err(struct hl_device *hdev, u16 event_type) 8734 { 8735 u32 i, sts_val, sts_clr_val = 0, error_count = 0; 8736 8737 sts_val = RREG32(mmCPU_IF_CPU_SEI_INTR_STS); 8738 8739 for (i = 0 ; i < GAUDI2_NUM_OF_CPU_SEI_ERR_CAUSE ; i++) { 8740 if (sts_val & BIT(i)) { 8741 gaudi2_print_event(hdev, event_type, true, 8742 "err cause: %s", gaudi2_cpu_sei_error_cause[i]); 8743 sts_clr_val |= BIT(i); 8744 error_count++; 8745 } 8746 } 8747 8748 hl_check_for_glbl_errors(hdev); 8749 8750 WREG32(mmCPU_IF_CPU_SEI_INTR_CLR, sts_clr_val); 8751 8752 return error_count; 8753 } 8754 8755 static int gaudi2_handle_rot_err(struct hl_device *hdev, u8 rot_index, u16 event_type, 8756 struct hl_eq_razwi_with_intr_cause *razwi_with_intr_cause, 8757 u64 *event_mask) 8758 { 8759 u64 intr_cause_data = le64_to_cpu(razwi_with_intr_cause->intr_cause.intr_cause_data); 8760 u32 error_count = 0; 8761 int i; 8762 8763 for (i = 0 ; i < GAUDI2_NUM_OF_ROT_ERR_CAUSE ; i++) 8764 if (intr_cause_data & BIT(i)) { 8765 gaudi2_print_event(hdev, event_type, true, 8766 "err cause: %s", guadi2_rot_error_cause[i]); 8767 error_count++; 8768 } 8769 8770 /* check if RAZWI happened */ 8771 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_ROT, rot_index, 0, event_mask); 8772 hl_check_for_glbl_errors(hdev); 8773 8774 return error_count; 8775 } 8776 8777 static int gaudi2_tpc_ack_interrupts(struct hl_device *hdev, u8 tpc_index, u16 event_type, 8778 struct hl_eq_razwi_with_intr_cause *razwi_with_intr_cause, 8779 u64 *event_mask) 8780 { 8781 u64 intr_cause_data = le64_to_cpu(razwi_with_intr_cause->intr_cause.intr_cause_data); 8782 u32 error_count = 0; 8783 int i; 8784 8785 for (i = 0 ; i < GAUDI2_NUM_OF_TPC_INTR_CAUSE ; i++) 8786 if (intr_cause_data & BIT(i)) { 8787 gaudi2_print_event(hdev, event_type, true, 8788 "interrupt cause: %s", gaudi2_tpc_interrupts_cause[i]); 8789 error_count++; 8790 } 8791 8792 /* check if RAZWI happened */ 8793 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_TPC, tpc_index, 0, event_mask); 8794 hl_check_for_glbl_errors(hdev); 8795 8796 return error_count; 8797 } 8798 8799 static int gaudi2_handle_dec_err(struct hl_device *hdev, u8 dec_index, u16 event_type, 8800 u64 *event_mask) 8801 { 8802 u32 sts_addr, sts_val, sts_clr_val = 0, error_count = 0; 8803 int i; 8804 8805 if (dec_index < NUM_OF_VDEC_PER_DCORE * NUM_OF_DCORES) 8806 /* DCORE DEC */ 8807 sts_addr = mmDCORE0_VDEC0_BRDG_CTRL_CAUSE_INTR + 8808 DCORE_OFFSET * (dec_index / NUM_OF_DEC_PER_DCORE) + 8809 DCORE_VDEC_OFFSET * (dec_index % NUM_OF_DEC_PER_DCORE); 8810 else 8811 /* PCIE DEC */ 8812 sts_addr = mmPCIE_VDEC0_BRDG_CTRL_CAUSE_INTR + PCIE_VDEC_OFFSET * 8813 (dec_index - NUM_OF_VDEC_PER_DCORE * NUM_OF_DCORES); 8814 8815 sts_val = RREG32(sts_addr); 8816 8817 for (i = 0 ; i < GAUDI2_NUM_OF_DEC_ERR_CAUSE ; i++) { 8818 if (sts_val & BIT(i)) { 8819 gaudi2_print_event(hdev, event_type, true, 8820 "err cause: %s", gaudi2_dec_error_cause[i]); 8821 sts_clr_val |= BIT(i); 8822 error_count++; 8823 } 8824 } 8825 8826 /* check if RAZWI happened */ 8827 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_DEC, dec_index, 0, event_mask); 8828 hl_check_for_glbl_errors(hdev); 8829 8830 /* Write 1 clear errors */ 8831 WREG32(sts_addr, sts_clr_val); 8832 8833 return error_count; 8834 } 8835 8836 static int gaudi2_handle_mme_err(struct hl_device *hdev, u8 mme_index, u16 event_type, 8837 u64 *event_mask) 8838 { 8839 u32 sts_addr, sts_val, sts_clr_addr, sts_clr_val = 0, error_count = 0; 8840 int i; 8841 8842 sts_addr = mmDCORE0_MME_CTRL_LO_INTR_CAUSE + DCORE_OFFSET * mme_index; 8843 sts_clr_addr = mmDCORE0_MME_CTRL_LO_INTR_CLEAR + DCORE_OFFSET * mme_index; 8844 8845 sts_val = RREG32(sts_addr); 8846 8847 for (i = 0 ; i < GAUDI2_NUM_OF_MME_ERR_CAUSE ; i++) { 8848 if (sts_val & BIT(i)) { 8849 gaudi2_print_event(hdev, event_type, true, 8850 "err cause: %s", guadi2_mme_error_cause[i]); 8851 sts_clr_val |= BIT(i); 8852 error_count++; 8853 } 8854 } 8855 8856 /* check if RAZWI happened */ 8857 for (i = MME_WRITE ; i < MME_INITIATORS_MAX ; i++) 8858 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_MME, mme_index, i, event_mask); 8859 8860 hl_check_for_glbl_errors(hdev); 8861 8862 WREG32(sts_clr_addr, sts_clr_val); 8863 8864 return error_count; 8865 } 8866 8867 static int gaudi2_handle_mme_sbte_err(struct hl_device *hdev, u16 event_type) 8868 { 8869 /* 8870 * We have a single error cause here but the report mechanism is 8871 * buggy. Hence there is no good reason to fetch the cause so we 8872 * just check for glbl_errors and exit. 8873 */ 8874 hl_check_for_glbl_errors(hdev); 8875 8876 return GAUDI2_NA_EVENT_CAUSE; 8877 } 8878 8879 static int gaudi2_handle_mme_wap_err(struct hl_device *hdev, u8 mme_index, u16 event_type, 8880 u64 *event_mask) 8881 { 8882 u32 sts_addr, sts_val, sts_clr_addr, sts_clr_val = 0, error_count = 0; 8883 int i; 8884 8885 sts_addr = mmDCORE0_MME_ACC_INTR_CAUSE + DCORE_OFFSET * mme_index; 8886 sts_clr_addr = mmDCORE0_MME_ACC_INTR_CLEAR + DCORE_OFFSET * mme_index; 8887 8888 sts_val = RREG32(sts_addr); 8889 8890 for (i = 0 ; i < GAUDI2_NUM_OF_MME_WAP_ERR_CAUSE ; i++) { 8891 if (sts_val & BIT(i)) { 8892 gaudi2_print_event(hdev, event_type, true, 8893 "err cause: %s", guadi2_mme_wap_error_cause[i]); 8894 sts_clr_val |= BIT(i); 8895 error_count++; 8896 } 8897 } 8898 8899 /* check if RAZWI happened on WAP0/1 */ 8900 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_MME, mme_index, MME_WAP0, event_mask); 8901 gaudi2_ack_module_razwi_event_handler(hdev, RAZWI_MME, mme_index, MME_WAP1, event_mask); 8902 hl_check_for_glbl_errors(hdev); 8903 8904 WREG32(sts_clr_addr, sts_clr_val); 8905 8906 return error_count; 8907 } 8908 8909 static int gaudi2_handle_kdma_core_event(struct hl_device *hdev, u16 event_type, 8910 u64 intr_cause_data) 8911 { 8912 u32 error_count = 0; 8913 int i; 8914 8915 /* If an AXI read or write error is received, an error is reported and 8916 * interrupt message is sent. Due to an HW errata, when reading the cause 8917 * register of the KDMA engine, the reported error is always HBW even if 8918 * the actual error caused by a LBW KDMA transaction. 8919 */ 8920 for (i = 0 ; i < GAUDI2_NUM_OF_DMA_CORE_INTR_CAUSE ; i++) 8921 if (intr_cause_data & BIT(i)) { 8922 gaudi2_print_event(hdev, event_type, true, 8923 "err cause: %s", gaudi2_kdma_core_interrupts_cause[i]); 8924 error_count++; 8925 } 8926 8927 hl_check_for_glbl_errors(hdev); 8928 8929 return error_count; 8930 } 8931 8932 static int gaudi2_handle_dma_core_event(struct hl_device *hdev, u16 event_type, u64 intr_cause) 8933 { 8934 u32 error_count = 0; 8935 int i; 8936 8937 for (i = 0 ; i < GAUDI2_NUM_OF_DMA_CORE_INTR_CAUSE ; i++) 8938 if (intr_cause & BIT(i)) { 8939 gaudi2_print_event(hdev, event_type, true, 8940 "err cause: %s", gaudi2_dma_core_interrupts_cause[i]); 8941 error_count++; 8942 } 8943 8944 hl_check_for_glbl_errors(hdev); 8945 8946 return error_count; 8947 } 8948 8949 static void gaudi2_print_pcie_mstr_rr_mstr_if_razwi_info(struct hl_device *hdev, u64 *event_mask) 8950 { 8951 u32 mstr_if_base_addr = mmPCIE_MSTR_RR_MSTR_IF_RR_SHRD_HBW_BASE, razwi_happened_addr; 8952 8953 razwi_happened_addr = mstr_if_base_addr + RR_SHRD_HBW_AW_RAZWI_HAPPENED; 8954 if (RREG32(razwi_happened_addr)) { 8955 gaudi2_razwi_rr_hbw_shared_printf_info(hdev, mstr_if_base_addr, true, "PCIE", 8956 GAUDI2_ENGINE_ID_PCIE, event_mask); 8957 WREG32(razwi_happened_addr, 0x1); 8958 } 8959 8960 razwi_happened_addr = mstr_if_base_addr + RR_SHRD_HBW_AR_RAZWI_HAPPENED; 8961 if (RREG32(razwi_happened_addr)) { 8962 gaudi2_razwi_rr_hbw_shared_printf_info(hdev, mstr_if_base_addr, false, "PCIE", 8963 GAUDI2_ENGINE_ID_PCIE, event_mask); 8964 WREG32(razwi_happened_addr, 0x1); 8965 } 8966 8967 razwi_happened_addr = mstr_if_base_addr + RR_SHRD_LBW_AW_RAZWI_HAPPENED; 8968 if (RREG32(razwi_happened_addr)) { 8969 gaudi2_razwi_rr_lbw_shared_printf_info(hdev, mstr_if_base_addr, true, "PCIE", 8970 GAUDI2_ENGINE_ID_PCIE, event_mask); 8971 WREG32(razwi_happened_addr, 0x1); 8972 } 8973 8974 razwi_happened_addr = mstr_if_base_addr + RR_SHRD_LBW_AR_RAZWI_HAPPENED; 8975 if (RREG32(razwi_happened_addr)) { 8976 gaudi2_razwi_rr_lbw_shared_printf_info(hdev, mstr_if_base_addr, false, "PCIE", 8977 GAUDI2_ENGINE_ID_PCIE, event_mask); 8978 WREG32(razwi_happened_addr, 0x1); 8979 } 8980 } 8981 8982 static int gaudi2_print_pcie_addr_dec_info(struct hl_device *hdev, u16 event_type, 8983 u64 intr_cause_data, u64 *event_mask) 8984 { 8985 u32 error_count = 0; 8986 int i; 8987 8988 for (i = 0 ; i < GAUDI2_NUM_OF_PCIE_ADDR_DEC_ERR_CAUSE ; i++) { 8989 if (!(intr_cause_data & BIT_ULL(i))) 8990 continue; 8991 8992 gaudi2_print_event(hdev, event_type, true, 8993 "err cause: %s", gaudi2_pcie_addr_dec_error_cause[i]); 8994 error_count++; 8995 8996 switch (intr_cause_data & BIT_ULL(i)) { 8997 case PCIE_WRAP_PCIE_IC_SEI_INTR_IND_AXI_LBW_ERR_INTR_MASK: 8998 hl_check_for_glbl_errors(hdev); 8999 break; 9000 case PCIE_WRAP_PCIE_IC_SEI_INTR_IND_BAD_ACCESS_INTR_MASK: 9001 gaudi2_print_pcie_mstr_rr_mstr_if_razwi_info(hdev, event_mask); 9002 break; 9003 } 9004 } 9005 9006 return error_count; 9007 } 9008 9009 static int gaudi2_handle_pif_fatal(struct hl_device *hdev, u16 event_type, 9010 u64 intr_cause_data) 9011 9012 { 9013 u32 error_count = 0; 9014 int i; 9015 9016 for (i = 0 ; i < GAUDI2_NUM_OF_PMMU_FATAL_ERR_CAUSE ; i++) { 9017 if (intr_cause_data & BIT_ULL(i)) { 9018 gaudi2_print_event(hdev, event_type, true, 9019 "err cause: %s", gaudi2_pmmu_fatal_interrupts_cause[i]); 9020 error_count++; 9021 } 9022 } 9023 9024 return error_count; 9025 } 9026 9027 static int gaudi2_handle_hif_fatal(struct hl_device *hdev, u16 event_type, u64 intr_cause_data) 9028 { 9029 u32 error_count = 0; 9030 int i; 9031 9032 for (i = 0 ; i < GAUDI2_NUM_OF_HIF_FATAL_ERR_CAUSE ; i++) { 9033 if (intr_cause_data & BIT_ULL(i)) { 9034 gaudi2_print_event(hdev, event_type, true, 9035 "err cause: %s", gaudi2_hif_fatal_interrupts_cause[i]); 9036 error_count++; 9037 } 9038 } 9039 9040 return error_count; 9041 } 9042 9043 static void gaudi2_handle_page_error(struct hl_device *hdev, u64 mmu_base, bool is_pmmu, 9044 u64 *event_mask) 9045 { 9046 u32 valid, val; 9047 u64 addr; 9048 9049 valid = RREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_ACCESS_PAGE_ERROR_VALID)); 9050 9051 if (!(valid & DCORE0_HMMU0_MMU_ACCESS_PAGE_ERROR_VALID_PAGE_ERR_VALID_ENTRY_MASK)) 9052 return; 9053 9054 val = RREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_PAGE_ERROR_CAPTURE)); 9055 addr = val & DCORE0_HMMU0_MMU_PAGE_ERROR_CAPTURE_VA_63_32_MASK; 9056 addr <<= 32; 9057 addr |= RREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_PAGE_ERROR_CAPTURE_VA)); 9058 9059 if (is_pmmu) { 9060 dev_err_ratelimited(hdev->dev, "PMMU page fault on va 0x%llx\n", addr); 9061 } else { 9062 addr = gaudi2_mmu_descramble_addr(hdev, addr); 9063 addr &= HW_UNSCRAMBLED_BITS_MASK; 9064 dev_err_ratelimited(hdev->dev, "HMMU page fault on va range 0x%llx - 0x%llx\n", 9065 addr, addr + ~HW_UNSCRAMBLED_BITS_MASK); 9066 } 9067 9068 hl_handle_page_fault(hdev, addr, 0, is_pmmu, event_mask); 9069 9070 WREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_ACCESS_PAGE_ERROR_VALID), 0); 9071 } 9072 9073 static void gaudi2_handle_access_error(struct hl_device *hdev, u64 mmu_base, bool is_pmmu) 9074 { 9075 u32 valid, val; 9076 u64 addr; 9077 9078 valid = RREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_ACCESS_PAGE_ERROR_VALID)); 9079 9080 if (!(valid & DCORE0_HMMU0_MMU_ACCESS_PAGE_ERROR_VALID_ACCESS_ERR_VALID_ENTRY_MASK)) 9081 return; 9082 9083 val = RREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_ACCESS_ERROR_CAPTURE)); 9084 addr = val & DCORE0_HMMU0_MMU_ACCESS_ERROR_CAPTURE_VA_63_32_MASK; 9085 addr <<= 32; 9086 addr |= RREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_ACCESS_ERROR_CAPTURE_VA)); 9087 9088 if (!is_pmmu) 9089 addr = gaudi2_mmu_descramble_addr(hdev, addr); 9090 9091 dev_err_ratelimited(hdev->dev, "%s access error on va 0x%llx\n", 9092 is_pmmu ? "PMMU" : "HMMU", addr); 9093 WREG32(mmu_base + MMU_OFFSET(mmDCORE0_HMMU0_MMU_ACCESS_PAGE_ERROR_VALID), 0); 9094 } 9095 9096 static int gaudi2_handle_mmu_spi_sei_generic(struct hl_device *hdev, u16 event_type, 9097 u64 mmu_base, bool is_pmmu, u64 *event_mask) 9098 { 9099 u32 spi_sei_cause, interrupt_clr = 0x0, error_count = 0; 9100 int i; 9101 9102 spi_sei_cause = RREG32(mmu_base + MMU_SPI_SEI_CAUSE_OFFSET); 9103 9104 for (i = 0 ; i < GAUDI2_NUM_OF_MMU_SPI_SEI_CAUSE ; i++) { 9105 if (spi_sei_cause & BIT(i)) { 9106 gaudi2_print_event(hdev, event_type, true, 9107 "err cause: %s", gaudi2_mmu_spi_sei[i].cause); 9108 9109 if (i == 0) 9110 gaudi2_handle_page_error(hdev, mmu_base, is_pmmu, event_mask); 9111 else if (i == 1) 9112 gaudi2_handle_access_error(hdev, mmu_base, is_pmmu); 9113 9114 if (gaudi2_mmu_spi_sei[i].clear_bit >= 0) 9115 interrupt_clr |= BIT(gaudi2_mmu_spi_sei[i].clear_bit); 9116 9117 error_count++; 9118 } 9119 } 9120 9121 /* Clear cause */ 9122 WREG32_AND(mmu_base + MMU_SPI_SEI_CAUSE_OFFSET, ~spi_sei_cause); 9123 9124 /* Clear interrupt */ 9125 WREG32(mmu_base + MMU_INTERRUPT_CLR_OFFSET, interrupt_clr); 9126 9127 return error_count; 9128 } 9129 9130 static int gaudi2_handle_sm_err(struct hl_device *hdev, u16 event_type, u8 sm_index) 9131 { 9132 u32 sei_cause_addr, sei_cause_val, sei_cause_cause, sei_cause_log, 9133 cq_intr_addr, cq_intr_val, cq_intr_queue_index, error_count = 0; 9134 int i; 9135 9136 sei_cause_addr = mmDCORE0_SYNC_MNGR_GLBL_SM_SEI_CAUSE + DCORE_OFFSET * sm_index; 9137 cq_intr_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_INTR + DCORE_OFFSET * sm_index; 9138 9139 sei_cause_val = RREG32(sei_cause_addr); 9140 sei_cause_cause = FIELD_GET(DCORE0_SYNC_MNGR_GLBL_SM_SEI_CAUSE_CAUSE_MASK, sei_cause_val); 9141 cq_intr_val = RREG32(cq_intr_addr); 9142 9143 /* SEI interrupt */ 9144 if (sei_cause_cause) { 9145 /* There are corresponding SEI_CAUSE_log bits for every SEI_CAUSE_cause bit */ 9146 sei_cause_log = FIELD_GET(DCORE0_SYNC_MNGR_GLBL_SM_SEI_CAUSE_LOG_MASK, 9147 sei_cause_val); 9148 9149 for (i = 0 ; i < GAUDI2_NUM_OF_SM_SEI_ERR_CAUSE ; i++) { 9150 if (!(sei_cause_cause & BIT(i))) 9151 continue; 9152 9153 gaudi2_print_event(hdev, event_type, true, 9154 "err cause: %s. %s: 0x%X", 9155 gaudi2_sm_sei_cause[i].cause_name, 9156 gaudi2_sm_sei_cause[i].log_name, 9157 sei_cause_log); 9158 error_count++; 9159 break; 9160 } 9161 9162 /* Clear SM_SEI_CAUSE */ 9163 WREG32(sei_cause_addr, 0); 9164 } 9165 9166 /* CQ interrupt */ 9167 if (cq_intr_val & DCORE0_SYNC_MNGR_GLBL_CQ_INTR_CQ_SEC_INTR_MASK) { 9168 cq_intr_queue_index = 9169 FIELD_GET(DCORE0_SYNC_MNGR_GLBL_CQ_INTR_CQ_INTR_QUEUE_INDEX_MASK, 9170 cq_intr_val); 9171 9172 dev_err_ratelimited(hdev->dev, "SM%u err. err cause: CQ_INTR. queue index: %u\n", 9173 sm_index, cq_intr_queue_index); 9174 error_count++; 9175 9176 /* Clear CQ_INTR */ 9177 WREG32(cq_intr_addr, 0); 9178 } 9179 9180 hl_check_for_glbl_errors(hdev); 9181 9182 return error_count; 9183 } 9184 9185 static u64 get_hmmu_base(u16 event_type) 9186 { 9187 u8 dcore, index_in_dcore; 9188 9189 switch (event_type) { 9190 case GAUDI2_EVENT_HMMU_0_AXI_ERR_RSP: 9191 case GAUDI2_EVENT_HMMU0_SPI_BASE ... GAUDI2_EVENT_HMMU0_SECURITY_ERROR: 9192 dcore = 0; 9193 index_in_dcore = 0; 9194 break; 9195 case GAUDI2_EVENT_HMMU_1_AXI_ERR_RSP: 9196 case GAUDI2_EVENT_HMMU1_SPI_BASE ... GAUDI2_EVENT_HMMU1_SECURITY_ERROR: 9197 dcore = 1; 9198 index_in_dcore = 0; 9199 break; 9200 case GAUDI2_EVENT_HMMU_2_AXI_ERR_RSP: 9201 case GAUDI2_EVENT_HMMU2_SPI_BASE ... GAUDI2_EVENT_HMMU2_SECURITY_ERROR: 9202 dcore = 0; 9203 index_in_dcore = 1; 9204 break; 9205 case GAUDI2_EVENT_HMMU_3_AXI_ERR_RSP: 9206 case GAUDI2_EVENT_HMMU3_SPI_BASE ... GAUDI2_EVENT_HMMU3_SECURITY_ERROR: 9207 dcore = 1; 9208 index_in_dcore = 1; 9209 break; 9210 case GAUDI2_EVENT_HMMU_4_AXI_ERR_RSP: 9211 case GAUDI2_EVENT_HMMU4_SPI_BASE ... GAUDI2_EVENT_HMMU4_SECURITY_ERROR: 9212 dcore = 3; 9213 index_in_dcore = 2; 9214 break; 9215 case GAUDI2_EVENT_HMMU_5_AXI_ERR_RSP: 9216 case GAUDI2_EVENT_HMMU5_SPI_BASE ... GAUDI2_EVENT_HMMU5_SECURITY_ERROR: 9217 dcore = 2; 9218 index_in_dcore = 2; 9219 break; 9220 case GAUDI2_EVENT_HMMU_6_AXI_ERR_RSP: 9221 case GAUDI2_EVENT_HMMU6_SPI_BASE ... GAUDI2_EVENT_HMMU6_SECURITY_ERROR: 9222 dcore = 3; 9223 index_in_dcore = 3; 9224 break; 9225 case GAUDI2_EVENT_HMMU_7_AXI_ERR_RSP: 9226 case GAUDI2_EVENT_HMMU7_SPI_BASE ... GAUDI2_EVENT_HMMU7_SECURITY_ERROR: 9227 dcore = 2; 9228 index_in_dcore = 3; 9229 break; 9230 case GAUDI2_EVENT_HMMU_8_AXI_ERR_RSP: 9231 case GAUDI2_EVENT_HMMU8_SPI_BASE ... GAUDI2_EVENT_HMMU8_SECURITY_ERROR: 9232 dcore = 0; 9233 index_in_dcore = 2; 9234 break; 9235 case GAUDI2_EVENT_HMMU_9_AXI_ERR_RSP: 9236 case GAUDI2_EVENT_HMMU9_SPI_BASE ... GAUDI2_EVENT_HMMU9_SECURITY_ERROR: 9237 dcore = 1; 9238 index_in_dcore = 2; 9239 break; 9240 case GAUDI2_EVENT_HMMU_10_AXI_ERR_RSP: 9241 case GAUDI2_EVENT_HMMU10_SPI_BASE ... GAUDI2_EVENT_HMMU10_SECURITY_ERROR: 9242 dcore = 0; 9243 index_in_dcore = 3; 9244 break; 9245 case GAUDI2_EVENT_HMMU_11_AXI_ERR_RSP: 9246 case GAUDI2_EVENT_HMMU11_SPI_BASE ... GAUDI2_EVENT_HMMU11_SECURITY_ERROR: 9247 dcore = 1; 9248 index_in_dcore = 3; 9249 break; 9250 case GAUDI2_EVENT_HMMU_12_AXI_ERR_RSP: 9251 case GAUDI2_EVENT_HMMU12_SPI_BASE ... GAUDI2_EVENT_HMMU12_SECURITY_ERROR: 9252 dcore = 3; 9253 index_in_dcore = 0; 9254 break; 9255 case GAUDI2_EVENT_HMMU_13_AXI_ERR_RSP: 9256 case GAUDI2_EVENT_HMMU13_SPI_BASE ... GAUDI2_EVENT_HMMU13_SECURITY_ERROR: 9257 dcore = 2; 9258 index_in_dcore = 0; 9259 break; 9260 case GAUDI2_EVENT_HMMU_14_AXI_ERR_RSP: 9261 case GAUDI2_EVENT_HMMU14_SPI_BASE ... GAUDI2_EVENT_HMMU14_SECURITY_ERROR: 9262 dcore = 3; 9263 index_in_dcore = 1; 9264 break; 9265 case GAUDI2_EVENT_HMMU_15_AXI_ERR_RSP: 9266 case GAUDI2_EVENT_HMMU15_SPI_BASE ... GAUDI2_EVENT_HMMU15_SECURITY_ERROR: 9267 dcore = 2; 9268 index_in_dcore = 1; 9269 break; 9270 default: 9271 return ULONG_MAX; 9272 } 9273 9274 return mmDCORE0_HMMU0_MMU_BASE + dcore * DCORE_OFFSET + index_in_dcore * DCORE_HMMU_OFFSET; 9275 } 9276 9277 static int gaudi2_handle_mmu_spi_sei_err(struct hl_device *hdev, u16 event_type, u64 *event_mask) 9278 { 9279 bool is_pmmu = false; 9280 u32 error_count = 0; 9281 u64 mmu_base; 9282 9283 switch (event_type) { 9284 case GAUDI2_EVENT_HMMU_0_AXI_ERR_RSP ... GAUDI2_EVENT_HMMU_12_AXI_ERR_RSP: 9285 case GAUDI2_EVENT_HMMU0_SPI_BASE ... GAUDI2_EVENT_HMMU12_SECURITY_ERROR: 9286 mmu_base = get_hmmu_base(event_type); 9287 break; 9288 9289 case GAUDI2_EVENT_PMMU0_PAGE_FAULT_WR_PERM ... GAUDI2_EVENT_PMMU0_SECURITY_ERROR: 9290 case GAUDI2_EVENT_PMMU_AXI_ERR_RSP_0: 9291 is_pmmu = true; 9292 mmu_base = mmPMMU_HBW_MMU_BASE; 9293 break; 9294 default: 9295 return 0; 9296 } 9297 9298 if (mmu_base == ULONG_MAX) 9299 return 0; 9300 9301 error_count = gaudi2_handle_mmu_spi_sei_generic(hdev, event_type, mmu_base, 9302 is_pmmu, event_mask); 9303 hl_check_for_glbl_errors(hdev); 9304 9305 return error_count; 9306 } 9307 9308 9309 /* returns true if hard reset is required (ECC DERR or Read parity), false otherwise (ECC SERR) */ 9310 static bool gaudi2_hbm_sei_handle_read_err(struct hl_device *hdev, 9311 struct hl_eq_hbm_sei_read_err_intr_info *rd_err_data, u32 err_cnt) 9312 { 9313 u32 addr, beat, beat_shift; 9314 bool rc = false; 9315 9316 dev_err_ratelimited(hdev->dev, 9317 "READ ERROR count: ECC SERR: %d, ECC DERR: %d, RD_PARITY: %d\n", 9318 FIELD_GET(HBM_ECC_SERR_CNTR_MASK, err_cnt), 9319 FIELD_GET(HBM_ECC_DERR_CNTR_MASK, err_cnt), 9320 FIELD_GET(HBM_RD_PARITY_CNTR_MASK, err_cnt)); 9321 9322 addr = le32_to_cpu(rd_err_data->dbg_rd_err_addr.rd_addr_val); 9323 dev_err_ratelimited(hdev->dev, 9324 "READ ERROR address: sid(%u), bg(%u), ba(%u), col(%u), row(%u)\n", 9325 FIELD_GET(HBM_RD_ADDR_SID_MASK, addr), 9326 FIELD_GET(HBM_RD_ADDR_BG_MASK, addr), 9327 FIELD_GET(HBM_RD_ADDR_BA_MASK, addr), 9328 FIELD_GET(HBM_RD_ADDR_COL_MASK, addr), 9329 FIELD_GET(HBM_RD_ADDR_ROW_MASK, addr)); 9330 9331 /* For each beat (RDQS edge), look for possible errors and print relevant info */ 9332 for (beat = 0 ; beat < 4 ; beat++) { 9333 if (le32_to_cpu(rd_err_data->dbg_rd_err_misc) & 9334 (HBM_RD_ERR_SERR_BEAT0_MASK << beat)) 9335 dev_err_ratelimited(hdev->dev, "Beat%d ECC SERR: DM: %#x, Syndrome: %#x\n", 9336 beat, 9337 le32_to_cpu(rd_err_data->dbg_rd_err_dm), 9338 le32_to_cpu(rd_err_data->dbg_rd_err_syndrome)); 9339 9340 if (le32_to_cpu(rd_err_data->dbg_rd_err_misc) & 9341 (HBM_RD_ERR_DERR_BEAT0_MASK << beat)) { 9342 dev_err_ratelimited(hdev->dev, "Beat%d ECC DERR: DM: %#x, Syndrome: %#x\n", 9343 beat, 9344 le32_to_cpu(rd_err_data->dbg_rd_err_dm), 9345 le32_to_cpu(rd_err_data->dbg_rd_err_syndrome)); 9346 rc |= true; 9347 } 9348 9349 beat_shift = beat * HBM_RD_ERR_BEAT_SHIFT; 9350 if (le32_to_cpu(rd_err_data->dbg_rd_err_misc) & 9351 (HBM_RD_ERR_PAR_ERR_BEAT0_MASK << beat_shift)) { 9352 dev_err_ratelimited(hdev->dev, 9353 "Beat%d read PARITY: DM: %#x, PAR data: %#x\n", 9354 beat, 9355 le32_to_cpu(rd_err_data->dbg_rd_err_dm), 9356 (le32_to_cpu(rd_err_data->dbg_rd_err_misc) & 9357 (HBM_RD_ERR_PAR_DATA_BEAT0_MASK << beat_shift)) >> 9358 (HBM_RD_ERR_PAR_DATA_BEAT0_SHIFT + beat_shift)); 9359 rc |= true; 9360 } 9361 9362 dev_err_ratelimited(hdev->dev, "Beat%d DQ data:\n", beat); 9363 dev_err_ratelimited(hdev->dev, "\t0x%08x\n", 9364 le32_to_cpu(rd_err_data->dbg_rd_err_data[beat * 2])); 9365 dev_err_ratelimited(hdev->dev, "\t0x%08x\n", 9366 le32_to_cpu(rd_err_data->dbg_rd_err_data[beat * 2 + 1])); 9367 } 9368 9369 return rc; 9370 } 9371 9372 static void gaudi2_hbm_sei_print_wr_par_info(struct hl_device *hdev, 9373 struct hl_eq_hbm_sei_wr_par_intr_info *wr_par_err_data, u32 err_cnt) 9374 { 9375 struct hbm_sei_wr_cmd_address *wr_cmd_addr = wr_par_err_data->dbg_last_wr_cmds; 9376 u32 i, curr_addr, derr = wr_par_err_data->dbg_derr; 9377 9378 dev_err_ratelimited(hdev->dev, "WRITE PARITY ERROR count: %d\n", err_cnt); 9379 9380 dev_err_ratelimited(hdev->dev, "CK-0 DERR: 0x%02x, CK-1 DERR: 0x%02x\n", 9381 derr & 0x3, derr & 0xc); 9382 9383 /* JIRA H6-3286 - the following prints may not be valid */ 9384 dev_err_ratelimited(hdev->dev, "Last latched write commands addresses:\n"); 9385 for (i = 0 ; i < HBM_WR_PAR_CMD_LIFO_LEN ; i++) { 9386 curr_addr = le32_to_cpu(wr_cmd_addr[i].dbg_wr_cmd_addr); 9387 dev_err_ratelimited(hdev->dev, 9388 "\twrite cmd[%u]: Address: SID(%u) BG(%u) BA(%u) COL(%u).\n", 9389 i, 9390 FIELD_GET(WR_PAR_LAST_CMD_SID_MASK, curr_addr), 9391 FIELD_GET(WR_PAR_LAST_CMD_BG_MASK, curr_addr), 9392 FIELD_GET(WR_PAR_LAST_CMD_BA_MASK, curr_addr), 9393 FIELD_GET(WR_PAR_LAST_CMD_COL_MASK, curr_addr)); 9394 } 9395 } 9396 9397 static void gaudi2_hbm_sei_print_ca_par_info(struct hl_device *hdev, 9398 struct hl_eq_hbm_sei_ca_par_intr_info *ca_par_err_data, u32 err_cnt) 9399 { 9400 __le32 *col_cmd = ca_par_err_data->dbg_col; 9401 __le16 *row_cmd = ca_par_err_data->dbg_row; 9402 u32 i; 9403 9404 dev_err_ratelimited(hdev->dev, "CA ERROR count: %d\n", err_cnt); 9405 9406 dev_err_ratelimited(hdev->dev, "Last latched C&R bus commands:\n"); 9407 for (i = 0 ; i < HBM_CA_ERR_CMD_LIFO_LEN ; i++) 9408 dev_err_ratelimited(hdev->dev, "cmd%u: ROW(0x%04x) COL(0x%05x)\n", i, 9409 le16_to_cpu(row_cmd[i]) & (u16)GENMASK(13, 0), 9410 le32_to_cpu(col_cmd[i]) & (u32)GENMASK(17, 0)); 9411 } 9412 9413 /* Returns true if hard reset is needed or false otherwise */ 9414 static bool gaudi2_handle_hbm_mc_sei_err(struct hl_device *hdev, u16 event_type, 9415 struct hl_eq_hbm_sei_data *sei_data) 9416 { 9417 bool require_hard_reset = false; 9418 u32 hbm_id, mc_id, cause_idx; 9419 9420 hbm_id = (event_type - GAUDI2_EVENT_HBM0_MC0_SEI_SEVERE) / 4; 9421 mc_id = ((event_type - GAUDI2_EVENT_HBM0_MC0_SEI_SEVERE) / 2) % 2; 9422 9423 cause_idx = sei_data->hdr.sei_cause; 9424 if (cause_idx > GAUDI2_NUM_OF_HBM_SEI_CAUSE - 1) { 9425 gaudi2_print_event(hdev, event_type, true, 9426 "err cause: %s", 9427 "Invalid HBM SEI event cause (%d) provided by FW", cause_idx); 9428 return true; 9429 } 9430 9431 gaudi2_print_event(hdev, event_type, !sei_data->hdr.is_critical, 9432 "System %s Error Interrupt - HBM(%u) MC(%u) MC_CH(%u) MC_PC(%u). Error cause: %s", 9433 sei_data->hdr.is_critical ? "Critical" : "Non-critical", 9434 hbm_id, mc_id, sei_data->hdr.mc_channel, sei_data->hdr.mc_pseudo_channel, 9435 hbm_mc_sei_cause[cause_idx]); 9436 9437 /* Print error-specific info */ 9438 switch (cause_idx) { 9439 case HBM_SEI_CATTRIP: 9440 require_hard_reset = true; 9441 break; 9442 9443 case HBM_SEI_CMD_PARITY_EVEN: 9444 gaudi2_hbm_sei_print_ca_par_info(hdev, &sei_data->ca_parity_even_info, 9445 le32_to_cpu(sei_data->hdr.cnt)); 9446 require_hard_reset = true; 9447 break; 9448 9449 case HBM_SEI_CMD_PARITY_ODD: 9450 gaudi2_hbm_sei_print_ca_par_info(hdev, &sei_data->ca_parity_odd_info, 9451 le32_to_cpu(sei_data->hdr.cnt)); 9452 require_hard_reset = true; 9453 break; 9454 9455 case HBM_SEI_WRITE_DATA_PARITY_ERR: 9456 gaudi2_hbm_sei_print_wr_par_info(hdev, &sei_data->wr_parity_info, 9457 le32_to_cpu(sei_data->hdr.cnt)); 9458 require_hard_reset = true; 9459 break; 9460 9461 case HBM_SEI_READ_ERR: 9462 /* Unlike other SEI events, read error requires further processing of the 9463 * raw data in order to determine the root cause. 9464 */ 9465 require_hard_reset = gaudi2_hbm_sei_handle_read_err(hdev, 9466 &sei_data->read_err_info, 9467 le32_to_cpu(sei_data->hdr.cnt)); 9468 break; 9469 9470 default: 9471 break; 9472 } 9473 9474 require_hard_reset |= !!sei_data->hdr.is_critical; 9475 9476 return require_hard_reset; 9477 } 9478 9479 static int gaudi2_handle_hbm_cattrip(struct hl_device *hdev, u16 event_type, 9480 u64 intr_cause_data) 9481 { 9482 if (intr_cause_data) { 9483 gaudi2_print_event(hdev, event_type, true, 9484 "temperature error cause: %#llx", intr_cause_data); 9485 return 1; 9486 } 9487 9488 return 0; 9489 } 9490 9491 static int gaudi2_handle_hbm_mc_spi(struct hl_device *hdev, u64 intr_cause_data) 9492 { 9493 u32 i, error_count = 0; 9494 9495 for (i = 0 ; i < GAUDI2_NUM_OF_HBM_MC_SPI_CAUSE ; i++) 9496 if (intr_cause_data & hbm_mc_spi[i].mask) { 9497 dev_dbg(hdev->dev, "HBM spi event: notification cause(%s)\n", 9498 hbm_mc_spi[i].cause); 9499 error_count++; 9500 } 9501 9502 return error_count; 9503 } 9504 9505 static void gaudi2_print_clk_change_info(struct hl_device *hdev, u16 event_type, u64 *event_mask) 9506 { 9507 ktime_t zero_time = ktime_set(0, 0); 9508 9509 mutex_lock(&hdev->clk_throttling.lock); 9510 9511 switch (event_type) { 9512 case GAUDI2_EVENT_CPU_FIX_POWER_ENV_S: 9513 hdev->clk_throttling.current_reason |= HL_CLK_THROTTLE_POWER; 9514 hdev->clk_throttling.aggregated_reason |= HL_CLK_THROTTLE_POWER; 9515 hdev->clk_throttling.timestamp[HL_CLK_THROTTLE_TYPE_POWER].start = ktime_get(); 9516 hdev->clk_throttling.timestamp[HL_CLK_THROTTLE_TYPE_POWER].end = zero_time; 9517 dev_dbg_ratelimited(hdev->dev, "Clock throttling due to power consumption\n"); 9518 break; 9519 9520 case GAUDI2_EVENT_CPU_FIX_POWER_ENV_E: 9521 hdev->clk_throttling.current_reason &= ~HL_CLK_THROTTLE_POWER; 9522 hdev->clk_throttling.timestamp[HL_CLK_THROTTLE_TYPE_POWER].end = ktime_get(); 9523 dev_dbg_ratelimited(hdev->dev, "Power envelop is safe, back to optimal clock\n"); 9524 break; 9525 9526 case GAUDI2_EVENT_CPU_FIX_THERMAL_ENV_S: 9527 hdev->clk_throttling.current_reason |= HL_CLK_THROTTLE_THERMAL; 9528 hdev->clk_throttling.aggregated_reason |= HL_CLK_THROTTLE_THERMAL; 9529 hdev->clk_throttling.timestamp[HL_CLK_THROTTLE_TYPE_THERMAL].start = ktime_get(); 9530 hdev->clk_throttling.timestamp[HL_CLK_THROTTLE_TYPE_THERMAL].end = zero_time; 9531 *event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9532 dev_info_ratelimited(hdev->dev, "Clock throttling due to overheating\n"); 9533 break; 9534 9535 case GAUDI2_EVENT_CPU_FIX_THERMAL_ENV_E: 9536 hdev->clk_throttling.current_reason &= ~HL_CLK_THROTTLE_THERMAL; 9537 hdev->clk_throttling.timestamp[HL_CLK_THROTTLE_TYPE_THERMAL].end = ktime_get(); 9538 *event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9539 dev_info_ratelimited(hdev->dev, "Thermal envelop is safe, back to optimal clock\n"); 9540 break; 9541 9542 default: 9543 dev_err(hdev->dev, "Received invalid clock change event %d\n", event_type); 9544 break; 9545 } 9546 9547 mutex_unlock(&hdev->clk_throttling.lock); 9548 } 9549 9550 static void gaudi2_print_out_of_sync_info(struct hl_device *hdev, u16 event_type, 9551 struct cpucp_pkt_sync_err *sync_err) 9552 { 9553 struct hl_hw_queue *q = &hdev->kernel_queues[GAUDI2_QUEUE_ID_CPU_PQ]; 9554 9555 gaudi2_print_event(hdev, event_type, false, 9556 "FW: pi=%u, ci=%u, LKD: pi=%u, ci=%d", 9557 le32_to_cpu(sync_err->pi), le32_to_cpu(sync_err->ci), 9558 q->pi, atomic_read(&q->ci)); 9559 } 9560 9561 static int gaudi2_handle_pcie_p2p_msix(struct hl_device *hdev, u16 event_type) 9562 { 9563 u32 p2p_intr, msix_gw_intr, error_count = 0; 9564 9565 p2p_intr = RREG32(mmPCIE_WRAP_P2P_INTR); 9566 msix_gw_intr = RREG32(mmPCIE_WRAP_MSIX_GW_INTR); 9567 9568 if (p2p_intr) { 9569 gaudi2_print_event(hdev, event_type, true, 9570 "pcie p2p transaction terminated due to security, req_id(0x%x)", 9571 RREG32(mmPCIE_WRAP_P2P_REQ_ID)); 9572 9573 WREG32(mmPCIE_WRAP_P2P_INTR, 0x1); 9574 error_count++; 9575 } 9576 9577 if (msix_gw_intr) { 9578 gaudi2_print_event(hdev, event_type, true, 9579 "pcie msi-x gen denied due to vector num check failure, vec(0x%X)", 9580 RREG32(mmPCIE_WRAP_MSIX_GW_VEC)); 9581 9582 WREG32(mmPCIE_WRAP_MSIX_GW_INTR, 0x1); 9583 error_count++; 9584 } 9585 9586 return error_count; 9587 } 9588 9589 static int gaudi2_handle_pcie_drain(struct hl_device *hdev, 9590 struct hl_eq_pcie_drain_ind_data *drain_data) 9591 { 9592 u64 cause, error_count = 0; 9593 9594 cause = le64_to_cpu(drain_data->intr_cause.intr_cause_data); 9595 9596 if (cause & BIT_ULL(0)) { 9597 dev_err_ratelimited(hdev->dev, "PCIE AXI drain LBW completed\n"); 9598 error_count++; 9599 } 9600 9601 if (cause & BIT_ULL(1)) { 9602 dev_err_ratelimited(hdev->dev, "PCIE AXI drain HBW completed\n"); 9603 error_count++; 9604 } 9605 9606 return error_count; 9607 } 9608 9609 static int gaudi2_handle_psoc_drain(struct hl_device *hdev, u64 intr_cause_data) 9610 { 9611 u32 error_count = 0; 9612 int i; 9613 9614 for (i = 0 ; i < GAUDI2_NUM_OF_AXI_DRAIN_ERR_CAUSE ; i++) { 9615 if (intr_cause_data & BIT_ULL(i)) { 9616 dev_err_ratelimited(hdev->dev, "PSOC %s completed\n", 9617 gaudi2_psoc_axi_drain_interrupts_cause[i]); 9618 error_count++; 9619 } 9620 } 9621 9622 hl_check_for_glbl_errors(hdev); 9623 9624 return error_count; 9625 } 9626 9627 static void gaudi2_print_cpu_pkt_failure_info(struct hl_device *hdev, u16 event_type, 9628 struct cpucp_pkt_sync_err *sync_err) 9629 { 9630 struct hl_hw_queue *q = &hdev->kernel_queues[GAUDI2_QUEUE_ID_CPU_PQ]; 9631 9632 gaudi2_print_event(hdev, event_type, false, 9633 "FW reported sanity check failure, FW: pi=%u, ci=%u, LKD: pi=%u, ci=%d", 9634 le32_to_cpu(sync_err->pi), le32_to_cpu(sync_err->ci), q->pi, atomic_read(&q->ci)); 9635 } 9636 9637 static int hl_arc_event_handle(struct hl_device *hdev, u16 event_type, 9638 struct hl_eq_engine_arc_intr_data *data) 9639 { 9640 struct hl_engine_arc_dccm_queue_full_irq *q; 9641 u32 intr_type, engine_id; 9642 u64 payload; 9643 9644 intr_type = le32_to_cpu(data->intr_type); 9645 engine_id = le32_to_cpu(data->engine_id); 9646 payload = le64_to_cpu(data->payload); 9647 9648 switch (intr_type) { 9649 case ENGINE_ARC_DCCM_QUEUE_FULL_IRQ: 9650 q = (struct hl_engine_arc_dccm_queue_full_irq *) &payload; 9651 9652 gaudi2_print_event(hdev, event_type, true, 9653 "ARC DCCM Full event: EngId: %u, Intr_type: %u, Qidx: %u", 9654 engine_id, intr_type, q->queue_index); 9655 return 1; 9656 default: 9657 gaudi2_print_event(hdev, event_type, true, "Unknown ARC event type"); 9658 return 0; 9659 } 9660 } 9661 9662 static u16 event_id_to_engine_id(struct hl_device *hdev, u16 event_type) 9663 { 9664 enum gaudi2_block_types type = GAUDI2_BLOCK_TYPE_MAX; 9665 u16 index; 9666 9667 switch (event_type) { 9668 case GAUDI2_EVENT_TPC0_AXI_ERR_RSP ... GAUDI2_EVENT_TPC24_AXI_ERR_RSP: 9669 index = event_type - GAUDI2_EVENT_TPC0_AXI_ERR_RSP; 9670 type = GAUDI2_BLOCK_TYPE_TPC; 9671 break; 9672 case GAUDI2_EVENT_TPC0_QM ... GAUDI2_EVENT_TPC24_QM: 9673 index = event_type - GAUDI2_EVENT_TPC0_QM; 9674 type = GAUDI2_BLOCK_TYPE_TPC; 9675 break; 9676 case GAUDI2_EVENT_MME0_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE: 9677 case GAUDI2_EVENT_MME0_SPI_BASE ... GAUDI2_EVENT_MME0_WAP_SOURCE_RESULT_INVALID: 9678 case GAUDI2_EVENT_MME0_QM: 9679 index = 0; 9680 type = GAUDI2_BLOCK_TYPE_MME; 9681 break; 9682 case GAUDI2_EVENT_MME1_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME1_CTRL_AXI_ERROR_RESPONSE: 9683 case GAUDI2_EVENT_MME1_SPI_BASE ... GAUDI2_EVENT_MME1_WAP_SOURCE_RESULT_INVALID: 9684 case GAUDI2_EVENT_MME1_QM: 9685 index = 1; 9686 type = GAUDI2_BLOCK_TYPE_MME; 9687 break; 9688 case GAUDI2_EVENT_MME2_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME2_CTRL_AXI_ERROR_RESPONSE: 9689 case GAUDI2_EVENT_MME2_SPI_BASE ... GAUDI2_EVENT_MME2_WAP_SOURCE_RESULT_INVALID: 9690 case GAUDI2_EVENT_MME2_QM: 9691 index = 2; 9692 type = GAUDI2_BLOCK_TYPE_MME; 9693 break; 9694 case GAUDI2_EVENT_MME3_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME3_CTRL_AXI_ERROR_RESPONSE: 9695 case GAUDI2_EVENT_MME3_SPI_BASE ... GAUDI2_EVENT_MME3_WAP_SOURCE_RESULT_INVALID: 9696 case GAUDI2_EVENT_MME3_QM: 9697 index = 3; 9698 type = GAUDI2_BLOCK_TYPE_MME; 9699 break; 9700 case GAUDI2_EVENT_KDMA_CH0_AXI_ERR_RSP: 9701 case GAUDI2_EVENT_KDMA_BM_SPMU: 9702 case GAUDI2_EVENT_KDMA0_CORE: 9703 return GAUDI2_ENGINE_ID_KDMA; 9704 case GAUDI2_EVENT_PDMA_CH0_AXI_ERR_RSP: 9705 case GAUDI2_EVENT_PDMA0_CORE: 9706 case GAUDI2_EVENT_PDMA0_BM_SPMU: 9707 case GAUDI2_EVENT_PDMA0_QM: 9708 return GAUDI2_ENGINE_ID_PDMA_0; 9709 case GAUDI2_EVENT_PDMA_CH1_AXI_ERR_RSP: 9710 case GAUDI2_EVENT_PDMA1_CORE: 9711 case GAUDI2_EVENT_PDMA1_BM_SPMU: 9712 case GAUDI2_EVENT_PDMA1_QM: 9713 return GAUDI2_ENGINE_ID_PDMA_1; 9714 case GAUDI2_EVENT_DEC0_AXI_ERR_RSPONSE ... GAUDI2_EVENT_DEC9_AXI_ERR_RSPONSE: 9715 index = event_type - GAUDI2_EVENT_DEC0_AXI_ERR_RSPONSE; 9716 type = GAUDI2_BLOCK_TYPE_DEC; 9717 break; 9718 case GAUDI2_EVENT_DEC0_SPI ... GAUDI2_EVENT_DEC9_BMON_SPMU: 9719 index = (event_type - GAUDI2_EVENT_DEC0_SPI) >> 1; 9720 type = GAUDI2_BLOCK_TYPE_DEC; 9721 break; 9722 case GAUDI2_EVENT_NIC0_AXI_ERROR_RESPONSE ... GAUDI2_EVENT_NIC11_AXI_ERROR_RESPONSE: 9723 index = event_type - GAUDI2_EVENT_NIC0_AXI_ERROR_RESPONSE; 9724 return GAUDI2_ENGINE_ID_NIC0_0 + (index * 2); 9725 case GAUDI2_EVENT_NIC0_QM0 ... GAUDI2_EVENT_NIC11_QM1: 9726 index = event_type - GAUDI2_EVENT_NIC0_QM0; 9727 return GAUDI2_ENGINE_ID_NIC0_0 + index; 9728 case GAUDI2_EVENT_NIC0_BMON_SPMU ... GAUDI2_EVENT_NIC11_SW_ERROR: 9729 index = event_type - GAUDI2_EVENT_NIC0_BMON_SPMU; 9730 return GAUDI2_ENGINE_ID_NIC0_0 + (index * 2); 9731 case GAUDI2_EVENT_TPC0_BMON_SPMU ... GAUDI2_EVENT_TPC24_KERNEL_ERR: 9732 index = (event_type - GAUDI2_EVENT_TPC0_BMON_SPMU) >> 1; 9733 type = GAUDI2_BLOCK_TYPE_TPC; 9734 break; 9735 case GAUDI2_EVENT_ROTATOR0_AXI_ERROR_RESPONSE: 9736 case GAUDI2_EVENT_ROTATOR0_BMON_SPMU: 9737 case GAUDI2_EVENT_ROTATOR0_ROT0_QM: 9738 return GAUDI2_ENGINE_ID_ROT_0; 9739 case GAUDI2_EVENT_ROTATOR1_AXI_ERROR_RESPONSE: 9740 case GAUDI2_EVENT_ROTATOR1_BMON_SPMU: 9741 case GAUDI2_EVENT_ROTATOR1_ROT1_QM: 9742 return GAUDI2_ENGINE_ID_ROT_1; 9743 case GAUDI2_EVENT_HDMA0_BM_SPMU: 9744 case GAUDI2_EVENT_HDMA0_QM: 9745 case GAUDI2_EVENT_HDMA0_CORE: 9746 return GAUDI2_DCORE0_ENGINE_ID_EDMA_0; 9747 case GAUDI2_EVENT_HDMA1_BM_SPMU: 9748 case GAUDI2_EVENT_HDMA1_QM: 9749 case GAUDI2_EVENT_HDMA1_CORE: 9750 return GAUDI2_DCORE0_ENGINE_ID_EDMA_1; 9751 case GAUDI2_EVENT_HDMA2_BM_SPMU: 9752 case GAUDI2_EVENT_HDMA2_QM: 9753 case GAUDI2_EVENT_HDMA2_CORE: 9754 return GAUDI2_DCORE1_ENGINE_ID_EDMA_0; 9755 case GAUDI2_EVENT_HDMA3_BM_SPMU: 9756 case GAUDI2_EVENT_HDMA3_QM: 9757 case GAUDI2_EVENT_HDMA3_CORE: 9758 return GAUDI2_DCORE1_ENGINE_ID_EDMA_1; 9759 case GAUDI2_EVENT_HDMA4_BM_SPMU: 9760 case GAUDI2_EVENT_HDMA4_QM: 9761 case GAUDI2_EVENT_HDMA4_CORE: 9762 return GAUDI2_DCORE2_ENGINE_ID_EDMA_0; 9763 case GAUDI2_EVENT_HDMA5_BM_SPMU: 9764 case GAUDI2_EVENT_HDMA5_QM: 9765 case GAUDI2_EVENT_HDMA5_CORE: 9766 return GAUDI2_DCORE2_ENGINE_ID_EDMA_1; 9767 case GAUDI2_EVENT_HDMA6_BM_SPMU: 9768 case GAUDI2_EVENT_HDMA6_QM: 9769 case GAUDI2_EVENT_HDMA6_CORE: 9770 return GAUDI2_DCORE3_ENGINE_ID_EDMA_0; 9771 case GAUDI2_EVENT_HDMA7_BM_SPMU: 9772 case GAUDI2_EVENT_HDMA7_QM: 9773 case GAUDI2_EVENT_HDMA7_CORE: 9774 return GAUDI2_DCORE3_ENGINE_ID_EDMA_1; 9775 default: 9776 break; 9777 } 9778 9779 switch (type) { 9780 case GAUDI2_BLOCK_TYPE_TPC: 9781 switch (index) { 9782 case TPC_ID_DCORE0_TPC0 ... TPC_ID_DCORE0_TPC5: 9783 return GAUDI2_DCORE0_ENGINE_ID_TPC_0 + index; 9784 case TPC_ID_DCORE1_TPC0 ... TPC_ID_DCORE1_TPC5: 9785 return GAUDI2_DCORE1_ENGINE_ID_TPC_0 + index - TPC_ID_DCORE1_TPC0; 9786 case TPC_ID_DCORE2_TPC0 ... TPC_ID_DCORE2_TPC5: 9787 return GAUDI2_DCORE2_ENGINE_ID_TPC_0 + index - TPC_ID_DCORE2_TPC0; 9788 case TPC_ID_DCORE3_TPC0 ... TPC_ID_DCORE3_TPC5: 9789 return GAUDI2_DCORE3_ENGINE_ID_TPC_0 + index - TPC_ID_DCORE3_TPC0; 9790 default: 9791 break; 9792 } 9793 break; 9794 case GAUDI2_BLOCK_TYPE_MME: 9795 switch (index) { 9796 case MME_ID_DCORE0: return GAUDI2_DCORE0_ENGINE_ID_MME; 9797 case MME_ID_DCORE1: return GAUDI2_DCORE1_ENGINE_ID_MME; 9798 case MME_ID_DCORE2: return GAUDI2_DCORE2_ENGINE_ID_MME; 9799 case MME_ID_DCORE3: return GAUDI2_DCORE3_ENGINE_ID_MME; 9800 default: 9801 break; 9802 } 9803 break; 9804 case GAUDI2_BLOCK_TYPE_DEC: 9805 switch (index) { 9806 case DEC_ID_DCORE0_DEC0: return GAUDI2_DCORE0_ENGINE_ID_DEC_0; 9807 case DEC_ID_DCORE0_DEC1: return GAUDI2_DCORE0_ENGINE_ID_DEC_1; 9808 case DEC_ID_DCORE1_DEC0: return GAUDI2_DCORE1_ENGINE_ID_DEC_0; 9809 case DEC_ID_DCORE1_DEC1: return GAUDI2_DCORE1_ENGINE_ID_DEC_1; 9810 case DEC_ID_DCORE2_DEC0: return GAUDI2_DCORE2_ENGINE_ID_DEC_0; 9811 case DEC_ID_DCORE2_DEC1: return GAUDI2_DCORE2_ENGINE_ID_DEC_1; 9812 case DEC_ID_DCORE3_DEC0: return GAUDI2_DCORE3_ENGINE_ID_DEC_0; 9813 case DEC_ID_DCORE3_DEC1: return GAUDI2_DCORE3_ENGINE_ID_DEC_1; 9814 case DEC_ID_PCIE_VDEC0: return GAUDI2_PCIE_ENGINE_ID_DEC_0; 9815 case DEC_ID_PCIE_VDEC1: return GAUDI2_PCIE_ENGINE_ID_DEC_1; 9816 default: 9817 break; 9818 } 9819 break; 9820 default: 9821 break; 9822 } 9823 9824 return U16_MAX; 9825 } 9826 9827 static void hl_eq_heartbeat_event_handle(struct hl_device *hdev) 9828 { 9829 hdev->eq_heartbeat_received = true; 9830 } 9831 9832 static void gaudi2_handle_eqe(struct hl_device *hdev, struct hl_eq_entry *eq_entry) 9833 { 9834 struct gaudi2_device *gaudi2 = hdev->asic_specific; 9835 bool reset_required = false, is_critical = false; 9836 u32 index, ctl, reset_flags = 0, error_count = 0; 9837 u64 event_mask = 0; 9838 u16 event_type; 9839 9840 ctl = le32_to_cpu(eq_entry->hdr.ctl); 9841 event_type = ((ctl & EQ_CTL_EVENT_TYPE_MASK) >> EQ_CTL_EVENT_TYPE_SHIFT); 9842 9843 if (event_type >= GAUDI2_EVENT_SIZE) { 9844 dev_err(hdev->dev, "Event type %u exceeds maximum of %u", 9845 event_type, GAUDI2_EVENT_SIZE - 1); 9846 return; 9847 } 9848 9849 gaudi2->events_stat[event_type]++; 9850 gaudi2->events_stat_aggregate[event_type]++; 9851 9852 switch (event_type) { 9853 case GAUDI2_EVENT_PCIE_CORE_SERR ... GAUDI2_EVENT_ARC0_ECC_DERR: 9854 fallthrough; 9855 case GAUDI2_EVENT_ROTATOR0_SERR ... GAUDI2_EVENT_ROTATOR1_DERR: 9856 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 9857 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 9858 reset_required = gaudi2_handle_ecc_event(hdev, event_type, &eq_entry->ecc_data); 9859 is_critical = eq_entry->ecc_data.is_critical; 9860 error_count++; 9861 break; 9862 9863 case GAUDI2_EVENT_TPC0_QM ... GAUDI2_EVENT_PDMA1_QM: 9864 fallthrough; 9865 case GAUDI2_EVENT_ROTATOR0_ROT0_QM ... GAUDI2_EVENT_ROTATOR1_ROT1_QM: 9866 fallthrough; 9867 case GAUDI2_EVENT_NIC0_QM0 ... GAUDI2_EVENT_NIC11_QM1: 9868 error_count = gaudi2_handle_qman_err(hdev, event_type, &event_mask); 9869 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9870 break; 9871 9872 case GAUDI2_EVENT_ARC_AXI_ERROR_RESPONSE_0: 9873 error_count = gaudi2_handle_arc_farm_sei_err(hdev, event_type, &event_mask); 9874 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9875 break; 9876 9877 case GAUDI2_EVENT_CPU_AXI_ERR_RSP: 9878 error_count = gaudi2_handle_cpu_sei_err(hdev, event_type); 9879 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 9880 event_mask |= HL_NOTIFIER_EVENT_CRITICL_FW_ERR; 9881 break; 9882 9883 case GAUDI2_EVENT_PDMA_CH0_AXI_ERR_RSP: 9884 case GAUDI2_EVENT_PDMA_CH1_AXI_ERR_RSP: 9885 error_count = gaudi2_handle_qm_sei_err(hdev, event_type, true, &event_mask); 9886 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9887 break; 9888 9889 case GAUDI2_EVENT_ROTATOR0_AXI_ERROR_RESPONSE: 9890 case GAUDI2_EVENT_ROTATOR1_AXI_ERROR_RESPONSE: 9891 index = event_type - GAUDI2_EVENT_ROTATOR0_AXI_ERROR_RESPONSE; 9892 error_count = gaudi2_handle_rot_err(hdev, index, event_type, 9893 &eq_entry->razwi_with_intr_cause, &event_mask); 9894 error_count += gaudi2_handle_qm_sei_err(hdev, event_type, false, &event_mask); 9895 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9896 break; 9897 9898 case GAUDI2_EVENT_TPC0_AXI_ERR_RSP ... GAUDI2_EVENT_TPC24_AXI_ERR_RSP: 9899 index = event_type - GAUDI2_EVENT_TPC0_AXI_ERR_RSP; 9900 error_count = gaudi2_tpc_ack_interrupts(hdev, index, event_type, 9901 &eq_entry->razwi_with_intr_cause, &event_mask); 9902 error_count += gaudi2_handle_qm_sei_err(hdev, event_type, false, &event_mask); 9903 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9904 break; 9905 9906 case GAUDI2_EVENT_DEC0_AXI_ERR_RSPONSE ... GAUDI2_EVENT_DEC9_AXI_ERR_RSPONSE: 9907 index = event_type - GAUDI2_EVENT_DEC0_AXI_ERR_RSPONSE; 9908 error_count = gaudi2_handle_dec_err(hdev, index, event_type, &event_mask); 9909 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9910 break; 9911 9912 case GAUDI2_EVENT_TPC0_KERNEL_ERR: 9913 case GAUDI2_EVENT_TPC1_KERNEL_ERR: 9914 case GAUDI2_EVENT_TPC2_KERNEL_ERR: 9915 case GAUDI2_EVENT_TPC3_KERNEL_ERR: 9916 case GAUDI2_EVENT_TPC4_KERNEL_ERR: 9917 case GAUDI2_EVENT_TPC5_KERNEL_ERR: 9918 case GAUDI2_EVENT_TPC6_KERNEL_ERR: 9919 case GAUDI2_EVENT_TPC7_KERNEL_ERR: 9920 case GAUDI2_EVENT_TPC8_KERNEL_ERR: 9921 case GAUDI2_EVENT_TPC9_KERNEL_ERR: 9922 case GAUDI2_EVENT_TPC10_KERNEL_ERR: 9923 case GAUDI2_EVENT_TPC11_KERNEL_ERR: 9924 case GAUDI2_EVENT_TPC12_KERNEL_ERR: 9925 case GAUDI2_EVENT_TPC13_KERNEL_ERR: 9926 case GAUDI2_EVENT_TPC14_KERNEL_ERR: 9927 case GAUDI2_EVENT_TPC15_KERNEL_ERR: 9928 case GAUDI2_EVENT_TPC16_KERNEL_ERR: 9929 case GAUDI2_EVENT_TPC17_KERNEL_ERR: 9930 case GAUDI2_EVENT_TPC18_KERNEL_ERR: 9931 case GAUDI2_EVENT_TPC19_KERNEL_ERR: 9932 case GAUDI2_EVENT_TPC20_KERNEL_ERR: 9933 case GAUDI2_EVENT_TPC21_KERNEL_ERR: 9934 case GAUDI2_EVENT_TPC22_KERNEL_ERR: 9935 case GAUDI2_EVENT_TPC23_KERNEL_ERR: 9936 case GAUDI2_EVENT_TPC24_KERNEL_ERR: 9937 index = (event_type - GAUDI2_EVENT_TPC0_KERNEL_ERR) / 9938 (GAUDI2_EVENT_TPC1_KERNEL_ERR - GAUDI2_EVENT_TPC0_KERNEL_ERR); 9939 error_count = gaudi2_tpc_ack_interrupts(hdev, index, event_type, 9940 &eq_entry->razwi_with_intr_cause, &event_mask); 9941 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9942 break; 9943 9944 case GAUDI2_EVENT_DEC0_SPI: 9945 case GAUDI2_EVENT_DEC1_SPI: 9946 case GAUDI2_EVENT_DEC2_SPI: 9947 case GAUDI2_EVENT_DEC3_SPI: 9948 case GAUDI2_EVENT_DEC4_SPI: 9949 case GAUDI2_EVENT_DEC5_SPI: 9950 case GAUDI2_EVENT_DEC6_SPI: 9951 case GAUDI2_EVENT_DEC7_SPI: 9952 case GAUDI2_EVENT_DEC8_SPI: 9953 case GAUDI2_EVENT_DEC9_SPI: 9954 index = (event_type - GAUDI2_EVENT_DEC0_SPI) / 9955 (GAUDI2_EVENT_DEC1_SPI - GAUDI2_EVENT_DEC0_SPI); 9956 error_count = gaudi2_handle_dec_err(hdev, index, event_type, &event_mask); 9957 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9958 break; 9959 9960 case GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE: 9961 case GAUDI2_EVENT_MME1_CTRL_AXI_ERROR_RESPONSE: 9962 case GAUDI2_EVENT_MME2_CTRL_AXI_ERROR_RESPONSE: 9963 case GAUDI2_EVENT_MME3_CTRL_AXI_ERROR_RESPONSE: 9964 index = (event_type - GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE) / 9965 (GAUDI2_EVENT_MME1_CTRL_AXI_ERROR_RESPONSE - 9966 GAUDI2_EVENT_MME0_CTRL_AXI_ERROR_RESPONSE); 9967 error_count = gaudi2_handle_mme_err(hdev, index, event_type, &event_mask); 9968 error_count += gaudi2_handle_qm_sei_err(hdev, event_type, false, &event_mask); 9969 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9970 break; 9971 9972 case GAUDI2_EVENT_MME0_QMAN_SW_ERROR: 9973 case GAUDI2_EVENT_MME1_QMAN_SW_ERROR: 9974 case GAUDI2_EVENT_MME2_QMAN_SW_ERROR: 9975 case GAUDI2_EVENT_MME3_QMAN_SW_ERROR: 9976 index = (event_type - GAUDI2_EVENT_MME0_QMAN_SW_ERROR) / 9977 (GAUDI2_EVENT_MME1_QMAN_SW_ERROR - 9978 GAUDI2_EVENT_MME0_QMAN_SW_ERROR); 9979 error_count = gaudi2_handle_mme_err(hdev, index, event_type, &event_mask); 9980 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9981 break; 9982 9983 case GAUDI2_EVENT_MME0_WAP_SOURCE_RESULT_INVALID: 9984 case GAUDI2_EVENT_MME1_WAP_SOURCE_RESULT_INVALID: 9985 case GAUDI2_EVENT_MME2_WAP_SOURCE_RESULT_INVALID: 9986 case GAUDI2_EVENT_MME3_WAP_SOURCE_RESULT_INVALID: 9987 index = (event_type - GAUDI2_EVENT_MME0_WAP_SOURCE_RESULT_INVALID) / 9988 (GAUDI2_EVENT_MME1_WAP_SOURCE_RESULT_INVALID - 9989 GAUDI2_EVENT_MME0_WAP_SOURCE_RESULT_INVALID); 9990 error_count = gaudi2_handle_mme_wap_err(hdev, index, event_type, &event_mask); 9991 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 9992 break; 9993 9994 case GAUDI2_EVENT_KDMA_CH0_AXI_ERR_RSP: 9995 case GAUDI2_EVENT_KDMA0_CORE: 9996 error_count = gaudi2_handle_kdma_core_event(hdev, event_type, 9997 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 9998 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 9999 break; 10000 10001 case GAUDI2_EVENT_HDMA2_CORE ... GAUDI2_EVENT_HDMA5_CORE: 10002 error_count = gaudi2_handle_dma_core_event(hdev, event_type, 10003 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10004 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10005 break; 10006 10007 case GAUDI2_EVENT_PDMA0_CORE ... GAUDI2_EVENT_PDMA1_CORE: 10008 error_count = gaudi2_handle_dma_core_event(hdev, event_type, 10009 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10010 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10011 break; 10012 10013 case GAUDI2_EVENT_PCIE_ADDR_DEC_ERR: 10014 error_count = gaudi2_print_pcie_addr_dec_info(hdev, event_type, 10015 le64_to_cpu(eq_entry->intr_cause.intr_cause_data), &event_mask); 10016 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10017 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10018 break; 10019 10020 case GAUDI2_EVENT_HMMU0_PAGE_FAULT_OR_WR_PERM ... GAUDI2_EVENT_HMMU12_SECURITY_ERROR: 10021 case GAUDI2_EVENT_HMMU_0_AXI_ERR_RSP ... GAUDI2_EVENT_HMMU_12_AXI_ERR_RSP: 10022 case GAUDI2_EVENT_PMMU0_PAGE_FAULT_WR_PERM ... GAUDI2_EVENT_PMMU0_SECURITY_ERROR: 10023 case GAUDI2_EVENT_PMMU_AXI_ERR_RSP_0: 10024 error_count = gaudi2_handle_mmu_spi_sei_err(hdev, event_type, &event_mask); 10025 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10026 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10027 break; 10028 10029 case GAUDI2_EVENT_HIF0_FATAL ... GAUDI2_EVENT_HIF12_FATAL: 10030 error_count = gaudi2_handle_hif_fatal(hdev, event_type, 10031 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10032 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10033 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10034 break; 10035 10036 case GAUDI2_EVENT_PMMU_FATAL_0: 10037 error_count = gaudi2_handle_pif_fatal(hdev, event_type, 10038 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10039 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10040 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10041 break; 10042 10043 case GAUDI2_EVENT_PSOC63_RAZWI_OR_PID_MIN_MAX_INTERRUPT: 10044 error_count = gaudi2_ack_psoc_razwi_event_handler(hdev, &event_mask); 10045 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10046 break; 10047 10048 case GAUDI2_EVENT_HBM0_MC0_SEI_SEVERE ... GAUDI2_EVENT_HBM5_MC1_SEI_NON_SEVERE: 10049 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10050 if (gaudi2_handle_hbm_mc_sei_err(hdev, event_type, &eq_entry->sei_data)) { 10051 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10052 reset_required = true; 10053 } 10054 error_count++; 10055 break; 10056 10057 case GAUDI2_EVENT_HBM_CATTRIP_0 ... GAUDI2_EVENT_HBM_CATTRIP_5: 10058 error_count = gaudi2_handle_hbm_cattrip(hdev, event_type, 10059 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10060 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10061 break; 10062 10063 case GAUDI2_EVENT_HBM0_MC0_SPI ... GAUDI2_EVENT_HBM5_MC1_SPI: 10064 error_count = gaudi2_handle_hbm_mc_spi(hdev, 10065 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10066 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10067 break; 10068 10069 case GAUDI2_EVENT_PCIE_DRAIN_COMPLETE: 10070 error_count = gaudi2_handle_pcie_drain(hdev, &eq_entry->pcie_drain_ind_data); 10071 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10072 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10073 if (hl_is_fw_sw_ver_equal_or_greater(hdev, 1, 13)) 10074 is_critical = true; 10075 break; 10076 10077 case GAUDI2_EVENT_PSOC59_RPM_ERROR_OR_DRAIN: 10078 error_count = gaudi2_handle_psoc_drain(hdev, 10079 le64_to_cpu(eq_entry->intr_cause.intr_cause_data)); 10080 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10081 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10082 break; 10083 10084 case GAUDI2_EVENT_CPU_AXI_ECC: 10085 error_count = GAUDI2_NA_EVENT_CAUSE; 10086 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10087 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10088 break; 10089 case GAUDI2_EVENT_CPU_L2_RAM_ECC: 10090 error_count = GAUDI2_NA_EVENT_CAUSE; 10091 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10092 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10093 break; 10094 case GAUDI2_EVENT_MME0_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME0_SBTE4_AXI_ERR_RSP: 10095 case GAUDI2_EVENT_MME1_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME1_SBTE4_AXI_ERR_RSP: 10096 case GAUDI2_EVENT_MME2_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME2_SBTE4_AXI_ERR_RSP: 10097 case GAUDI2_EVENT_MME3_SBTE0_AXI_ERR_RSP ... GAUDI2_EVENT_MME3_SBTE4_AXI_ERR_RSP: 10098 error_count = gaudi2_handle_mme_sbte_err(hdev, event_type); 10099 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10100 break; 10101 case GAUDI2_EVENT_VM0_ALARM_A ... GAUDI2_EVENT_VM3_ALARM_B: 10102 error_count = GAUDI2_NA_EVENT_CAUSE; 10103 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10104 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10105 break; 10106 case GAUDI2_EVENT_PSOC_AXI_ERR_RSP: 10107 error_count = GAUDI2_NA_EVENT_CAUSE; 10108 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10109 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10110 break; 10111 case GAUDI2_EVENT_PSOC_PRSTN_FALL: 10112 error_count = GAUDI2_NA_EVENT_CAUSE; 10113 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10114 break; 10115 case GAUDI2_EVENT_PCIE_APB_TIMEOUT: 10116 error_count = GAUDI2_NA_EVENT_CAUSE; 10117 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10118 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10119 break; 10120 case GAUDI2_EVENT_PCIE_FATAL_ERR: 10121 error_count = GAUDI2_NA_EVENT_CAUSE; 10122 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10123 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10124 break; 10125 case GAUDI2_EVENT_TPC0_BMON_SPMU: 10126 case GAUDI2_EVENT_TPC1_BMON_SPMU: 10127 case GAUDI2_EVENT_TPC2_BMON_SPMU: 10128 case GAUDI2_EVENT_TPC3_BMON_SPMU: 10129 case GAUDI2_EVENT_TPC4_BMON_SPMU: 10130 case GAUDI2_EVENT_TPC5_BMON_SPMU: 10131 case GAUDI2_EVENT_TPC6_BMON_SPMU: 10132 case GAUDI2_EVENT_TPC7_BMON_SPMU: 10133 case GAUDI2_EVENT_TPC8_BMON_SPMU: 10134 case GAUDI2_EVENT_TPC9_BMON_SPMU: 10135 case GAUDI2_EVENT_TPC10_BMON_SPMU: 10136 case GAUDI2_EVENT_TPC11_BMON_SPMU: 10137 case GAUDI2_EVENT_TPC12_BMON_SPMU: 10138 case GAUDI2_EVENT_TPC13_BMON_SPMU: 10139 case GAUDI2_EVENT_TPC14_BMON_SPMU: 10140 case GAUDI2_EVENT_TPC15_BMON_SPMU: 10141 case GAUDI2_EVENT_TPC16_BMON_SPMU: 10142 case GAUDI2_EVENT_TPC17_BMON_SPMU: 10143 case GAUDI2_EVENT_TPC18_BMON_SPMU: 10144 case GAUDI2_EVENT_TPC19_BMON_SPMU: 10145 case GAUDI2_EVENT_TPC20_BMON_SPMU: 10146 case GAUDI2_EVENT_TPC21_BMON_SPMU: 10147 case GAUDI2_EVENT_TPC22_BMON_SPMU: 10148 case GAUDI2_EVENT_TPC23_BMON_SPMU: 10149 case GAUDI2_EVENT_TPC24_BMON_SPMU: 10150 case GAUDI2_EVENT_MME0_CTRL_BMON_SPMU: 10151 case GAUDI2_EVENT_MME0_SBTE_BMON_SPMU: 10152 case GAUDI2_EVENT_MME0_WAP_BMON_SPMU: 10153 case GAUDI2_EVENT_MME1_CTRL_BMON_SPMU: 10154 case GAUDI2_EVENT_MME1_SBTE_BMON_SPMU: 10155 case GAUDI2_EVENT_MME1_WAP_BMON_SPMU: 10156 case GAUDI2_EVENT_MME2_CTRL_BMON_SPMU: 10157 case GAUDI2_EVENT_MME2_SBTE_BMON_SPMU: 10158 case GAUDI2_EVENT_MME2_WAP_BMON_SPMU: 10159 case GAUDI2_EVENT_MME3_CTRL_BMON_SPMU: 10160 case GAUDI2_EVENT_MME3_SBTE_BMON_SPMU: 10161 case GAUDI2_EVENT_MME3_WAP_BMON_SPMU: 10162 case GAUDI2_EVENT_HDMA2_BM_SPMU ... GAUDI2_EVENT_PDMA1_BM_SPMU: 10163 fallthrough; 10164 case GAUDI2_EVENT_DEC0_BMON_SPMU: 10165 case GAUDI2_EVENT_DEC1_BMON_SPMU: 10166 case GAUDI2_EVENT_DEC2_BMON_SPMU: 10167 case GAUDI2_EVENT_DEC3_BMON_SPMU: 10168 case GAUDI2_EVENT_DEC4_BMON_SPMU: 10169 case GAUDI2_EVENT_DEC5_BMON_SPMU: 10170 case GAUDI2_EVENT_DEC6_BMON_SPMU: 10171 case GAUDI2_EVENT_DEC7_BMON_SPMU: 10172 case GAUDI2_EVENT_DEC8_BMON_SPMU: 10173 case GAUDI2_EVENT_DEC9_BMON_SPMU: 10174 case GAUDI2_EVENT_ROTATOR0_BMON_SPMU ... GAUDI2_EVENT_SM3_BMON_SPMU: 10175 error_count = GAUDI2_NA_EVENT_CAUSE; 10176 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10177 break; 10178 10179 case GAUDI2_EVENT_CPU_FIX_POWER_ENV_S: 10180 case GAUDI2_EVENT_CPU_FIX_POWER_ENV_E: 10181 case GAUDI2_EVENT_CPU_FIX_THERMAL_ENV_S: 10182 case GAUDI2_EVENT_CPU_FIX_THERMAL_ENV_E: 10183 gaudi2_print_clk_change_info(hdev, event_type, &event_mask); 10184 error_count = GAUDI2_NA_EVENT_CAUSE; 10185 break; 10186 10187 case GAUDI2_EVENT_CPU_PKT_QUEUE_OUT_SYNC: 10188 gaudi2_print_out_of_sync_info(hdev, event_type, &eq_entry->pkt_sync_err); 10189 error_count = GAUDI2_NA_EVENT_CAUSE; 10190 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10191 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10192 break; 10193 10194 case GAUDI2_EVENT_PCIE_FLR_REQUESTED: 10195 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10196 error_count = GAUDI2_NA_EVENT_CAUSE; 10197 /* Do nothing- FW will handle it */ 10198 break; 10199 10200 case GAUDI2_EVENT_PCIE_P2P_MSIX: 10201 error_count = gaudi2_handle_pcie_p2p_msix(hdev, event_type); 10202 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10203 break; 10204 10205 case GAUDI2_EVENT_SM0_AXI_ERROR_RESPONSE ... GAUDI2_EVENT_SM3_AXI_ERROR_RESPONSE: 10206 index = event_type - GAUDI2_EVENT_SM0_AXI_ERROR_RESPONSE; 10207 error_count = gaudi2_handle_sm_err(hdev, event_type, index); 10208 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10209 break; 10210 10211 case GAUDI2_EVENT_PSOC_MME_PLL_LOCK_ERR ... GAUDI2_EVENT_DCORE2_HBM_PLL_LOCK_ERR: 10212 error_count = GAUDI2_NA_EVENT_CAUSE; 10213 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10214 break; 10215 10216 case GAUDI2_EVENT_CPU_CPLD_SHUTDOWN_CAUSE: 10217 dev_info(hdev->dev, "CPLD shutdown cause, reset reason: 0x%llx\n", 10218 le64_to_cpu(eq_entry->data[0])); 10219 error_count = GAUDI2_NA_EVENT_CAUSE; 10220 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10221 break; 10222 case GAUDI2_EVENT_CPU_CPLD_SHUTDOWN_EVENT: 10223 dev_err(hdev->dev, "CPLD shutdown event, reset reason: 0x%llx\n", 10224 le64_to_cpu(eq_entry->data[0])); 10225 error_count = GAUDI2_NA_EVENT_CAUSE; 10226 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10227 break; 10228 10229 case GAUDI2_EVENT_CPU_PKT_SANITY_FAILED: 10230 gaudi2_print_cpu_pkt_failure_info(hdev, event_type, &eq_entry->pkt_sync_err); 10231 error_count = GAUDI2_NA_EVENT_CAUSE; 10232 reset_flags |= HL_DRV_RESET_FW_FATAL_ERR; 10233 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10234 break; 10235 10236 case GAUDI2_EVENT_ARC_DCCM_FULL: 10237 error_count = hl_arc_event_handle(hdev, event_type, &eq_entry->arc_data); 10238 event_mask |= HL_NOTIFIER_EVENT_USER_ENGINE_ERR; 10239 break; 10240 10241 case GAUDI2_EVENT_CPU_FP32_NOT_SUPPORTED: 10242 case GAUDI2_EVENT_CPU_DEV_RESET_REQ: 10243 event_mask |= HL_NOTIFIER_EVENT_GENERAL_HW_ERR; 10244 error_count = GAUDI2_NA_EVENT_CAUSE; 10245 is_critical = true; 10246 break; 10247 10248 case GAUDI2_EVENT_ARC_PWR_BRK_ENTRY: 10249 case GAUDI2_EVENT_ARC_PWR_BRK_EXT: 10250 case GAUDI2_EVENT_ARC_PWR_RD_MODE0: 10251 case GAUDI2_EVENT_ARC_PWR_RD_MODE1: 10252 case GAUDI2_EVENT_ARC_PWR_RD_MODE2: 10253 case GAUDI2_EVENT_ARC_PWR_RD_MODE3: 10254 error_count = GAUDI2_NA_EVENT_CAUSE; 10255 dev_info_ratelimited(hdev->dev, "%s event received\n", 10256 gaudi2_irq_map_table[event_type].name); 10257 break; 10258 10259 case GAUDI2_EVENT_ARC_EQ_HEARTBEAT: 10260 hl_eq_heartbeat_event_handle(hdev); 10261 error_count = GAUDI2_NA_EVENT_CAUSE; 10262 break; 10263 default: 10264 if (gaudi2_irq_map_table[event_type].valid) { 10265 dev_err_ratelimited(hdev->dev, "Cannot find handler for event %d\n", 10266 event_type); 10267 error_count = GAUDI2_NA_EVENT_CAUSE; 10268 } 10269 } 10270 10271 if (event_mask & HL_NOTIFIER_EVENT_USER_ENGINE_ERR) 10272 hl_capture_engine_err(hdev, event_id_to_engine_id(hdev, event_type), error_count); 10273 10274 /* Make sure to dump an error in case no error cause was printed so far. 10275 * Note that although we have counted the errors, we use this number as 10276 * a boolean. 10277 */ 10278 if (error_count == GAUDI2_NA_EVENT_CAUSE && !is_info_event(event_type)) 10279 gaudi2_print_event(hdev, event_type, true, "%d", event_type); 10280 else if (error_count == 0) 10281 gaudi2_print_event(hdev, event_type, true, 10282 "No error cause for H/W event %u", event_type); 10283 10284 if ((gaudi2_irq_map_table[event_type].reset != EVENT_RESET_TYPE_NONE) || 10285 reset_required) { 10286 if (reset_required || 10287 (gaudi2_irq_map_table[event_type].reset == EVENT_RESET_TYPE_HARD)) 10288 reset_flags |= HL_DRV_RESET_HARD; 10289 10290 if (hdev->hard_reset_on_fw_events || 10291 (hdev->asic_prop.fw_security_enabled && is_critical)) 10292 goto reset_device; 10293 } 10294 10295 /* Send unmask irq only for interrupts not classified as MSG */ 10296 if (!gaudi2_irq_map_table[event_type].msg) 10297 hl_fw_unmask_irq(hdev, event_type); 10298 10299 if (event_mask) 10300 hl_notifier_event_send_all(hdev, event_mask); 10301 10302 return; 10303 10304 reset_device: 10305 if (hdev->asic_prop.fw_security_enabled && is_critical) { 10306 reset_flags |= HL_DRV_RESET_BYPASS_REQ_TO_FW; 10307 event_mask |= HL_NOTIFIER_EVENT_DEVICE_UNAVAILABLE; 10308 } else { 10309 reset_flags |= HL_DRV_RESET_DELAY; 10310 } 10311 /* escalate general hw errors to critical/fatal error */ 10312 if (event_mask & HL_NOTIFIER_EVENT_GENERAL_HW_ERR) 10313 hl_handle_critical_hw_err(hdev, event_type, &event_mask); 10314 10315 event_mask |= HL_NOTIFIER_EVENT_DEVICE_RESET; 10316 hl_device_cond_reset(hdev, reset_flags, event_mask); 10317 } 10318 10319 static int gaudi2_memset_memory_chunk_using_edma_qm(struct hl_device *hdev, 10320 struct packet_lin_dma *lin_dma_pkt, 10321 u64 phys_addr, u32 hw_queue_id, u32 size, u64 addr, u32 val) 10322 { 10323 u32 ctl, pkt_size; 10324 int rc = 0, i; 10325 10326 ctl = FIELD_PREP(GAUDI2_PKT_CTL_OPCODE_MASK, PACKET_LIN_DMA); 10327 ctl |= FIELD_PREP(GAUDI2_PKT_LIN_DMA_CTL_MEMSET_MASK, 1); 10328 ctl |= FIELD_PREP(GAUDI2_PKT_LIN_DMA_CTL_WRCOMP_MASK, 1); 10329 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_EB_MASK, 1); 10330 10331 lin_dma_pkt->ctl = cpu_to_le32(ctl); 10332 lin_dma_pkt->src_addr = cpu_to_le64(val); 10333 lin_dma_pkt->dst_addr = cpu_to_le64(addr); 10334 lin_dma_pkt->tsize = cpu_to_le32(size); 10335 10336 pkt_size = sizeof(struct packet_lin_dma); 10337 10338 for (i = 0; i < 3; i++) { 10339 rc = hdev->asic_funcs->access_dev_mem(hdev, PCI_REGION_DRAM, 10340 phys_addr + (i * sizeof(u64)), 10341 ((u64 *)(lin_dma_pkt)) + i, DEBUGFS_WRITE64); 10342 if (rc) { 10343 dev_err(hdev->dev, "Failed to copy lin_dma packet to HBM (%#llx)\n", 10344 phys_addr); 10345 return rc; 10346 } 10347 } 10348 10349 rc = hl_hw_queue_send_cb_no_cmpl(hdev, hw_queue_id, pkt_size, phys_addr); 10350 if (rc) 10351 dev_err(hdev->dev, "Failed to send lin_dma packet to H/W queue %d\n", 10352 hw_queue_id); 10353 10354 return rc; 10355 } 10356 10357 static int gaudi2_memset_device_memory(struct hl_device *hdev, u64 addr, u64 size, u64 val) 10358 { 10359 u32 edma_queues_id[] = {GAUDI2_QUEUE_ID_DCORE0_EDMA_0_0, 10360 GAUDI2_QUEUE_ID_DCORE1_EDMA_0_0, 10361 GAUDI2_QUEUE_ID_DCORE2_EDMA_0_0, 10362 GAUDI2_QUEUE_ID_DCORE3_EDMA_0_0}; 10363 u32 chunk_size, dcore, edma_idx, sob_offset, sob_addr, comp_val, 10364 old_mmubp, mmubp, num_of_pkts, busy, pkt_size, cb_len; 10365 u64 comp_addr, cur_addr = addr, end_addr = addr + size; 10366 struct asic_fixed_properties *prop = &hdev->asic_prop; 10367 int rc = 0, dma_num = 0, i; 10368 void *lin_dma_pkts_arr; 10369 10370 if (prop->edma_enabled_mask == 0) { 10371 dev_info(hdev->dev, "non of the EDMA engines is enabled - skip dram scrubbing\n"); 10372 return -EIO; 10373 } 10374 10375 sob_offset = hdev->asic_prop.first_available_user_sob[0] * 4; 10376 sob_addr = mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + sob_offset; 10377 comp_addr = CFG_BASE + sob_addr; 10378 comp_val = FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_INC_MASK, 1) | 10379 FIELD_PREP(DCORE0_SYNC_MNGR_OBJS_SOB_OBJ_VAL_MASK, 1); 10380 mmubp = FIELD_PREP(ARC_FARM_KDMA_CTX_AXUSER_HB_MMU_BP_WR_MASK, 1) | 10381 FIELD_PREP(ARC_FARM_KDMA_CTX_AXUSER_HB_MMU_BP_RD_MASK, 1); 10382 10383 /* Calculate how many lin dma pkts we'll need */ 10384 num_of_pkts = div64_u64(round_up(size, SZ_2G), SZ_2G); 10385 pkt_size = sizeof(struct packet_lin_dma); 10386 cb_len = pkt_size * num_of_pkts; 10387 10388 /* 10389 * if we're not scrubing HMMU or NIC reserved sections in hbm, 10390 * then it the scrubing of the user section, as we use the start of the user section 10391 * to store the CB of the EDMA QM, so shift the start address of the scrubbing accordingly 10392 * and scrub the CB section before leaving this function. 10393 */ 10394 if ((addr >= prop->dram_user_base_address) && 10395 (addr < prop->dram_user_base_address + cb_len)) 10396 cur_addr += (prop->dram_user_base_address + cb_len) - addr; 10397 10398 lin_dma_pkts_arr = kvcalloc(num_of_pkts, pkt_size, GFP_KERNEL); 10399 if (!lin_dma_pkts_arr) 10400 return -ENOMEM; 10401 10402 /* 10403 * set mmu bypass for the scrubbing - all ddmas are configured the same so save 10404 * only the first one to restore later 10405 * also set the sob addr for all edma cores for completion. 10406 * set QM as trusted to allow it to access physical address with MMU bp. 10407 */ 10408 old_mmubp = RREG32(mmDCORE0_EDMA0_CORE_CTX_AXUSER_HB_MMU_BP); 10409 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 10410 for (edma_idx = 0 ; edma_idx < NUM_OF_EDMA_PER_DCORE ; edma_idx++) { 10411 u32 edma_offset = dcore * DCORE_OFFSET + edma_idx * DCORE_EDMA_OFFSET; 10412 u32 edma_bit = dcore * NUM_OF_EDMA_PER_DCORE + edma_idx; 10413 10414 if (!(prop->edma_enabled_mask & BIT(edma_bit))) 10415 continue; 10416 10417 WREG32(mmDCORE0_EDMA0_CORE_CTX_AXUSER_HB_MMU_BP + 10418 edma_offset, mmubp); 10419 WREG32(mmDCORE0_EDMA0_CORE_CTX_WR_COMP_ADDR_LO + edma_offset, 10420 lower_32_bits(comp_addr)); 10421 WREG32(mmDCORE0_EDMA0_CORE_CTX_WR_COMP_ADDR_HI + edma_offset, 10422 upper_32_bits(comp_addr)); 10423 WREG32(mmDCORE0_EDMA0_CORE_CTX_WR_COMP_WDATA + edma_offset, 10424 comp_val); 10425 gaudi2_qman_set_test_mode(hdev, 10426 edma_queues_id[dcore] + 4 * edma_idx, true); 10427 } 10428 } 10429 10430 WREG32(sob_addr, 0); 10431 10432 while (cur_addr < end_addr) { 10433 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 10434 for (edma_idx = 0 ; edma_idx < NUM_OF_EDMA_PER_DCORE ; edma_idx++) { 10435 u32 edma_bit = dcore * NUM_OF_EDMA_PER_DCORE + edma_idx; 10436 10437 if (!(prop->edma_enabled_mask & BIT(edma_bit))) 10438 continue; 10439 10440 chunk_size = min_t(u64, SZ_2G, end_addr - cur_addr); 10441 10442 rc = gaudi2_memset_memory_chunk_using_edma_qm(hdev, 10443 (struct packet_lin_dma *)lin_dma_pkts_arr + dma_num, 10444 prop->dram_user_base_address + (dma_num * pkt_size), 10445 edma_queues_id[dcore] + edma_idx * 4, 10446 chunk_size, cur_addr, val); 10447 if (rc) 10448 goto end; 10449 10450 dma_num++; 10451 cur_addr += chunk_size; 10452 if (cur_addr == end_addr) 10453 goto edma_wait; 10454 } 10455 } 10456 } 10457 10458 edma_wait: 10459 rc = hl_poll_timeout(hdev, sob_addr, busy, (busy == dma_num), 1000, 1000000); 10460 if (rc) { 10461 dev_err(hdev->dev, "DMA Timeout during HBM scrubbing(sob: 0x%x, dma_num: 0x%x)\n", 10462 busy, dma_num); 10463 goto end; 10464 } 10465 end: 10466 for (dcore = 0 ; dcore < NUM_OF_DCORES ; dcore++) { 10467 for (edma_idx = 0 ; edma_idx < NUM_OF_EDMA_PER_DCORE ; edma_idx++) { 10468 u32 edma_offset = dcore * DCORE_OFFSET + edma_idx * DCORE_EDMA_OFFSET; 10469 u32 edma_bit = dcore * NUM_OF_EDMA_PER_DCORE + edma_idx; 10470 10471 if (!(prop->edma_enabled_mask & BIT(edma_bit))) 10472 continue; 10473 10474 WREG32(mmDCORE0_EDMA0_CORE_CTX_AXUSER_HB_MMU_BP + edma_offset, old_mmubp); 10475 WREG32(mmDCORE0_EDMA0_CORE_CTX_WR_COMP_ADDR_LO + edma_offset, 0); 10476 WREG32(mmDCORE0_EDMA0_CORE_CTX_WR_COMP_ADDR_HI + edma_offset, 0); 10477 WREG32(mmDCORE0_EDMA0_CORE_CTX_WR_COMP_WDATA + edma_offset, 0); 10478 gaudi2_qman_set_test_mode(hdev, 10479 edma_queues_id[dcore] + 4 * edma_idx, false); 10480 } 10481 } 10482 10483 memset(lin_dma_pkts_arr, 0, sizeof(u64)); 10484 10485 /* Zero the HBM area where we copied the CB */ 10486 for (i = 0; i < cb_len / sizeof(u64); i += sizeof(u64)) 10487 rc = hdev->asic_funcs->access_dev_mem(hdev, PCI_REGION_DRAM, 10488 prop->dram_user_base_address + i, 10489 (u64 *)(lin_dma_pkts_arr), DEBUGFS_WRITE64); 10490 WREG32(sob_addr, 0); 10491 10492 kfree(lin_dma_pkts_arr); 10493 10494 return rc; 10495 } 10496 10497 static int gaudi2_scrub_device_dram(struct hl_device *hdev, u64 val) 10498 { 10499 int rc; 10500 struct asic_fixed_properties *prop = &hdev->asic_prop; 10501 u64 size = prop->dram_end_address - prop->dram_user_base_address; 10502 10503 rc = gaudi2_memset_device_memory(hdev, prop->dram_user_base_address, size, val); 10504 10505 if (rc) 10506 dev_err(hdev->dev, "Failed to scrub dram, address: 0x%llx size: %llu\n", 10507 prop->dram_user_base_address, size); 10508 return rc; 10509 } 10510 10511 static int gaudi2_scrub_device_mem(struct hl_device *hdev) 10512 { 10513 int rc; 10514 struct asic_fixed_properties *prop = &hdev->asic_prop; 10515 u64 val = hdev->memory_scrub_val; 10516 u64 addr, size; 10517 10518 if (!hdev->memory_scrub) 10519 return 0; 10520 10521 /* scrub SRAM */ 10522 addr = prop->sram_user_base_address; 10523 size = hdev->pldm ? 0x10000 : (prop->sram_size - SRAM_USER_BASE_OFFSET); 10524 dev_dbg(hdev->dev, "Scrubbing SRAM: 0x%09llx - 0x%09llx, val: 0x%llx\n", 10525 addr, addr + size, val); 10526 rc = gaudi2_memset_device_memory(hdev, addr, size, val); 10527 if (rc) { 10528 dev_err(hdev->dev, "scrubbing SRAM failed (%d)\n", rc); 10529 return rc; 10530 } 10531 10532 /* scrub DRAM */ 10533 rc = gaudi2_scrub_device_dram(hdev, val); 10534 if (rc) { 10535 dev_err(hdev->dev, "scrubbing DRAM failed (%d)\n", rc); 10536 return rc; 10537 } 10538 return 0; 10539 } 10540 10541 static void gaudi2_restore_user_sm_registers(struct hl_device *hdev) 10542 { 10543 u64 addr, mon_sts_addr, mon_cfg_addr, cq_lbw_l_addr, cq_lbw_h_addr, 10544 cq_lbw_data_addr, cq_base_l_addr, cq_base_h_addr, cq_size_addr; 10545 u32 val, size, offset; 10546 int dcore_id; 10547 10548 offset = hdev->asic_prop.first_available_cq[0] * 4; 10549 cq_lbw_l_addr = mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_L_0 + offset; 10550 cq_lbw_h_addr = mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_H_0 + offset; 10551 cq_lbw_data_addr = mmDCORE0_SYNC_MNGR_GLBL_LBW_DATA_0 + offset; 10552 cq_base_l_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_BASE_ADDR_L_0 + offset; 10553 cq_base_h_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_BASE_ADDR_H_0 + offset; 10554 cq_size_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_SIZE_LOG2_0 + offset; 10555 size = mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_H_0 - 10556 (mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_L_0 + offset); 10557 10558 /* memset dcore0 CQ registers */ 10559 gaudi2_memset_device_lbw(hdev, cq_lbw_l_addr, size, 0); 10560 gaudi2_memset_device_lbw(hdev, cq_lbw_h_addr, size, 0); 10561 gaudi2_memset_device_lbw(hdev, cq_lbw_data_addr, size, 0); 10562 gaudi2_memset_device_lbw(hdev, cq_base_l_addr, size, 0); 10563 gaudi2_memset_device_lbw(hdev, cq_base_h_addr, size, 0); 10564 gaudi2_memset_device_lbw(hdev, cq_size_addr, size, 0); 10565 10566 cq_lbw_l_addr = mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_L_0 + DCORE_OFFSET; 10567 cq_lbw_h_addr = mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_H_0 + DCORE_OFFSET; 10568 cq_lbw_data_addr = mmDCORE0_SYNC_MNGR_GLBL_LBW_DATA_0 + DCORE_OFFSET; 10569 cq_base_l_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_BASE_ADDR_L_0 + DCORE_OFFSET; 10570 cq_base_h_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_BASE_ADDR_H_0 + DCORE_OFFSET; 10571 cq_size_addr = mmDCORE0_SYNC_MNGR_GLBL_CQ_SIZE_LOG2_0 + DCORE_OFFSET; 10572 size = mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_H_0 - mmDCORE0_SYNC_MNGR_GLBL_LBW_ADDR_L_0; 10573 10574 for (dcore_id = 1 ; dcore_id < NUM_OF_DCORES ; dcore_id++) { 10575 gaudi2_memset_device_lbw(hdev, cq_lbw_l_addr, size, 0); 10576 gaudi2_memset_device_lbw(hdev, cq_lbw_h_addr, size, 0); 10577 gaudi2_memset_device_lbw(hdev, cq_lbw_data_addr, size, 0); 10578 gaudi2_memset_device_lbw(hdev, cq_base_l_addr, size, 0); 10579 gaudi2_memset_device_lbw(hdev, cq_base_h_addr, size, 0); 10580 gaudi2_memset_device_lbw(hdev, cq_size_addr, size, 0); 10581 10582 cq_lbw_l_addr += DCORE_OFFSET; 10583 cq_lbw_h_addr += DCORE_OFFSET; 10584 cq_lbw_data_addr += DCORE_OFFSET; 10585 cq_base_l_addr += DCORE_OFFSET; 10586 cq_base_h_addr += DCORE_OFFSET; 10587 cq_size_addr += DCORE_OFFSET; 10588 } 10589 10590 offset = hdev->asic_prop.first_available_user_mon[0] * 4; 10591 addr = mmDCORE0_SYNC_MNGR_OBJS_MON_STATUS_0 + offset; 10592 val = 1 << DCORE0_SYNC_MNGR_OBJS_MON_STATUS_PROT_SHIFT; 10593 size = mmDCORE0_SYNC_MNGR_OBJS_SM_SEC_0 - (mmDCORE0_SYNC_MNGR_OBJS_MON_STATUS_0 + offset); 10594 10595 /* memset dcore0 monitors */ 10596 gaudi2_memset_device_lbw(hdev, addr, size, val); 10597 10598 addr = mmDCORE0_SYNC_MNGR_OBJS_MON_CONFIG_0 + offset; 10599 gaudi2_memset_device_lbw(hdev, addr, size, 0); 10600 10601 mon_sts_addr = mmDCORE0_SYNC_MNGR_OBJS_MON_STATUS_0 + DCORE_OFFSET; 10602 mon_cfg_addr = mmDCORE0_SYNC_MNGR_OBJS_MON_CONFIG_0 + DCORE_OFFSET; 10603 size = mmDCORE0_SYNC_MNGR_OBJS_SM_SEC_0 - mmDCORE0_SYNC_MNGR_OBJS_MON_STATUS_0; 10604 10605 for (dcore_id = 1 ; dcore_id < NUM_OF_DCORES ; dcore_id++) { 10606 gaudi2_memset_device_lbw(hdev, mon_sts_addr, size, val); 10607 gaudi2_memset_device_lbw(hdev, mon_cfg_addr, size, 0); 10608 mon_sts_addr += DCORE_OFFSET; 10609 mon_cfg_addr += DCORE_OFFSET; 10610 } 10611 10612 offset = hdev->asic_prop.first_available_user_sob[0] * 4; 10613 addr = mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + offset; 10614 val = 0; 10615 size = mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 - 10616 (mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + offset); 10617 10618 /* memset dcore0 sobs */ 10619 gaudi2_memset_device_lbw(hdev, addr, size, val); 10620 10621 addr = mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + DCORE_OFFSET; 10622 size = mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 - mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0; 10623 10624 for (dcore_id = 1 ; dcore_id < NUM_OF_DCORES ; dcore_id++) { 10625 gaudi2_memset_device_lbw(hdev, addr, size, val); 10626 addr += DCORE_OFFSET; 10627 } 10628 10629 /* Flush all WREG to prevent race */ 10630 val = RREG32(mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + offset); 10631 } 10632 10633 static void gaudi2_restore_user_qm_registers(struct hl_device *hdev) 10634 { 10635 u32 reg_base, hw_queue_id; 10636 10637 for (hw_queue_id = GAUDI2_QUEUE_ID_PDMA_0_0 ; hw_queue_id <= GAUDI2_QUEUE_ID_ROT_1_0; 10638 hw_queue_id += NUM_OF_PQ_PER_QMAN) { 10639 if (!gaudi2_is_queue_enabled(hdev, hw_queue_id)) 10640 continue; 10641 10642 gaudi2_clear_qm_fence_counters_common(hdev, hw_queue_id, false); 10643 10644 reg_base = gaudi2_qm_blocks_bases[hw_queue_id]; 10645 WREG32(reg_base + QM_ARB_CFG_0_OFFSET, 0); 10646 } 10647 10648 /* Flush all WREG to prevent race */ 10649 RREG32(mmPDMA0_QM_ARB_CFG_0); 10650 } 10651 10652 static void gaudi2_restore_nic_qm_registers(struct hl_device *hdev) 10653 { 10654 u32 reg_base, hw_queue_id; 10655 10656 for (hw_queue_id = GAUDI2_QUEUE_ID_NIC_0_0 ; hw_queue_id <= GAUDI2_QUEUE_ID_NIC_23_3; 10657 hw_queue_id += NUM_OF_PQ_PER_QMAN) { 10658 if (!gaudi2_is_queue_enabled(hdev, hw_queue_id)) 10659 continue; 10660 10661 gaudi2_clear_qm_fence_counters_common(hdev, hw_queue_id, false); 10662 10663 reg_base = gaudi2_qm_blocks_bases[hw_queue_id]; 10664 WREG32(reg_base + QM_ARB_CFG_0_OFFSET, 0); 10665 } 10666 10667 /* Flush all WREG to prevent race */ 10668 RREG32(mmPDMA0_QM_ARB_CFG_0); 10669 } 10670 10671 static int gaudi2_context_switch(struct hl_device *hdev, u32 asid) 10672 { 10673 return 0; 10674 } 10675 10676 static void gaudi2_restore_phase_topology(struct hl_device *hdev) 10677 { 10678 } 10679 10680 static void gaudi2_init_block_instances(struct hl_device *hdev, u32 block_idx, 10681 struct dup_block_ctx *cfg_ctx) 10682 { 10683 u64 block_base = cfg_ctx->base + block_idx * cfg_ctx->block_off; 10684 u8 seq; 10685 int i; 10686 10687 for (i = 0 ; i < cfg_ctx->instances ; i++) { 10688 seq = block_idx * cfg_ctx->instances + i; 10689 10690 /* skip disabled instance */ 10691 if (!(cfg_ctx->enabled_mask & BIT_ULL(seq))) 10692 continue; 10693 10694 cfg_ctx->instance_cfg_fn(hdev, block_base + i * cfg_ctx->instance_off, 10695 cfg_ctx->data); 10696 } 10697 } 10698 10699 static void gaudi2_init_blocks_with_mask(struct hl_device *hdev, struct dup_block_ctx *cfg_ctx, 10700 u64 mask) 10701 { 10702 int i; 10703 10704 cfg_ctx->enabled_mask = mask; 10705 10706 for (i = 0 ; i < cfg_ctx->blocks ; i++) 10707 gaudi2_init_block_instances(hdev, i, cfg_ctx); 10708 } 10709 10710 void gaudi2_init_blocks(struct hl_device *hdev, struct dup_block_ctx *cfg_ctx) 10711 { 10712 gaudi2_init_blocks_with_mask(hdev, cfg_ctx, U64_MAX); 10713 } 10714 10715 static int gaudi2_debugfs_read_dma(struct hl_device *hdev, u64 addr, u32 size, void *blob_addr) 10716 { 10717 void *host_mem_virtual_addr; 10718 dma_addr_t host_mem_dma_addr; 10719 u64 reserved_va_base; 10720 u32 pos, size_left, size_to_dma; 10721 struct hl_ctx *ctx; 10722 int rc = 0; 10723 10724 /* Fetch the ctx */ 10725 ctx = hl_get_compute_ctx(hdev); 10726 if (!ctx) { 10727 dev_err(hdev->dev, "No ctx available\n"); 10728 return -EINVAL; 10729 } 10730 10731 /* Allocate buffers for read and for poll */ 10732 host_mem_virtual_addr = hl_asic_dma_alloc_coherent(hdev, SZ_2M, &host_mem_dma_addr, 10733 GFP_KERNEL | __GFP_ZERO); 10734 if (host_mem_virtual_addr == NULL) { 10735 dev_err(hdev->dev, "Failed to allocate memory for KDMA read\n"); 10736 rc = -ENOMEM; 10737 goto put_ctx; 10738 } 10739 10740 /* Reserve VM region on asic side */ 10741 reserved_va_base = hl_reserve_va_block(hdev, ctx, HL_VA_RANGE_TYPE_HOST, SZ_2M, 10742 HL_MMU_VA_ALIGNMENT_NOT_NEEDED); 10743 if (!reserved_va_base) { 10744 dev_err(hdev->dev, "Failed to reserve vmem on asic\n"); 10745 rc = -ENOMEM; 10746 goto free_data_buffer; 10747 } 10748 10749 /* Create mapping on asic side */ 10750 mutex_lock(&hdev->mmu_lock); 10751 10752 rc = hl_mmu_map_contiguous(ctx, reserved_va_base, host_mem_dma_addr, SZ_2M); 10753 if (rc) { 10754 dev_err(hdev->dev, "Failed to create mapping on asic mmu\n"); 10755 goto unreserve_va; 10756 } 10757 10758 rc = hl_mmu_invalidate_cache_range(hdev, false, 10759 MMU_OP_USERPTR | MMU_OP_SKIP_LOW_CACHE_INV, 10760 ctx->asid, reserved_va_base, SZ_2M); 10761 if (rc) { 10762 hl_mmu_unmap_contiguous(ctx, reserved_va_base, SZ_2M); 10763 goto unreserve_va; 10764 } 10765 10766 mutex_unlock(&hdev->mmu_lock); 10767 10768 /* Enable MMU on KDMA */ 10769 gaudi2_kdma_set_mmbp_asid(hdev, false, ctx->asid); 10770 10771 pos = 0; 10772 size_left = size; 10773 size_to_dma = SZ_2M; 10774 10775 while (size_left > 0) { 10776 if (size_left < SZ_2M) 10777 size_to_dma = size_left; 10778 10779 rc = gaudi2_send_job_to_kdma(hdev, addr, reserved_va_base, size_to_dma, false); 10780 if (rc) 10781 break; 10782 10783 memcpy(blob_addr + pos, host_mem_virtual_addr, size_to_dma); 10784 10785 if (size_left <= SZ_2M) 10786 break; 10787 10788 pos += SZ_2M; 10789 addr += SZ_2M; 10790 size_left -= SZ_2M; 10791 } 10792 10793 gaudi2_kdma_set_mmbp_asid(hdev, true, HL_KERNEL_ASID_ID); 10794 10795 mutex_lock(&hdev->mmu_lock); 10796 10797 rc = hl_mmu_unmap_contiguous(ctx, reserved_va_base, SZ_2M); 10798 if (rc) 10799 goto unreserve_va; 10800 10801 rc = hl_mmu_invalidate_cache_range(hdev, false, MMU_OP_USERPTR, 10802 ctx->asid, reserved_va_base, SZ_2M); 10803 10804 unreserve_va: 10805 mutex_unlock(&hdev->mmu_lock); 10806 hl_unreserve_va_block(hdev, ctx, reserved_va_base, SZ_2M); 10807 free_data_buffer: 10808 hl_asic_dma_free_coherent(hdev, SZ_2M, host_mem_virtual_addr, host_mem_dma_addr); 10809 put_ctx: 10810 hl_ctx_put(ctx); 10811 10812 return rc; 10813 } 10814 10815 static int gaudi2_internal_cb_pool_init(struct hl_device *hdev, struct hl_ctx *ctx) 10816 { 10817 struct gaudi2_device *gaudi2 = hdev->asic_specific; 10818 int min_alloc_order, rc; 10819 10820 if (!(gaudi2->hw_cap_initialized & HW_CAP_PMMU)) 10821 return 0; 10822 10823 hdev->internal_cb_pool_virt_addr = hl_asic_dma_alloc_coherent(hdev, 10824 HOST_SPACE_INTERNAL_CB_SZ, 10825 &hdev->internal_cb_pool_dma_addr, 10826 GFP_KERNEL | __GFP_ZERO); 10827 10828 if (!hdev->internal_cb_pool_virt_addr) 10829 return -ENOMEM; 10830 10831 min_alloc_order = ilog2(min(gaudi2_get_signal_cb_size(hdev), 10832 gaudi2_get_wait_cb_size(hdev))); 10833 10834 hdev->internal_cb_pool = gen_pool_create(min_alloc_order, -1); 10835 if (!hdev->internal_cb_pool) { 10836 dev_err(hdev->dev, "Failed to create internal CB pool\n"); 10837 rc = -ENOMEM; 10838 goto free_internal_cb_pool; 10839 } 10840 10841 rc = gen_pool_add(hdev->internal_cb_pool, (uintptr_t) hdev->internal_cb_pool_virt_addr, 10842 HOST_SPACE_INTERNAL_CB_SZ, -1); 10843 if (rc) { 10844 dev_err(hdev->dev, "Failed to add memory to internal CB pool\n"); 10845 rc = -EFAULT; 10846 goto destroy_internal_cb_pool; 10847 } 10848 10849 hdev->internal_cb_va_base = hl_reserve_va_block(hdev, ctx, HL_VA_RANGE_TYPE_HOST, 10850 HOST_SPACE_INTERNAL_CB_SZ, HL_MMU_VA_ALIGNMENT_NOT_NEEDED); 10851 10852 if (!hdev->internal_cb_va_base) { 10853 rc = -ENOMEM; 10854 goto destroy_internal_cb_pool; 10855 } 10856 10857 mutex_lock(&hdev->mmu_lock); 10858 10859 rc = hl_mmu_map_contiguous(ctx, hdev->internal_cb_va_base, hdev->internal_cb_pool_dma_addr, 10860 HOST_SPACE_INTERNAL_CB_SZ); 10861 if (rc) 10862 goto unreserve_internal_cb_pool; 10863 10864 rc = hl_mmu_invalidate_cache(hdev, false, MMU_OP_USERPTR); 10865 if (rc) 10866 goto unmap_internal_cb_pool; 10867 10868 mutex_unlock(&hdev->mmu_lock); 10869 10870 return 0; 10871 10872 unmap_internal_cb_pool: 10873 hl_mmu_unmap_contiguous(ctx, hdev->internal_cb_va_base, HOST_SPACE_INTERNAL_CB_SZ); 10874 unreserve_internal_cb_pool: 10875 mutex_unlock(&hdev->mmu_lock); 10876 hl_unreserve_va_block(hdev, ctx, hdev->internal_cb_va_base, HOST_SPACE_INTERNAL_CB_SZ); 10877 destroy_internal_cb_pool: 10878 gen_pool_destroy(hdev->internal_cb_pool); 10879 free_internal_cb_pool: 10880 hl_asic_dma_free_coherent(hdev, HOST_SPACE_INTERNAL_CB_SZ, hdev->internal_cb_pool_virt_addr, 10881 hdev->internal_cb_pool_dma_addr); 10882 10883 return rc; 10884 } 10885 10886 static void gaudi2_internal_cb_pool_fini(struct hl_device *hdev, struct hl_ctx *ctx) 10887 { 10888 struct gaudi2_device *gaudi2 = hdev->asic_specific; 10889 10890 if (!(gaudi2->hw_cap_initialized & HW_CAP_PMMU)) 10891 return; 10892 10893 mutex_lock(&hdev->mmu_lock); 10894 hl_mmu_unmap_contiguous(ctx, hdev->internal_cb_va_base, HOST_SPACE_INTERNAL_CB_SZ); 10895 hl_unreserve_va_block(hdev, ctx, hdev->internal_cb_va_base, HOST_SPACE_INTERNAL_CB_SZ); 10896 hl_mmu_invalidate_cache(hdev, true, MMU_OP_USERPTR); 10897 mutex_unlock(&hdev->mmu_lock); 10898 10899 gen_pool_destroy(hdev->internal_cb_pool); 10900 10901 hl_asic_dma_free_coherent(hdev, HOST_SPACE_INTERNAL_CB_SZ, hdev->internal_cb_pool_virt_addr, 10902 hdev->internal_cb_pool_dma_addr); 10903 } 10904 10905 static void gaudi2_restore_user_registers(struct hl_device *hdev) 10906 { 10907 gaudi2_restore_user_sm_registers(hdev); 10908 gaudi2_restore_user_qm_registers(hdev); 10909 } 10910 10911 static int gaudi2_map_virtual_msix_doorbell_memory(struct hl_ctx *ctx) 10912 { 10913 struct hl_device *hdev = ctx->hdev; 10914 struct asic_fixed_properties *prop = &hdev->asic_prop; 10915 struct gaudi2_device *gaudi2 = hdev->asic_specific; 10916 int rc; 10917 10918 rc = hl_mmu_map_page(ctx, RESERVED_VA_FOR_VIRTUAL_MSIX_DOORBELL_START, 10919 gaudi2->virt_msix_db_dma_addr, prop->pmmu.page_size, true); 10920 if (rc) 10921 dev_err(hdev->dev, "Failed to map VA %#llx for virtual MSI-X doorbell memory\n", 10922 RESERVED_VA_FOR_VIRTUAL_MSIX_DOORBELL_START); 10923 10924 return rc; 10925 } 10926 10927 static void gaudi2_unmap_virtual_msix_doorbell_memory(struct hl_ctx *ctx) 10928 { 10929 struct hl_device *hdev = ctx->hdev; 10930 struct asic_fixed_properties *prop = &hdev->asic_prop; 10931 int rc; 10932 10933 rc = hl_mmu_unmap_page(ctx, RESERVED_VA_FOR_VIRTUAL_MSIX_DOORBELL_START, 10934 prop->pmmu.page_size, true); 10935 if (rc) 10936 dev_err(hdev->dev, "Failed to unmap VA %#llx of virtual MSI-X doorbell memory\n", 10937 RESERVED_VA_FOR_VIRTUAL_MSIX_DOORBELL_START); 10938 } 10939 10940 static int gaudi2_ctx_init(struct hl_ctx *ctx) 10941 { 10942 int rc; 10943 10944 if (ctx->asid == HL_KERNEL_ASID_ID) 10945 return 0; 10946 10947 rc = gaudi2_mmu_prepare(ctx->hdev, ctx->asid); 10948 if (rc) 10949 return rc; 10950 10951 /* No need to clear user registers if the device has just 10952 * performed reset, we restore only nic qm registers 10953 */ 10954 if (ctx->hdev->reset_upon_device_release) 10955 gaudi2_restore_nic_qm_registers(ctx->hdev); 10956 else 10957 gaudi2_restore_user_registers(ctx->hdev); 10958 10959 rc = gaudi2_internal_cb_pool_init(ctx->hdev, ctx); 10960 if (rc) 10961 return rc; 10962 10963 rc = gaudi2_map_virtual_msix_doorbell_memory(ctx); 10964 if (rc) 10965 gaudi2_internal_cb_pool_fini(ctx->hdev, ctx); 10966 10967 return rc; 10968 } 10969 10970 static void gaudi2_ctx_fini(struct hl_ctx *ctx) 10971 { 10972 if (ctx->asid == HL_KERNEL_ASID_ID) 10973 return; 10974 10975 gaudi2_internal_cb_pool_fini(ctx->hdev, ctx); 10976 10977 gaudi2_unmap_virtual_msix_doorbell_memory(ctx); 10978 } 10979 10980 static int gaudi2_pre_schedule_cs(struct hl_cs *cs) 10981 { 10982 struct hl_device *hdev = cs->ctx->hdev; 10983 int index = cs->sequence & (hdev->asic_prop.max_pending_cs - 1); 10984 u32 mon_payload, sob_id, mon_id; 10985 10986 if (!cs_needs_completion(cs)) 10987 return 0; 10988 10989 /* 10990 * First 64 SOB/MON are reserved for driver for QMAN auto completion 10991 * mechanism. Each SOB/MON pair are used for a pending CS with the same 10992 * cyclic index. The SOB value is increased when each of the CS jobs is 10993 * completed. When the SOB reaches the number of CS jobs, the monitor 10994 * generates MSI-X interrupt. 10995 */ 10996 10997 sob_id = mon_id = index; 10998 mon_payload = (1 << CQ_ENTRY_SHADOW_INDEX_VALID_SHIFT) | 10999 (1 << CQ_ENTRY_READY_SHIFT) | index; 11000 11001 gaudi2_arm_cq_monitor(hdev, sob_id, mon_id, GAUDI2_RESERVED_CQ_CS_COMPLETION, mon_payload, 11002 cs->jobs_cnt); 11003 11004 return 0; 11005 } 11006 11007 static u32 gaudi2_get_queue_id_for_cq(struct hl_device *hdev, u32 cq_idx) 11008 { 11009 return HL_INVALID_QUEUE; 11010 } 11011 11012 static u32 gaudi2_gen_signal_cb(struct hl_device *hdev, void *data, u16 sob_id, u32 size, bool eb) 11013 { 11014 struct hl_cb *cb = data; 11015 struct packet_msg_short *pkt; 11016 u32 value, ctl, pkt_size = sizeof(*pkt); 11017 11018 pkt = (struct packet_msg_short *) (uintptr_t) (cb->kernel_address + size); 11019 memset(pkt, 0, pkt_size); 11020 11021 /* Inc by 1, Mode ADD */ 11022 value = FIELD_PREP(GAUDI2_PKT_SHORT_VAL_SOB_SYNC_VAL_MASK, 1); 11023 value |= FIELD_PREP(GAUDI2_PKT_SHORT_VAL_SOB_MOD_MASK, 1); 11024 11025 ctl = FIELD_PREP(GAUDI2_PKT_SHORT_CTL_ADDR_MASK, sob_id * 4); 11026 ctl |= FIELD_PREP(GAUDI2_PKT_SHORT_CTL_BASE_MASK, 1); /* SOB base */ 11027 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_OPCODE_MASK, PACKET_MSG_SHORT); 11028 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_EB_MASK, eb); 11029 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_MB_MASK, 1); 11030 11031 pkt->value = cpu_to_le32(value); 11032 pkt->ctl = cpu_to_le32(ctl); 11033 11034 return size + pkt_size; 11035 } 11036 11037 static u32 gaudi2_add_mon_msg_short(struct packet_msg_short *pkt, u32 value, u16 addr) 11038 { 11039 u32 ctl, pkt_size = sizeof(*pkt); 11040 11041 memset(pkt, 0, pkt_size); 11042 11043 ctl = FIELD_PREP(GAUDI2_PKT_SHORT_CTL_ADDR_MASK, addr); 11044 ctl |= FIELD_PREP(GAUDI2_PKT_SHORT_CTL_BASE_MASK, 0); /* MON base */ 11045 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_OPCODE_MASK, PACKET_MSG_SHORT); 11046 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_EB_MASK, 0); 11047 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_MB_MASK, 0); 11048 11049 pkt->value = cpu_to_le32(value); 11050 pkt->ctl = cpu_to_le32(ctl); 11051 11052 return pkt_size; 11053 } 11054 11055 static u32 gaudi2_add_arm_monitor_pkt(struct hl_device *hdev, struct packet_msg_short *pkt, 11056 u16 sob_base, u8 sob_mask, u16 sob_val, u16 addr) 11057 { 11058 u32 ctl, value, pkt_size = sizeof(*pkt); 11059 u8 mask; 11060 11061 if (hl_gen_sob_mask(sob_base, sob_mask, &mask)) { 11062 dev_err(hdev->dev, "sob_base %u (mask %#x) is not valid\n", sob_base, sob_mask); 11063 return 0; 11064 } 11065 11066 memset(pkt, 0, pkt_size); 11067 11068 value = FIELD_PREP(GAUDI2_PKT_SHORT_VAL_MON_SYNC_GID_MASK, sob_base / 8); 11069 value |= FIELD_PREP(GAUDI2_PKT_SHORT_VAL_MON_SYNC_VAL_MASK, sob_val); 11070 value |= FIELD_PREP(GAUDI2_PKT_SHORT_VAL_MON_MODE_MASK, 0); /* GREATER OR EQUAL*/ 11071 value |= FIELD_PREP(GAUDI2_PKT_SHORT_VAL_MON_MASK_MASK, mask); 11072 11073 ctl = FIELD_PREP(GAUDI2_PKT_SHORT_CTL_ADDR_MASK, addr); 11074 ctl |= FIELD_PREP(GAUDI2_PKT_SHORT_CTL_BASE_MASK, 0); /* MON base */ 11075 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_OPCODE_MASK, PACKET_MSG_SHORT); 11076 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_EB_MASK, 0); 11077 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_MB_MASK, 1); 11078 11079 pkt->value = cpu_to_le32(value); 11080 pkt->ctl = cpu_to_le32(ctl); 11081 11082 return pkt_size; 11083 } 11084 11085 static u32 gaudi2_add_fence_pkt(struct packet_fence *pkt) 11086 { 11087 u32 ctl, cfg, pkt_size = sizeof(*pkt); 11088 11089 memset(pkt, 0, pkt_size); 11090 11091 cfg = FIELD_PREP(GAUDI2_PKT_FENCE_CFG_DEC_VAL_MASK, 1); 11092 cfg |= FIELD_PREP(GAUDI2_PKT_FENCE_CFG_TARGET_VAL_MASK, 1); 11093 cfg |= FIELD_PREP(GAUDI2_PKT_FENCE_CFG_ID_MASK, 2); 11094 11095 ctl = FIELD_PREP(GAUDI2_PKT_CTL_OPCODE_MASK, PACKET_FENCE); 11096 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_EB_MASK, 0); 11097 ctl |= FIELD_PREP(GAUDI2_PKT_CTL_MB_MASK, 1); 11098 11099 pkt->cfg = cpu_to_le32(cfg); 11100 pkt->ctl = cpu_to_le32(ctl); 11101 11102 return pkt_size; 11103 } 11104 11105 static u32 gaudi2_gen_wait_cb(struct hl_device *hdev, struct hl_gen_wait_properties *prop) 11106 { 11107 struct hl_cb *cb = prop->data; 11108 void *buf = (void *) (uintptr_t) (cb->kernel_address); 11109 11110 u64 monitor_base, fence_addr = 0; 11111 u32 stream_index, size = prop->size; 11112 u16 msg_addr_offset; 11113 11114 stream_index = prop->q_idx % 4; 11115 fence_addr = CFG_BASE + gaudi2_qm_blocks_bases[prop->q_idx] + 11116 QM_FENCE2_OFFSET + stream_index * 4; 11117 11118 /* 11119 * monitor_base should be the content of the base0 address registers, 11120 * so it will be added to the msg short offsets 11121 */ 11122 monitor_base = mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0; 11123 11124 /* First monitor config packet: low address of the sync */ 11125 msg_addr_offset = (mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRL_0 + prop->mon_id * 4) - 11126 monitor_base; 11127 11128 size += gaudi2_add_mon_msg_short(buf + size, (u32) fence_addr, msg_addr_offset); 11129 11130 /* Second monitor config packet: high address of the sync */ 11131 msg_addr_offset = (mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_ADDRH_0 + prop->mon_id * 4) - 11132 monitor_base; 11133 11134 size += gaudi2_add_mon_msg_short(buf + size, (u32) (fence_addr >> 32), msg_addr_offset); 11135 11136 /* 11137 * Third monitor config packet: the payload, i.e. what to write when the 11138 * sync triggers 11139 */ 11140 msg_addr_offset = (mmDCORE0_SYNC_MNGR_OBJS_MON_PAY_DATA_0 + prop->mon_id * 4) - 11141 monitor_base; 11142 11143 size += gaudi2_add_mon_msg_short(buf + size, 1, msg_addr_offset); 11144 11145 /* Fourth monitor config packet: bind the monitor to a sync object */ 11146 msg_addr_offset = (mmDCORE0_SYNC_MNGR_OBJS_MON_ARM_0 + prop->mon_id * 4) - monitor_base; 11147 11148 size += gaudi2_add_arm_monitor_pkt(hdev, buf + size, prop->sob_base, prop->sob_mask, 11149 prop->sob_val, msg_addr_offset); 11150 11151 /* Fence packet */ 11152 size += gaudi2_add_fence_pkt(buf + size); 11153 11154 return size; 11155 } 11156 11157 static void gaudi2_reset_sob(struct hl_device *hdev, void *data) 11158 { 11159 struct hl_hw_sob *hw_sob = data; 11160 11161 dev_dbg(hdev->dev, "reset SOB, q_idx: %d, sob_id: %d\n", hw_sob->q_idx, hw_sob->sob_id); 11162 11163 WREG32(mmDCORE0_SYNC_MNGR_OBJS_SOB_OBJ_0 + hw_sob->sob_id * 4, 0); 11164 11165 kref_init(&hw_sob->kref); 11166 } 11167 11168 static void gaudi2_reset_sob_group(struct hl_device *hdev, u16 sob_group) 11169 { 11170 } 11171 11172 static u64 gaudi2_get_device_time(struct hl_device *hdev) 11173 { 11174 u64 device_time = ((u64) RREG32(mmPSOC_TIMESTAMP_CNTCVU)) << 32; 11175 11176 return device_time | RREG32(mmPSOC_TIMESTAMP_CNTCVL); 11177 } 11178 11179 static int gaudi2_collective_wait_init_cs(struct hl_cs *cs) 11180 { 11181 return 0; 11182 } 11183 11184 static int gaudi2_collective_wait_create_jobs(struct hl_device *hdev, struct hl_ctx *ctx, 11185 struct hl_cs *cs, u32 wait_queue_id, 11186 u32 collective_engine_id, u32 encaps_signal_offset) 11187 { 11188 return -EINVAL; 11189 } 11190 11191 /* 11192 * hl_mmu_scramble - converts a dram (non power of 2) page-size aligned address 11193 * to DMMU page-size address (64MB) before mapping it in 11194 * the MMU. 11195 * The operation is performed on both the virtual and physical addresses. 11196 * for device with 6 HBMs the scramble is: 11197 * (addr[47:0] / 48M) * 64M + addr % 48M + addr[63:48] 11198 * 11199 * Example: 11200 * ============================================================================= 11201 * Allocated DRAM Reserved VA scrambled VA for MMU mapping Scrambled PA 11202 * Phys address in MMU last 11203 * HOP 11204 * ============================================================================= 11205 * PA1 0x3000000 VA1 0x9C000000 SVA1= (VA1/48M)*64M 0xD0000000 <- PA1/48M 0x1 11206 * PA2 0x9000000 VA2 0x9F000000 SVA2= (VA2/48M)*64M 0xD4000000 <- PA2/48M 0x3 11207 * ============================================================================= 11208 */ 11209 static u64 gaudi2_mmu_scramble_addr(struct hl_device *hdev, u64 raw_addr) 11210 { 11211 struct asic_fixed_properties *prop = &hdev->asic_prop; 11212 u32 divisor, mod_va; 11213 u64 div_va; 11214 11215 /* accept any address in the DRAM address space */ 11216 if (hl_mem_area_inside_range(raw_addr, sizeof(raw_addr), DRAM_PHYS_BASE, 11217 VA_HBM_SPACE_END)) { 11218 11219 divisor = prop->num_functional_hbms * GAUDI2_HBM_MMU_SCRM_MEM_SIZE; 11220 div_va = div_u64_rem(raw_addr & GAUDI2_HBM_MMU_SCRM_ADDRESS_MASK, divisor, &mod_va); 11221 return (raw_addr & ~GAUDI2_HBM_MMU_SCRM_ADDRESS_MASK) | 11222 (div_va << GAUDI2_HBM_MMU_SCRM_DIV_SHIFT) | 11223 (mod_va << GAUDI2_HBM_MMU_SCRM_MOD_SHIFT); 11224 } 11225 11226 return raw_addr; 11227 } 11228 11229 static u64 gaudi2_mmu_descramble_addr(struct hl_device *hdev, u64 scrambled_addr) 11230 { 11231 struct asic_fixed_properties *prop = &hdev->asic_prop; 11232 u32 divisor, mod_va; 11233 u64 div_va; 11234 11235 /* accept any address in the DRAM address space */ 11236 if (hl_mem_area_inside_range(scrambled_addr, sizeof(scrambled_addr), DRAM_PHYS_BASE, 11237 VA_HBM_SPACE_END)) { 11238 11239 divisor = prop->num_functional_hbms * GAUDI2_HBM_MMU_SCRM_MEM_SIZE; 11240 div_va = div_u64_rem(scrambled_addr & GAUDI2_HBM_MMU_SCRM_ADDRESS_MASK, 11241 PAGE_SIZE_64MB, &mod_va); 11242 11243 return ((scrambled_addr & ~GAUDI2_HBM_MMU_SCRM_ADDRESS_MASK) + 11244 (div_va * divisor + mod_va)); 11245 } 11246 11247 return scrambled_addr; 11248 } 11249 11250 static u32 gaudi2_get_dec_base_addr(struct hl_device *hdev, u32 core_id) 11251 { 11252 u32 base = 0, dcore_id, dec_id; 11253 11254 if (core_id >= NUMBER_OF_DEC) { 11255 dev_err(hdev->dev, "Unexpected core number %d for DEC\n", core_id); 11256 goto out; 11257 } 11258 11259 if (core_id < 8) { 11260 dcore_id = core_id / NUM_OF_DEC_PER_DCORE; 11261 dec_id = core_id % NUM_OF_DEC_PER_DCORE; 11262 11263 base = mmDCORE0_DEC0_CMD_BASE + dcore_id * DCORE_OFFSET + 11264 dec_id * DCORE_VDEC_OFFSET; 11265 } else { 11266 /* PCIe Shared Decoder */ 11267 base = mmPCIE_DEC0_CMD_BASE + ((core_id % 8) * PCIE_VDEC_OFFSET); 11268 } 11269 out: 11270 return base; 11271 } 11272 11273 static int gaudi2_get_hw_block_id(struct hl_device *hdev, u64 block_addr, 11274 u32 *block_size, u32 *block_id) 11275 { 11276 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11277 int i; 11278 11279 for (i = 0 ; i < NUM_USER_MAPPED_BLOCKS ; i++) { 11280 if (block_addr == CFG_BASE + gaudi2->mapped_blocks[i].address) { 11281 *block_id = i; 11282 if (block_size) 11283 *block_size = gaudi2->mapped_blocks[i].size; 11284 return 0; 11285 } 11286 } 11287 11288 dev_err(hdev->dev, "Invalid block address %#llx", block_addr); 11289 11290 return -EINVAL; 11291 } 11292 11293 static int gaudi2_block_mmap(struct hl_device *hdev, struct vm_area_struct *vma, 11294 u32 block_id, u32 block_size) 11295 { 11296 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11297 u64 offset_in_bar; 11298 u64 address; 11299 int rc; 11300 11301 if (block_id >= NUM_USER_MAPPED_BLOCKS) { 11302 dev_err(hdev->dev, "Invalid block id %u", block_id); 11303 return -EINVAL; 11304 } 11305 11306 /* we allow mapping only an entire block */ 11307 if (block_size != gaudi2->mapped_blocks[block_id].size) { 11308 dev_err(hdev->dev, "Invalid block size %u", block_size); 11309 return -EINVAL; 11310 } 11311 11312 offset_in_bar = CFG_BASE + gaudi2->mapped_blocks[block_id].address - STM_FLASH_BASE_ADDR; 11313 11314 address = pci_resource_start(hdev->pdev, SRAM_CFG_BAR_ID) + offset_in_bar; 11315 11316 vm_flags_set(vma, VM_IO | VM_PFNMAP | VM_DONTEXPAND | VM_DONTDUMP | 11317 VM_DONTCOPY | VM_NORESERVE); 11318 11319 rc = remap_pfn_range(vma, vma->vm_start, address >> PAGE_SHIFT, 11320 block_size, vma->vm_page_prot); 11321 if (rc) 11322 dev_err(hdev->dev, "remap_pfn_range error %d", rc); 11323 11324 return rc; 11325 } 11326 11327 static void gaudi2_enable_events_from_fw(struct hl_device *hdev) 11328 { 11329 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11330 11331 struct cpu_dyn_regs *dyn_regs = &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 11332 u32 irq_handler_offset = le32_to_cpu(dyn_regs->gic_host_ints_irq); 11333 11334 if (gaudi2->hw_cap_initialized & HW_CAP_CPU_Q) 11335 WREG32(irq_handler_offset, 11336 gaudi2_irq_map_table[GAUDI2_EVENT_CPU_INTS_REGISTER].cpu_id); 11337 } 11338 11339 static int gaudi2_get_mmu_base(struct hl_device *hdev, u64 mmu_id, u32 *mmu_base) 11340 { 11341 switch (mmu_id) { 11342 case HW_CAP_DCORE0_DMMU0: 11343 *mmu_base = mmDCORE0_HMMU0_MMU_BASE; 11344 break; 11345 case HW_CAP_DCORE0_DMMU1: 11346 *mmu_base = mmDCORE0_HMMU1_MMU_BASE; 11347 break; 11348 case HW_CAP_DCORE0_DMMU2: 11349 *mmu_base = mmDCORE0_HMMU2_MMU_BASE; 11350 break; 11351 case HW_CAP_DCORE0_DMMU3: 11352 *mmu_base = mmDCORE0_HMMU3_MMU_BASE; 11353 break; 11354 case HW_CAP_DCORE1_DMMU0: 11355 *mmu_base = mmDCORE1_HMMU0_MMU_BASE; 11356 break; 11357 case HW_CAP_DCORE1_DMMU1: 11358 *mmu_base = mmDCORE1_HMMU1_MMU_BASE; 11359 break; 11360 case HW_CAP_DCORE1_DMMU2: 11361 *mmu_base = mmDCORE1_HMMU2_MMU_BASE; 11362 break; 11363 case HW_CAP_DCORE1_DMMU3: 11364 *mmu_base = mmDCORE1_HMMU3_MMU_BASE; 11365 break; 11366 case HW_CAP_DCORE2_DMMU0: 11367 *mmu_base = mmDCORE2_HMMU0_MMU_BASE; 11368 break; 11369 case HW_CAP_DCORE2_DMMU1: 11370 *mmu_base = mmDCORE2_HMMU1_MMU_BASE; 11371 break; 11372 case HW_CAP_DCORE2_DMMU2: 11373 *mmu_base = mmDCORE2_HMMU2_MMU_BASE; 11374 break; 11375 case HW_CAP_DCORE2_DMMU3: 11376 *mmu_base = mmDCORE2_HMMU3_MMU_BASE; 11377 break; 11378 case HW_CAP_DCORE3_DMMU0: 11379 *mmu_base = mmDCORE3_HMMU0_MMU_BASE; 11380 break; 11381 case HW_CAP_DCORE3_DMMU1: 11382 *mmu_base = mmDCORE3_HMMU1_MMU_BASE; 11383 break; 11384 case HW_CAP_DCORE3_DMMU2: 11385 *mmu_base = mmDCORE3_HMMU2_MMU_BASE; 11386 break; 11387 case HW_CAP_DCORE3_DMMU3: 11388 *mmu_base = mmDCORE3_HMMU3_MMU_BASE; 11389 break; 11390 case HW_CAP_PMMU: 11391 *mmu_base = mmPMMU_HBW_MMU_BASE; 11392 break; 11393 default: 11394 return -EINVAL; 11395 } 11396 11397 return 0; 11398 } 11399 11400 static void gaudi2_ack_mmu_error(struct hl_device *hdev, u64 mmu_id) 11401 { 11402 bool is_pmmu = (mmu_id == HW_CAP_PMMU); 11403 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11404 u32 mmu_base; 11405 11406 if (!(gaudi2->hw_cap_initialized & mmu_id)) 11407 return; 11408 11409 if (gaudi2_get_mmu_base(hdev, mmu_id, &mmu_base)) 11410 return; 11411 11412 gaudi2_handle_page_error(hdev, mmu_base, is_pmmu, NULL); 11413 gaudi2_handle_access_error(hdev, mmu_base, is_pmmu); 11414 } 11415 11416 static int gaudi2_ack_mmu_page_fault_or_access_error(struct hl_device *hdev, u64 mmu_cap_mask) 11417 { 11418 u32 i, mmu_id, num_of_hmmus = NUM_OF_HMMU_PER_DCORE * NUM_OF_DCORES; 11419 11420 /* check all HMMUs */ 11421 for (i = 0 ; i < num_of_hmmus ; i++) { 11422 mmu_id = HW_CAP_DCORE0_DMMU0 << i; 11423 11424 if (mmu_cap_mask & mmu_id) 11425 gaudi2_ack_mmu_error(hdev, mmu_id); 11426 } 11427 11428 /* check PMMU */ 11429 if (mmu_cap_mask & HW_CAP_PMMU) 11430 gaudi2_ack_mmu_error(hdev, HW_CAP_PMMU); 11431 11432 return 0; 11433 } 11434 11435 static void gaudi2_get_msi_info(__le32 *table) 11436 { 11437 table[CPUCP_EVENT_QUEUE_MSI_TYPE] = cpu_to_le32(GAUDI2_EVENT_QUEUE_MSIX_IDX); 11438 table[CPUCP_EVENT_QUEUE_ERR_MSI_TYPE] = cpu_to_le32(GAUDI2_IRQ_NUM_EQ_ERROR); 11439 } 11440 11441 static int gaudi2_map_pll_idx_to_fw_idx(u32 pll_idx) 11442 { 11443 switch (pll_idx) { 11444 case HL_GAUDI2_CPU_PLL: return CPU_PLL; 11445 case HL_GAUDI2_PCI_PLL: return PCI_PLL; 11446 case HL_GAUDI2_NIC_PLL: return NIC_PLL; 11447 case HL_GAUDI2_DMA_PLL: return DMA_PLL; 11448 case HL_GAUDI2_MESH_PLL: return MESH_PLL; 11449 case HL_GAUDI2_MME_PLL: return MME_PLL; 11450 case HL_GAUDI2_TPC_PLL: return TPC_PLL; 11451 case HL_GAUDI2_IF_PLL: return IF_PLL; 11452 case HL_GAUDI2_SRAM_PLL: return SRAM_PLL; 11453 case HL_GAUDI2_HBM_PLL: return HBM_PLL; 11454 case HL_GAUDI2_VID_PLL: return VID_PLL; 11455 case HL_GAUDI2_MSS_PLL: return MSS_PLL; 11456 default: return -EINVAL; 11457 } 11458 } 11459 11460 static int gaudi2_gen_sync_to_engine_map(struct hl_device *hdev, struct hl_sync_to_engine_map *map) 11461 { 11462 /* Not implemented */ 11463 return 0; 11464 } 11465 11466 static int gaudi2_monitor_valid(struct hl_mon_state_dump *mon) 11467 { 11468 /* Not implemented */ 11469 return 0; 11470 } 11471 11472 static int gaudi2_print_single_monitor(char **buf, size_t *size, size_t *offset, 11473 struct hl_device *hdev, struct hl_mon_state_dump *mon) 11474 { 11475 /* Not implemented */ 11476 return 0; 11477 } 11478 11479 11480 static int gaudi2_print_fences_single_engine(struct hl_device *hdev, u64 base_offset, 11481 u64 status_base_offset, enum hl_sync_engine_type engine_type, 11482 u32 engine_id, char **buf, size_t *size, size_t *offset) 11483 { 11484 /* Not implemented */ 11485 return 0; 11486 } 11487 11488 11489 static struct hl_state_dump_specs_funcs gaudi2_state_dump_funcs = { 11490 .monitor_valid = gaudi2_monitor_valid, 11491 .print_single_monitor = gaudi2_print_single_monitor, 11492 .gen_sync_to_engine_map = gaudi2_gen_sync_to_engine_map, 11493 .print_fences_single_engine = gaudi2_print_fences_single_engine, 11494 }; 11495 11496 static void gaudi2_state_dump_init(struct hl_device *hdev) 11497 { 11498 /* Not implemented */ 11499 hdev->state_dump_specs.props = gaudi2_state_dump_specs_props; 11500 hdev->state_dump_specs.funcs = gaudi2_state_dump_funcs; 11501 } 11502 11503 static u32 gaudi2_get_sob_addr(struct hl_device *hdev, u32 sob_id) 11504 { 11505 return 0; 11506 } 11507 11508 static u32 *gaudi2_get_stream_master_qid_arr(void) 11509 { 11510 return NULL; 11511 } 11512 11513 static void gaudi2_add_device_attr(struct hl_device *hdev, struct attribute_group *dev_clk_attr_grp, 11514 struct attribute_group *dev_vrm_attr_grp) 11515 { 11516 hl_sysfs_add_dev_clk_attr(hdev, dev_clk_attr_grp); 11517 hl_sysfs_add_dev_vrm_attr(hdev, dev_vrm_attr_grp); 11518 } 11519 11520 static int gaudi2_mmu_get_real_page_size(struct hl_device *hdev, struct hl_mmu_properties *mmu_prop, 11521 u32 page_size, u32 *real_page_size, bool is_dram_addr) 11522 { 11523 struct asic_fixed_properties *prop = &hdev->asic_prop; 11524 11525 /* for host pages the page size must be */ 11526 if (!is_dram_addr) { 11527 if (page_size % mmu_prop->page_size) 11528 goto page_size_err; 11529 11530 *real_page_size = mmu_prop->page_size; 11531 return 0; 11532 } 11533 11534 if ((page_size % prop->dram_page_size) || (prop->dram_page_size > mmu_prop->page_size)) 11535 goto page_size_err; 11536 11537 /* 11538 * MMU page size is different from DRAM page size (more precisely, DMMU page is greater 11539 * than DRAM page size). 11540 * for this reason work with the DRAM page size and let the MMU scrambling routine handle 11541 * this mismatch when calculating the address to place in the MMU page table. 11542 * (in that case also make sure that the dram_page_size is not greater than the 11543 * mmu page size) 11544 */ 11545 *real_page_size = prop->dram_page_size; 11546 11547 return 0; 11548 11549 page_size_err: 11550 dev_err(hdev->dev, "page size of 0x%X is not 0x%X aligned, can't map\n", 11551 page_size, mmu_prop->page_size >> 10); 11552 return -EFAULT; 11553 } 11554 11555 static int gaudi2_get_monitor_dump(struct hl_device *hdev, void *data) 11556 { 11557 return -EOPNOTSUPP; 11558 } 11559 11560 int gaudi2_send_device_activity(struct hl_device *hdev, bool open) 11561 { 11562 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11563 11564 if (!(gaudi2->hw_cap_initialized & HW_CAP_CPU_Q)) 11565 return 0; 11566 11567 return hl_fw_send_device_activity(hdev, open); 11568 } 11569 11570 static u64 gaudi2_read_pte(struct hl_device *hdev, u64 addr) 11571 { 11572 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11573 u64 val; 11574 11575 if (hdev->reset_info.hard_reset_pending) 11576 return U64_MAX; 11577 11578 val = readq(hdev->pcie_bar[DRAM_BAR_ID] + (addr - gaudi2->dram_bar_cur_addr)); 11579 11580 return val; 11581 } 11582 11583 static void gaudi2_write_pte(struct hl_device *hdev, u64 addr, u64 val) 11584 { 11585 struct gaudi2_device *gaudi2 = hdev->asic_specific; 11586 11587 if (hdev->reset_info.hard_reset_pending) 11588 return; 11589 11590 writeq(val, hdev->pcie_bar[DRAM_BAR_ID] + (addr - gaudi2->dram_bar_cur_addr)); 11591 } 11592 11593 static const struct hl_asic_funcs gaudi2_funcs = { 11594 .early_init = gaudi2_early_init, 11595 .early_fini = gaudi2_early_fini, 11596 .late_init = gaudi2_late_init, 11597 .late_fini = gaudi2_late_fini, 11598 .sw_init = gaudi2_sw_init, 11599 .sw_fini = gaudi2_sw_fini, 11600 .hw_init = gaudi2_hw_init, 11601 .hw_fini = gaudi2_hw_fini, 11602 .halt_engines = gaudi2_halt_engines, 11603 .suspend = gaudi2_suspend, 11604 .resume = gaudi2_resume, 11605 .mmap = gaudi2_mmap, 11606 .ring_doorbell = gaudi2_ring_doorbell, 11607 .pqe_write = gaudi2_pqe_write, 11608 .asic_dma_alloc_coherent = gaudi2_dma_alloc_coherent, 11609 .asic_dma_free_coherent = gaudi2_dma_free_coherent, 11610 .scrub_device_mem = gaudi2_scrub_device_mem, 11611 .scrub_device_dram = gaudi2_scrub_device_dram, 11612 .get_int_queue_base = NULL, 11613 .test_queues = gaudi2_test_queues, 11614 .asic_dma_pool_zalloc = gaudi2_dma_pool_zalloc, 11615 .asic_dma_pool_free = gaudi2_dma_pool_free, 11616 .cpu_accessible_dma_pool_alloc = gaudi2_cpu_accessible_dma_pool_alloc, 11617 .cpu_accessible_dma_pool_free = gaudi2_cpu_accessible_dma_pool_free, 11618 .dma_unmap_sgtable = hl_asic_dma_unmap_sgtable, 11619 .cs_parser = gaudi2_cs_parser, 11620 .dma_map_sgtable = hl_asic_dma_map_sgtable, 11621 .add_end_of_cb_packets = NULL, 11622 .update_eq_ci = gaudi2_update_eq_ci, 11623 .context_switch = gaudi2_context_switch, 11624 .restore_phase_topology = gaudi2_restore_phase_topology, 11625 .debugfs_read_dma = gaudi2_debugfs_read_dma, 11626 .add_device_attr = gaudi2_add_device_attr, 11627 .handle_eqe = gaudi2_handle_eqe, 11628 .get_events_stat = gaudi2_get_events_stat, 11629 .read_pte = gaudi2_read_pte, 11630 .write_pte = gaudi2_write_pte, 11631 .mmu_invalidate_cache = gaudi2_mmu_invalidate_cache, 11632 .mmu_invalidate_cache_range = gaudi2_mmu_invalidate_cache_range, 11633 .mmu_prefetch_cache_range = NULL, 11634 .send_heartbeat = gaudi2_send_heartbeat, 11635 .debug_coresight = gaudi2_debug_coresight, 11636 .is_device_idle = gaudi2_is_device_idle, 11637 .compute_reset_late_init = gaudi2_compute_reset_late_init, 11638 .hw_queues_lock = gaudi2_hw_queues_lock, 11639 .hw_queues_unlock = gaudi2_hw_queues_unlock, 11640 .get_pci_id = gaudi2_get_pci_id, 11641 .get_eeprom_data = gaudi2_get_eeprom_data, 11642 .get_monitor_dump = gaudi2_get_monitor_dump, 11643 .send_cpu_message = gaudi2_send_cpu_message, 11644 .pci_bars_map = gaudi2_pci_bars_map, 11645 .init_iatu = gaudi2_init_iatu, 11646 .rreg = hl_rreg, 11647 .wreg = hl_wreg, 11648 .halt_coresight = gaudi2_halt_coresight, 11649 .ctx_init = gaudi2_ctx_init, 11650 .ctx_fini = gaudi2_ctx_fini, 11651 .pre_schedule_cs = gaudi2_pre_schedule_cs, 11652 .get_queue_id_for_cq = gaudi2_get_queue_id_for_cq, 11653 .load_firmware_to_device = NULL, 11654 .load_boot_fit_to_device = NULL, 11655 .get_signal_cb_size = gaudi2_get_signal_cb_size, 11656 .get_wait_cb_size = gaudi2_get_wait_cb_size, 11657 .gen_signal_cb = gaudi2_gen_signal_cb, 11658 .gen_wait_cb = gaudi2_gen_wait_cb, 11659 .reset_sob = gaudi2_reset_sob, 11660 .reset_sob_group = gaudi2_reset_sob_group, 11661 .get_device_time = gaudi2_get_device_time, 11662 .pb_print_security_errors = gaudi2_pb_print_security_errors, 11663 .collective_wait_init_cs = gaudi2_collective_wait_init_cs, 11664 .collective_wait_create_jobs = gaudi2_collective_wait_create_jobs, 11665 .get_dec_base_addr = gaudi2_get_dec_base_addr, 11666 .scramble_addr = gaudi2_mmu_scramble_addr, 11667 .descramble_addr = gaudi2_mmu_descramble_addr, 11668 .ack_protection_bits_errors = gaudi2_ack_protection_bits_errors, 11669 .get_hw_block_id = gaudi2_get_hw_block_id, 11670 .hw_block_mmap = gaudi2_block_mmap, 11671 .enable_events_from_fw = gaudi2_enable_events_from_fw, 11672 .ack_mmu_errors = gaudi2_ack_mmu_page_fault_or_access_error, 11673 .get_msi_info = gaudi2_get_msi_info, 11674 .map_pll_idx_to_fw_idx = gaudi2_map_pll_idx_to_fw_idx, 11675 .init_firmware_preload_params = gaudi2_init_firmware_preload_params, 11676 .init_firmware_loader = gaudi2_init_firmware_loader, 11677 .init_cpu_scrambler_dram = gaudi2_init_scrambler_hbm, 11678 .state_dump_init = gaudi2_state_dump_init, 11679 .get_sob_addr = &gaudi2_get_sob_addr, 11680 .set_pci_memory_regions = gaudi2_set_pci_memory_regions, 11681 .get_stream_master_qid_arr = gaudi2_get_stream_master_qid_arr, 11682 .check_if_razwi_happened = gaudi2_check_if_razwi_happened, 11683 .mmu_get_real_page_size = gaudi2_mmu_get_real_page_size, 11684 .access_dev_mem = hl_access_dev_mem, 11685 .set_dram_bar_base = gaudi2_set_hbm_bar_base, 11686 .set_engine_cores = gaudi2_set_engine_cores, 11687 .set_engines = gaudi2_set_engines, 11688 .send_device_activity = gaudi2_send_device_activity, 11689 .set_dram_properties = gaudi2_set_dram_properties, 11690 .set_binning_masks = gaudi2_set_binning_masks, 11691 }; 11692 11693 void gaudi2_set_asic_funcs(struct hl_device *hdev) 11694 { 11695 hdev->asic_funcs = &gaudi2_funcs; 11696 } 11697