1297b0cebSHawking Zhang /* 2297b0cebSHawking Zhang * Copyright 2025 Advanced Micro Devices, Inc. 3297b0cebSHawking Zhang * 4297b0cebSHawking Zhang * Permission is hereby granted, free of charge, to any person obtaining a 5297b0cebSHawking Zhang * copy of this software and associated documentation files (the "Software"), 6297b0cebSHawking Zhang * to deal in the Software without restriction, including without limitation 7297b0cebSHawking Zhang * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8297b0cebSHawking Zhang * and/or sell copies of the Software, and to permit persons to whom the 9297b0cebSHawking Zhang * Software is furnished to do so, subject to the following conditions: 10297b0cebSHawking Zhang * 11297b0cebSHawking Zhang * The above copyright notice and this permission notice shall be included in 12297b0cebSHawking Zhang * all copies or substantial portions of the Software. 13297b0cebSHawking Zhang * 14297b0cebSHawking Zhang * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15297b0cebSHawking Zhang * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16297b0cebSHawking Zhang * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17297b0cebSHawking Zhang * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18297b0cebSHawking Zhang * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19297b0cebSHawking Zhang * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20297b0cebSHawking Zhang * OTHER DEALINGS IN THE SOFTWARE. 21297b0cebSHawking Zhang * 22297b0cebSHawking Zhang */ 23297b0cebSHawking Zhang #include "amdgpu.h" 24297b0cebSHawking Zhang #include "soc15.h" 25297b0cebSHawking Zhang #include "soc15_common.h" 26297b0cebSHawking Zhang #include "soc_v1_0.h" 27fe1c48e9SLikun Gao #include "amdgpu_ip.h" 28a9368961SHawking Zhang #include "amdgpu_imu.h" 29a9368961SHawking Zhang #include "gfxhub_v12_1.h" 30a9368961SHawking Zhang #include "sdma_v7_1.h" 31a9368961SHawking Zhang #include "gfx_v12_1.h" 32297b0cebSHawking Zhang 33297b0cebSHawking Zhang #include "gc/gc_12_1_0_offset.h" 34297b0cebSHawking Zhang #include "gc/gc_12_1_0_sh_mask.h" 35297b0cebSHawking Zhang #include "mp/mp_15_0_8_offset.h" 36297b0cebSHawking Zhang 37fcc4fc75SLikun Gao #define XCC_REG_RANGE_0_LOW 0x1260 /* XCC gfxdec0 lower Bound */ 38fcc4fc75SLikun Gao #define XCC_REG_RANGE_0_HIGH 0x3C00 /* XCC gfxdec0 upper Bound */ 39fcc4fc75SLikun Gao #define XCC_REG_RANGE_1_LOW 0xA000 /* XCC gfxdec1 lower Bound */ 40fcc4fc75SLikun Gao #define XCC_REG_RANGE_1_HIGH 0x10000 /* XCC gfxdec1 upper Bound */ 41fcc4fc75SLikun Gao #define NORMALIZE_XCC_REG_OFFSET(offset) \ 42fcc4fc75SLikun Gao (offset & 0xFFFF) 43fcc4fc75SLikun Gao 44297b0cebSHawking Zhang /* Initialized doorbells for amdgpu including multimedia 45297b0cebSHawking Zhang * KFD can use all the rest in 2M doorbell bar */ 46297b0cebSHawking Zhang static void soc_v1_0_doorbell_index_init(struct amdgpu_device *adev) 47297b0cebSHawking Zhang { 48297b0cebSHawking Zhang int i; 49297b0cebSHawking Zhang 50297b0cebSHawking Zhang adev->doorbell_index.kiq = AMDGPU_SOC_V1_0_DOORBELL_KIQ_START; 51297b0cebSHawking Zhang 52297b0cebSHawking Zhang adev->doorbell_index.mec_ring0 = AMDGPU_SOC_V1_0_DOORBELL_MEC_RING_START; 53297b0cebSHawking Zhang adev->doorbell_index.mes_ring0 = AMDGPU_SOC_V1_0_DOORBELL_MES_RING0; 54297b0cebSHawking Zhang adev->doorbell_index.mes_ring1 = AMDGPU_SOC_V1_0_DOORBELL_MES_RING1; 55297b0cebSHawking Zhang 56297b0cebSHawking Zhang adev->doorbell_index.userqueue_start = AMDGPU_SOC_V1_0_DOORBELL_USERQUEUE_START; 57297b0cebSHawking Zhang adev->doorbell_index.userqueue_end = AMDGPU_SOC_V1_0_DOORBELL_USERQUEUE_END; 58297b0cebSHawking Zhang adev->doorbell_index.xcc_doorbell_range = AMDGPU_SOC_V1_0_DOORBELL_XCC_RANGE; 59297b0cebSHawking Zhang 60297b0cebSHawking Zhang adev->doorbell_index.sdma_doorbell_range = 20; 61297b0cebSHawking Zhang for (i = 0; i < adev->sdma.num_instances; i++) 62297b0cebSHawking Zhang adev->doorbell_index.sdma_engine[i] = 63297b0cebSHawking Zhang AMDGPU_SOC_V1_0_DOORBELL_sDMA_ENGINE_START + 64297b0cebSHawking Zhang i * (adev->doorbell_index.sdma_doorbell_range >> 1); 65297b0cebSHawking Zhang 66297b0cebSHawking Zhang adev->doorbell_index.ih = AMDGPU_SOC_V1_0_DOORBELL_IH; 67297b0cebSHawking Zhang adev->doorbell_index.vcn.vcn_ring0_1 = AMDGPU_SOC_V1_0_DOORBELL_VCN_START; 68297b0cebSHawking Zhang 69297b0cebSHawking Zhang adev->doorbell_index.first_non_cp = AMDGPU_SOC_V1_0_DOORBELL_FIRST_NON_CP; 70297b0cebSHawking Zhang adev->doorbell_index.last_non_cp = AMDGPU_SOC_V1_0_DOORBELL_LAST_NON_CP; 71297b0cebSHawking Zhang 72297b0cebSHawking Zhang adev->doorbell_index.max_assignment = AMDGPU_SOC_V1_0_DOORBELL_MAX_ASSIGNMENT << 1; 73297b0cebSHawking Zhang } 74297b0cebSHawking Zhang 75*21677982SLe Ma /* Fixed pattern for upper 32bits smn addressing. 76*21677982SLe Ma * bit[47:40]: Socket ID 77*21677982SLe Ma * bit[39:34]: Die ID 78*21677982SLe Ma * bit[32]: local or remote die in same socket 79*21677982SLe Ma * The ext_id is comprised of socket_id and die_id. 80*21677982SLe Ma * ext_id = (socket_id << 6) | (die_id) 81*21677982SLe Ma */ 82*21677982SLe Ma u64 soc_v1_0_encode_ext_smn_addressing(int ext_id) 83*21677982SLe Ma { 84*21677982SLe Ma u64 ext_offset; 85*21677982SLe Ma int socket_id, die_id; 86*21677982SLe Ma 87*21677982SLe Ma /* local die routing for MID0 on local socket */ 88*21677982SLe Ma if (ext_id == 0) 89*21677982SLe Ma return 0; 90*21677982SLe Ma 91*21677982SLe Ma die_id = ext_id & 0x3; 92*21677982SLe Ma socket_id = (ext_id >> 6) & 0xff; 93*21677982SLe Ma 94*21677982SLe Ma /* Initiated from host, accessing to non-MID0 is cross-die traffic */ 95*21677982SLe Ma if (socket_id == 0) 96*21677982SLe Ma ext_offset = ((u64)die_id << 34) | (1ULL << 32); 97*21677982SLe Ma else if (socket_id != 0 && die_id != 0) 98*21677982SLe Ma ext_offset = ((u64)socket_id << 40) | ((u64)die_id << 34) | 99*21677982SLe Ma (3ULL << 32); 100*21677982SLe Ma else 101*21677982SLe Ma ext_offset = ((u64)socket_id << 40) | (1ULL << 33); 102*21677982SLe Ma 103*21677982SLe Ma return ext_offset; 104*21677982SLe Ma } 105*21677982SLe Ma 106297b0cebSHawking Zhang static u32 soc_v1_0_get_config_memsize(struct amdgpu_device *adev) 107297b0cebSHawking Zhang { 108297b0cebSHawking Zhang return adev->nbio.funcs->get_memsize(adev); 109297b0cebSHawking Zhang } 110297b0cebSHawking Zhang 111297b0cebSHawking Zhang static u32 soc_v1_0_get_xclk(struct amdgpu_device *adev) 112297b0cebSHawking Zhang { 113297b0cebSHawking Zhang return adev->clock.spll.reference_freq; 114297b0cebSHawking Zhang } 115297b0cebSHawking Zhang 116297b0cebSHawking Zhang void soc_v1_0_grbm_select(struct amdgpu_device *adev, 117297b0cebSHawking Zhang u32 me, u32 pipe, 118297b0cebSHawking Zhang u32 queue, u32 vmid, 119297b0cebSHawking Zhang int xcc_id) 120297b0cebSHawking Zhang { 121297b0cebSHawking Zhang u32 grbm_gfx_cntl = 0; 122297b0cebSHawking Zhang grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, PIPEID, pipe); 123297b0cebSHawking Zhang grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, MEID, me); 124297b0cebSHawking Zhang grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, VMID, vmid); 125297b0cebSHawking Zhang grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, QUEUEID, queue); 126297b0cebSHawking Zhang 127297b0cebSHawking Zhang WREG32_SOC15_RLC_SHADOW(GC, xcc_id, regGRBM_GFX_CNTL, grbm_gfx_cntl); 128297b0cebSHawking Zhang } 129297b0cebSHawking Zhang 130297b0cebSHawking Zhang static struct soc15_allowed_register_entry soc_v1_0_allowed_read_registers[] = { 131297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regGRBM_STATUS) }, 132297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regGRBM_STATUS2) }, 133297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regGRBM_STATUS3) }, 134297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regGRBM_STATUS_SE0) }, 135297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regGRBM_STATUS_SE1) }, 136297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_STAT) }, 137297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_STALLED_STAT1) }, 138297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_STALLED_STAT2) }, 139297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_STALLED_STAT3) }, 140297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_CPF_BUSY_STAT) }, 141297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_CPF_STALLED_STAT1) }, 142297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_CPF_STATUS) }, 143297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_CPC_BUSY_STAT) }, 144297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_CPC_STALLED_STAT1) }, 145297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regCP_CPC_STATUS) }, 146297b0cebSHawking Zhang { SOC15_REG_ENTRY(GC, 0, regGB_ADDR_CONFIG_1) }, 147297b0cebSHawking Zhang }; 148297b0cebSHawking Zhang 149297b0cebSHawking Zhang static uint32_t soc_v1_0_read_indexed_register(struct amdgpu_device *adev, 150297b0cebSHawking Zhang u32 se_num, 151297b0cebSHawking Zhang u32 sh_num, 152297b0cebSHawking Zhang u32 reg_offset) 153297b0cebSHawking Zhang { 154297b0cebSHawking Zhang uint32_t val; 155297b0cebSHawking Zhang 156297b0cebSHawking Zhang mutex_lock(&adev->grbm_idx_mutex); 157297b0cebSHawking Zhang if (se_num != 0xffffffff || sh_num != 0xffffffff) 158297b0cebSHawking Zhang amdgpu_gfx_select_se_sh(adev, se_num, sh_num, 0xffffffff, 0); 159297b0cebSHawking Zhang 160297b0cebSHawking Zhang val = RREG32(reg_offset); 161297b0cebSHawking Zhang 162297b0cebSHawking Zhang if (se_num != 0xffffffff || sh_num != 0xffffffff) 163297b0cebSHawking Zhang amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff, 0); 164297b0cebSHawking Zhang mutex_unlock(&adev->grbm_idx_mutex); 165297b0cebSHawking Zhang return val; 166297b0cebSHawking Zhang } 167297b0cebSHawking Zhang 168297b0cebSHawking Zhang static uint32_t soc_v1_0_get_register_value(struct amdgpu_device *adev, 169297b0cebSHawking Zhang bool indexed, u32 se_num, 170297b0cebSHawking Zhang u32 sh_num, u32 reg_offset) 171297b0cebSHawking Zhang { 172297b0cebSHawking Zhang if (indexed) { 173297b0cebSHawking Zhang return soc_v1_0_read_indexed_register(adev, se_num, sh_num, reg_offset); 174297b0cebSHawking Zhang } else { 175297b0cebSHawking Zhang if (reg_offset == SOC15_REG_OFFSET(GC, 0, regGB_ADDR_CONFIG_1) && 176297b0cebSHawking Zhang adev->gfx.config.gb_addr_config) 177297b0cebSHawking Zhang return adev->gfx.config.gb_addr_config; 178297b0cebSHawking Zhang return RREG32(reg_offset); 179297b0cebSHawking Zhang } 180297b0cebSHawking Zhang } 181297b0cebSHawking Zhang 182297b0cebSHawking Zhang static int soc_v1_0_read_register(struct amdgpu_device *adev, 183297b0cebSHawking Zhang u32 se_num, u32 sh_num, 184297b0cebSHawking Zhang u32 reg_offset, u32 *value) 185297b0cebSHawking Zhang { 186297b0cebSHawking Zhang uint32_t i; 187297b0cebSHawking Zhang struct soc15_allowed_register_entry *en; 188297b0cebSHawking Zhang 189297b0cebSHawking Zhang *value = 0; 190297b0cebSHawking Zhang for (i = 0; i < ARRAY_SIZE(soc_v1_0_allowed_read_registers); i++) { 191297b0cebSHawking Zhang en = &soc_v1_0_allowed_read_registers[i]; 192297b0cebSHawking Zhang if (!adev->reg_offset[en->hwip][en->inst]) 193297b0cebSHawking Zhang continue; 194297b0cebSHawking Zhang else if (reg_offset != (adev->reg_offset[en->hwip][en->inst][en->seg] 195297b0cebSHawking Zhang + en->reg_offset)) 196297b0cebSHawking Zhang continue; 197297b0cebSHawking Zhang 198297b0cebSHawking Zhang *value = soc_v1_0_get_register_value(adev, 199297b0cebSHawking Zhang soc_v1_0_allowed_read_registers[i].grbm_indexed, 200297b0cebSHawking Zhang se_num, sh_num, reg_offset); 201297b0cebSHawking Zhang return 0; 202297b0cebSHawking Zhang } 203297b0cebSHawking Zhang return -EINVAL; 204297b0cebSHawking Zhang } 205297b0cebSHawking Zhang 206297b0cebSHawking Zhang static bool soc_v1_0_need_full_reset(struct amdgpu_device *adev) 207297b0cebSHawking Zhang { 208297b0cebSHawking Zhang switch (amdgpu_ip_version(adev, GC_HWIP, 0)) { 209297b0cebSHawking Zhang case IP_VERSION(12, 1, 0): 210297b0cebSHawking Zhang default: 211297b0cebSHawking Zhang return true; 212297b0cebSHawking Zhang } 213297b0cebSHawking Zhang } 214297b0cebSHawking Zhang 215297b0cebSHawking Zhang static bool soc_v1_0_need_reset_on_init(struct amdgpu_device *adev) 216297b0cebSHawking Zhang { 217297b0cebSHawking Zhang u32 sol_reg; 218297b0cebSHawking Zhang 219297b0cebSHawking Zhang if (adev->flags & AMD_IS_APU) 220297b0cebSHawking Zhang return false; 221297b0cebSHawking Zhang 222297b0cebSHawking Zhang /* Check sOS sign of life register to confirm sys driver and sOS 223297b0cebSHawking Zhang * are already been loaded. 224297b0cebSHawking Zhang */ 225297b0cebSHawking Zhang sol_reg = RREG32_SOC15(MP0, 0, regMPASP_SMN_C2PMSG_81); 226297b0cebSHawking Zhang if (sol_reg) 227297b0cebSHawking Zhang return true; 228297b0cebSHawking Zhang 229297b0cebSHawking Zhang return false; 230297b0cebSHawking Zhang } 231297b0cebSHawking Zhang 232297b0cebSHawking Zhang static int soc_v1_0_asic_reset(struct amdgpu_device *adev) 233297b0cebSHawking Zhang { 234297b0cebSHawking Zhang return 0; 235297b0cebSHawking Zhang } 236297b0cebSHawking Zhang 237297b0cebSHawking Zhang static const struct amdgpu_asic_funcs soc_v1_0_asic_funcs = { 238297b0cebSHawking Zhang .read_bios_from_rom = &amdgpu_soc15_read_bios_from_rom, 239297b0cebSHawking Zhang .read_register = &soc_v1_0_read_register, 240297b0cebSHawking Zhang .get_config_memsize = &soc_v1_0_get_config_memsize, 241297b0cebSHawking Zhang .get_xclk = &soc_v1_0_get_xclk, 242297b0cebSHawking Zhang .need_full_reset = &soc_v1_0_need_full_reset, 243297b0cebSHawking Zhang .init_doorbell_index = &soc_v1_0_doorbell_index_init, 244297b0cebSHawking Zhang .need_reset_on_init = &soc_v1_0_need_reset_on_init, 245*21677982SLe Ma .encode_ext_smn_addressing = &soc_v1_0_encode_ext_smn_addressing, 246297b0cebSHawking Zhang .reset = soc_v1_0_asic_reset, 247297b0cebSHawking Zhang }; 248297b0cebSHawking Zhang 249297b0cebSHawking Zhang static int soc_v1_0_common_early_init(struct amdgpu_ip_block *ip_block) 250297b0cebSHawking Zhang { 251297b0cebSHawking Zhang struct amdgpu_device *adev = ip_block->adev; 252297b0cebSHawking Zhang 253297b0cebSHawking Zhang adev->smc_rreg = NULL; 254297b0cebSHawking Zhang adev->smc_wreg = NULL; 255297b0cebSHawking Zhang adev->pcie_rreg = &amdgpu_device_indirect_rreg; 256297b0cebSHawking Zhang adev->pcie_wreg = &amdgpu_device_indirect_wreg; 257297b0cebSHawking Zhang adev->pcie_rreg_ext = &amdgpu_device_indirect_rreg_ext; 258297b0cebSHawking Zhang adev->pcie_wreg_ext = &amdgpu_device_indirect_wreg_ext; 259297b0cebSHawking Zhang adev->pcie_rreg64 = &amdgpu_device_indirect_rreg64; 260297b0cebSHawking Zhang adev->pcie_wreg64 = &amdgpu_device_indirect_wreg64; 261297b0cebSHawking Zhang adev->pciep_rreg = amdgpu_device_pcie_port_rreg; 262297b0cebSHawking Zhang adev->pciep_wreg = amdgpu_device_pcie_port_wreg; 263297b0cebSHawking Zhang adev->pcie_rreg64_ext = &amdgpu_device_indirect_rreg64_ext; 264297b0cebSHawking Zhang adev->pcie_wreg64_ext = &amdgpu_device_indirect_wreg64_ext; 265297b0cebSHawking Zhang adev->uvd_ctx_rreg = NULL; 266297b0cebSHawking Zhang adev->uvd_ctx_wreg = NULL; 267297b0cebSHawking Zhang adev->didt_rreg = NULL; 268297b0cebSHawking Zhang adev->didt_wreg = NULL; 269297b0cebSHawking Zhang 270297b0cebSHawking Zhang adev->asic_funcs = &soc_v1_0_asic_funcs; 271297b0cebSHawking Zhang 272297b0cebSHawking Zhang adev->rev_id = amdgpu_device_get_rev_id(adev); 273297b0cebSHawking Zhang adev->external_rev_id = 0xff; 274297b0cebSHawking Zhang 275297b0cebSHawking Zhang switch (amdgpu_ip_version(adev, GC_HWIP, 0)) { 276297b0cebSHawking Zhang case IP_VERSION(12, 1, 0): 277297b0cebSHawking Zhang adev->cg_flags = 0; 278297b0cebSHawking Zhang adev->pg_flags = 0; 279297b0cebSHawking Zhang adev->external_rev_id = adev->rev_id + 0x50; 280297b0cebSHawking Zhang break; 281297b0cebSHawking Zhang default: 282297b0cebSHawking Zhang /* FIXME: not supported yet */ 283297b0cebSHawking Zhang return -EINVAL; 284297b0cebSHawking Zhang } 285297b0cebSHawking Zhang 286297b0cebSHawking Zhang return 0; 287297b0cebSHawking Zhang } 288297b0cebSHawking Zhang 289297b0cebSHawking Zhang static int soc_v1_0_common_late_init(struct amdgpu_ip_block *ip_block) 290297b0cebSHawking Zhang { 291297b0cebSHawking Zhang struct amdgpu_device *adev = ip_block->adev; 292297b0cebSHawking Zhang 293297b0cebSHawking Zhang /* Enable selfring doorbell aperture late because doorbell BAR 294297b0cebSHawking Zhang * aperture will change if resize BAR successfully in gmc sw_init. 295297b0cebSHawking Zhang */ 296297b0cebSHawking Zhang adev->nbio.funcs->enable_doorbell_selfring_aperture(adev, true); 297297b0cebSHawking Zhang 298297b0cebSHawking Zhang return 0; 299297b0cebSHawking Zhang } 300297b0cebSHawking Zhang 301297b0cebSHawking Zhang static int soc_v1_0_common_sw_init(struct amdgpu_ip_block *ip_block) 302297b0cebSHawking Zhang { 303297b0cebSHawking Zhang return 0; 304297b0cebSHawking Zhang } 305297b0cebSHawking Zhang 306297b0cebSHawking Zhang static int soc_v1_0_common_hw_init(struct amdgpu_ip_block *ip_block) 307297b0cebSHawking Zhang { 308297b0cebSHawking Zhang struct amdgpu_device *adev = ip_block->adev; 309297b0cebSHawking Zhang 310297b0cebSHawking Zhang /* enable the doorbell aperture */ 311297b0cebSHawking Zhang adev->nbio.funcs->enable_doorbell_aperture(adev, true); 312297b0cebSHawking Zhang 313297b0cebSHawking Zhang return 0; 314297b0cebSHawking Zhang } 315297b0cebSHawking Zhang 316297b0cebSHawking Zhang static int soc_v1_0_common_hw_fini(struct amdgpu_ip_block *ip_block) 317297b0cebSHawking Zhang { 318297b0cebSHawking Zhang struct amdgpu_device *adev = ip_block->adev; 319297b0cebSHawking Zhang 320297b0cebSHawking Zhang adev->nbio.funcs->enable_doorbell_aperture(adev, false); 321297b0cebSHawking Zhang adev->nbio.funcs->enable_doorbell_selfring_aperture(adev, false); 322297b0cebSHawking Zhang 323297b0cebSHawking Zhang return 0; 324297b0cebSHawking Zhang } 325297b0cebSHawking Zhang 326297b0cebSHawking Zhang static int soc_v1_0_common_suspend(struct amdgpu_ip_block *ip_block) 327297b0cebSHawking Zhang { 328297b0cebSHawking Zhang return soc_v1_0_common_hw_fini(ip_block); 329297b0cebSHawking Zhang } 330297b0cebSHawking Zhang 331297b0cebSHawking Zhang static int soc_v1_0_common_resume(struct amdgpu_ip_block *ip_block) 332297b0cebSHawking Zhang { 333297b0cebSHawking Zhang return soc_v1_0_common_hw_init(ip_block); 334297b0cebSHawking Zhang } 335297b0cebSHawking Zhang 336297b0cebSHawking Zhang static bool soc_v1_0_common_is_idle(struct amdgpu_ip_block *ip_block) 337297b0cebSHawking Zhang { 338297b0cebSHawking Zhang return true; 339297b0cebSHawking Zhang } 340297b0cebSHawking Zhang 341297b0cebSHawking Zhang static int soc_v1_0_common_set_clockgating_state(struct amdgpu_ip_block *ip_block, 342297b0cebSHawking Zhang enum amd_clockgating_state state) 343297b0cebSHawking Zhang { 344297b0cebSHawking Zhang return 0; 345297b0cebSHawking Zhang } 346297b0cebSHawking Zhang 347297b0cebSHawking Zhang static int soc_v1_0_common_set_powergating_state(struct amdgpu_ip_block *ip_block, 348297b0cebSHawking Zhang enum amd_powergating_state state) 349297b0cebSHawking Zhang { 350297b0cebSHawking Zhang return 0; 351297b0cebSHawking Zhang } 352297b0cebSHawking Zhang 353297b0cebSHawking Zhang static void soc_v1_0_common_get_clockgating_state(struct amdgpu_ip_block *ip_block, 354297b0cebSHawking Zhang u64 *flags) 355297b0cebSHawking Zhang { 356297b0cebSHawking Zhang return; 357297b0cebSHawking Zhang } 358297b0cebSHawking Zhang 359297b0cebSHawking Zhang static const struct amd_ip_funcs soc_v1_0_common_ip_funcs = { 360297b0cebSHawking Zhang .name = "soc_v1_0_common", 361297b0cebSHawking Zhang .early_init = soc_v1_0_common_early_init, 362297b0cebSHawking Zhang .late_init = soc_v1_0_common_late_init, 363297b0cebSHawking Zhang .sw_init = soc_v1_0_common_sw_init, 364297b0cebSHawking Zhang .hw_init = soc_v1_0_common_hw_init, 365297b0cebSHawking Zhang .hw_fini = soc_v1_0_common_hw_fini, 366297b0cebSHawking Zhang .suspend = soc_v1_0_common_suspend, 367297b0cebSHawking Zhang .resume = soc_v1_0_common_resume, 368297b0cebSHawking Zhang .is_idle = soc_v1_0_common_is_idle, 369297b0cebSHawking Zhang .set_clockgating_state = soc_v1_0_common_set_clockgating_state, 370297b0cebSHawking Zhang .set_powergating_state = soc_v1_0_common_set_powergating_state, 371297b0cebSHawking Zhang .get_clockgating_state = soc_v1_0_common_get_clockgating_state, 372297b0cebSHawking Zhang }; 373297b0cebSHawking Zhang 374297b0cebSHawking Zhang const struct amdgpu_ip_block_version soc_v1_0_common_ip_block = { 375297b0cebSHawking Zhang .type = AMD_IP_BLOCK_TYPE_COMMON, 376297b0cebSHawking Zhang .major = 1, 377297b0cebSHawking Zhang .minor = 0, 378297b0cebSHawking Zhang .rev = 0, 379297b0cebSHawking Zhang .funcs = &soc_v1_0_common_ip_funcs, 380297b0cebSHawking Zhang }; 381fe1c48e9SLikun Gao 382a9368961SHawking Zhang static enum amdgpu_gfx_partition __soc_v1_0_calc_xcp_mode(struct amdgpu_xcp_mgr *xcp_mgr) 383a9368961SHawking Zhang { 384a9368961SHawking Zhang struct amdgpu_device *adev = xcp_mgr->adev; 385a9368961SHawking Zhang int num_xcc, num_xcc_per_xcp = 0, mode = 0; 386a9368961SHawking Zhang 387a9368961SHawking Zhang num_xcc = NUM_XCC(xcp_mgr->adev->gfx.xcc_mask); 388a9368961SHawking Zhang if (adev->gfx.funcs && 389a9368961SHawking Zhang adev->gfx.funcs->get_xccs_per_xcp) 390a9368961SHawking Zhang num_xcc_per_xcp = adev->gfx.funcs->get_xccs_per_xcp(adev); 391a9368961SHawking Zhang if ((num_xcc_per_xcp) && (num_xcc % num_xcc_per_xcp == 0)) 392a9368961SHawking Zhang mode = num_xcc / num_xcc_per_xcp; 393a9368961SHawking Zhang 394a9368961SHawking Zhang if (num_xcc_per_xcp == 1) 395a9368961SHawking Zhang return AMDGPU_CPX_PARTITION_MODE; 396a9368961SHawking Zhang 397a9368961SHawking Zhang switch (mode) { 398a9368961SHawking Zhang case 1: 399a9368961SHawking Zhang return AMDGPU_SPX_PARTITION_MODE; 400a9368961SHawking Zhang case 2: 401a9368961SHawking Zhang return AMDGPU_DPX_PARTITION_MODE; 402a9368961SHawking Zhang case 3: 403a9368961SHawking Zhang return AMDGPU_TPX_PARTITION_MODE; 404a9368961SHawking Zhang case 4: 405a9368961SHawking Zhang return AMDGPU_QPX_PARTITION_MODE; 406a9368961SHawking Zhang default: 407a9368961SHawking Zhang return AMDGPU_UNKNOWN_COMPUTE_PARTITION_MODE; 408a9368961SHawking Zhang } 409a9368961SHawking Zhang 410a9368961SHawking Zhang return AMDGPU_UNKNOWN_COMPUTE_PARTITION_MODE; 411a9368961SHawking Zhang } 412a9368961SHawking Zhang 413a9368961SHawking Zhang static int soc_v1_0_query_partition_mode(struct amdgpu_xcp_mgr *xcp_mgr) 414a9368961SHawking Zhang { 415a9368961SHawking Zhang enum amdgpu_gfx_partition derv_mode, mode; 416a9368961SHawking Zhang struct amdgpu_device *adev = xcp_mgr->adev; 417a9368961SHawking Zhang 418a9368961SHawking Zhang mode = AMDGPU_UNKNOWN_COMPUTE_PARTITION_MODE; 419a9368961SHawking Zhang derv_mode = __soc_v1_0_calc_xcp_mode(xcp_mgr); 420a9368961SHawking Zhang 421fd25254fSMukul Joshi if (amdgpu_sriov_vf(adev) || !adev->psp.funcs) 422a9368961SHawking Zhang return derv_mode; 423a9368961SHawking Zhang 424a9368961SHawking Zhang if (adev->nbio.funcs && 425a9368961SHawking Zhang adev->nbio.funcs->get_compute_partition_mode) { 426a9368961SHawking Zhang mode = adev->nbio.funcs->get_compute_partition_mode(adev); 427a9368961SHawking Zhang if (mode != derv_mode) 428a9368961SHawking Zhang dev_warn(adev->dev, 429a9368961SHawking Zhang "Mismatch in compute partition mode - reported : %d derived : %d", 430a9368961SHawking Zhang mode, derv_mode); 431a9368961SHawking Zhang } 432a9368961SHawking Zhang 433a9368961SHawking Zhang return mode; 434a9368961SHawking Zhang } 435a9368961SHawking Zhang 436a9368961SHawking Zhang static int __soc_v1_0_get_xcc_per_xcp(struct amdgpu_xcp_mgr *xcp_mgr, int mode) 437a9368961SHawking Zhang { 438a9368961SHawking Zhang int num_xcc, num_xcc_per_xcp = 0; 439a9368961SHawking Zhang 440a9368961SHawking Zhang num_xcc = NUM_XCC(xcp_mgr->adev->gfx.xcc_mask); 441a9368961SHawking Zhang 442a9368961SHawking Zhang switch (mode) { 443a9368961SHawking Zhang case AMDGPU_SPX_PARTITION_MODE: 444a9368961SHawking Zhang num_xcc_per_xcp = num_xcc; 445a9368961SHawking Zhang break; 446a9368961SHawking Zhang case AMDGPU_DPX_PARTITION_MODE: 447a9368961SHawking Zhang num_xcc_per_xcp = num_xcc / 2; 448a9368961SHawking Zhang break; 449a9368961SHawking Zhang case AMDGPU_TPX_PARTITION_MODE: 450a9368961SHawking Zhang num_xcc_per_xcp = num_xcc / 3; 451a9368961SHawking Zhang break; 452a9368961SHawking Zhang case AMDGPU_QPX_PARTITION_MODE: 453a9368961SHawking Zhang num_xcc_per_xcp = num_xcc / 4; 454a9368961SHawking Zhang break; 455a9368961SHawking Zhang case AMDGPU_CPX_PARTITION_MODE: 456a9368961SHawking Zhang num_xcc_per_xcp = 1; 457a9368961SHawking Zhang break; 458a9368961SHawking Zhang } 459a9368961SHawking Zhang 460a9368961SHawking Zhang return num_xcc_per_xcp; 461a9368961SHawking Zhang } 462a9368961SHawking Zhang 463a9368961SHawking Zhang static int __soc_v1_0_get_xcp_ip_info(struct amdgpu_xcp_mgr *xcp_mgr, int xcp_id, 464a9368961SHawking Zhang enum AMDGPU_XCP_IP_BLOCK ip_id, 465a9368961SHawking Zhang struct amdgpu_xcp_ip *ip) 466a9368961SHawking Zhang { 467a9368961SHawking Zhang struct amdgpu_device *adev = xcp_mgr->adev; 468a9368961SHawking Zhang int num_sdma, num_vcn, num_shared_vcn, num_xcp; 469a9368961SHawking Zhang int num_xcc_xcp, num_sdma_xcp, num_vcn_xcp; 470a9368961SHawking Zhang 471a9368961SHawking Zhang num_sdma = adev->sdma.num_instances; 472a9368961SHawking Zhang num_vcn = adev->vcn.num_vcn_inst; 473a9368961SHawking Zhang num_shared_vcn = 1; 474a9368961SHawking Zhang 475a9368961SHawking Zhang num_xcc_xcp = adev->gfx.num_xcc_per_xcp; 476a9368961SHawking Zhang num_xcp = NUM_XCC(adev->gfx.xcc_mask) / num_xcc_xcp; 477a9368961SHawking Zhang 478a9368961SHawking Zhang switch (xcp_mgr->mode) { 479a9368961SHawking Zhang case AMDGPU_SPX_PARTITION_MODE: 480a9368961SHawking Zhang case AMDGPU_DPX_PARTITION_MODE: 481a9368961SHawking Zhang case AMDGPU_TPX_PARTITION_MODE: 482a9368961SHawking Zhang case AMDGPU_QPX_PARTITION_MODE: 483a9368961SHawking Zhang case AMDGPU_CPX_PARTITION_MODE: 484a9368961SHawking Zhang num_sdma_xcp = DIV_ROUND_UP(num_sdma, num_xcp); 485a9368961SHawking Zhang num_vcn_xcp = DIV_ROUND_UP(num_vcn, num_xcp); 486a9368961SHawking Zhang break; 487a9368961SHawking Zhang default: 488a9368961SHawking Zhang return -EINVAL; 489a9368961SHawking Zhang } 490a9368961SHawking Zhang 491a9368961SHawking Zhang if (num_vcn && num_xcp > num_vcn) 492a9368961SHawking Zhang num_shared_vcn = num_xcp / num_vcn; 493a9368961SHawking Zhang 494a9368961SHawking Zhang switch (ip_id) { 495a9368961SHawking Zhang case AMDGPU_XCP_GFXHUB: 496a9368961SHawking Zhang ip->inst_mask = XCP_INST_MASK(num_xcc_xcp, xcp_id); 497a9368961SHawking Zhang ip->ip_funcs = &gfxhub_v12_1_xcp_funcs; 498a9368961SHawking Zhang break; 499a9368961SHawking Zhang case AMDGPU_XCP_GFX: 500a9368961SHawking Zhang ip->inst_mask = XCP_INST_MASK(num_xcc_xcp, xcp_id); 501a9368961SHawking Zhang ip->ip_funcs = &gfx_v12_1_xcp_funcs; 502a9368961SHawking Zhang break; 503a9368961SHawking Zhang case AMDGPU_XCP_SDMA: 504a9368961SHawking Zhang ip->inst_mask = XCP_INST_MASK(num_sdma_xcp, xcp_id); 505a9368961SHawking Zhang ip->ip_funcs = &sdma_v7_1_xcp_funcs; 506a9368961SHawking Zhang break; 507a9368961SHawking Zhang case AMDGPU_XCP_VCN: 508a9368961SHawking Zhang ip->inst_mask = 509a9368961SHawking Zhang XCP_INST_MASK(num_vcn_xcp, xcp_id / num_shared_vcn); 510a9368961SHawking Zhang /* TODO : Assign IP funcs */ 511a9368961SHawking Zhang break; 512a9368961SHawking Zhang default: 513a9368961SHawking Zhang return -EINVAL; 514a9368961SHawking Zhang } 515a9368961SHawking Zhang 516a9368961SHawking Zhang ip->ip_id = ip_id; 517a9368961SHawking Zhang 518a9368961SHawking Zhang return 0; 519a9368961SHawking Zhang } 520a9368961SHawking Zhang 521a9368961SHawking Zhang static int soc_v1_0_get_xcp_res_info(struct amdgpu_xcp_mgr *xcp_mgr, 522a9368961SHawking Zhang int mode, 523a9368961SHawking Zhang struct amdgpu_xcp_cfg *xcp_cfg) 524a9368961SHawking Zhang { 525a9368961SHawking Zhang struct amdgpu_device *adev = xcp_mgr->adev; 526a9368961SHawking Zhang int max_res[AMDGPU_XCP_RES_MAX] = {}; 527a9368961SHawking Zhang bool res_lt_xcp; 528a9368961SHawking Zhang int num_xcp, i; 529a9368961SHawking Zhang u16 nps_modes; 530a9368961SHawking Zhang 531a9368961SHawking Zhang if (!(xcp_mgr->supp_xcp_modes & BIT(mode))) 532a9368961SHawking Zhang return -EINVAL; 533a9368961SHawking Zhang 534a9368961SHawking Zhang max_res[AMDGPU_XCP_RES_XCC] = NUM_XCC(adev->gfx.xcc_mask); 535a9368961SHawking Zhang max_res[AMDGPU_XCP_RES_DMA] = adev->sdma.num_instances; 536a9368961SHawking Zhang max_res[AMDGPU_XCP_RES_DEC] = adev->vcn.num_vcn_inst; 537a9368961SHawking Zhang max_res[AMDGPU_XCP_RES_JPEG] = adev->jpeg.num_jpeg_inst; 538a9368961SHawking Zhang 539a9368961SHawking Zhang switch (mode) { 540a9368961SHawking Zhang case AMDGPU_SPX_PARTITION_MODE: 541a9368961SHawking Zhang num_xcp = 1; 542a9368961SHawking Zhang nps_modes = BIT(AMDGPU_NPS1_PARTITION_MODE); 543a9368961SHawking Zhang break; 544a9368961SHawking Zhang case AMDGPU_DPX_PARTITION_MODE: 545a9368961SHawking Zhang num_xcp = 2; 546a9368961SHawking Zhang nps_modes = BIT(AMDGPU_NPS1_PARTITION_MODE); 547a9368961SHawking Zhang break; 548a9368961SHawking Zhang case AMDGPU_TPX_PARTITION_MODE: 549a9368961SHawking Zhang num_xcp = 3; 550a9368961SHawking Zhang nps_modes = BIT(AMDGPU_NPS1_PARTITION_MODE) | 551a9368961SHawking Zhang BIT(AMDGPU_NPS4_PARTITION_MODE); 552a9368961SHawking Zhang break; 553a9368961SHawking Zhang case AMDGPU_QPX_PARTITION_MODE: 554a9368961SHawking Zhang num_xcp = 4; 555a9368961SHawking Zhang nps_modes = BIT(AMDGPU_NPS1_PARTITION_MODE) | 556a9368961SHawking Zhang BIT(AMDGPU_NPS4_PARTITION_MODE); 557a9368961SHawking Zhang break; 558a9368961SHawking Zhang case AMDGPU_CPX_PARTITION_MODE: 559a9368961SHawking Zhang num_xcp = NUM_XCC(adev->gfx.xcc_mask); 560a9368961SHawking Zhang nps_modes = BIT(AMDGPU_NPS1_PARTITION_MODE) | 561a9368961SHawking Zhang BIT(AMDGPU_NPS4_PARTITION_MODE); 562a9368961SHawking Zhang break; 563a9368961SHawking Zhang default: 564a9368961SHawking Zhang return -EINVAL; 565a9368961SHawking Zhang } 566a9368961SHawking Zhang 567a9368961SHawking Zhang xcp_cfg->compatible_nps_modes = 568a9368961SHawking Zhang (adev->gmc.supported_nps_modes & nps_modes); 569a9368961SHawking Zhang xcp_cfg->num_res = ARRAY_SIZE(max_res); 570a9368961SHawking Zhang 571a9368961SHawking Zhang for (i = 0; i < xcp_cfg->num_res; i++) { 572a9368961SHawking Zhang res_lt_xcp = max_res[i] < num_xcp; 573a9368961SHawking Zhang xcp_cfg->xcp_res[i].id = i; 574a9368961SHawking Zhang xcp_cfg->xcp_res[i].num_inst = 575a9368961SHawking Zhang res_lt_xcp ? 1 : max_res[i] / num_xcp; 576a9368961SHawking Zhang xcp_cfg->xcp_res[i].num_inst = 577a9368961SHawking Zhang i == AMDGPU_XCP_RES_JPEG ? 578a9368961SHawking Zhang xcp_cfg->xcp_res[i].num_inst * 579a9368961SHawking Zhang adev->jpeg.num_jpeg_rings : xcp_cfg->xcp_res[i].num_inst; 580a9368961SHawking Zhang xcp_cfg->xcp_res[i].num_shared = 581a9368961SHawking Zhang res_lt_xcp ? num_xcp / max_res[i] : 1; 582a9368961SHawking Zhang } 583a9368961SHawking Zhang 584a9368961SHawking Zhang return 0; 585a9368961SHawking Zhang } 586a9368961SHawking Zhang 587a9368961SHawking Zhang static enum amdgpu_gfx_partition __soc_v1_0_get_auto_mode(struct amdgpu_xcp_mgr *xcp_mgr) 588a9368961SHawking Zhang { 589a9368961SHawking Zhang struct amdgpu_device *adev = xcp_mgr->adev; 590a9368961SHawking Zhang int num_xcc; 591a9368961SHawking Zhang 592a9368961SHawking Zhang num_xcc = NUM_XCC(xcp_mgr->adev->gfx.xcc_mask); 593a9368961SHawking Zhang 594a9368961SHawking Zhang if (adev->gmc.num_mem_partitions == 1) 595a9368961SHawking Zhang return AMDGPU_SPX_PARTITION_MODE; 596a9368961SHawking Zhang 597a9368961SHawking Zhang if (adev->gmc.num_mem_partitions == num_xcc) 598a9368961SHawking Zhang return AMDGPU_CPX_PARTITION_MODE; 599a9368961SHawking Zhang 600a9368961SHawking Zhang if (adev->gmc.num_mem_partitions == 2) 601a9368961SHawking Zhang return AMDGPU_DPX_PARTITION_MODE; 602a9368961SHawking Zhang 603a9368961SHawking Zhang return AMDGPU_UNKNOWN_COMPUTE_PARTITION_MODE; 604a9368961SHawking Zhang } 605a9368961SHawking Zhang 606a9368961SHawking Zhang static bool __soc_v1_0_is_valid_mode(struct amdgpu_xcp_mgr *xcp_mgr, 607a9368961SHawking Zhang enum amdgpu_gfx_partition mode) 608a9368961SHawking Zhang { 609a9368961SHawking Zhang struct amdgpu_device *adev = xcp_mgr->adev; 610a9368961SHawking Zhang int num_xcc, num_xccs_per_xcp; 611a9368961SHawking Zhang 612a9368961SHawking Zhang num_xcc = NUM_XCC(adev->gfx.xcc_mask); 613a9368961SHawking Zhang switch (mode) { 614a9368961SHawking Zhang case AMDGPU_SPX_PARTITION_MODE: 615a9368961SHawking Zhang return adev->gmc.num_mem_partitions == 1 && num_xcc > 0; 616a9368961SHawking Zhang case AMDGPU_DPX_PARTITION_MODE: 617a9368961SHawking Zhang return adev->gmc.num_mem_partitions <= 2 && (num_xcc % 4) == 0; 618a9368961SHawking Zhang case AMDGPU_TPX_PARTITION_MODE: 619a9368961SHawking Zhang return (adev->gmc.num_mem_partitions == 1 || 620a9368961SHawking Zhang adev->gmc.num_mem_partitions == 3) && 621a9368961SHawking Zhang ((num_xcc % 3) == 0); 622a9368961SHawking Zhang case AMDGPU_QPX_PARTITION_MODE: 623a9368961SHawking Zhang num_xccs_per_xcp = num_xcc / 4; 624a9368961SHawking Zhang return (adev->gmc.num_mem_partitions == 1 || 625a9368961SHawking Zhang adev->gmc.num_mem_partitions == 4) && 626a9368961SHawking Zhang (num_xccs_per_xcp >= 2); 627a9368961SHawking Zhang case AMDGPU_CPX_PARTITION_MODE: 628a9368961SHawking Zhang /* (num_xcc > 1) because 1 XCC is considered SPX, not CPX. 629a9368961SHawking Zhang * (num_xcc % adev->gmc.num_mem_partitions) == 0 because 630a9368961SHawking Zhang * num_compute_partitions can't be less than num_mem_partitions 631a9368961SHawking Zhang */ 632a9368961SHawking Zhang return ((num_xcc > 1) && 633a9368961SHawking Zhang (num_xcc % adev->gmc.num_mem_partitions) == 0); 634a9368961SHawking Zhang default: 635a9368961SHawking Zhang return false; 636a9368961SHawking Zhang } 637a9368961SHawking Zhang 638a9368961SHawking Zhang return false; 639a9368961SHawking Zhang } 640a9368961SHawking Zhang 641a9368961SHawking Zhang static void __soc_v1_0_update_available_partition_mode(struct amdgpu_xcp_mgr *xcp_mgr) 642a9368961SHawking Zhang { 643a9368961SHawking Zhang int mode; 644a9368961SHawking Zhang 645a9368961SHawking Zhang xcp_mgr->avail_xcp_modes = 0; 646a9368961SHawking Zhang 647a9368961SHawking Zhang for_each_inst(mode, xcp_mgr->supp_xcp_modes) { 648a9368961SHawking Zhang if (__soc_v1_0_is_valid_mode(xcp_mgr, mode)) 649a9368961SHawking Zhang xcp_mgr->avail_xcp_modes |= BIT(mode); 650a9368961SHawking Zhang } 651a9368961SHawking Zhang } 652a9368961SHawking Zhang 653a9368961SHawking Zhang static int soc_v1_0_switch_partition_mode(struct amdgpu_xcp_mgr *xcp_mgr, 654a9368961SHawking Zhang int mode, int *num_xcps) 655a9368961SHawking Zhang { 656a9368961SHawking Zhang int num_xcc_per_xcp, num_xcc, ret; 657a9368961SHawking Zhang struct amdgpu_device *adev; 658a9368961SHawking Zhang u32 flags = 0; 659a9368961SHawking Zhang 660a9368961SHawking Zhang adev = xcp_mgr->adev; 661a9368961SHawking Zhang num_xcc = NUM_XCC(adev->gfx.xcc_mask); 662a9368961SHawking Zhang 663a9368961SHawking Zhang if (mode == AMDGPU_AUTO_COMPUTE_PARTITION_MODE) { 664a9368961SHawking Zhang mode = __soc_v1_0_get_auto_mode(xcp_mgr); 665a9368961SHawking Zhang if (mode == AMDGPU_UNKNOWN_COMPUTE_PARTITION_MODE) { 666a9368961SHawking Zhang dev_err(adev->dev, 667a9368961SHawking Zhang "Invalid config, no compatible compute partition mode found, available memory partitions: %d", 668a9368961SHawking Zhang adev->gmc.num_mem_partitions); 669a9368961SHawking Zhang return -EINVAL; 670a9368961SHawking Zhang } 671a9368961SHawking Zhang } else if (!__soc_v1_0_is_valid_mode(xcp_mgr, mode)) { 672a9368961SHawking Zhang dev_err(adev->dev, 673a9368961SHawking Zhang "Invalid compute partition mode requested, requested: %s, available memory partitions: %d", 674a9368961SHawking Zhang amdgpu_gfx_compute_mode_desc(mode), adev->gmc.num_mem_partitions); 675a9368961SHawking Zhang return -EINVAL; 676a9368961SHawking Zhang } 677a9368961SHawking Zhang 678a9368961SHawking Zhang if (adev->kfd.init_complete && !amdgpu_in_reset(adev)) 679a9368961SHawking Zhang flags |= AMDGPU_XCP_OPS_KFD; 680a9368961SHawking Zhang 681a9368961SHawking Zhang if (flags & AMDGPU_XCP_OPS_KFD) { 682a9368961SHawking Zhang ret = amdgpu_amdkfd_check_and_lock_kfd(adev); 683a9368961SHawking Zhang if (ret) 684a9368961SHawking Zhang goto out; 685a9368961SHawking Zhang } 686a9368961SHawking Zhang 687a9368961SHawking Zhang ret = amdgpu_xcp_pre_partition_switch(xcp_mgr, flags); 688a9368961SHawking Zhang if (ret) 689a9368961SHawking Zhang goto unlock; 690a9368961SHawking Zhang 691a9368961SHawking Zhang num_xcc_per_xcp = __soc_v1_0_get_xcc_per_xcp(xcp_mgr, mode); 692a9368961SHawking Zhang if (adev->gfx.imu.funcs && 69360481d95SLikun Gao adev->gfx.imu.funcs->switch_compute_partition) { 69460481d95SLikun Gao ret = adev->gfx.imu.funcs->switch_compute_partition(xcp_mgr->adev, num_xcc_per_xcp, mode); 69560481d95SLikun Gao if (ret) 69660481d95SLikun Gao goto out; 69760481d95SLikun Gao } 69860481d95SLikun Gao if (adev->gfx.imu.funcs && 69960481d95SLikun Gao adev->gfx.imu.funcs->init_mcm_addr_lut && 70060481d95SLikun Gao amdgpu_emu_mode) 70160481d95SLikun Gao adev->gfx.imu.funcs->init_mcm_addr_lut(adev); 702a9368961SHawking Zhang 703a9368961SHawking Zhang /* Init info about new xcps */ 704a9368961SHawking Zhang *num_xcps = num_xcc / num_xcc_per_xcp; 705a9368961SHawking Zhang amdgpu_xcp_init(xcp_mgr, *num_xcps, mode); 706a9368961SHawking Zhang 707a9368961SHawking Zhang ret = amdgpu_xcp_post_partition_switch(xcp_mgr, flags); 708a9368961SHawking Zhang if (!ret) 709a9368961SHawking Zhang __soc_v1_0_update_available_partition_mode(xcp_mgr); 710a9368961SHawking Zhang unlock: 711a9368961SHawking Zhang if (flags & AMDGPU_XCP_OPS_KFD) 712a9368961SHawking Zhang amdgpu_amdkfd_unlock_kfd(adev); 713a9368961SHawking Zhang out: 714a9368961SHawking Zhang return ret; 715a9368961SHawking Zhang } 716a9368961SHawking Zhang 717a9368961SHawking Zhang #ifdef HAVE_ACPI_DEV_GET_FIRST_MATCH_DEV 718a9368961SHawking Zhang static int __soc_v1_0_get_xcp_mem_id(struct amdgpu_device *adev, 719a9368961SHawking Zhang int xcc_id, uint8_t *mem_id) 720a9368961SHawking Zhang { 721a9368961SHawking Zhang /* memory/spatial modes validation check is already done */ 722a9368961SHawking Zhang *mem_id = xcc_id / adev->gfx.num_xcc_per_xcp; 723a9368961SHawking Zhang *mem_id /= adev->xcp_mgr->num_xcp_per_mem_partition; 724a9368961SHawking Zhang 725a9368961SHawking Zhang return 0; 726a9368961SHawking Zhang } 727a9368961SHawking Zhang 728a9368961SHawking Zhang static int soc_v1_0_get_xcp_mem_id(struct amdgpu_xcp_mgr *xcp_mgr, 729a9368961SHawking Zhang struct amdgpu_xcp *xcp, uint8_t *mem_id) 730a9368961SHawking Zhang { 731a9368961SHawking Zhang struct amdgpu_numa_info numa_info; 732a9368961SHawking Zhang struct amdgpu_device *adev; 733a9368961SHawking Zhang uint32_t xcc_mask; 734a9368961SHawking Zhang int r, i, xcc_id; 735a9368961SHawking Zhang 736a9368961SHawking Zhang adev = xcp_mgr->adev; 737a9368961SHawking Zhang /* TODO: BIOS is not returning the right info now 738a9368961SHawking Zhang * Check on this later 739a9368961SHawking Zhang */ 740a9368961SHawking Zhang /* 741a9368961SHawking Zhang if (adev->gmc.gmc_funcs->query_mem_partition_mode) 742a9368961SHawking Zhang mode = adev->gmc.gmc_funcs->query_mem_partition_mode(adev); 743a9368961SHawking Zhang */ 744a9368961SHawking Zhang if (adev->gmc.num_mem_partitions == 1) { 745a9368961SHawking Zhang /* Only one range */ 746a9368961SHawking Zhang *mem_id = 0; 747a9368961SHawking Zhang return 0; 748a9368961SHawking Zhang } 749a9368961SHawking Zhang 750a9368961SHawking Zhang r = amdgpu_xcp_get_inst_details(xcp, AMDGPU_XCP_GFX, &xcc_mask); 751a9368961SHawking Zhang if (r || !xcc_mask) 752a9368961SHawking Zhang return -EINVAL; 753a9368961SHawking Zhang 754a9368961SHawking Zhang xcc_id = ffs(xcc_mask) - 1; 755a9368961SHawking Zhang if (!adev->gmc.is_app_apu) 756a9368961SHawking Zhang return __soc_v1_0_get_xcp_mem_id(adev, xcc_id, mem_id); 757a9368961SHawking Zhang 758a9368961SHawking Zhang r = amdgpu_acpi_get_mem_info(adev, xcc_id, &numa_info); 759a9368961SHawking Zhang 760a9368961SHawking Zhang if (r) 761a9368961SHawking Zhang return r; 762a9368961SHawking Zhang 763a9368961SHawking Zhang r = -EINVAL; 764a9368961SHawking Zhang for (i = 0; i < adev->gmc.num_mem_partitions; ++i) { 765a9368961SHawking Zhang if (adev->gmc.mem_partitions[i].numa.node == numa_info.nid) { 766a9368961SHawking Zhang *mem_id = i; 767a9368961SHawking Zhang r = 0; 768a9368961SHawking Zhang break; 769a9368961SHawking Zhang } 770a9368961SHawking Zhang } 771a9368961SHawking Zhang 772a9368961SHawking Zhang return r; 773a9368961SHawking Zhang } 774a9368961SHawking Zhang #endif 775a9368961SHawking Zhang 776a9368961SHawking Zhang static int soc_v1_0_get_xcp_ip_details(struct amdgpu_xcp_mgr *xcp_mgr, int xcp_id, 777a9368961SHawking Zhang enum AMDGPU_XCP_IP_BLOCK ip_id, 778a9368961SHawking Zhang struct amdgpu_xcp_ip *ip) 779a9368961SHawking Zhang { 780a9368961SHawking Zhang if (!ip) 781a9368961SHawking Zhang return -EINVAL; 782a9368961SHawking Zhang 783a9368961SHawking Zhang return __soc_v1_0_get_xcp_ip_info(xcp_mgr, xcp_id, ip_id, ip); 784a9368961SHawking Zhang } 785a9368961SHawking Zhang 786a9368961SHawking Zhang struct amdgpu_xcp_mgr_funcs soc_v1_0_xcp_funcs = { 787a9368961SHawking Zhang .switch_partition_mode = &soc_v1_0_switch_partition_mode, 788a9368961SHawking Zhang .query_partition_mode = &soc_v1_0_query_partition_mode, 789a9368961SHawking Zhang .get_ip_details = &soc_v1_0_get_xcp_ip_details, 790a9368961SHawking Zhang .get_xcp_res_info = &soc_v1_0_get_xcp_res_info, 791a9368961SHawking Zhang #ifdef HAVE_ACPI_DEV_GET_FIRST_MATCH_DEV 792a9368961SHawking Zhang .get_xcp_mem_id = &soc_v1_0_get_xcp_mem_id, 793a9368961SHawking Zhang #endif 794a9368961SHawking Zhang }; 795a9368961SHawking Zhang 796f9ed1d46SHawking Zhang static int soc_v1_0_xcp_mgr_init(struct amdgpu_device *adev) 797f9ed1d46SHawking Zhang { 798f9ed1d46SHawking Zhang int ret; 799f9ed1d46SHawking Zhang 800f9ed1d46SHawking Zhang if (amdgpu_sriov_vf(adev)) 801f9ed1d46SHawking Zhang soc_v1_0_xcp_funcs.switch_partition_mode = NULL; 802f9ed1d46SHawking Zhang 803f9ed1d46SHawking Zhang ret = amdgpu_xcp_mgr_init(adev, AMDGPU_UNKNOWN_COMPUTE_PARTITION_MODE, 804f9ed1d46SHawking Zhang 1, &soc_v1_0_xcp_funcs); 805f9ed1d46SHawking Zhang if (ret) 806f9ed1d46SHawking Zhang return ret; 807f9ed1d46SHawking Zhang 808f9ed1d46SHawking Zhang amdgpu_xcp_update_supported_modes(adev->xcp_mgr); 809f9ed1d46SHawking Zhang /* TODO: Default memory node affinity init */ 810f9ed1d46SHawking Zhang 811f9ed1d46SHawking Zhang return ret; 812f9ed1d46SHawking Zhang } 813f9ed1d46SHawking Zhang 814fe1c48e9SLikun Gao int soc_v1_0_init_soc_config(struct amdgpu_device *adev) 815fe1c48e9SLikun Gao { 81687046288SLikun Gao int ret, i; 81787046288SLikun Gao int xcc_inst_per_aid = 4; 81887046288SLikun Gao uint16_t xcc_mask; 819f9ed1d46SHawking Zhang 82087046288SLikun Gao xcc_mask = adev->gfx.xcc_mask; 82187046288SLikun Gao adev->aid_mask = 0; 82287046288SLikun Gao for (i = 0; xcc_mask; xcc_mask >>= xcc_inst_per_aid, i++) { 82387046288SLikun Gao if (xcc_mask & ((1U << xcc_inst_per_aid) - 1)) 82487046288SLikun Gao adev->aid_mask |= (1 << i); 82587046288SLikun Gao } 82687046288SLikun Gao 827fe1c48e9SLikun Gao adev->sdma.num_inst_per_xcc = 2; 828d6e81483SLikun Gao adev->sdma.num_instances = 829d6e81483SLikun Gao NUM_XCC(adev->gfx.xcc_mask) * adev->sdma.num_inst_per_xcc; 830d6e81483SLikun Gao adev->sdma.sdma_mask = 831d6e81483SLikun Gao GENMASK(adev->sdma.num_instances - 1, 0); 832fe1c48e9SLikun Gao 833f9ed1d46SHawking Zhang ret = soc_v1_0_xcp_mgr_init(adev); 834f9ed1d46SHawking Zhang if (ret) 835f9ed1d46SHawking Zhang return ret; 836f9ed1d46SHawking Zhang 837fe1c48e9SLikun Gao amdgpu_ip_map_init(adev); 838fe1c48e9SLikun Gao 839fe1c48e9SLikun Gao return 0; 840fe1c48e9SLikun Gao } 841fcc4fc75SLikun Gao 842fcc4fc75SLikun Gao bool soc_v1_0_normalize_xcc_reg_range(uint32_t reg) 843fcc4fc75SLikun Gao { 844fcc4fc75SLikun Gao if (((reg >= XCC_REG_RANGE_0_LOW) && (reg < XCC_REG_RANGE_0_HIGH)) || 845fcc4fc75SLikun Gao ((reg >= XCC_REG_RANGE_1_LOW) && (reg < XCC_REG_RANGE_1_HIGH))) 846fcc4fc75SLikun Gao return true; 847fcc4fc75SLikun Gao else 848fcc4fc75SLikun Gao return false; 849fcc4fc75SLikun Gao } 850fcc4fc75SLikun Gao 851fcc4fc75SLikun Gao uint32_t soc_v1_0_normalize_xcc_reg_offset(uint32_t reg) 852fcc4fc75SLikun Gao { 853fcc4fc75SLikun Gao uint32_t normalized_reg = NORMALIZE_XCC_REG_OFFSET(reg); 854fcc4fc75SLikun Gao 855fcc4fc75SLikun Gao /* If it is an XCC reg, normalize the reg to keep 856fcc4fc75SLikun Gao * lower 16 bits in local xcc */ 857fcc4fc75SLikun Gao 858fcc4fc75SLikun Gao if (soc_v1_0_normalize_xcc_reg_range(normalized_reg)) 859fcc4fc75SLikun Gao return normalized_reg; 860fcc4fc75SLikun Gao else 861fcc4fc75SLikun Gao return reg; 862fcc4fc75SLikun Gao } 863