1 /* 2 * Copyright 2016 Advanced Micro Devices, Inc. 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 * 22 */ 23 #include <linux/firmware.h> 24 #include <linux/slab.h> 25 #include <linux/module.h> 26 #include <linux/pci.h> 27 28 #include <drm/amdgpu_drm.h> 29 30 #include "amdgpu.h" 31 #include "amdgpu_atombios.h" 32 #include "amdgpu_ih.h" 33 #include "amdgpu_uvd.h" 34 #include "amdgpu_vce.h" 35 #include "amdgpu_ucode.h" 36 #include "amdgpu_psp.h" 37 #include "atom.h" 38 #include "amd_pcie.h" 39 40 #include "uvd/uvd_7_0_offset.h" 41 #include "gc/gc_9_0_offset.h" 42 #include "gc/gc_9_0_sh_mask.h" 43 #include "sdma0/sdma0_4_0_offset.h" 44 #include "sdma1/sdma1_4_0_offset.h" 45 #include "nbio/nbio_7_0_default.h" 46 #include "nbio/nbio_7_0_offset.h" 47 #include "nbio/nbio_7_0_sh_mask.h" 48 #include "nbio/nbio_7_0_smn.h" 49 #include "mp/mp_9_0_offset.h" 50 51 #include "soc15.h" 52 #include "soc15_common.h" 53 #include "gfx_v9_0.h" 54 #include "gmc_v9_0.h" 55 #include "gfxhub_v1_0.h" 56 #include "mmhub_v1_0.h" 57 #include "df_v1_7.h" 58 #include "df_v3_6.h" 59 #include "nbio_v6_1.h" 60 #include "nbio_v7_0.h" 61 #include "nbio_v7_4.h" 62 #include "hdp_v4_0.h" 63 #include "vega10_ih.h" 64 #include "vega20_ih.h" 65 #include "navi10_ih.h" 66 #include "sdma_v4_0.h" 67 #include "uvd_v7_0.h" 68 #include "vce_v4_0.h" 69 #include "vcn_v1_0.h" 70 #include "vcn_v2_0.h" 71 #include "jpeg_v2_0.h" 72 #include "vcn_v2_5.h" 73 #include "jpeg_v2_5.h" 74 #include "smuio_v9_0.h" 75 #include "smuio_v11_0.h" 76 #include "smuio_v13_0.h" 77 #include "amdgpu_vkms.h" 78 #include "mxgpu_ai.h" 79 #include "amdgpu_ras.h" 80 #include "amdgpu_xgmi.h" 81 #include <uapi/linux/kfd_ioctl.h> 82 83 #define mmMP0_MISC_CGTT_CTRL0 0x01b9 84 #define mmMP0_MISC_CGTT_CTRL0_BASE_IDX 0 85 #define mmMP0_MISC_LIGHT_SLEEP_CTRL 0x01ba 86 #define mmMP0_MISC_LIGHT_SLEEP_CTRL_BASE_IDX 0 87 88 static const struct amd_ip_funcs soc15_common_ip_funcs; 89 90 /* Vega, Raven, Arcturus */ 91 static const struct amdgpu_video_codec_info vega_video_codecs_encode_array[] = 92 { 93 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 2304, 0)}, 94 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 4096, 2304, 0)}, 95 }; 96 97 static const struct amdgpu_video_codecs vega_video_codecs_encode = 98 { 99 .codec_count = ARRAY_SIZE(vega_video_codecs_encode_array), 100 .codec_array = vega_video_codecs_encode_array, 101 }; 102 103 /* Vega */ 104 static const struct amdgpu_video_codec_info vega_video_codecs_decode_array[] = 105 { 106 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG2, 4096, 4906, 3)}, 107 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4, 4096, 4906, 5)}, 108 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4906, 52)}, 109 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VC1, 4096, 4906, 4)}, 110 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 4096, 4096, 186)}, 111 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 4096, 4096, 0)}, 112 }; 113 114 static const struct amdgpu_video_codecs vega_video_codecs_decode = 115 { 116 .codec_count = ARRAY_SIZE(vega_video_codecs_decode_array), 117 .codec_array = vega_video_codecs_decode_array, 118 }; 119 120 /* Raven */ 121 static const struct amdgpu_video_codec_info rv_video_codecs_decode_array[] = 122 { 123 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG2, 4096, 4906, 3)}, 124 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4, 4096, 4906, 5)}, 125 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4906, 52)}, 126 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VC1, 4096, 4906, 4)}, 127 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 4096, 4096, 186)}, 128 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 4096, 4096, 0)}, 129 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VP9, 4096, 4096, 0)}, 130 }; 131 132 static const struct amdgpu_video_codecs rv_video_codecs_decode = 133 { 134 .codec_count = ARRAY_SIZE(rv_video_codecs_decode_array), 135 .codec_array = rv_video_codecs_decode_array, 136 }; 137 138 /* Renoir, Arcturus */ 139 static const struct amdgpu_video_codec_info rn_video_codecs_decode_array[] = 140 { 141 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG2, 4096, 4906, 3)}, 142 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4, 4096, 4906, 5)}, 143 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_MPEG4_AVC, 4096, 4906, 52)}, 144 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VC1, 4096, 4906, 4)}, 145 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_HEVC, 8192, 4352, 186)}, 146 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_JPEG, 4096, 4096, 0)}, 147 {codec_info_build(AMDGPU_INFO_VIDEO_CAPS_CODEC_IDX_VP9, 8192, 4352, 0)}, 148 }; 149 150 static const struct amdgpu_video_codecs rn_video_codecs_decode = 151 { 152 .codec_count = ARRAY_SIZE(rn_video_codecs_decode_array), 153 .codec_array = rn_video_codecs_decode_array, 154 }; 155 156 static int soc15_query_video_codecs(struct amdgpu_device *adev, bool encode, 157 const struct amdgpu_video_codecs **codecs) 158 { 159 if (adev->ip_versions[VCE_HWIP][0]) { 160 switch (adev->ip_versions[VCE_HWIP][0]) { 161 case IP_VERSION(4, 0, 0): 162 case IP_VERSION(4, 1, 0): 163 if (encode) 164 *codecs = &vega_video_codecs_encode; 165 else 166 *codecs = &vega_video_codecs_decode; 167 return 0; 168 default: 169 return -EINVAL; 170 } 171 } else { 172 switch (adev->ip_versions[UVD_HWIP][0]) { 173 case IP_VERSION(1, 0, 0): 174 case IP_VERSION(1, 0, 1): 175 if (encode) 176 *codecs = &vega_video_codecs_encode; 177 else 178 *codecs = &rv_video_codecs_decode; 179 return 0; 180 case IP_VERSION(2, 5, 0): 181 case IP_VERSION(2, 6, 0): 182 case IP_VERSION(2, 2, 0): 183 if (encode) 184 *codecs = &vega_video_codecs_encode; 185 else 186 *codecs = &rn_video_codecs_decode; 187 return 0; 188 default: 189 return -EINVAL; 190 } 191 } 192 } 193 194 /* 195 * Indirect registers accessor 196 */ 197 static u32 soc15_pcie_rreg(struct amdgpu_device *adev, u32 reg) 198 { 199 unsigned long address, data; 200 address = adev->nbio.funcs->get_pcie_index_offset(adev); 201 data = adev->nbio.funcs->get_pcie_data_offset(adev); 202 203 return amdgpu_device_indirect_rreg(adev, address, data, reg); 204 } 205 206 static void soc15_pcie_wreg(struct amdgpu_device *adev, u32 reg, u32 v) 207 { 208 unsigned long address, data; 209 210 address = adev->nbio.funcs->get_pcie_index_offset(adev); 211 data = adev->nbio.funcs->get_pcie_data_offset(adev); 212 213 amdgpu_device_indirect_wreg(adev, address, data, reg, v); 214 } 215 216 static u64 soc15_pcie_rreg64(struct amdgpu_device *adev, u32 reg) 217 { 218 unsigned long address, data; 219 address = adev->nbio.funcs->get_pcie_index_offset(adev); 220 data = adev->nbio.funcs->get_pcie_data_offset(adev); 221 222 return amdgpu_device_indirect_rreg64(adev, address, data, reg); 223 } 224 225 static void soc15_pcie_wreg64(struct amdgpu_device *adev, u32 reg, u64 v) 226 { 227 unsigned long address, data; 228 229 address = adev->nbio.funcs->get_pcie_index_offset(adev); 230 data = adev->nbio.funcs->get_pcie_data_offset(adev); 231 232 amdgpu_device_indirect_wreg64(adev, address, data, reg, v); 233 } 234 235 static u32 soc15_uvd_ctx_rreg(struct amdgpu_device *adev, u32 reg) 236 { 237 unsigned long flags, address, data; 238 u32 r; 239 240 address = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_INDEX); 241 data = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_DATA); 242 243 spin_lock_irqsave(&adev->uvd_ctx_idx_lock, flags); 244 WREG32(address, ((reg) & 0x1ff)); 245 r = RREG32(data); 246 spin_unlock_irqrestore(&adev->uvd_ctx_idx_lock, flags); 247 return r; 248 } 249 250 static void soc15_uvd_ctx_wreg(struct amdgpu_device *adev, u32 reg, u32 v) 251 { 252 unsigned long flags, address, data; 253 254 address = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_INDEX); 255 data = SOC15_REG_OFFSET(UVD, 0, mmUVD_CTX_DATA); 256 257 spin_lock_irqsave(&adev->uvd_ctx_idx_lock, flags); 258 WREG32(address, ((reg) & 0x1ff)); 259 WREG32(data, (v)); 260 spin_unlock_irqrestore(&adev->uvd_ctx_idx_lock, flags); 261 } 262 263 static u32 soc15_didt_rreg(struct amdgpu_device *adev, u32 reg) 264 { 265 unsigned long flags, address, data; 266 u32 r; 267 268 address = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_INDEX); 269 data = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_DATA); 270 271 spin_lock_irqsave(&adev->didt_idx_lock, flags); 272 WREG32(address, (reg)); 273 r = RREG32(data); 274 spin_unlock_irqrestore(&adev->didt_idx_lock, flags); 275 return r; 276 } 277 278 static void soc15_didt_wreg(struct amdgpu_device *adev, u32 reg, u32 v) 279 { 280 unsigned long flags, address, data; 281 282 address = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_INDEX); 283 data = SOC15_REG_OFFSET(GC, 0, mmDIDT_IND_DATA); 284 285 spin_lock_irqsave(&adev->didt_idx_lock, flags); 286 WREG32(address, (reg)); 287 WREG32(data, (v)); 288 spin_unlock_irqrestore(&adev->didt_idx_lock, flags); 289 } 290 291 static u32 soc15_gc_cac_rreg(struct amdgpu_device *adev, u32 reg) 292 { 293 unsigned long flags; 294 u32 r; 295 296 spin_lock_irqsave(&adev->gc_cac_idx_lock, flags); 297 WREG32_SOC15(GC, 0, mmGC_CAC_IND_INDEX, (reg)); 298 r = RREG32_SOC15(GC, 0, mmGC_CAC_IND_DATA); 299 spin_unlock_irqrestore(&adev->gc_cac_idx_lock, flags); 300 return r; 301 } 302 303 static void soc15_gc_cac_wreg(struct amdgpu_device *adev, u32 reg, u32 v) 304 { 305 unsigned long flags; 306 307 spin_lock_irqsave(&adev->gc_cac_idx_lock, flags); 308 WREG32_SOC15(GC, 0, mmGC_CAC_IND_INDEX, (reg)); 309 WREG32_SOC15(GC, 0, mmGC_CAC_IND_DATA, (v)); 310 spin_unlock_irqrestore(&adev->gc_cac_idx_lock, flags); 311 } 312 313 static u32 soc15_se_cac_rreg(struct amdgpu_device *adev, u32 reg) 314 { 315 unsigned long flags; 316 u32 r; 317 318 spin_lock_irqsave(&adev->se_cac_idx_lock, flags); 319 WREG32_SOC15(GC, 0, mmSE_CAC_IND_INDEX, (reg)); 320 r = RREG32_SOC15(GC, 0, mmSE_CAC_IND_DATA); 321 spin_unlock_irqrestore(&adev->se_cac_idx_lock, flags); 322 return r; 323 } 324 325 static void soc15_se_cac_wreg(struct amdgpu_device *adev, u32 reg, u32 v) 326 { 327 unsigned long flags; 328 329 spin_lock_irqsave(&adev->se_cac_idx_lock, flags); 330 WREG32_SOC15(GC, 0, mmSE_CAC_IND_INDEX, (reg)); 331 WREG32_SOC15(GC, 0, mmSE_CAC_IND_DATA, (v)); 332 spin_unlock_irqrestore(&adev->se_cac_idx_lock, flags); 333 } 334 335 static u32 soc15_get_config_memsize(struct amdgpu_device *adev) 336 { 337 return adev->nbio.funcs->get_memsize(adev); 338 } 339 340 static u32 soc15_get_xclk(struct amdgpu_device *adev) 341 { 342 u32 reference_clock = adev->clock.spll.reference_freq; 343 344 if (adev->ip_versions[MP1_HWIP][0] == IP_VERSION(12, 0, 0) || 345 adev->ip_versions[MP1_HWIP][0] == IP_VERSION(12, 0, 1)) 346 return 10000; 347 if (adev->ip_versions[MP1_HWIP][0] == IP_VERSION(10, 0, 0) || 348 adev->ip_versions[MP1_HWIP][0] == IP_VERSION(10, 0, 1)) 349 return reference_clock / 4; 350 351 return reference_clock; 352 } 353 354 355 void soc15_grbm_select(struct amdgpu_device *adev, 356 u32 me, u32 pipe, u32 queue, u32 vmid) 357 { 358 u32 grbm_gfx_cntl = 0; 359 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, PIPEID, pipe); 360 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, MEID, me); 361 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, VMID, vmid); 362 grbm_gfx_cntl = REG_SET_FIELD(grbm_gfx_cntl, GRBM_GFX_CNTL, QUEUEID, queue); 363 364 WREG32_SOC15_RLC_SHADOW(GC, 0, mmGRBM_GFX_CNTL, grbm_gfx_cntl); 365 } 366 367 static void soc15_vga_set_state(struct amdgpu_device *adev, bool state) 368 { 369 /* todo */ 370 } 371 372 static bool soc15_read_disabled_bios(struct amdgpu_device *adev) 373 { 374 /* todo */ 375 return false; 376 } 377 378 static bool soc15_read_bios_from_rom(struct amdgpu_device *adev, 379 u8 *bios, u32 length_bytes) 380 { 381 u32 *dw_ptr; 382 u32 i, length_dw; 383 uint32_t rom_index_offset; 384 uint32_t rom_data_offset; 385 386 if (bios == NULL) 387 return false; 388 if (length_bytes == 0) 389 return false; 390 /* APU vbios image is part of sbios image */ 391 if (adev->flags & AMD_IS_APU) 392 return false; 393 394 dw_ptr = (u32 *)bios; 395 length_dw = ALIGN(length_bytes, 4) / 4; 396 397 rom_index_offset = 398 adev->smuio.funcs->get_rom_index_offset(adev); 399 rom_data_offset = 400 adev->smuio.funcs->get_rom_data_offset(adev); 401 402 /* set rom index to 0 */ 403 WREG32(rom_index_offset, 0); 404 /* read out the rom data */ 405 for (i = 0; i < length_dw; i++) 406 dw_ptr[i] = RREG32(rom_data_offset); 407 408 return true; 409 } 410 411 static struct soc15_allowed_register_entry soc15_allowed_read_registers[] = { 412 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS)}, 413 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS2)}, 414 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE0)}, 415 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE1)}, 416 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE2)}, 417 { SOC15_REG_ENTRY(GC, 0, mmGRBM_STATUS_SE3)}, 418 { SOC15_REG_ENTRY(SDMA0, 0, mmSDMA0_STATUS_REG)}, 419 { SOC15_REG_ENTRY(SDMA1, 0, mmSDMA1_STATUS_REG)}, 420 { SOC15_REG_ENTRY(GC, 0, mmCP_STAT)}, 421 { SOC15_REG_ENTRY(GC, 0, mmCP_STALLED_STAT1)}, 422 { SOC15_REG_ENTRY(GC, 0, mmCP_STALLED_STAT2)}, 423 { SOC15_REG_ENTRY(GC, 0, mmCP_STALLED_STAT3)}, 424 { SOC15_REG_ENTRY(GC, 0, mmCP_CPF_BUSY_STAT)}, 425 { SOC15_REG_ENTRY(GC, 0, mmCP_CPF_STALLED_STAT1)}, 426 { SOC15_REG_ENTRY(GC, 0, mmCP_CPF_STATUS)}, 427 { SOC15_REG_ENTRY(GC, 0, mmCP_CPC_BUSY_STAT)}, 428 { SOC15_REG_ENTRY(GC, 0, mmCP_CPC_STALLED_STAT1)}, 429 { SOC15_REG_ENTRY(GC, 0, mmCP_CPC_STATUS)}, 430 { SOC15_REG_ENTRY(GC, 0, mmGB_ADDR_CONFIG)}, 431 { SOC15_REG_ENTRY(GC, 0, mmDB_DEBUG2)}, 432 }; 433 434 static uint32_t soc15_read_indexed_register(struct amdgpu_device *adev, u32 se_num, 435 u32 sh_num, u32 reg_offset) 436 { 437 uint32_t val; 438 439 mutex_lock(&adev->grbm_idx_mutex); 440 if (se_num != 0xffffffff || sh_num != 0xffffffff) 441 amdgpu_gfx_select_se_sh(adev, se_num, sh_num, 0xffffffff); 442 443 val = RREG32(reg_offset); 444 445 if (se_num != 0xffffffff || sh_num != 0xffffffff) 446 amdgpu_gfx_select_se_sh(adev, 0xffffffff, 0xffffffff, 0xffffffff); 447 mutex_unlock(&adev->grbm_idx_mutex); 448 return val; 449 } 450 451 static uint32_t soc15_get_register_value(struct amdgpu_device *adev, 452 bool indexed, u32 se_num, 453 u32 sh_num, u32 reg_offset) 454 { 455 if (indexed) { 456 return soc15_read_indexed_register(adev, se_num, sh_num, reg_offset); 457 } else { 458 if (reg_offset == SOC15_REG_OFFSET(GC, 0, mmGB_ADDR_CONFIG)) 459 return adev->gfx.config.gb_addr_config; 460 else if (reg_offset == SOC15_REG_OFFSET(GC, 0, mmDB_DEBUG2)) 461 return adev->gfx.config.db_debug2; 462 return RREG32(reg_offset); 463 } 464 } 465 466 static int soc15_read_register(struct amdgpu_device *adev, u32 se_num, 467 u32 sh_num, u32 reg_offset, u32 *value) 468 { 469 uint32_t i; 470 struct soc15_allowed_register_entry *en; 471 472 *value = 0; 473 for (i = 0; i < ARRAY_SIZE(soc15_allowed_read_registers); i++) { 474 en = &soc15_allowed_read_registers[i]; 475 if (adev->reg_offset[en->hwip][en->inst] && 476 reg_offset != (adev->reg_offset[en->hwip][en->inst][en->seg] 477 + en->reg_offset)) 478 continue; 479 480 *value = soc15_get_register_value(adev, 481 soc15_allowed_read_registers[i].grbm_indexed, 482 se_num, sh_num, reg_offset); 483 return 0; 484 } 485 return -EINVAL; 486 } 487 488 489 /** 490 * soc15_program_register_sequence - program an array of registers. 491 * 492 * @adev: amdgpu_device pointer 493 * @regs: pointer to the register array 494 * @array_size: size of the register array 495 * 496 * Programs an array or registers with and and or masks. 497 * This is a helper for setting golden registers. 498 */ 499 500 void soc15_program_register_sequence(struct amdgpu_device *adev, 501 const struct soc15_reg_golden *regs, 502 const u32 array_size) 503 { 504 const struct soc15_reg_golden *entry; 505 u32 tmp, reg; 506 int i; 507 508 for (i = 0; i < array_size; ++i) { 509 entry = ®s[i]; 510 reg = adev->reg_offset[entry->hwip][entry->instance][entry->segment] + entry->reg; 511 512 if (entry->and_mask == 0xffffffff) { 513 tmp = entry->or_mask; 514 } else { 515 tmp = (entry->hwip == GC_HWIP) ? 516 RREG32_SOC15_IP(GC, reg) : RREG32(reg); 517 518 tmp &= ~(entry->and_mask); 519 tmp |= (entry->or_mask & entry->and_mask); 520 } 521 522 if (reg == SOC15_REG_OFFSET(GC, 0, mmPA_SC_BINNER_EVENT_CNTL_3) || 523 reg == SOC15_REG_OFFSET(GC, 0, mmPA_SC_ENHANCE) || 524 reg == SOC15_REG_OFFSET(GC, 0, mmPA_SC_ENHANCE_1) || 525 reg == SOC15_REG_OFFSET(GC, 0, mmSH_MEM_CONFIG)) 526 WREG32_RLC(reg, tmp); 527 else 528 (entry->hwip == GC_HWIP) ? 529 WREG32_SOC15_IP(GC, reg, tmp) : WREG32(reg, tmp); 530 531 } 532 533 } 534 535 static int soc15_asic_baco_reset(struct amdgpu_device *adev) 536 { 537 struct amdgpu_ras *ras = amdgpu_ras_get_context(adev); 538 int ret = 0; 539 540 /* avoid NBIF got stuck when do RAS recovery in BACO reset */ 541 if (ras && adev->ras_enabled) 542 adev->nbio.funcs->enable_doorbell_interrupt(adev, false); 543 544 ret = amdgpu_dpm_baco_reset(adev); 545 if (ret) 546 return ret; 547 548 /* re-enable doorbell interrupt after BACO exit */ 549 if (ras && adev->ras_enabled) 550 adev->nbio.funcs->enable_doorbell_interrupt(adev, true); 551 552 return 0; 553 } 554 555 static enum amd_reset_method 556 soc15_asic_reset_method(struct amdgpu_device *adev) 557 { 558 bool baco_reset = false; 559 bool connected_to_cpu = false; 560 struct amdgpu_ras *ras = amdgpu_ras_get_context(adev); 561 562 if (adev->gmc.xgmi.supported && adev->gmc.xgmi.connected_to_cpu) 563 connected_to_cpu = true; 564 565 if (amdgpu_reset_method == AMD_RESET_METHOD_MODE1 || 566 amdgpu_reset_method == AMD_RESET_METHOD_MODE2 || 567 amdgpu_reset_method == AMD_RESET_METHOD_BACO || 568 amdgpu_reset_method == AMD_RESET_METHOD_PCI) { 569 /* If connected to cpu, driver only support mode2 */ 570 if (connected_to_cpu) 571 return AMD_RESET_METHOD_MODE2; 572 return amdgpu_reset_method; 573 } 574 575 if (amdgpu_reset_method != -1) 576 dev_warn(adev->dev, "Specified reset method:%d isn't supported, using AUTO instead.\n", 577 amdgpu_reset_method); 578 579 switch (adev->ip_versions[MP1_HWIP][0]) { 580 case IP_VERSION(10, 0, 0): 581 case IP_VERSION(10, 0, 1): 582 case IP_VERSION(12, 0, 0): 583 case IP_VERSION(12, 0, 1): 584 return AMD_RESET_METHOD_MODE2; 585 case IP_VERSION(9, 0, 0): 586 case IP_VERSION(11, 0, 2): 587 if (adev->asic_type == CHIP_VEGA20) { 588 if (adev->psp.sos.fw_version >= 0x80067) 589 baco_reset = amdgpu_dpm_is_baco_supported(adev); 590 /* 591 * 1. PMFW version > 0x284300: all cases use baco 592 * 2. PMFW version <= 0x284300: only sGPU w/o RAS use baco 593 */ 594 if (ras && adev->ras_enabled && 595 adev->pm.fw_version <= 0x283400) 596 baco_reset = false; 597 } else { 598 baco_reset = amdgpu_dpm_is_baco_supported(adev); 599 } 600 break; 601 case IP_VERSION(13, 0, 2): 602 /* 603 * 1.connected to cpu: driver issue mode2 reset 604 * 2.discret gpu: driver issue mode1 reset 605 */ 606 if (connected_to_cpu) 607 return AMD_RESET_METHOD_MODE2; 608 break; 609 default: 610 break; 611 } 612 613 if (baco_reset) 614 return AMD_RESET_METHOD_BACO; 615 else 616 return AMD_RESET_METHOD_MODE1; 617 } 618 619 static int soc15_asic_reset(struct amdgpu_device *adev) 620 { 621 /* original raven doesn't have full asic reset */ 622 if ((adev->apu_flags & AMD_APU_IS_RAVEN) && 623 !(adev->apu_flags & AMD_APU_IS_RAVEN2)) 624 return 0; 625 626 switch (soc15_asic_reset_method(adev)) { 627 case AMD_RESET_METHOD_PCI: 628 dev_info(adev->dev, "PCI reset\n"); 629 return amdgpu_device_pci_reset(adev); 630 case AMD_RESET_METHOD_BACO: 631 dev_info(adev->dev, "BACO reset\n"); 632 return soc15_asic_baco_reset(adev); 633 case AMD_RESET_METHOD_MODE2: 634 dev_info(adev->dev, "MODE2 reset\n"); 635 return amdgpu_dpm_mode2_reset(adev); 636 default: 637 dev_info(adev->dev, "MODE1 reset\n"); 638 return amdgpu_device_mode1_reset(adev); 639 } 640 } 641 642 static bool soc15_supports_baco(struct amdgpu_device *adev) 643 { 644 switch (adev->ip_versions[MP1_HWIP][0]) { 645 case IP_VERSION(9, 0, 0): 646 case IP_VERSION(11, 0, 2): 647 if (adev->asic_type == CHIP_VEGA20) { 648 if (adev->psp.sos.fw_version >= 0x80067) 649 return amdgpu_dpm_is_baco_supported(adev); 650 return false; 651 } else { 652 return amdgpu_dpm_is_baco_supported(adev); 653 } 654 break; 655 default: 656 return false; 657 } 658 } 659 660 /*static int soc15_set_uvd_clock(struct amdgpu_device *adev, u32 clock, 661 u32 cntl_reg, u32 status_reg) 662 { 663 return 0; 664 }*/ 665 666 static int soc15_set_uvd_clocks(struct amdgpu_device *adev, u32 vclk, u32 dclk) 667 { 668 /*int r; 669 670 r = soc15_set_uvd_clock(adev, vclk, ixCG_VCLK_CNTL, ixCG_VCLK_STATUS); 671 if (r) 672 return r; 673 674 r = soc15_set_uvd_clock(adev, dclk, ixCG_DCLK_CNTL, ixCG_DCLK_STATUS); 675 */ 676 return 0; 677 } 678 679 static int soc15_set_vce_clocks(struct amdgpu_device *adev, u32 evclk, u32 ecclk) 680 { 681 /* todo */ 682 683 return 0; 684 } 685 686 static void soc15_pcie_gen3_enable(struct amdgpu_device *adev) 687 { 688 if (pci_is_root_bus(adev->pdev->bus)) 689 return; 690 691 if (amdgpu_pcie_gen2 == 0) 692 return; 693 694 if (adev->flags & AMD_IS_APU) 695 return; 696 697 if (!(adev->pm.pcie_gen_mask & (CAIL_PCIE_LINK_SPEED_SUPPORT_GEN2 | 698 CAIL_PCIE_LINK_SPEED_SUPPORT_GEN3))) 699 return; 700 701 /* todo */ 702 } 703 704 static void soc15_program_aspm(struct amdgpu_device *adev) 705 { 706 if (!amdgpu_aspm) 707 return; 708 709 if (!(adev->flags & AMD_IS_APU) && 710 (adev->nbio.funcs->program_aspm)) 711 adev->nbio.funcs->program_aspm(adev); 712 } 713 714 static void soc15_enable_doorbell_aperture(struct amdgpu_device *adev, 715 bool enable) 716 { 717 adev->nbio.funcs->enable_doorbell_aperture(adev, enable); 718 adev->nbio.funcs->enable_doorbell_selfring_aperture(adev, enable); 719 } 720 721 const struct amdgpu_ip_block_version vega10_common_ip_block = 722 { 723 .type = AMD_IP_BLOCK_TYPE_COMMON, 724 .major = 2, 725 .minor = 0, 726 .rev = 0, 727 .funcs = &soc15_common_ip_funcs, 728 }; 729 730 static uint32_t soc15_get_rev_id(struct amdgpu_device *adev) 731 { 732 return adev->nbio.funcs->get_rev_id(adev); 733 } 734 735 static void soc15_reg_base_init(struct amdgpu_device *adev) 736 { 737 int r; 738 739 /* Set IP register base before any HW register access */ 740 switch (adev->asic_type) { 741 case CHIP_VEGA10: 742 case CHIP_VEGA12: 743 case CHIP_RAVEN: 744 vega10_reg_base_init(adev); 745 break; 746 case CHIP_RENOIR: 747 /* It's safe to do ip discovery here for Renoir, 748 * it doesn't support SRIOV. */ 749 if (amdgpu_discovery) { 750 r = amdgpu_discovery_reg_base_init(adev); 751 if (r == 0) 752 break; 753 DRM_WARN("failed to init reg base from ip discovery table, " 754 "fallback to legacy init method\n"); 755 } 756 vega10_reg_base_init(adev); 757 break; 758 case CHIP_VEGA20: 759 vega20_reg_base_init(adev); 760 break; 761 case CHIP_ARCTURUS: 762 arct_reg_base_init(adev); 763 break; 764 case CHIP_ALDEBARAN: 765 aldebaran_reg_base_init(adev); 766 break; 767 default: 768 DRM_ERROR("Unsupported asic type: %d!\n", adev->asic_type); 769 break; 770 } 771 } 772 773 void soc15_set_virt_ops(struct amdgpu_device *adev) 774 { 775 adev->virt.ops = &xgpu_ai_virt_ops; 776 777 /* init soc15 reg base early enough so we can 778 * request request full access for sriov before 779 * set_ip_blocks. */ 780 soc15_reg_base_init(adev); 781 } 782 783 static bool soc15_need_full_reset(struct amdgpu_device *adev) 784 { 785 /* change this when we implement soft reset */ 786 return true; 787 } 788 789 static void soc15_get_pcie_usage(struct amdgpu_device *adev, uint64_t *count0, 790 uint64_t *count1) 791 { 792 uint32_t perfctr = 0; 793 uint64_t cnt0_of, cnt1_of; 794 int tmp; 795 796 /* This reports 0 on APUs, so return to avoid writing/reading registers 797 * that may or may not be different from their GPU counterparts 798 */ 799 if (adev->flags & AMD_IS_APU) 800 return; 801 802 /* Set the 2 events that we wish to watch, defined above */ 803 /* Reg 40 is # received msgs */ 804 /* Reg 104 is # of posted requests sent */ 805 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK, EVENT0_SEL, 40); 806 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK, EVENT1_SEL, 104); 807 808 /* Write to enable desired perf counters */ 809 WREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK, perfctr); 810 /* Zero out and enable the perf counters 811 * Write 0x5: 812 * Bit 0 = Start all counters(1) 813 * Bit 2 = Global counter reset enable(1) 814 */ 815 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000005); 816 817 msleep(1000); 818 819 /* Load the shadow and disable the perf counters 820 * Write 0x2: 821 * Bit 0 = Stop counters(0) 822 * Bit 1 = Load the shadow counters(1) 823 */ 824 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000002); 825 826 /* Read register values to get any >32bit overflow */ 827 tmp = RREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK); 828 cnt0_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK, COUNTER0_UPPER); 829 cnt1_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK, COUNTER1_UPPER); 830 831 /* Get the values and add the overflow */ 832 *count0 = RREG32_PCIE(smnPCIE_PERF_COUNT0_TXCLK) | (cnt0_of << 32); 833 *count1 = RREG32_PCIE(smnPCIE_PERF_COUNT1_TXCLK) | (cnt1_of << 32); 834 } 835 836 static void vega20_get_pcie_usage(struct amdgpu_device *adev, uint64_t *count0, 837 uint64_t *count1) 838 { 839 uint32_t perfctr = 0; 840 uint64_t cnt0_of, cnt1_of; 841 int tmp; 842 843 /* This reports 0 on APUs, so return to avoid writing/reading registers 844 * that may or may not be different from their GPU counterparts 845 */ 846 if (adev->flags & AMD_IS_APU) 847 return; 848 849 /* Set the 2 events that we wish to watch, defined above */ 850 /* Reg 40 is # received msgs */ 851 /* Reg 108 is # of posted requests sent on VG20 */ 852 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK3, 853 EVENT0_SEL, 40); 854 perfctr = REG_SET_FIELD(perfctr, PCIE_PERF_CNTL_TXCLK3, 855 EVENT1_SEL, 108); 856 857 /* Write to enable desired perf counters */ 858 WREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK3, perfctr); 859 /* Zero out and enable the perf counters 860 * Write 0x5: 861 * Bit 0 = Start all counters(1) 862 * Bit 2 = Global counter reset enable(1) 863 */ 864 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000005); 865 866 msleep(1000); 867 868 /* Load the shadow and disable the perf counters 869 * Write 0x2: 870 * Bit 0 = Stop counters(0) 871 * Bit 1 = Load the shadow counters(1) 872 */ 873 WREG32_PCIE(smnPCIE_PERF_COUNT_CNTL, 0x00000002); 874 875 /* Read register values to get any >32bit overflow */ 876 tmp = RREG32_PCIE(smnPCIE_PERF_CNTL_TXCLK3); 877 cnt0_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK3, COUNTER0_UPPER); 878 cnt1_of = REG_GET_FIELD(tmp, PCIE_PERF_CNTL_TXCLK3, COUNTER1_UPPER); 879 880 /* Get the values and add the overflow */ 881 *count0 = RREG32_PCIE(smnPCIE_PERF_COUNT0_TXCLK3) | (cnt0_of << 32); 882 *count1 = RREG32_PCIE(smnPCIE_PERF_COUNT1_TXCLK3) | (cnt1_of << 32); 883 } 884 885 static bool soc15_need_reset_on_init(struct amdgpu_device *adev) 886 { 887 u32 sol_reg; 888 889 /* Just return false for soc15 GPUs. Reset does not seem to 890 * be necessary. 891 */ 892 if (!amdgpu_passthrough(adev)) 893 return false; 894 895 if (adev->flags & AMD_IS_APU) 896 return false; 897 898 /* Check sOS sign of life register to confirm sys driver and sOS 899 * are already been loaded. 900 */ 901 sol_reg = RREG32_SOC15(MP0, 0, mmMP0_SMN_C2PMSG_81); 902 if (sol_reg) 903 return true; 904 905 return false; 906 } 907 908 static uint64_t soc15_get_pcie_replay_count(struct amdgpu_device *adev) 909 { 910 uint64_t nak_r, nak_g; 911 912 /* Get the number of NAKs received and generated */ 913 nak_r = RREG32_PCIE(smnPCIE_RX_NUM_NAK); 914 nak_g = RREG32_PCIE(smnPCIE_RX_NUM_NAK_GENERATED); 915 916 /* Add the total number of NAKs, i.e the number of replays */ 917 return (nak_r + nak_g); 918 } 919 920 static void soc15_pre_asic_init(struct amdgpu_device *adev) 921 { 922 gmc_v9_0_restore_registers(adev); 923 } 924 925 static const struct amdgpu_asic_funcs soc15_asic_funcs = 926 { 927 .read_disabled_bios = &soc15_read_disabled_bios, 928 .read_bios_from_rom = &soc15_read_bios_from_rom, 929 .read_register = &soc15_read_register, 930 .reset = &soc15_asic_reset, 931 .reset_method = &soc15_asic_reset_method, 932 .set_vga_state = &soc15_vga_set_state, 933 .get_xclk = &soc15_get_xclk, 934 .set_uvd_clocks = &soc15_set_uvd_clocks, 935 .set_vce_clocks = &soc15_set_vce_clocks, 936 .get_config_memsize = &soc15_get_config_memsize, 937 .need_full_reset = &soc15_need_full_reset, 938 .init_doorbell_index = &vega10_doorbell_index_init, 939 .get_pcie_usage = &soc15_get_pcie_usage, 940 .need_reset_on_init = &soc15_need_reset_on_init, 941 .get_pcie_replay_count = &soc15_get_pcie_replay_count, 942 .supports_baco = &soc15_supports_baco, 943 .pre_asic_init = &soc15_pre_asic_init, 944 .query_video_codecs = &soc15_query_video_codecs, 945 }; 946 947 static const struct amdgpu_asic_funcs vega20_asic_funcs = 948 { 949 .read_disabled_bios = &soc15_read_disabled_bios, 950 .read_bios_from_rom = &soc15_read_bios_from_rom, 951 .read_register = &soc15_read_register, 952 .reset = &soc15_asic_reset, 953 .reset_method = &soc15_asic_reset_method, 954 .set_vga_state = &soc15_vga_set_state, 955 .get_xclk = &soc15_get_xclk, 956 .set_uvd_clocks = &soc15_set_uvd_clocks, 957 .set_vce_clocks = &soc15_set_vce_clocks, 958 .get_config_memsize = &soc15_get_config_memsize, 959 .need_full_reset = &soc15_need_full_reset, 960 .init_doorbell_index = &vega20_doorbell_index_init, 961 .get_pcie_usage = &vega20_get_pcie_usage, 962 .need_reset_on_init = &soc15_need_reset_on_init, 963 .get_pcie_replay_count = &soc15_get_pcie_replay_count, 964 .supports_baco = &soc15_supports_baco, 965 .pre_asic_init = &soc15_pre_asic_init, 966 .query_video_codecs = &soc15_query_video_codecs, 967 }; 968 969 static int soc15_common_early_init(void *handle) 970 { 971 #define MMIO_REG_HOLE_OFFSET (0x80000 - PAGE_SIZE) 972 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 973 974 if (!amdgpu_sriov_vf(adev)) { 975 adev->rmmio_remap.reg_offset = MMIO_REG_HOLE_OFFSET; 976 adev->rmmio_remap.bus_addr = adev->rmmio_base + MMIO_REG_HOLE_OFFSET; 977 } 978 adev->smc_rreg = NULL; 979 adev->smc_wreg = NULL; 980 adev->pcie_rreg = &soc15_pcie_rreg; 981 adev->pcie_wreg = &soc15_pcie_wreg; 982 adev->pcie_rreg64 = &soc15_pcie_rreg64; 983 adev->pcie_wreg64 = &soc15_pcie_wreg64; 984 adev->uvd_ctx_rreg = &soc15_uvd_ctx_rreg; 985 adev->uvd_ctx_wreg = &soc15_uvd_ctx_wreg; 986 adev->didt_rreg = &soc15_didt_rreg; 987 adev->didt_wreg = &soc15_didt_wreg; 988 adev->gc_cac_rreg = &soc15_gc_cac_rreg; 989 adev->gc_cac_wreg = &soc15_gc_cac_wreg; 990 adev->se_cac_rreg = &soc15_se_cac_rreg; 991 adev->se_cac_wreg = &soc15_se_cac_wreg; 992 993 adev->rev_id = soc15_get_rev_id(adev); 994 adev->external_rev_id = 0xFF; 995 /* TODO: split the GC and PG flags based on the relevant IP version for which 996 * they are relevant. 997 */ 998 switch (adev->ip_versions[GC_HWIP][0]) { 999 case IP_VERSION(9, 0, 1): 1000 adev->asic_funcs = &soc15_asic_funcs; 1001 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1002 AMD_CG_SUPPORT_GFX_MGLS | 1003 AMD_CG_SUPPORT_GFX_RLC_LS | 1004 AMD_CG_SUPPORT_GFX_CP_LS | 1005 AMD_CG_SUPPORT_GFX_3D_CGCG | 1006 AMD_CG_SUPPORT_GFX_3D_CGLS | 1007 AMD_CG_SUPPORT_GFX_CGCG | 1008 AMD_CG_SUPPORT_GFX_CGLS | 1009 AMD_CG_SUPPORT_BIF_MGCG | 1010 AMD_CG_SUPPORT_BIF_LS | 1011 AMD_CG_SUPPORT_HDP_LS | 1012 AMD_CG_SUPPORT_DRM_MGCG | 1013 AMD_CG_SUPPORT_DRM_LS | 1014 AMD_CG_SUPPORT_ROM_MGCG | 1015 AMD_CG_SUPPORT_DF_MGCG | 1016 AMD_CG_SUPPORT_SDMA_MGCG | 1017 AMD_CG_SUPPORT_SDMA_LS | 1018 AMD_CG_SUPPORT_MC_MGCG | 1019 AMD_CG_SUPPORT_MC_LS; 1020 adev->pg_flags = 0; 1021 adev->external_rev_id = 0x1; 1022 break; 1023 case IP_VERSION(9, 2, 1): 1024 adev->asic_funcs = &soc15_asic_funcs; 1025 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1026 AMD_CG_SUPPORT_GFX_MGLS | 1027 AMD_CG_SUPPORT_GFX_CGCG | 1028 AMD_CG_SUPPORT_GFX_CGLS | 1029 AMD_CG_SUPPORT_GFX_3D_CGCG | 1030 AMD_CG_SUPPORT_GFX_3D_CGLS | 1031 AMD_CG_SUPPORT_GFX_CP_LS | 1032 AMD_CG_SUPPORT_MC_LS | 1033 AMD_CG_SUPPORT_MC_MGCG | 1034 AMD_CG_SUPPORT_SDMA_MGCG | 1035 AMD_CG_SUPPORT_SDMA_LS | 1036 AMD_CG_SUPPORT_BIF_MGCG | 1037 AMD_CG_SUPPORT_BIF_LS | 1038 AMD_CG_SUPPORT_HDP_MGCG | 1039 AMD_CG_SUPPORT_HDP_LS | 1040 AMD_CG_SUPPORT_ROM_MGCG | 1041 AMD_CG_SUPPORT_VCE_MGCG | 1042 AMD_CG_SUPPORT_UVD_MGCG; 1043 adev->pg_flags = 0; 1044 adev->external_rev_id = adev->rev_id + 0x14; 1045 break; 1046 case IP_VERSION(9, 4, 0): 1047 adev->asic_funcs = &vega20_asic_funcs; 1048 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1049 AMD_CG_SUPPORT_GFX_MGLS | 1050 AMD_CG_SUPPORT_GFX_CGCG | 1051 AMD_CG_SUPPORT_GFX_CGLS | 1052 AMD_CG_SUPPORT_GFX_3D_CGCG | 1053 AMD_CG_SUPPORT_GFX_3D_CGLS | 1054 AMD_CG_SUPPORT_GFX_CP_LS | 1055 AMD_CG_SUPPORT_MC_LS | 1056 AMD_CG_SUPPORT_MC_MGCG | 1057 AMD_CG_SUPPORT_SDMA_MGCG | 1058 AMD_CG_SUPPORT_SDMA_LS | 1059 AMD_CG_SUPPORT_BIF_MGCG | 1060 AMD_CG_SUPPORT_BIF_LS | 1061 AMD_CG_SUPPORT_HDP_MGCG | 1062 AMD_CG_SUPPORT_HDP_LS | 1063 AMD_CG_SUPPORT_ROM_MGCG | 1064 AMD_CG_SUPPORT_VCE_MGCG | 1065 AMD_CG_SUPPORT_UVD_MGCG; 1066 adev->pg_flags = 0; 1067 adev->external_rev_id = adev->rev_id + 0x28; 1068 break; 1069 case IP_VERSION(9, 1, 0): 1070 case IP_VERSION(9, 2, 2): 1071 adev->asic_funcs = &soc15_asic_funcs; 1072 1073 if (adev->rev_id >= 0x8) 1074 adev->apu_flags |= AMD_APU_IS_RAVEN2; 1075 1076 if (adev->apu_flags & AMD_APU_IS_RAVEN2) 1077 adev->external_rev_id = adev->rev_id + 0x79; 1078 else if (adev->apu_flags & AMD_APU_IS_PICASSO) 1079 adev->external_rev_id = adev->rev_id + 0x41; 1080 else if (adev->rev_id == 1) 1081 adev->external_rev_id = adev->rev_id + 0x20; 1082 else 1083 adev->external_rev_id = adev->rev_id + 0x01; 1084 1085 if (adev->apu_flags & AMD_APU_IS_RAVEN2) { 1086 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1087 AMD_CG_SUPPORT_GFX_MGLS | 1088 AMD_CG_SUPPORT_GFX_CP_LS | 1089 AMD_CG_SUPPORT_GFX_3D_CGCG | 1090 AMD_CG_SUPPORT_GFX_3D_CGLS | 1091 AMD_CG_SUPPORT_GFX_CGCG | 1092 AMD_CG_SUPPORT_GFX_CGLS | 1093 AMD_CG_SUPPORT_BIF_LS | 1094 AMD_CG_SUPPORT_HDP_LS | 1095 AMD_CG_SUPPORT_MC_MGCG | 1096 AMD_CG_SUPPORT_MC_LS | 1097 AMD_CG_SUPPORT_SDMA_MGCG | 1098 AMD_CG_SUPPORT_SDMA_LS | 1099 AMD_CG_SUPPORT_VCN_MGCG; 1100 1101 adev->pg_flags = AMD_PG_SUPPORT_SDMA | AMD_PG_SUPPORT_VCN; 1102 } else if (adev->apu_flags & AMD_APU_IS_PICASSO) { 1103 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1104 AMD_CG_SUPPORT_GFX_MGLS | 1105 AMD_CG_SUPPORT_GFX_CP_LS | 1106 AMD_CG_SUPPORT_GFX_3D_CGLS | 1107 AMD_CG_SUPPORT_GFX_CGCG | 1108 AMD_CG_SUPPORT_GFX_CGLS | 1109 AMD_CG_SUPPORT_BIF_LS | 1110 AMD_CG_SUPPORT_HDP_LS | 1111 AMD_CG_SUPPORT_MC_MGCG | 1112 AMD_CG_SUPPORT_MC_LS | 1113 AMD_CG_SUPPORT_SDMA_MGCG | 1114 AMD_CG_SUPPORT_SDMA_LS | 1115 AMD_CG_SUPPORT_VCN_MGCG; 1116 1117 adev->pg_flags = AMD_PG_SUPPORT_SDMA | 1118 AMD_PG_SUPPORT_MMHUB | 1119 AMD_PG_SUPPORT_VCN; 1120 } else { 1121 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1122 AMD_CG_SUPPORT_GFX_MGLS | 1123 AMD_CG_SUPPORT_GFX_RLC_LS | 1124 AMD_CG_SUPPORT_GFX_CP_LS | 1125 AMD_CG_SUPPORT_GFX_3D_CGLS | 1126 AMD_CG_SUPPORT_GFX_CGCG | 1127 AMD_CG_SUPPORT_GFX_CGLS | 1128 AMD_CG_SUPPORT_BIF_MGCG | 1129 AMD_CG_SUPPORT_BIF_LS | 1130 AMD_CG_SUPPORT_HDP_MGCG | 1131 AMD_CG_SUPPORT_HDP_LS | 1132 AMD_CG_SUPPORT_DRM_MGCG | 1133 AMD_CG_SUPPORT_DRM_LS | 1134 AMD_CG_SUPPORT_MC_MGCG | 1135 AMD_CG_SUPPORT_MC_LS | 1136 AMD_CG_SUPPORT_SDMA_MGCG | 1137 AMD_CG_SUPPORT_SDMA_LS | 1138 AMD_CG_SUPPORT_VCN_MGCG; 1139 1140 adev->pg_flags = AMD_PG_SUPPORT_SDMA | AMD_PG_SUPPORT_VCN; 1141 } 1142 break; 1143 case IP_VERSION(9, 4, 1): 1144 adev->asic_funcs = &vega20_asic_funcs; 1145 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1146 AMD_CG_SUPPORT_GFX_MGLS | 1147 AMD_CG_SUPPORT_GFX_CGCG | 1148 AMD_CG_SUPPORT_GFX_CGLS | 1149 AMD_CG_SUPPORT_GFX_CP_LS | 1150 AMD_CG_SUPPORT_HDP_MGCG | 1151 AMD_CG_SUPPORT_HDP_LS | 1152 AMD_CG_SUPPORT_SDMA_MGCG | 1153 AMD_CG_SUPPORT_SDMA_LS | 1154 AMD_CG_SUPPORT_MC_MGCG | 1155 AMD_CG_SUPPORT_MC_LS | 1156 AMD_CG_SUPPORT_IH_CG | 1157 AMD_CG_SUPPORT_VCN_MGCG | 1158 AMD_CG_SUPPORT_JPEG_MGCG; 1159 adev->pg_flags = AMD_PG_SUPPORT_VCN | AMD_PG_SUPPORT_VCN_DPG; 1160 adev->external_rev_id = adev->rev_id + 0x32; 1161 break; 1162 case IP_VERSION(9, 3, 0): 1163 adev->asic_funcs = &soc15_asic_funcs; 1164 1165 if (adev->apu_flags & AMD_APU_IS_RENOIR) 1166 adev->external_rev_id = adev->rev_id + 0x91; 1167 else 1168 adev->external_rev_id = adev->rev_id + 0xa1; 1169 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1170 AMD_CG_SUPPORT_GFX_MGLS | 1171 AMD_CG_SUPPORT_GFX_3D_CGCG | 1172 AMD_CG_SUPPORT_GFX_3D_CGLS | 1173 AMD_CG_SUPPORT_GFX_CGCG | 1174 AMD_CG_SUPPORT_GFX_CGLS | 1175 AMD_CG_SUPPORT_GFX_CP_LS | 1176 AMD_CG_SUPPORT_MC_MGCG | 1177 AMD_CG_SUPPORT_MC_LS | 1178 AMD_CG_SUPPORT_SDMA_MGCG | 1179 AMD_CG_SUPPORT_SDMA_LS | 1180 AMD_CG_SUPPORT_BIF_LS | 1181 AMD_CG_SUPPORT_HDP_LS | 1182 AMD_CG_SUPPORT_VCN_MGCG | 1183 AMD_CG_SUPPORT_JPEG_MGCG | 1184 AMD_CG_SUPPORT_IH_CG | 1185 AMD_CG_SUPPORT_ATHUB_LS | 1186 AMD_CG_SUPPORT_ATHUB_MGCG | 1187 AMD_CG_SUPPORT_DF_MGCG; 1188 adev->pg_flags = AMD_PG_SUPPORT_SDMA | 1189 AMD_PG_SUPPORT_VCN | 1190 AMD_PG_SUPPORT_JPEG | 1191 AMD_PG_SUPPORT_VCN_DPG; 1192 break; 1193 case IP_VERSION(9, 4, 2): 1194 adev->asic_funcs = &vega20_asic_funcs; 1195 adev->cg_flags = AMD_CG_SUPPORT_GFX_MGCG | 1196 AMD_CG_SUPPORT_GFX_MGLS | 1197 AMD_CG_SUPPORT_GFX_CP_LS | 1198 AMD_CG_SUPPORT_HDP_LS | 1199 AMD_CG_SUPPORT_SDMA_MGCG | 1200 AMD_CG_SUPPORT_SDMA_LS | 1201 AMD_CG_SUPPORT_IH_CG | 1202 AMD_CG_SUPPORT_VCN_MGCG | AMD_CG_SUPPORT_JPEG_MGCG; 1203 adev->pg_flags = AMD_PG_SUPPORT_VCN_DPG; 1204 adev->external_rev_id = adev->rev_id + 0x3c; 1205 break; 1206 default: 1207 /* FIXME: not supported yet */ 1208 return -EINVAL; 1209 } 1210 1211 if (amdgpu_sriov_vf(adev)) { 1212 amdgpu_virt_init_setting(adev); 1213 xgpu_ai_mailbox_set_irq_funcs(adev); 1214 } 1215 1216 return 0; 1217 } 1218 1219 static int soc15_common_late_init(void *handle) 1220 { 1221 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1222 int r = 0; 1223 1224 if (amdgpu_sriov_vf(adev)) 1225 xgpu_ai_mailbox_get_irq(adev); 1226 1227 if (adev->nbio.ras_funcs && 1228 adev->nbio.ras_funcs->ras_late_init) 1229 r = adev->nbio.ras_funcs->ras_late_init(adev); 1230 1231 return r; 1232 } 1233 1234 static int soc15_common_sw_init(void *handle) 1235 { 1236 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1237 1238 if (amdgpu_sriov_vf(adev)) 1239 xgpu_ai_mailbox_add_irq_id(adev); 1240 1241 if (adev->df.funcs && 1242 adev->df.funcs->sw_init) 1243 adev->df.funcs->sw_init(adev); 1244 1245 return 0; 1246 } 1247 1248 static int soc15_common_sw_fini(void *handle) 1249 { 1250 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1251 1252 if (adev->nbio.ras_funcs && 1253 adev->nbio.ras_funcs->ras_fini) 1254 adev->nbio.ras_funcs->ras_fini(adev); 1255 1256 if (adev->df.funcs && 1257 adev->df.funcs->sw_fini) 1258 adev->df.funcs->sw_fini(adev); 1259 return 0; 1260 } 1261 1262 static void soc15_doorbell_range_init(struct amdgpu_device *adev) 1263 { 1264 int i; 1265 struct amdgpu_ring *ring; 1266 1267 /* sdma/ih doorbell range are programed by hypervisor */ 1268 if (!amdgpu_sriov_vf(adev)) { 1269 for (i = 0; i < adev->sdma.num_instances; i++) { 1270 ring = &adev->sdma.instance[i].ring; 1271 adev->nbio.funcs->sdma_doorbell_range(adev, i, 1272 ring->use_doorbell, ring->doorbell_index, 1273 adev->doorbell_index.sdma_doorbell_range); 1274 } 1275 1276 adev->nbio.funcs->ih_doorbell_range(adev, adev->irq.ih.use_doorbell, 1277 adev->irq.ih.doorbell_index); 1278 } 1279 } 1280 1281 static int soc15_common_hw_init(void *handle) 1282 { 1283 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1284 1285 /* enable pcie gen2/3 link */ 1286 soc15_pcie_gen3_enable(adev); 1287 /* enable aspm */ 1288 soc15_program_aspm(adev); 1289 /* setup nbio registers */ 1290 adev->nbio.funcs->init_registers(adev); 1291 /* remap HDP registers to a hole in mmio space, 1292 * for the purpose of expose those registers 1293 * to process space 1294 */ 1295 if (adev->nbio.funcs->remap_hdp_registers && !amdgpu_sriov_vf(adev)) 1296 adev->nbio.funcs->remap_hdp_registers(adev); 1297 1298 /* enable the doorbell aperture */ 1299 soc15_enable_doorbell_aperture(adev, true); 1300 /* HW doorbell routing policy: doorbell writing not 1301 * in SDMA/IH/MM/ACV range will be routed to CP. So 1302 * we need to init SDMA/IH/MM/ACV doorbell range prior 1303 * to CP ip block init and ring test. 1304 */ 1305 soc15_doorbell_range_init(adev); 1306 1307 return 0; 1308 } 1309 1310 static int soc15_common_hw_fini(void *handle) 1311 { 1312 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1313 1314 /* disable the doorbell aperture */ 1315 soc15_enable_doorbell_aperture(adev, false); 1316 if (amdgpu_sriov_vf(adev)) 1317 xgpu_ai_mailbox_put_irq(adev); 1318 1319 if (adev->nbio.ras_if && 1320 amdgpu_ras_is_supported(adev, adev->nbio.ras_if->block)) { 1321 if (adev->nbio.ras_funcs && 1322 adev->nbio.ras_funcs->init_ras_controller_interrupt) 1323 amdgpu_irq_put(adev, &adev->nbio.ras_controller_irq, 0); 1324 if (adev->nbio.ras_funcs && 1325 adev->nbio.ras_funcs->init_ras_err_event_athub_interrupt) 1326 amdgpu_irq_put(adev, &adev->nbio.ras_err_event_athub_irq, 0); 1327 } 1328 1329 return 0; 1330 } 1331 1332 static int soc15_common_suspend(void *handle) 1333 { 1334 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1335 1336 return soc15_common_hw_fini(adev); 1337 } 1338 1339 static int soc15_common_resume(void *handle) 1340 { 1341 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1342 1343 return soc15_common_hw_init(adev); 1344 } 1345 1346 static bool soc15_common_is_idle(void *handle) 1347 { 1348 return true; 1349 } 1350 1351 static int soc15_common_wait_for_idle(void *handle) 1352 { 1353 return 0; 1354 } 1355 1356 static int soc15_common_soft_reset(void *handle) 1357 { 1358 return 0; 1359 } 1360 1361 static void soc15_update_drm_clock_gating(struct amdgpu_device *adev, bool enable) 1362 { 1363 uint32_t def, data; 1364 1365 def = data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_CGTT_CTRL0)); 1366 1367 if (enable && (adev->cg_flags & AMD_CG_SUPPORT_DRM_MGCG)) 1368 data &= ~(0x01000000 | 1369 0x02000000 | 1370 0x04000000 | 1371 0x08000000 | 1372 0x10000000 | 1373 0x20000000 | 1374 0x40000000 | 1375 0x80000000); 1376 else 1377 data |= (0x01000000 | 1378 0x02000000 | 1379 0x04000000 | 1380 0x08000000 | 1381 0x10000000 | 1382 0x20000000 | 1383 0x40000000 | 1384 0x80000000); 1385 1386 if (def != data) 1387 WREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_CGTT_CTRL0), data); 1388 } 1389 1390 static void soc15_update_drm_light_sleep(struct amdgpu_device *adev, bool enable) 1391 { 1392 uint32_t def, data; 1393 1394 def = data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_LIGHT_SLEEP_CTRL)); 1395 1396 if (enable && (adev->cg_flags & AMD_CG_SUPPORT_DRM_LS)) 1397 data |= 1; 1398 else 1399 data &= ~1; 1400 1401 if (def != data) 1402 WREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_LIGHT_SLEEP_CTRL), data); 1403 } 1404 1405 static int soc15_common_set_clockgating_state(void *handle, 1406 enum amd_clockgating_state state) 1407 { 1408 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1409 1410 if (amdgpu_sriov_vf(adev)) 1411 return 0; 1412 1413 switch (adev->ip_versions[NBIO_HWIP][0]) { 1414 case IP_VERSION(6, 1, 0): 1415 case IP_VERSION(6, 2, 0): 1416 case IP_VERSION(7, 4, 0): 1417 adev->nbio.funcs->update_medium_grain_clock_gating(adev, 1418 state == AMD_CG_STATE_GATE); 1419 adev->nbio.funcs->update_medium_grain_light_sleep(adev, 1420 state == AMD_CG_STATE_GATE); 1421 adev->hdp.funcs->update_clock_gating(adev, 1422 state == AMD_CG_STATE_GATE); 1423 soc15_update_drm_clock_gating(adev, 1424 state == AMD_CG_STATE_GATE); 1425 soc15_update_drm_light_sleep(adev, 1426 state == AMD_CG_STATE_GATE); 1427 adev->smuio.funcs->update_rom_clock_gating(adev, 1428 state == AMD_CG_STATE_GATE); 1429 adev->df.funcs->update_medium_grain_clock_gating(adev, 1430 state == AMD_CG_STATE_GATE); 1431 break; 1432 case IP_VERSION(7, 0, 0): 1433 case IP_VERSION(7, 0, 1): 1434 case IP_VERSION(2, 5, 0): 1435 adev->nbio.funcs->update_medium_grain_clock_gating(adev, 1436 state == AMD_CG_STATE_GATE); 1437 adev->nbio.funcs->update_medium_grain_light_sleep(adev, 1438 state == AMD_CG_STATE_GATE); 1439 adev->hdp.funcs->update_clock_gating(adev, 1440 state == AMD_CG_STATE_GATE); 1441 soc15_update_drm_clock_gating(adev, 1442 state == AMD_CG_STATE_GATE); 1443 soc15_update_drm_light_sleep(adev, 1444 state == AMD_CG_STATE_GATE); 1445 break; 1446 case IP_VERSION(7, 4, 1): 1447 case IP_VERSION(7, 4, 4): 1448 adev->hdp.funcs->update_clock_gating(adev, 1449 state == AMD_CG_STATE_GATE); 1450 break; 1451 default: 1452 break; 1453 } 1454 return 0; 1455 } 1456 1457 static void soc15_common_get_clockgating_state(void *handle, u32 *flags) 1458 { 1459 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 1460 int data; 1461 1462 if (amdgpu_sriov_vf(adev)) 1463 *flags = 0; 1464 1465 adev->nbio.funcs->get_clockgating_state(adev, flags); 1466 1467 adev->hdp.funcs->get_clock_gating_state(adev, flags); 1468 1469 if (adev->ip_versions[MP0_HWIP][0] != IP_VERSION(13, 0, 2)) { 1470 1471 /* AMD_CG_SUPPORT_DRM_MGCG */ 1472 data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_CGTT_CTRL0)); 1473 if (!(data & 0x01000000)) 1474 *flags |= AMD_CG_SUPPORT_DRM_MGCG; 1475 1476 /* AMD_CG_SUPPORT_DRM_LS */ 1477 data = RREG32(SOC15_REG_OFFSET(MP0, 0, mmMP0_MISC_LIGHT_SLEEP_CTRL)); 1478 if (data & 0x1) 1479 *flags |= AMD_CG_SUPPORT_DRM_LS; 1480 } 1481 1482 /* AMD_CG_SUPPORT_ROM_MGCG */ 1483 adev->smuio.funcs->get_clock_gating_state(adev, flags); 1484 1485 adev->df.funcs->get_clockgating_state(adev, flags); 1486 } 1487 1488 static int soc15_common_set_powergating_state(void *handle, 1489 enum amd_powergating_state state) 1490 { 1491 /* todo */ 1492 return 0; 1493 } 1494 1495 static const struct amd_ip_funcs soc15_common_ip_funcs = { 1496 .name = "soc15_common", 1497 .early_init = soc15_common_early_init, 1498 .late_init = soc15_common_late_init, 1499 .sw_init = soc15_common_sw_init, 1500 .sw_fini = soc15_common_sw_fini, 1501 .hw_init = soc15_common_hw_init, 1502 .hw_fini = soc15_common_hw_fini, 1503 .suspend = soc15_common_suspend, 1504 .resume = soc15_common_resume, 1505 .is_idle = soc15_common_is_idle, 1506 .wait_for_idle = soc15_common_wait_for_idle, 1507 .soft_reset = soc15_common_soft_reset, 1508 .set_clockgating_state = soc15_common_set_clockgating_state, 1509 .set_powergating_state = soc15_common_set_powergating_state, 1510 .get_clockgating_state= soc15_common_get_clockgating_state, 1511 }; 1512