1aaa36a97SAlex Deucher /* 2aaa36a97SAlex Deucher * Copyright 2014 Advanced Micro Devices, Inc. 3aaa36a97SAlex Deucher * All Rights Reserved. 4aaa36a97SAlex Deucher * 5aaa36a97SAlex Deucher * Permission is hereby granted, free of charge, to any person obtaining a 6aaa36a97SAlex Deucher * copy of this software and associated documentation files (the 7aaa36a97SAlex Deucher * "Software"), to deal in the Software without restriction, including 8aaa36a97SAlex Deucher * without limitation the rights to use, copy, modify, merge, publish, 9aaa36a97SAlex Deucher * distribute, sub license, and/or sell copies of the Software, and to 10aaa36a97SAlex Deucher * permit persons to whom the Software is furnished to do so, subject to 11aaa36a97SAlex Deucher * the following conditions: 12aaa36a97SAlex Deucher * 13aaa36a97SAlex Deucher * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14aaa36a97SAlex Deucher * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15aaa36a97SAlex Deucher * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 16aaa36a97SAlex Deucher * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, 17aaa36a97SAlex Deucher * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 18aaa36a97SAlex Deucher * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 19aaa36a97SAlex Deucher * USE OR OTHER DEALINGS IN THE SOFTWARE. 20aaa36a97SAlex Deucher * 21aaa36a97SAlex Deucher * The above copyright notice and this permission notice (including the 22aaa36a97SAlex Deucher * next paragraph) shall be included in all copies or substantial portions 23aaa36a97SAlex Deucher * of the Software. 24aaa36a97SAlex Deucher * 25aaa36a97SAlex Deucher * Authors: Christian König <christian.koenig@amd.com> 26aaa36a97SAlex Deucher */ 27aaa36a97SAlex Deucher 28aaa36a97SAlex Deucher #include <linux/firmware.h> 29aaa36a97SAlex Deucher #include <drm/drmP.h> 30aaa36a97SAlex Deucher #include "amdgpu.h" 31aaa36a97SAlex Deucher #include "amdgpu_vce.h" 32aaa36a97SAlex Deucher #include "vid.h" 33aaa36a97SAlex Deucher #include "vce/vce_3_0_d.h" 34aaa36a97SAlex Deucher #include "vce/vce_3_0_sh_mask.h" 35be4f38e2SAlex Deucher #include "oss/oss_3_0_d.h" 36be4f38e2SAlex Deucher #include "oss/oss_3_0_sh_mask.h" 375bbc553aSLeo Liu #include "gca/gfx_8_0_d.h" 386a585777SAlex Deucher #include "smu/smu_7_1_2_d.h" 396a585777SAlex Deucher #include "smu/smu_7_1_2_sh_mask.h" 405bbc553aSLeo Liu 415bbc553aSLeo Liu #define GRBM_GFX_INDEX__VCE_INSTANCE__SHIFT 0x04 425bbc553aSLeo Liu #define GRBM_GFX_INDEX__VCE_INSTANCE_MASK 0x10 433c0ff9f1SLeo Liu #define mmVCE_LMI_VCPU_CACHE_40BIT_BAR0 0x8616 443c0ff9f1SLeo Liu #define mmVCE_LMI_VCPU_CACHE_40BIT_BAR1 0x8617 453c0ff9f1SLeo Liu #define mmVCE_LMI_VCPU_CACHE_40BIT_BAR2 0x8618 46aaa36a97SAlex Deucher 47e9822622SLeo Liu #define VCE_V3_0_FW_SIZE (384 * 1024) 48e9822622SLeo Liu #define VCE_V3_0_STACK_SIZE (64 * 1024) 49e9822622SLeo Liu #define VCE_V3_0_DATA_SIZE ((16 * 1024 * AMDGPU_MAX_VCE_HANDLES) + (52 * 1024)) 50e9822622SLeo Liu 515bbc553aSLeo Liu static void vce_v3_0_mc_resume(struct amdgpu_device *adev, int idx); 52aaa36a97SAlex Deucher static void vce_v3_0_set_ring_funcs(struct amdgpu_device *adev); 53aaa36a97SAlex Deucher static void vce_v3_0_set_irq_funcs(struct amdgpu_device *adev); 54aaa36a97SAlex Deucher 55aaa36a97SAlex Deucher /** 56aaa36a97SAlex Deucher * vce_v3_0_ring_get_rptr - get read pointer 57aaa36a97SAlex Deucher * 58aaa36a97SAlex Deucher * @ring: amdgpu_ring pointer 59aaa36a97SAlex Deucher * 60aaa36a97SAlex Deucher * Returns the current hardware read pointer 61aaa36a97SAlex Deucher */ 62aaa36a97SAlex Deucher static uint32_t vce_v3_0_ring_get_rptr(struct amdgpu_ring *ring) 63aaa36a97SAlex Deucher { 64aaa36a97SAlex Deucher struct amdgpu_device *adev = ring->adev; 65aaa36a97SAlex Deucher 66aaa36a97SAlex Deucher if (ring == &adev->vce.ring[0]) 67aaa36a97SAlex Deucher return RREG32(mmVCE_RB_RPTR); 68aaa36a97SAlex Deucher else 69aaa36a97SAlex Deucher return RREG32(mmVCE_RB_RPTR2); 70aaa36a97SAlex Deucher } 71aaa36a97SAlex Deucher 72aaa36a97SAlex Deucher /** 73aaa36a97SAlex Deucher * vce_v3_0_ring_get_wptr - get write pointer 74aaa36a97SAlex Deucher * 75aaa36a97SAlex Deucher * @ring: amdgpu_ring pointer 76aaa36a97SAlex Deucher * 77aaa36a97SAlex Deucher * Returns the current hardware write pointer 78aaa36a97SAlex Deucher */ 79aaa36a97SAlex Deucher static uint32_t vce_v3_0_ring_get_wptr(struct amdgpu_ring *ring) 80aaa36a97SAlex Deucher { 81aaa36a97SAlex Deucher struct amdgpu_device *adev = ring->adev; 82aaa36a97SAlex Deucher 83aaa36a97SAlex Deucher if (ring == &adev->vce.ring[0]) 84aaa36a97SAlex Deucher return RREG32(mmVCE_RB_WPTR); 85aaa36a97SAlex Deucher else 86aaa36a97SAlex Deucher return RREG32(mmVCE_RB_WPTR2); 87aaa36a97SAlex Deucher } 88aaa36a97SAlex Deucher 89aaa36a97SAlex Deucher /** 90aaa36a97SAlex Deucher * vce_v3_0_ring_set_wptr - set write pointer 91aaa36a97SAlex Deucher * 92aaa36a97SAlex Deucher * @ring: amdgpu_ring pointer 93aaa36a97SAlex Deucher * 94aaa36a97SAlex Deucher * Commits the write pointer to the hardware 95aaa36a97SAlex Deucher */ 96aaa36a97SAlex Deucher static void vce_v3_0_ring_set_wptr(struct amdgpu_ring *ring) 97aaa36a97SAlex Deucher { 98aaa36a97SAlex Deucher struct amdgpu_device *adev = ring->adev; 99aaa36a97SAlex Deucher 100aaa36a97SAlex Deucher if (ring == &adev->vce.ring[0]) 101aaa36a97SAlex Deucher WREG32(mmVCE_RB_WPTR, ring->wptr); 102aaa36a97SAlex Deucher else 103aaa36a97SAlex Deucher WREG32(mmVCE_RB_WPTR2, ring->wptr); 104aaa36a97SAlex Deucher } 105aaa36a97SAlex Deucher 1060689a570SEric Huang static void vce_v3_0_override_vce_clock_gating(struct amdgpu_device *adev, bool override) 1070689a570SEric Huang { 1080689a570SEric Huang u32 tmp, data; 1090689a570SEric Huang 1100689a570SEric Huang tmp = data = RREG32(mmVCE_RB_ARB_CTRL); 1110689a570SEric Huang if (override) 1120689a570SEric Huang data |= VCE_RB_ARB_CTRL__VCE_CGTT_OVERRIDE_MASK; 1130689a570SEric Huang else 1140689a570SEric Huang data &= ~VCE_RB_ARB_CTRL__VCE_CGTT_OVERRIDE_MASK; 1150689a570SEric Huang 1160689a570SEric Huang if (tmp != data) 1170689a570SEric Huang WREG32(mmVCE_RB_ARB_CTRL, data); 1180689a570SEric Huang } 1190689a570SEric Huang 1200689a570SEric Huang static void vce_v3_0_set_vce_sw_clock_gating(struct amdgpu_device *adev, 1210689a570SEric Huang bool gated) 1220689a570SEric Huang { 1230689a570SEric Huang u32 tmp, data; 1240689a570SEric Huang /* Set Override to disable Clock Gating */ 1250689a570SEric Huang vce_v3_0_override_vce_clock_gating(adev, true); 1260689a570SEric Huang 1270689a570SEric Huang if (!gated) { 1280689a570SEric Huang /* Force CLOCK ON for VCE_CLOCK_GATING_B, 1290689a570SEric Huang * {*_FORCE_ON, *_FORCE_OFF} = {1, 0} 1300689a570SEric Huang * VREG can be FORCE ON or set to Dynamic, but can't be OFF 1310689a570SEric Huang */ 1320689a570SEric Huang tmp = data = RREG32(mmVCE_CLOCK_GATING_B); 1330689a570SEric Huang data |= 0x1ff; 1340689a570SEric Huang data &= ~0xef0000; 1350689a570SEric Huang if (tmp != data) 1360689a570SEric Huang WREG32(mmVCE_CLOCK_GATING_B, data); 1370689a570SEric Huang 1380689a570SEric Huang /* Force CLOCK ON for VCE_UENC_CLOCK_GATING, 1390689a570SEric Huang * {*_FORCE_ON, *_FORCE_OFF} = {1, 0} 1400689a570SEric Huang */ 1410689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING); 1420689a570SEric Huang data |= 0x3ff000; 1430689a570SEric Huang data &= ~0xffc00000; 1440689a570SEric Huang if (tmp != data) 1450689a570SEric Huang WREG32(mmVCE_UENC_CLOCK_GATING, data); 1460689a570SEric Huang 1470689a570SEric Huang /* set VCE_UENC_CLOCK_GATING_2 */ 1480689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING_2); 1490689a570SEric Huang data |= 0x2; 1500689a570SEric Huang data &= ~0x2; 1510689a570SEric Huang if (tmp != data) 1520689a570SEric Huang WREG32(mmVCE_UENC_CLOCK_GATING_2, data); 1530689a570SEric Huang 1540689a570SEric Huang /* Force CLOCK ON for VCE_UENC_REG_CLOCK_GATING */ 1550689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_REG_CLOCK_GATING); 1560689a570SEric Huang data |= 0x37f; 1570689a570SEric Huang if (tmp != data) 1580689a570SEric Huang WREG32(mmVCE_UENC_REG_CLOCK_GATING, data); 1590689a570SEric Huang 1600689a570SEric Huang /* Force VCE_UENC_DMA_DCLK_CTRL Clock ON */ 1610689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_DMA_DCLK_CTRL); 1620689a570SEric Huang data |= VCE_UENC_DMA_DCLK_CTRL__WRDMCLK_FORCEON_MASK | 1630689a570SEric Huang VCE_UENC_DMA_DCLK_CTRL__RDDMCLK_FORCEON_MASK | 1640689a570SEric Huang VCE_UENC_DMA_DCLK_CTRL__REGCLK_FORCEON_MASK | 1650689a570SEric Huang 0x8; 1660689a570SEric Huang if (tmp != data) 1670689a570SEric Huang WREG32(mmVCE_UENC_DMA_DCLK_CTRL, data); 1680689a570SEric Huang } else { 1690689a570SEric Huang /* Force CLOCK OFF for VCE_CLOCK_GATING_B, 1700689a570SEric Huang * {*, *_FORCE_OFF} = {*, 1} 1710689a570SEric Huang * set VREG to Dynamic, as it can't be OFF 1720689a570SEric Huang */ 1730689a570SEric Huang tmp = data = RREG32(mmVCE_CLOCK_GATING_B); 1740689a570SEric Huang data &= ~0x80010; 1750689a570SEric Huang data |= 0xe70008; 1760689a570SEric Huang if (tmp != data) 1770689a570SEric Huang WREG32(mmVCE_CLOCK_GATING_B, data); 1780689a570SEric Huang /* Force CLOCK OFF for VCE_UENC_CLOCK_GATING, 1790689a570SEric Huang * Force ClOCK OFF takes precedent over Force CLOCK ON setting. 1800689a570SEric Huang * {*_FORCE_ON, *_FORCE_OFF} = {*, 1} 1810689a570SEric Huang */ 1820689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING); 1830689a570SEric Huang data |= 0xffc00000; 1840689a570SEric Huang if (tmp != data) 1850689a570SEric Huang WREG32(mmVCE_UENC_CLOCK_GATING, data); 1860689a570SEric Huang /* Set VCE_UENC_CLOCK_GATING_2 */ 1870689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_CLOCK_GATING_2); 1880689a570SEric Huang data |= 0x10000; 1890689a570SEric Huang if (tmp != data) 1900689a570SEric Huang WREG32(mmVCE_UENC_CLOCK_GATING_2, data); 1910689a570SEric Huang /* Set VCE_UENC_REG_CLOCK_GATING to dynamic */ 1920689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_REG_CLOCK_GATING); 1930689a570SEric Huang data &= ~0xffc00000; 1940689a570SEric Huang if (tmp != data) 1950689a570SEric Huang WREG32(mmVCE_UENC_REG_CLOCK_GATING, data); 1960689a570SEric Huang /* Set VCE_UENC_DMA_DCLK_CTRL CG always in dynamic mode */ 1970689a570SEric Huang tmp = data = RREG32(mmVCE_UENC_DMA_DCLK_CTRL); 1980689a570SEric Huang data &= ~(VCE_UENC_DMA_DCLK_CTRL__WRDMCLK_FORCEON_MASK | 1990689a570SEric Huang VCE_UENC_DMA_DCLK_CTRL__RDDMCLK_FORCEON_MASK | 2000689a570SEric Huang VCE_UENC_DMA_DCLK_CTRL__REGCLK_FORCEON_MASK | 2010689a570SEric Huang 0x8); 2020689a570SEric Huang if (tmp != data) 2030689a570SEric Huang WREG32(mmVCE_UENC_DMA_DCLK_CTRL, data); 2040689a570SEric Huang } 2050689a570SEric Huang vce_v3_0_override_vce_clock_gating(adev, false); 2060689a570SEric Huang } 2070689a570SEric Huang 208aaa36a97SAlex Deucher /** 209aaa36a97SAlex Deucher * vce_v3_0_start - start VCE block 210aaa36a97SAlex Deucher * 211aaa36a97SAlex Deucher * @adev: amdgpu_device pointer 212aaa36a97SAlex Deucher * 213aaa36a97SAlex Deucher * Setup and start the VCE block 214aaa36a97SAlex Deucher */ 215aaa36a97SAlex Deucher static int vce_v3_0_start(struct amdgpu_device *adev) 216aaa36a97SAlex Deucher { 217aaa36a97SAlex Deucher struct amdgpu_ring *ring; 2185bbc553aSLeo Liu int idx, i, j, r; 219aaa36a97SAlex Deucher 2205bbc553aSLeo Liu mutex_lock(&adev->grbm_idx_mutex); 2215bbc553aSLeo Liu for (idx = 0; idx < 2; ++idx) { 2226a585777SAlex Deucher 2236a585777SAlex Deucher if (adev->vce.harvest_config & (1 << idx)) 2246a585777SAlex Deucher continue; 2256a585777SAlex Deucher 2265bbc553aSLeo Liu if (idx == 0) 2275bbc553aSLeo Liu WREG32_P(mmGRBM_GFX_INDEX, 0, 2285bbc553aSLeo Liu ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK); 2295bbc553aSLeo Liu else 2305bbc553aSLeo Liu WREG32_P(mmGRBM_GFX_INDEX, 2315bbc553aSLeo Liu GRBM_GFX_INDEX__VCE_INSTANCE_MASK, 2325bbc553aSLeo Liu ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK); 2335bbc553aSLeo Liu 2345bbc553aSLeo Liu vce_v3_0_mc_resume(adev, idx); 235aaa36a97SAlex Deucher 236aaa36a97SAlex Deucher /* set BUSY flag */ 237aaa36a97SAlex Deucher WREG32_P(mmVCE_STATUS, 1, ~1); 2383c0ff9f1SLeo Liu if (adev->asic_type >= CHIP_STONEY) 2393c0ff9f1SLeo Liu WREG32_P(mmVCE_VCPU_CNTL, 1, ~0x200001); 2403c0ff9f1SLeo Liu else 2415bbc553aSLeo Liu WREG32_P(mmVCE_VCPU_CNTL, VCE_VCPU_CNTL__CLK_EN_MASK, 2425bbc553aSLeo Liu ~VCE_VCPU_CNTL__CLK_EN_MASK); 243aaa36a97SAlex Deucher 244aaa36a97SAlex Deucher WREG32_P(mmVCE_SOFT_RESET, 245aaa36a97SAlex Deucher VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK, 246aaa36a97SAlex Deucher ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK); 247aaa36a97SAlex Deucher 248aaa36a97SAlex Deucher mdelay(100); 249aaa36a97SAlex Deucher 2505bbc553aSLeo Liu WREG32_P(mmVCE_SOFT_RESET, 0, 2515bbc553aSLeo Liu ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK); 252aaa36a97SAlex Deucher 253aaa36a97SAlex Deucher for (i = 0; i < 10; ++i) { 254aaa36a97SAlex Deucher uint32_t status; 255aaa36a97SAlex Deucher for (j = 0; j < 100; ++j) { 256aaa36a97SAlex Deucher status = RREG32(mmVCE_STATUS); 257aaa36a97SAlex Deucher if (status & 2) 258aaa36a97SAlex Deucher break; 259aaa36a97SAlex Deucher mdelay(10); 260aaa36a97SAlex Deucher } 261aaa36a97SAlex Deucher r = 0; 262aaa36a97SAlex Deucher if (status & 2) 263aaa36a97SAlex Deucher break; 264aaa36a97SAlex Deucher 265aaa36a97SAlex Deucher DRM_ERROR("VCE not responding, trying to reset the ECPU!!!\n"); 2665bbc553aSLeo Liu WREG32_P(mmVCE_SOFT_RESET, 2675bbc553aSLeo Liu VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK, 268aaa36a97SAlex Deucher ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK); 269aaa36a97SAlex Deucher mdelay(10); 2705bbc553aSLeo Liu WREG32_P(mmVCE_SOFT_RESET, 0, 2715bbc553aSLeo Liu ~VCE_SOFT_RESET__ECPU_SOFT_RESET_MASK); 272aaa36a97SAlex Deucher mdelay(10); 273aaa36a97SAlex Deucher r = -1; 274aaa36a97SAlex Deucher } 275aaa36a97SAlex Deucher 276aaa36a97SAlex Deucher /* clear BUSY flag */ 277aaa36a97SAlex Deucher WREG32_P(mmVCE_STATUS, 0, ~1); 278aaa36a97SAlex Deucher 2790689a570SEric Huang /* Set Clock-Gating off */ 2800689a570SEric Huang if (adev->cg_flags & AMDGPU_CG_SUPPORT_VCE_MGCG) 2810689a570SEric Huang vce_v3_0_set_vce_sw_clock_gating(adev, false); 2820689a570SEric Huang 283aaa36a97SAlex Deucher if (r) { 284aaa36a97SAlex Deucher DRM_ERROR("VCE not responding, giving up!!!\n"); 2855bbc553aSLeo Liu mutex_unlock(&adev->grbm_idx_mutex); 286aaa36a97SAlex Deucher return r; 287aaa36a97SAlex Deucher } 2885bbc553aSLeo Liu } 2895bbc553aSLeo Liu 2905bbc553aSLeo Liu WREG32_P(mmGRBM_GFX_INDEX, 0, ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK); 2915bbc553aSLeo Liu mutex_unlock(&adev->grbm_idx_mutex); 2925bbc553aSLeo Liu 2935bbc553aSLeo Liu ring = &adev->vce.ring[0]; 2945bbc553aSLeo Liu WREG32(mmVCE_RB_RPTR, ring->wptr); 2955bbc553aSLeo Liu WREG32(mmVCE_RB_WPTR, ring->wptr); 2965bbc553aSLeo Liu WREG32(mmVCE_RB_BASE_LO, ring->gpu_addr); 2975bbc553aSLeo Liu WREG32(mmVCE_RB_BASE_HI, upper_32_bits(ring->gpu_addr)); 2985bbc553aSLeo Liu WREG32(mmVCE_RB_SIZE, ring->ring_size / 4); 2995bbc553aSLeo Liu 3005bbc553aSLeo Liu ring = &adev->vce.ring[1]; 3015bbc553aSLeo Liu WREG32(mmVCE_RB_RPTR2, ring->wptr); 3025bbc553aSLeo Liu WREG32(mmVCE_RB_WPTR2, ring->wptr); 3035bbc553aSLeo Liu WREG32(mmVCE_RB_BASE_LO2, ring->gpu_addr); 3045bbc553aSLeo Liu WREG32(mmVCE_RB_BASE_HI2, upper_32_bits(ring->gpu_addr)); 3055bbc553aSLeo Liu WREG32(mmVCE_RB_SIZE2, ring->ring_size / 4); 306aaa36a97SAlex Deucher 307aaa36a97SAlex Deucher return 0; 308aaa36a97SAlex Deucher } 309aaa36a97SAlex Deucher 3106a585777SAlex Deucher #define ixVCE_HARVEST_FUSE_MACRO__ADDRESS 0xC0014074 3116a585777SAlex Deucher #define VCE_HARVEST_FUSE_MACRO__SHIFT 27 3126a585777SAlex Deucher #define VCE_HARVEST_FUSE_MACRO__MASK 0x18000000 3136a585777SAlex Deucher 3146a585777SAlex Deucher static unsigned vce_v3_0_get_harvest_config(struct amdgpu_device *adev) 3156a585777SAlex Deucher { 3166a585777SAlex Deucher u32 tmp; 3176a585777SAlex Deucher 318cfaba566SSamuel Li /* Fiji, Stoney are single pipe */ 319cfaba566SSamuel Li if ((adev->asic_type == CHIP_FIJI) || 3201dab5f06STom St Denis (adev->asic_type == CHIP_STONEY)) 3211dab5f06STom St Denis return AMDGPU_VCE_HARVEST_VCE1; 322188a9bcdSAlex Deucher 323188a9bcdSAlex Deucher /* Tonga and CZ are dual or single pipe */ 3242f7d10b3SJammy Zhou if (adev->flags & AMD_IS_APU) 3256a585777SAlex Deucher tmp = (RREG32_SMC(ixVCE_HARVEST_FUSE_MACRO__ADDRESS) & 3266a585777SAlex Deucher VCE_HARVEST_FUSE_MACRO__MASK) >> 3276a585777SAlex Deucher VCE_HARVEST_FUSE_MACRO__SHIFT; 3286a585777SAlex Deucher else 3296a585777SAlex Deucher tmp = (RREG32_SMC(ixCC_HARVEST_FUSES) & 3306a585777SAlex Deucher CC_HARVEST_FUSES__VCE_DISABLE_MASK) >> 3316a585777SAlex Deucher CC_HARVEST_FUSES__VCE_DISABLE__SHIFT; 3326a585777SAlex Deucher 3336a585777SAlex Deucher switch (tmp) { 3346a585777SAlex Deucher case 1: 3351dab5f06STom St Denis return AMDGPU_VCE_HARVEST_VCE0; 3366a585777SAlex Deucher case 2: 3371dab5f06STom St Denis return AMDGPU_VCE_HARVEST_VCE1; 3386a585777SAlex Deucher case 3: 3391dab5f06STom St Denis return AMDGPU_VCE_HARVEST_VCE0 | AMDGPU_VCE_HARVEST_VCE1; 3406a585777SAlex Deucher default: 3411dab5f06STom St Denis return 0; 3426a585777SAlex Deucher } 3436a585777SAlex Deucher } 3446a585777SAlex Deucher 3455fc3aeebSyanyang1 static int vce_v3_0_early_init(void *handle) 346aaa36a97SAlex Deucher { 3475fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 3485fc3aeebSyanyang1 3496a585777SAlex Deucher adev->vce.harvest_config = vce_v3_0_get_harvest_config(adev); 3506a585777SAlex Deucher 3516a585777SAlex Deucher if ((adev->vce.harvest_config & 3526a585777SAlex Deucher (AMDGPU_VCE_HARVEST_VCE0 | AMDGPU_VCE_HARVEST_VCE1)) == 3536a585777SAlex Deucher (AMDGPU_VCE_HARVEST_VCE0 | AMDGPU_VCE_HARVEST_VCE1)) 3546a585777SAlex Deucher return -ENOENT; 3556a585777SAlex Deucher 356aaa36a97SAlex Deucher vce_v3_0_set_ring_funcs(adev); 357aaa36a97SAlex Deucher vce_v3_0_set_irq_funcs(adev); 358aaa36a97SAlex Deucher 359aaa36a97SAlex Deucher return 0; 360aaa36a97SAlex Deucher } 361aaa36a97SAlex Deucher 3625fc3aeebSyanyang1 static int vce_v3_0_sw_init(void *handle) 363aaa36a97SAlex Deucher { 3645fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 365aaa36a97SAlex Deucher struct amdgpu_ring *ring; 366aaa36a97SAlex Deucher int r; 367aaa36a97SAlex Deucher 368aaa36a97SAlex Deucher /* VCE */ 369aaa36a97SAlex Deucher r = amdgpu_irq_add_id(adev, 167, &adev->vce.irq); 370aaa36a97SAlex Deucher if (r) 371aaa36a97SAlex Deucher return r; 372aaa36a97SAlex Deucher 373e9822622SLeo Liu r = amdgpu_vce_sw_init(adev, VCE_V3_0_FW_SIZE + 374e9822622SLeo Liu (VCE_V3_0_STACK_SIZE + VCE_V3_0_DATA_SIZE) * 2); 375aaa36a97SAlex Deucher if (r) 376aaa36a97SAlex Deucher return r; 377aaa36a97SAlex Deucher 378aaa36a97SAlex Deucher r = amdgpu_vce_resume(adev); 379aaa36a97SAlex Deucher if (r) 380aaa36a97SAlex Deucher return r; 381aaa36a97SAlex Deucher 382aaa36a97SAlex Deucher ring = &adev->vce.ring[0]; 383aaa36a97SAlex Deucher sprintf(ring->name, "vce0"); 384aaa36a97SAlex Deucher r = amdgpu_ring_init(adev, ring, 4096, VCE_CMD_NO_OP, 0xf, 385aaa36a97SAlex Deucher &adev->vce.irq, 0, AMDGPU_RING_TYPE_VCE); 386aaa36a97SAlex Deucher if (r) 387aaa36a97SAlex Deucher return r; 388aaa36a97SAlex Deucher 389aaa36a97SAlex Deucher ring = &adev->vce.ring[1]; 390aaa36a97SAlex Deucher sprintf(ring->name, "vce1"); 391aaa36a97SAlex Deucher r = amdgpu_ring_init(adev, ring, 4096, VCE_CMD_NO_OP, 0xf, 392aaa36a97SAlex Deucher &adev->vce.irq, 0, AMDGPU_RING_TYPE_VCE); 393aaa36a97SAlex Deucher if (r) 394aaa36a97SAlex Deucher return r; 395aaa36a97SAlex Deucher 396aaa36a97SAlex Deucher return r; 397aaa36a97SAlex Deucher } 398aaa36a97SAlex Deucher 3995fc3aeebSyanyang1 static int vce_v3_0_sw_fini(void *handle) 400aaa36a97SAlex Deucher { 401aaa36a97SAlex Deucher int r; 4025fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 403aaa36a97SAlex Deucher 404aaa36a97SAlex Deucher r = amdgpu_vce_suspend(adev); 405aaa36a97SAlex Deucher if (r) 406aaa36a97SAlex Deucher return r; 407aaa36a97SAlex Deucher 408aaa36a97SAlex Deucher r = amdgpu_vce_sw_fini(adev); 409aaa36a97SAlex Deucher if (r) 410aaa36a97SAlex Deucher return r; 411aaa36a97SAlex Deucher 412aaa36a97SAlex Deucher return r; 413aaa36a97SAlex Deucher } 414aaa36a97SAlex Deucher 4155fc3aeebSyanyang1 static int vce_v3_0_hw_init(void *handle) 416aaa36a97SAlex Deucher { 417aaa36a97SAlex Deucher struct amdgpu_ring *ring; 418aaa36a97SAlex Deucher int r; 4195fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 420aaa36a97SAlex Deucher 421aaa36a97SAlex Deucher r = vce_v3_0_start(adev); 422aaa36a97SAlex Deucher if (r) 423aaa36a97SAlex Deucher return r; 424aaa36a97SAlex Deucher 425aaa36a97SAlex Deucher ring = &adev->vce.ring[0]; 426aaa36a97SAlex Deucher ring->ready = true; 427aaa36a97SAlex Deucher r = amdgpu_ring_test_ring(ring); 428aaa36a97SAlex Deucher if (r) { 429aaa36a97SAlex Deucher ring->ready = false; 430aaa36a97SAlex Deucher return r; 431aaa36a97SAlex Deucher } 432aaa36a97SAlex Deucher 433aaa36a97SAlex Deucher ring = &adev->vce.ring[1]; 434aaa36a97SAlex Deucher ring->ready = true; 435aaa36a97SAlex Deucher r = amdgpu_ring_test_ring(ring); 436aaa36a97SAlex Deucher if (r) { 437aaa36a97SAlex Deucher ring->ready = false; 438aaa36a97SAlex Deucher return r; 439aaa36a97SAlex Deucher } 440aaa36a97SAlex Deucher 441aaa36a97SAlex Deucher DRM_INFO("VCE initialized successfully.\n"); 442aaa36a97SAlex Deucher 443aaa36a97SAlex Deucher return 0; 444aaa36a97SAlex Deucher } 445aaa36a97SAlex Deucher 4465fc3aeebSyanyang1 static int vce_v3_0_hw_fini(void *handle) 447aaa36a97SAlex Deucher { 448aaa36a97SAlex Deucher return 0; 449aaa36a97SAlex Deucher } 450aaa36a97SAlex Deucher 4515fc3aeebSyanyang1 static int vce_v3_0_suspend(void *handle) 452aaa36a97SAlex Deucher { 453aaa36a97SAlex Deucher int r; 4545fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 455aaa36a97SAlex Deucher 456aaa36a97SAlex Deucher r = vce_v3_0_hw_fini(adev); 457aaa36a97SAlex Deucher if (r) 458aaa36a97SAlex Deucher return r; 459aaa36a97SAlex Deucher 460aaa36a97SAlex Deucher r = amdgpu_vce_suspend(adev); 461aaa36a97SAlex Deucher if (r) 462aaa36a97SAlex Deucher return r; 463aaa36a97SAlex Deucher 464aaa36a97SAlex Deucher return r; 465aaa36a97SAlex Deucher } 466aaa36a97SAlex Deucher 4675fc3aeebSyanyang1 static int vce_v3_0_resume(void *handle) 468aaa36a97SAlex Deucher { 469aaa36a97SAlex Deucher int r; 4705fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 471aaa36a97SAlex Deucher 472aaa36a97SAlex Deucher r = amdgpu_vce_resume(adev); 473aaa36a97SAlex Deucher if (r) 474aaa36a97SAlex Deucher return r; 475aaa36a97SAlex Deucher 476aaa36a97SAlex Deucher r = vce_v3_0_hw_init(adev); 477aaa36a97SAlex Deucher if (r) 478aaa36a97SAlex Deucher return r; 479aaa36a97SAlex Deucher 480aaa36a97SAlex Deucher return r; 481aaa36a97SAlex Deucher } 482aaa36a97SAlex Deucher 4835bbc553aSLeo Liu static void vce_v3_0_mc_resume(struct amdgpu_device *adev, int idx) 484aaa36a97SAlex Deucher { 485aaa36a97SAlex Deucher uint32_t offset, size; 486aaa36a97SAlex Deucher 487aaa36a97SAlex Deucher WREG32_P(mmVCE_CLOCK_GATING_A, 0, ~(1 << 16)); 488aaa36a97SAlex Deucher WREG32_P(mmVCE_UENC_CLOCK_GATING, 0x1FF000, ~0xFF9FF000); 489aaa36a97SAlex Deucher WREG32_P(mmVCE_UENC_REG_CLOCK_GATING, 0x3F, ~0x3F); 490aaa36a97SAlex Deucher WREG32(mmVCE_CLOCK_GATING_B, 0xf7); 491aaa36a97SAlex Deucher 492aaa36a97SAlex Deucher WREG32(mmVCE_LMI_CTRL, 0x00398000); 493aaa36a97SAlex Deucher WREG32_P(mmVCE_LMI_CACHE_CTRL, 0x0, ~0x1); 494aaa36a97SAlex Deucher WREG32(mmVCE_LMI_SWAP_CNTL, 0); 495aaa36a97SAlex Deucher WREG32(mmVCE_LMI_SWAP_CNTL1, 0); 496aaa36a97SAlex Deucher WREG32(mmVCE_LMI_VM_CTRL, 0); 4973c0ff9f1SLeo Liu if (adev->asic_type >= CHIP_STONEY) { 4983c0ff9f1SLeo Liu WREG32(mmVCE_LMI_VCPU_CACHE_40BIT_BAR0, (adev->vce.gpu_addr >> 8)); 4993c0ff9f1SLeo Liu WREG32(mmVCE_LMI_VCPU_CACHE_40BIT_BAR1, (adev->vce.gpu_addr >> 8)); 5003c0ff9f1SLeo Liu WREG32(mmVCE_LMI_VCPU_CACHE_40BIT_BAR2, (adev->vce.gpu_addr >> 8)); 5013c0ff9f1SLeo Liu } else 502aaa36a97SAlex Deucher WREG32(mmVCE_LMI_VCPU_CACHE_40BIT_BAR, (adev->vce.gpu_addr >> 8)); 503aaa36a97SAlex Deucher offset = AMDGPU_VCE_FIRMWARE_OFFSET; 504e9822622SLeo Liu size = VCE_V3_0_FW_SIZE; 505aaa36a97SAlex Deucher WREG32(mmVCE_VCPU_CACHE_OFFSET0, offset & 0x7fffffff); 506aaa36a97SAlex Deucher WREG32(mmVCE_VCPU_CACHE_SIZE0, size); 507aaa36a97SAlex Deucher 5085bbc553aSLeo Liu if (idx == 0) { 509aaa36a97SAlex Deucher offset += size; 510e9822622SLeo Liu size = VCE_V3_0_STACK_SIZE; 511aaa36a97SAlex Deucher WREG32(mmVCE_VCPU_CACHE_OFFSET1, offset & 0x7fffffff); 512aaa36a97SAlex Deucher WREG32(mmVCE_VCPU_CACHE_SIZE1, size); 513aaa36a97SAlex Deucher offset += size; 514e9822622SLeo Liu size = VCE_V3_0_DATA_SIZE; 515aaa36a97SAlex Deucher WREG32(mmVCE_VCPU_CACHE_OFFSET2, offset & 0x7fffffff); 516aaa36a97SAlex Deucher WREG32(mmVCE_VCPU_CACHE_SIZE2, size); 5175bbc553aSLeo Liu } else { 5185bbc553aSLeo Liu offset += size + VCE_V3_0_STACK_SIZE + VCE_V3_0_DATA_SIZE; 5195bbc553aSLeo Liu size = VCE_V3_0_STACK_SIZE; 5205bbc553aSLeo Liu WREG32(mmVCE_VCPU_CACHE_OFFSET1, offset & 0xfffffff); 5215bbc553aSLeo Liu WREG32(mmVCE_VCPU_CACHE_SIZE1, size); 5225bbc553aSLeo Liu offset += size; 5235bbc553aSLeo Liu size = VCE_V3_0_DATA_SIZE; 5245bbc553aSLeo Liu WREG32(mmVCE_VCPU_CACHE_OFFSET2, offset & 0xfffffff); 5255bbc553aSLeo Liu WREG32(mmVCE_VCPU_CACHE_SIZE2, size); 5265bbc553aSLeo Liu } 527aaa36a97SAlex Deucher 528aaa36a97SAlex Deucher WREG32_P(mmVCE_LMI_CTRL2, 0x0, ~0x100); 529aaa36a97SAlex Deucher 530aaa36a97SAlex Deucher WREG32_P(mmVCE_SYS_INT_EN, VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK, 531aaa36a97SAlex Deucher ~VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK); 532aaa36a97SAlex Deucher } 533aaa36a97SAlex Deucher 5345fc3aeebSyanyang1 static bool vce_v3_0_is_idle(void *handle) 535aaa36a97SAlex Deucher { 5365fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 537be4f38e2SAlex Deucher u32 mask = 0; 538be4f38e2SAlex Deucher int idx; 5395fc3aeebSyanyang1 540be4f38e2SAlex Deucher for (idx = 0; idx < 2; ++idx) { 541be4f38e2SAlex Deucher if (adev->vce.harvest_config & (1 << idx)) 542be4f38e2SAlex Deucher continue; 543be4f38e2SAlex Deucher 544be4f38e2SAlex Deucher if (idx == 0) 545be4f38e2SAlex Deucher mask |= SRBM_STATUS2__VCE0_BUSY_MASK; 546be4f38e2SAlex Deucher else 547be4f38e2SAlex Deucher mask |= SRBM_STATUS2__VCE1_BUSY_MASK; 548be4f38e2SAlex Deucher } 549be4f38e2SAlex Deucher 550be4f38e2SAlex Deucher return !(RREG32(mmSRBM_STATUS2) & mask); 551aaa36a97SAlex Deucher } 552aaa36a97SAlex Deucher 5535fc3aeebSyanyang1 static int vce_v3_0_wait_for_idle(void *handle) 554aaa36a97SAlex Deucher { 555aaa36a97SAlex Deucher unsigned i; 5565fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 557be4f38e2SAlex Deucher u32 mask = 0; 558be4f38e2SAlex Deucher int idx; 559be4f38e2SAlex Deucher 560be4f38e2SAlex Deucher for (idx = 0; idx < 2; ++idx) { 561be4f38e2SAlex Deucher if (adev->vce.harvest_config & (1 << idx)) 562be4f38e2SAlex Deucher continue; 563be4f38e2SAlex Deucher 564be4f38e2SAlex Deucher if (idx == 0) 565be4f38e2SAlex Deucher mask |= SRBM_STATUS2__VCE0_BUSY_MASK; 566be4f38e2SAlex Deucher else 567be4f38e2SAlex Deucher mask |= SRBM_STATUS2__VCE1_BUSY_MASK; 568be4f38e2SAlex Deucher } 569aaa36a97SAlex Deucher 570aaa36a97SAlex Deucher for (i = 0; i < adev->usec_timeout; i++) { 571be4f38e2SAlex Deucher if (!(RREG32(mmSRBM_STATUS2) & mask)) 572aaa36a97SAlex Deucher return 0; 573aaa36a97SAlex Deucher } 574aaa36a97SAlex Deucher return -ETIMEDOUT; 575aaa36a97SAlex Deucher } 576aaa36a97SAlex Deucher 5775fc3aeebSyanyang1 static int vce_v3_0_soft_reset(void *handle) 578aaa36a97SAlex Deucher { 5795fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 580be4f38e2SAlex Deucher u32 mask = 0; 581be4f38e2SAlex Deucher int idx; 5825fc3aeebSyanyang1 583be4f38e2SAlex Deucher for (idx = 0; idx < 2; ++idx) { 584be4f38e2SAlex Deucher if (adev->vce.harvest_config & (1 << idx)) 585be4f38e2SAlex Deucher continue; 586be4f38e2SAlex Deucher 587be4f38e2SAlex Deucher if (idx == 0) 588be4f38e2SAlex Deucher mask |= SRBM_SOFT_RESET__SOFT_RESET_VCE0_MASK; 589be4f38e2SAlex Deucher else 590be4f38e2SAlex Deucher mask |= SRBM_SOFT_RESET__SOFT_RESET_VCE1_MASK; 591be4f38e2SAlex Deucher } 592be4f38e2SAlex Deucher WREG32_P(mmSRBM_SOFT_RESET, mask, 593be4f38e2SAlex Deucher ~(SRBM_SOFT_RESET__SOFT_RESET_VCE0_MASK | 594be4f38e2SAlex Deucher SRBM_SOFT_RESET__SOFT_RESET_VCE1_MASK)); 595aaa36a97SAlex Deucher mdelay(5); 596aaa36a97SAlex Deucher 597aaa36a97SAlex Deucher return vce_v3_0_start(adev); 598aaa36a97SAlex Deucher } 599aaa36a97SAlex Deucher 6005fc3aeebSyanyang1 static void vce_v3_0_print_status(void *handle) 601aaa36a97SAlex Deucher { 6025fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 6035fc3aeebSyanyang1 604aaa36a97SAlex Deucher dev_info(adev->dev, "VCE 3.0 registers\n"); 605aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_STATUS=0x%08X\n", 606aaa36a97SAlex Deucher RREG32(mmVCE_STATUS)); 607aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CNTL=0x%08X\n", 608aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CNTL)); 609aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CACHE_OFFSET0=0x%08X\n", 610aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CACHE_OFFSET0)); 611aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CACHE_SIZE0=0x%08X\n", 612aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CACHE_SIZE0)); 613aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CACHE_OFFSET1=0x%08X\n", 614aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CACHE_OFFSET1)); 615aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CACHE_SIZE1=0x%08X\n", 616aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CACHE_SIZE1)); 617aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CACHE_OFFSET2=0x%08X\n", 618aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CACHE_OFFSET2)); 619aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_VCPU_CACHE_SIZE2=0x%08X\n", 620aaa36a97SAlex Deucher RREG32(mmVCE_VCPU_CACHE_SIZE2)); 621aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_SOFT_RESET=0x%08X\n", 622aaa36a97SAlex Deucher RREG32(mmVCE_SOFT_RESET)); 623aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_BASE_LO2=0x%08X\n", 624aaa36a97SAlex Deucher RREG32(mmVCE_RB_BASE_LO2)); 625aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_BASE_HI2=0x%08X\n", 626aaa36a97SAlex Deucher RREG32(mmVCE_RB_BASE_HI2)); 627aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_SIZE2=0x%08X\n", 628aaa36a97SAlex Deucher RREG32(mmVCE_RB_SIZE2)); 629aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_RPTR2=0x%08X\n", 630aaa36a97SAlex Deucher RREG32(mmVCE_RB_RPTR2)); 631aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_WPTR2=0x%08X\n", 632aaa36a97SAlex Deucher RREG32(mmVCE_RB_WPTR2)); 633aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_BASE_LO=0x%08X\n", 634aaa36a97SAlex Deucher RREG32(mmVCE_RB_BASE_LO)); 635aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_BASE_HI=0x%08X\n", 636aaa36a97SAlex Deucher RREG32(mmVCE_RB_BASE_HI)); 637aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_SIZE=0x%08X\n", 638aaa36a97SAlex Deucher RREG32(mmVCE_RB_SIZE)); 639aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_RPTR=0x%08X\n", 640aaa36a97SAlex Deucher RREG32(mmVCE_RB_RPTR)); 641aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_RB_WPTR=0x%08X\n", 642aaa36a97SAlex Deucher RREG32(mmVCE_RB_WPTR)); 643aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_CLOCK_GATING_A=0x%08X\n", 644aaa36a97SAlex Deucher RREG32(mmVCE_CLOCK_GATING_A)); 645aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_CLOCK_GATING_B=0x%08X\n", 646aaa36a97SAlex Deucher RREG32(mmVCE_CLOCK_GATING_B)); 647aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_UENC_CLOCK_GATING=0x%08X\n", 648aaa36a97SAlex Deucher RREG32(mmVCE_UENC_CLOCK_GATING)); 649aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_UENC_REG_CLOCK_GATING=0x%08X\n", 650aaa36a97SAlex Deucher RREG32(mmVCE_UENC_REG_CLOCK_GATING)); 651aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_SYS_INT_EN=0x%08X\n", 652aaa36a97SAlex Deucher RREG32(mmVCE_SYS_INT_EN)); 653aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_LMI_CTRL2=0x%08X\n", 654aaa36a97SAlex Deucher RREG32(mmVCE_LMI_CTRL2)); 655aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_LMI_CTRL=0x%08X\n", 656aaa36a97SAlex Deucher RREG32(mmVCE_LMI_CTRL)); 657aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_LMI_VM_CTRL=0x%08X\n", 658aaa36a97SAlex Deucher RREG32(mmVCE_LMI_VM_CTRL)); 659aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_LMI_SWAP_CNTL=0x%08X\n", 660aaa36a97SAlex Deucher RREG32(mmVCE_LMI_SWAP_CNTL)); 661aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_LMI_SWAP_CNTL1=0x%08X\n", 662aaa36a97SAlex Deucher RREG32(mmVCE_LMI_SWAP_CNTL1)); 663aaa36a97SAlex Deucher dev_info(adev->dev, " VCE_LMI_CACHE_CTRL=0x%08X\n", 664aaa36a97SAlex Deucher RREG32(mmVCE_LMI_CACHE_CTRL)); 665aaa36a97SAlex Deucher } 666aaa36a97SAlex Deucher 667aaa36a97SAlex Deucher static int vce_v3_0_set_interrupt_state(struct amdgpu_device *adev, 668aaa36a97SAlex Deucher struct amdgpu_irq_src *source, 669aaa36a97SAlex Deucher unsigned type, 670aaa36a97SAlex Deucher enum amdgpu_interrupt_state state) 671aaa36a97SAlex Deucher { 672aaa36a97SAlex Deucher uint32_t val = 0; 673aaa36a97SAlex Deucher 674aaa36a97SAlex Deucher if (state == AMDGPU_IRQ_STATE_ENABLE) 675aaa36a97SAlex Deucher val |= VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK; 676aaa36a97SAlex Deucher 677aaa36a97SAlex Deucher WREG32_P(mmVCE_SYS_INT_EN, val, ~VCE_SYS_INT_EN__VCE_SYS_INT_TRAP_INTERRUPT_EN_MASK); 678aaa36a97SAlex Deucher return 0; 679aaa36a97SAlex Deucher } 680aaa36a97SAlex Deucher 681aaa36a97SAlex Deucher static int vce_v3_0_process_interrupt(struct amdgpu_device *adev, 682aaa36a97SAlex Deucher struct amdgpu_irq_src *source, 683aaa36a97SAlex Deucher struct amdgpu_iv_entry *entry) 684aaa36a97SAlex Deucher { 685aaa36a97SAlex Deucher DRM_DEBUG("IH: VCE\n"); 686d6c29c30SLeo Liu 687d6c29c30SLeo Liu WREG32_P(mmVCE_SYS_INT_STATUS, 688d6c29c30SLeo Liu VCE_SYS_INT_STATUS__VCE_SYS_INT_TRAP_INTERRUPT_INT_MASK, 689d6c29c30SLeo Liu ~VCE_SYS_INT_STATUS__VCE_SYS_INT_TRAP_INTERRUPT_INT_MASK); 690d6c29c30SLeo Liu 691aaa36a97SAlex Deucher switch (entry->src_data) { 692aaa36a97SAlex Deucher case 0: 693aaa36a97SAlex Deucher amdgpu_fence_process(&adev->vce.ring[0]); 694aaa36a97SAlex Deucher break; 695aaa36a97SAlex Deucher case 1: 696aaa36a97SAlex Deucher amdgpu_fence_process(&adev->vce.ring[1]); 697aaa36a97SAlex Deucher break; 698aaa36a97SAlex Deucher default: 699aaa36a97SAlex Deucher DRM_ERROR("Unhandled interrupt: %d %d\n", 700aaa36a97SAlex Deucher entry->src_id, entry->src_data); 701aaa36a97SAlex Deucher break; 702aaa36a97SAlex Deucher } 703aaa36a97SAlex Deucher 704aaa36a97SAlex Deucher return 0; 705aaa36a97SAlex Deucher } 706aaa36a97SAlex Deucher 7075fc3aeebSyanyang1 static int vce_v3_0_set_clockgating_state(void *handle, 7085fc3aeebSyanyang1 enum amd_clockgating_state state) 709aaa36a97SAlex Deucher { 7100689a570SEric Huang struct amdgpu_device *adev = (struct amdgpu_device *)handle; 7110689a570SEric Huang bool enable = (state == AMD_CG_STATE_GATE) ? true : false; 7120689a570SEric Huang int i; 7130689a570SEric Huang 7140689a570SEric Huang if (!(adev->cg_flags & AMDGPU_CG_SUPPORT_VCE_MGCG)) 7150689a570SEric Huang return 0; 7160689a570SEric Huang 7170689a570SEric Huang mutex_lock(&adev->grbm_idx_mutex); 7180689a570SEric Huang for (i = 0; i < 2; i++) { 7190689a570SEric Huang /* Program VCE Instance 0 or 1 if not harvested */ 7200689a570SEric Huang if (adev->vce.harvest_config & (1 << i)) 7210689a570SEric Huang continue; 7220689a570SEric Huang 7230689a570SEric Huang if (i == 0) 7240689a570SEric Huang WREG32_P(mmGRBM_GFX_INDEX, 0, 7250689a570SEric Huang ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK); 7260689a570SEric Huang else 7270689a570SEric Huang WREG32_P(mmGRBM_GFX_INDEX, 7280689a570SEric Huang GRBM_GFX_INDEX__VCE_INSTANCE_MASK, 7290689a570SEric Huang ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK); 7300689a570SEric Huang 7310689a570SEric Huang if (enable) { 7320689a570SEric Huang /* initialize VCE_CLOCK_GATING_A: Clock ON/OFF delay */ 7330689a570SEric Huang uint32_t data = RREG32(mmVCE_CLOCK_GATING_A); 7340689a570SEric Huang data &= ~(0xf | 0xff0); 7350689a570SEric Huang data |= ((0x0 << 0) | (0x04 << 4)); 7360689a570SEric Huang WREG32(mmVCE_CLOCK_GATING_A, data); 7370689a570SEric Huang 7380689a570SEric Huang /* initialize VCE_UENC_CLOCK_GATING: Clock ON/OFF delay */ 7390689a570SEric Huang data = RREG32(mmVCE_UENC_CLOCK_GATING); 7400689a570SEric Huang data &= ~(0xf | 0xff0); 7410689a570SEric Huang data |= ((0x0 << 0) | (0x04 << 4)); 7420689a570SEric Huang WREG32(mmVCE_UENC_CLOCK_GATING, data); 7430689a570SEric Huang } 7440689a570SEric Huang 7450689a570SEric Huang vce_v3_0_set_vce_sw_clock_gating(adev, enable); 7460689a570SEric Huang } 7470689a570SEric Huang 7480689a570SEric Huang WREG32_P(mmGRBM_GFX_INDEX, 0, ~GRBM_GFX_INDEX__VCE_INSTANCE_MASK); 7490689a570SEric Huang mutex_unlock(&adev->grbm_idx_mutex); 7500689a570SEric Huang 751aaa36a97SAlex Deucher return 0; 752aaa36a97SAlex Deucher } 753aaa36a97SAlex Deucher 7545fc3aeebSyanyang1 static int vce_v3_0_set_powergating_state(void *handle, 7555fc3aeebSyanyang1 enum amd_powergating_state state) 756aaa36a97SAlex Deucher { 757aaa36a97SAlex Deucher /* This doesn't actually powergate the VCE block. 758aaa36a97SAlex Deucher * That's done in the dpm code via the SMC. This 759aaa36a97SAlex Deucher * just re-inits the block as necessary. The actual 760aaa36a97SAlex Deucher * gating still happens in the dpm code. We should 761aaa36a97SAlex Deucher * revisit this when there is a cleaner line between 762aaa36a97SAlex Deucher * the smc and the hw blocks 763aaa36a97SAlex Deucher */ 7645fc3aeebSyanyang1 struct amdgpu_device *adev = (struct amdgpu_device *)handle; 7655fc3aeebSyanyang1 7665fc3aeebSyanyang1 if (state == AMD_PG_STATE_GATE) 767aaa36a97SAlex Deucher /* XXX do we need a vce_v3_0_stop()? */ 768aaa36a97SAlex Deucher return 0; 769aaa36a97SAlex Deucher else 770aaa36a97SAlex Deucher return vce_v3_0_start(adev); 771aaa36a97SAlex Deucher } 772aaa36a97SAlex Deucher 7735fc3aeebSyanyang1 const struct amd_ip_funcs vce_v3_0_ip_funcs = { 774aaa36a97SAlex Deucher .early_init = vce_v3_0_early_init, 775aaa36a97SAlex Deucher .late_init = NULL, 776aaa36a97SAlex Deucher .sw_init = vce_v3_0_sw_init, 777aaa36a97SAlex Deucher .sw_fini = vce_v3_0_sw_fini, 778aaa36a97SAlex Deucher .hw_init = vce_v3_0_hw_init, 779aaa36a97SAlex Deucher .hw_fini = vce_v3_0_hw_fini, 780aaa36a97SAlex Deucher .suspend = vce_v3_0_suspend, 781aaa36a97SAlex Deucher .resume = vce_v3_0_resume, 782aaa36a97SAlex Deucher .is_idle = vce_v3_0_is_idle, 783aaa36a97SAlex Deucher .wait_for_idle = vce_v3_0_wait_for_idle, 784aaa36a97SAlex Deucher .soft_reset = vce_v3_0_soft_reset, 785aaa36a97SAlex Deucher .print_status = vce_v3_0_print_status, 786aaa36a97SAlex Deucher .set_clockgating_state = vce_v3_0_set_clockgating_state, 787aaa36a97SAlex Deucher .set_powergating_state = vce_v3_0_set_powergating_state, 788aaa36a97SAlex Deucher }; 789aaa36a97SAlex Deucher 790aaa36a97SAlex Deucher static const struct amdgpu_ring_funcs vce_v3_0_ring_funcs = { 791aaa36a97SAlex Deucher .get_rptr = vce_v3_0_ring_get_rptr, 792aaa36a97SAlex Deucher .get_wptr = vce_v3_0_ring_get_wptr, 793aaa36a97SAlex Deucher .set_wptr = vce_v3_0_ring_set_wptr, 794aaa36a97SAlex Deucher .parse_cs = amdgpu_vce_ring_parse_cs, 795aaa36a97SAlex Deucher .emit_ib = amdgpu_vce_ring_emit_ib, 796aaa36a97SAlex Deucher .emit_fence = amdgpu_vce_ring_emit_fence, 797aaa36a97SAlex Deucher .emit_semaphore = amdgpu_vce_ring_emit_semaphore, 798aaa36a97SAlex Deucher .test_ring = amdgpu_vce_ring_test_ring, 799aaa36a97SAlex Deucher .test_ib = amdgpu_vce_ring_test_ib, 800edff0e28SJammy Zhou .insert_nop = amdgpu_ring_insert_nop, 801aaa36a97SAlex Deucher }; 802aaa36a97SAlex Deucher 803aaa36a97SAlex Deucher static void vce_v3_0_set_ring_funcs(struct amdgpu_device *adev) 804aaa36a97SAlex Deucher { 805aaa36a97SAlex Deucher adev->vce.ring[0].funcs = &vce_v3_0_ring_funcs; 806aaa36a97SAlex Deucher adev->vce.ring[1].funcs = &vce_v3_0_ring_funcs; 807aaa36a97SAlex Deucher } 808aaa36a97SAlex Deucher 809aaa36a97SAlex Deucher static const struct amdgpu_irq_src_funcs vce_v3_0_irq_funcs = { 810aaa36a97SAlex Deucher .set = vce_v3_0_set_interrupt_state, 811aaa36a97SAlex Deucher .process = vce_v3_0_process_interrupt, 812aaa36a97SAlex Deucher }; 813aaa36a97SAlex Deucher 814aaa36a97SAlex Deucher static void vce_v3_0_set_irq_funcs(struct amdgpu_device *adev) 815aaa36a97SAlex Deucher { 816aaa36a97SAlex Deucher adev->vce.irq.num_types = 1; 817aaa36a97SAlex Deucher adev->vce.irq.funcs = &vce_v3_0_irq_funcs; 818aaa36a97SAlex Deucher }; 819