1771fe6b9SJerome Glisse /* 2771fe6b9SJerome Glisse * Copyright 2008 Advanced Micro Devices, Inc. 3771fe6b9SJerome Glisse * Copyright 2008 Red Hat Inc. 4771fe6b9SJerome Glisse * Copyright 2009 Jerome Glisse. 5771fe6b9SJerome Glisse * 6771fe6b9SJerome Glisse * Permission is hereby granted, free of charge, to any person obtaining a 7771fe6b9SJerome Glisse * copy of this software and associated documentation files (the "Software"), 8771fe6b9SJerome Glisse * to deal in the Software without restriction, including without limitation 9771fe6b9SJerome Glisse * the rights to use, copy, modify, merge, publish, distribute, sublicense, 10771fe6b9SJerome Glisse * and/or sell copies of the Software, and to permit persons to whom the 11771fe6b9SJerome Glisse * Software is furnished to do so, subject to the following conditions: 12771fe6b9SJerome Glisse * 13771fe6b9SJerome Glisse * The above copyright notice and this permission notice shall be included in 14771fe6b9SJerome Glisse * all copies or substantial portions of the Software. 15771fe6b9SJerome Glisse * 16771fe6b9SJerome Glisse * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 17771fe6b9SJerome Glisse * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18771fe6b9SJerome Glisse * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19771fe6b9SJerome Glisse * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 20771fe6b9SJerome Glisse * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 21771fe6b9SJerome Glisse * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 22771fe6b9SJerome Glisse * OTHER DEALINGS IN THE SOFTWARE. 23771fe6b9SJerome Glisse * 24771fe6b9SJerome Glisse * Authors: Dave Airlie 25771fe6b9SJerome Glisse * Alex Deucher 26771fe6b9SJerome Glisse * Jerome Glisse 27771fe6b9SJerome Glisse */ 28771fe6b9SJerome Glisse #include <linux/seq_file.h> 29771fe6b9SJerome Glisse #include "drmP.h" 30771fe6b9SJerome Glisse #include "drm.h" 31771fe6b9SJerome Glisse #include "radeon_drm.h" 32771fe6b9SJerome Glisse #include "radeon_microcode.h" 33771fe6b9SJerome Glisse #include "radeon_reg.h" 34771fe6b9SJerome Glisse #include "radeon.h" 35771fe6b9SJerome Glisse 36771fe6b9SJerome Glisse /* This files gather functions specifics to: 37771fe6b9SJerome Glisse * r100,rv100,rs100,rv200,rs200,r200,rv250,rs300,rv280 38771fe6b9SJerome Glisse * 39771fe6b9SJerome Glisse * Some of these functions might be used by newer ASICs. 40771fe6b9SJerome Glisse */ 41771fe6b9SJerome Glisse void r100_hdp_reset(struct radeon_device *rdev); 42771fe6b9SJerome Glisse void r100_gpu_init(struct radeon_device *rdev); 43771fe6b9SJerome Glisse int r100_gui_wait_for_idle(struct radeon_device *rdev); 44771fe6b9SJerome Glisse int r100_mc_wait_for_idle(struct radeon_device *rdev); 45771fe6b9SJerome Glisse void r100_gpu_wait_for_vsync(struct radeon_device *rdev); 46771fe6b9SJerome Glisse void r100_gpu_wait_for_vsync2(struct radeon_device *rdev); 47771fe6b9SJerome Glisse int r100_debugfs_mc_info_init(struct radeon_device *rdev); 48771fe6b9SJerome Glisse 49771fe6b9SJerome Glisse 50771fe6b9SJerome Glisse /* 51771fe6b9SJerome Glisse * PCI GART 52771fe6b9SJerome Glisse */ 53771fe6b9SJerome Glisse void r100_pci_gart_tlb_flush(struct radeon_device *rdev) 54771fe6b9SJerome Glisse { 55771fe6b9SJerome Glisse /* TODO: can we do somethings here ? */ 56771fe6b9SJerome Glisse /* It seems hw only cache one entry so we should discard this 57771fe6b9SJerome Glisse * entry otherwise if first GPU GART read hit this entry it 58771fe6b9SJerome Glisse * could end up in wrong address. */ 59771fe6b9SJerome Glisse } 60771fe6b9SJerome Glisse 61771fe6b9SJerome Glisse int r100_pci_gart_enable(struct radeon_device *rdev) 62771fe6b9SJerome Glisse { 63771fe6b9SJerome Glisse uint32_t tmp; 64771fe6b9SJerome Glisse int r; 65771fe6b9SJerome Glisse 66771fe6b9SJerome Glisse /* Initialize common gart structure */ 67771fe6b9SJerome Glisse r = radeon_gart_init(rdev); 68771fe6b9SJerome Glisse if (r) { 69771fe6b9SJerome Glisse return r; 70771fe6b9SJerome Glisse } 71771fe6b9SJerome Glisse if (rdev->gart.table.ram.ptr == NULL) { 72771fe6b9SJerome Glisse rdev->gart.table_size = rdev->gart.num_gpu_pages * 4; 73771fe6b9SJerome Glisse r = radeon_gart_table_ram_alloc(rdev); 74771fe6b9SJerome Glisse if (r) { 75771fe6b9SJerome Glisse return r; 76771fe6b9SJerome Glisse } 77771fe6b9SJerome Glisse } 78771fe6b9SJerome Glisse /* discard memory request outside of configured range */ 79771fe6b9SJerome Glisse tmp = RREG32(RADEON_AIC_CNTL) | RADEON_DIS_OUT_OF_PCI_GART_ACCESS; 80771fe6b9SJerome Glisse WREG32(RADEON_AIC_CNTL, tmp); 81771fe6b9SJerome Glisse /* set address range for PCI address translate */ 82771fe6b9SJerome Glisse WREG32(RADEON_AIC_LO_ADDR, rdev->mc.gtt_location); 83771fe6b9SJerome Glisse tmp = rdev->mc.gtt_location + rdev->mc.gtt_size - 1; 84771fe6b9SJerome Glisse WREG32(RADEON_AIC_HI_ADDR, tmp); 85771fe6b9SJerome Glisse /* Enable bus mastering */ 86771fe6b9SJerome Glisse tmp = RREG32(RADEON_BUS_CNTL) & ~RADEON_BUS_MASTER_DIS; 87771fe6b9SJerome Glisse WREG32(RADEON_BUS_CNTL, tmp); 88771fe6b9SJerome Glisse /* set PCI GART page-table base address */ 89771fe6b9SJerome Glisse WREG32(RADEON_AIC_PT_BASE, rdev->gart.table_addr); 90771fe6b9SJerome Glisse tmp = RREG32(RADEON_AIC_CNTL) | RADEON_PCIGART_TRANSLATE_EN; 91771fe6b9SJerome Glisse WREG32(RADEON_AIC_CNTL, tmp); 92771fe6b9SJerome Glisse r100_pci_gart_tlb_flush(rdev); 93771fe6b9SJerome Glisse rdev->gart.ready = true; 94771fe6b9SJerome Glisse return 0; 95771fe6b9SJerome Glisse } 96771fe6b9SJerome Glisse 97771fe6b9SJerome Glisse void r100_pci_gart_disable(struct radeon_device *rdev) 98771fe6b9SJerome Glisse { 99771fe6b9SJerome Glisse uint32_t tmp; 100771fe6b9SJerome Glisse 101771fe6b9SJerome Glisse /* discard memory request outside of configured range */ 102771fe6b9SJerome Glisse tmp = RREG32(RADEON_AIC_CNTL) | RADEON_DIS_OUT_OF_PCI_GART_ACCESS; 103771fe6b9SJerome Glisse WREG32(RADEON_AIC_CNTL, tmp & ~RADEON_PCIGART_TRANSLATE_EN); 104771fe6b9SJerome Glisse WREG32(RADEON_AIC_LO_ADDR, 0); 105771fe6b9SJerome Glisse WREG32(RADEON_AIC_HI_ADDR, 0); 106771fe6b9SJerome Glisse } 107771fe6b9SJerome Glisse 108771fe6b9SJerome Glisse int r100_pci_gart_set_page(struct radeon_device *rdev, int i, uint64_t addr) 109771fe6b9SJerome Glisse { 110771fe6b9SJerome Glisse if (i < 0 || i > rdev->gart.num_gpu_pages) { 111771fe6b9SJerome Glisse return -EINVAL; 112771fe6b9SJerome Glisse } 113ed10f95dSDave Airlie rdev->gart.table.ram.ptr[i] = cpu_to_le32(lower_32_bits(addr)); 114771fe6b9SJerome Glisse return 0; 115771fe6b9SJerome Glisse } 116771fe6b9SJerome Glisse 117771fe6b9SJerome Glisse int r100_gart_enable(struct radeon_device *rdev) 118771fe6b9SJerome Glisse { 119771fe6b9SJerome Glisse if (rdev->flags & RADEON_IS_AGP) { 120771fe6b9SJerome Glisse r100_pci_gart_disable(rdev); 121771fe6b9SJerome Glisse return 0; 122771fe6b9SJerome Glisse } 123771fe6b9SJerome Glisse return r100_pci_gart_enable(rdev); 124771fe6b9SJerome Glisse } 125771fe6b9SJerome Glisse 126771fe6b9SJerome Glisse 127771fe6b9SJerome Glisse /* 128771fe6b9SJerome Glisse * MC 129771fe6b9SJerome Glisse */ 130771fe6b9SJerome Glisse void r100_mc_disable_clients(struct radeon_device *rdev) 131771fe6b9SJerome Glisse { 132771fe6b9SJerome Glisse uint32_t ov0_scale_cntl, crtc_ext_cntl, crtc_gen_cntl, crtc2_gen_cntl; 133771fe6b9SJerome Glisse 134771fe6b9SJerome Glisse /* FIXME: is this function correct for rs100,rs200,rs300 ? */ 135771fe6b9SJerome Glisse if (r100_gui_wait_for_idle(rdev)) { 136771fe6b9SJerome Glisse printk(KERN_WARNING "Failed to wait GUI idle while " 137771fe6b9SJerome Glisse "programming pipes. Bad things might happen.\n"); 138771fe6b9SJerome Glisse } 139771fe6b9SJerome Glisse 140771fe6b9SJerome Glisse /* stop display and memory access */ 141771fe6b9SJerome Glisse ov0_scale_cntl = RREG32(RADEON_OV0_SCALE_CNTL); 142771fe6b9SJerome Glisse WREG32(RADEON_OV0_SCALE_CNTL, ov0_scale_cntl & ~RADEON_SCALER_ENABLE); 143771fe6b9SJerome Glisse crtc_ext_cntl = RREG32(RADEON_CRTC_EXT_CNTL); 144771fe6b9SJerome Glisse WREG32(RADEON_CRTC_EXT_CNTL, crtc_ext_cntl | RADEON_CRTC_DISPLAY_DIS); 145771fe6b9SJerome Glisse crtc_gen_cntl = RREG32(RADEON_CRTC_GEN_CNTL); 146771fe6b9SJerome Glisse 147771fe6b9SJerome Glisse r100_gpu_wait_for_vsync(rdev); 148771fe6b9SJerome Glisse 149771fe6b9SJerome Glisse WREG32(RADEON_CRTC_GEN_CNTL, 150771fe6b9SJerome Glisse (crtc_gen_cntl & ~(RADEON_CRTC_CUR_EN | RADEON_CRTC_ICON_EN)) | 151771fe6b9SJerome Glisse RADEON_CRTC_DISP_REQ_EN_B | RADEON_CRTC_EXT_DISP_EN); 152771fe6b9SJerome Glisse 153771fe6b9SJerome Glisse if (!(rdev->flags & RADEON_SINGLE_CRTC)) { 154771fe6b9SJerome Glisse crtc2_gen_cntl = RREG32(RADEON_CRTC2_GEN_CNTL); 155771fe6b9SJerome Glisse 156771fe6b9SJerome Glisse r100_gpu_wait_for_vsync2(rdev); 157771fe6b9SJerome Glisse WREG32(RADEON_CRTC2_GEN_CNTL, 158771fe6b9SJerome Glisse (crtc2_gen_cntl & 159771fe6b9SJerome Glisse ~(RADEON_CRTC2_CUR_EN | RADEON_CRTC2_ICON_EN)) | 160771fe6b9SJerome Glisse RADEON_CRTC2_DISP_REQ_EN_B); 161771fe6b9SJerome Glisse } 162771fe6b9SJerome Glisse 163771fe6b9SJerome Glisse udelay(500); 164771fe6b9SJerome Glisse } 165771fe6b9SJerome Glisse 166771fe6b9SJerome Glisse void r100_mc_setup(struct radeon_device *rdev) 167771fe6b9SJerome Glisse { 168771fe6b9SJerome Glisse uint32_t tmp; 169771fe6b9SJerome Glisse int r; 170771fe6b9SJerome Glisse 171771fe6b9SJerome Glisse r = r100_debugfs_mc_info_init(rdev); 172771fe6b9SJerome Glisse if (r) { 173771fe6b9SJerome Glisse DRM_ERROR("Failed to register debugfs file for R100 MC !\n"); 174771fe6b9SJerome Glisse } 175771fe6b9SJerome Glisse /* Write VRAM size in case we are limiting it */ 176771fe6b9SJerome Glisse WREG32(RADEON_CONFIG_MEMSIZE, rdev->mc.vram_size); 177771fe6b9SJerome Glisse tmp = rdev->mc.vram_location + rdev->mc.vram_size - 1; 178771fe6b9SJerome Glisse tmp = REG_SET(RADEON_MC_FB_TOP, tmp >> 16); 179771fe6b9SJerome Glisse tmp |= REG_SET(RADEON_MC_FB_START, rdev->mc.vram_location >> 16); 180771fe6b9SJerome Glisse WREG32(RADEON_MC_FB_LOCATION, tmp); 181771fe6b9SJerome Glisse 182771fe6b9SJerome Glisse /* Enable bus mastering */ 183771fe6b9SJerome Glisse tmp = RREG32(RADEON_BUS_CNTL) & ~RADEON_BUS_MASTER_DIS; 184771fe6b9SJerome Glisse WREG32(RADEON_BUS_CNTL, tmp); 185771fe6b9SJerome Glisse 186771fe6b9SJerome Glisse if (rdev->flags & RADEON_IS_AGP) { 187771fe6b9SJerome Glisse tmp = rdev->mc.gtt_location + rdev->mc.gtt_size - 1; 188771fe6b9SJerome Glisse tmp = REG_SET(RADEON_MC_AGP_TOP, tmp >> 16); 189771fe6b9SJerome Glisse tmp |= REG_SET(RADEON_MC_AGP_START, rdev->mc.gtt_location >> 16); 190771fe6b9SJerome Glisse WREG32(RADEON_MC_AGP_LOCATION, tmp); 191771fe6b9SJerome Glisse WREG32(RADEON_AGP_BASE, rdev->mc.agp_base); 192771fe6b9SJerome Glisse } else { 193771fe6b9SJerome Glisse WREG32(RADEON_MC_AGP_LOCATION, 0x0FFFFFFF); 194771fe6b9SJerome Glisse WREG32(RADEON_AGP_BASE, 0); 195771fe6b9SJerome Glisse } 196771fe6b9SJerome Glisse 197771fe6b9SJerome Glisse tmp = RREG32(RADEON_HOST_PATH_CNTL) & RADEON_HDP_APER_CNTL; 198771fe6b9SJerome Glisse tmp |= (7 << 28); 199771fe6b9SJerome Glisse WREG32(RADEON_HOST_PATH_CNTL, tmp | RADEON_HDP_SOFT_RESET | RADEON_HDP_READ_BUFFER_INVALIDATE); 200771fe6b9SJerome Glisse (void)RREG32(RADEON_HOST_PATH_CNTL); 201771fe6b9SJerome Glisse WREG32(RADEON_HOST_PATH_CNTL, tmp); 202771fe6b9SJerome Glisse (void)RREG32(RADEON_HOST_PATH_CNTL); 203771fe6b9SJerome Glisse } 204771fe6b9SJerome Glisse 205771fe6b9SJerome Glisse int r100_mc_init(struct radeon_device *rdev) 206771fe6b9SJerome Glisse { 207771fe6b9SJerome Glisse int r; 208771fe6b9SJerome Glisse 209771fe6b9SJerome Glisse if (r100_debugfs_rbbm_init(rdev)) { 210771fe6b9SJerome Glisse DRM_ERROR("Failed to register debugfs file for RBBM !\n"); 211771fe6b9SJerome Glisse } 212771fe6b9SJerome Glisse 213771fe6b9SJerome Glisse r100_gpu_init(rdev); 214771fe6b9SJerome Glisse /* Disable gart which also disable out of gart access */ 215771fe6b9SJerome Glisse r100_pci_gart_disable(rdev); 216771fe6b9SJerome Glisse 217771fe6b9SJerome Glisse /* Setup GPU memory space */ 218771fe6b9SJerome Glisse rdev->mc.gtt_location = 0xFFFFFFFFUL; 219771fe6b9SJerome Glisse if (rdev->flags & RADEON_IS_AGP) { 220771fe6b9SJerome Glisse r = radeon_agp_init(rdev); 221771fe6b9SJerome Glisse if (r) { 222771fe6b9SJerome Glisse printk(KERN_WARNING "[drm] Disabling AGP\n"); 223771fe6b9SJerome Glisse rdev->flags &= ~RADEON_IS_AGP; 224771fe6b9SJerome Glisse rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024; 225771fe6b9SJerome Glisse } else { 226771fe6b9SJerome Glisse rdev->mc.gtt_location = rdev->mc.agp_base; 227771fe6b9SJerome Glisse } 228771fe6b9SJerome Glisse } 229771fe6b9SJerome Glisse r = radeon_mc_setup(rdev); 230771fe6b9SJerome Glisse if (r) { 231771fe6b9SJerome Glisse return r; 232771fe6b9SJerome Glisse } 233771fe6b9SJerome Glisse 234771fe6b9SJerome Glisse r100_mc_disable_clients(rdev); 235771fe6b9SJerome Glisse if (r100_mc_wait_for_idle(rdev)) { 236771fe6b9SJerome Glisse printk(KERN_WARNING "Failed to wait MC idle while " 237771fe6b9SJerome Glisse "programming pipes. Bad things might happen.\n"); 238771fe6b9SJerome Glisse } 239771fe6b9SJerome Glisse 240771fe6b9SJerome Glisse r100_mc_setup(rdev); 241771fe6b9SJerome Glisse return 0; 242771fe6b9SJerome Glisse } 243771fe6b9SJerome Glisse 244771fe6b9SJerome Glisse void r100_mc_fini(struct radeon_device *rdev) 245771fe6b9SJerome Glisse { 246771fe6b9SJerome Glisse r100_pci_gart_disable(rdev); 247771fe6b9SJerome Glisse radeon_gart_table_ram_free(rdev); 248771fe6b9SJerome Glisse radeon_gart_fini(rdev); 249771fe6b9SJerome Glisse } 250771fe6b9SJerome Glisse 251771fe6b9SJerome Glisse 252771fe6b9SJerome Glisse /* 253771fe6b9SJerome Glisse * Fence emission 254771fe6b9SJerome Glisse */ 255771fe6b9SJerome Glisse void r100_fence_ring_emit(struct radeon_device *rdev, 256771fe6b9SJerome Glisse struct radeon_fence *fence) 257771fe6b9SJerome Glisse { 258771fe6b9SJerome Glisse /* Who ever call radeon_fence_emit should call ring_lock and ask 259771fe6b9SJerome Glisse * for enough space (today caller are ib schedule and buffer move) */ 260771fe6b9SJerome Glisse /* Wait until IDLE & CLEAN */ 261771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET0(0x1720, 0)); 262771fe6b9SJerome Glisse radeon_ring_write(rdev, (1 << 16) | (1 << 17)); 263771fe6b9SJerome Glisse /* Emit fence sequence & fire IRQ */ 264771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET0(rdev->fence_drv.scratch_reg, 0)); 265771fe6b9SJerome Glisse radeon_ring_write(rdev, fence->seq); 266771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET0(RADEON_GEN_INT_STATUS, 0)); 267771fe6b9SJerome Glisse radeon_ring_write(rdev, RADEON_SW_INT_FIRE); 268771fe6b9SJerome Glisse } 269771fe6b9SJerome Glisse 270771fe6b9SJerome Glisse 271771fe6b9SJerome Glisse /* 272771fe6b9SJerome Glisse * Writeback 273771fe6b9SJerome Glisse */ 274771fe6b9SJerome Glisse int r100_wb_init(struct radeon_device *rdev) 275771fe6b9SJerome Glisse { 276771fe6b9SJerome Glisse int r; 277771fe6b9SJerome Glisse 278771fe6b9SJerome Glisse if (rdev->wb.wb_obj == NULL) { 279771fe6b9SJerome Glisse r = radeon_object_create(rdev, NULL, 4096, 280771fe6b9SJerome Glisse true, 281771fe6b9SJerome Glisse RADEON_GEM_DOMAIN_GTT, 282771fe6b9SJerome Glisse false, &rdev->wb.wb_obj); 283771fe6b9SJerome Glisse if (r) { 284771fe6b9SJerome Glisse DRM_ERROR("radeon: failed to create WB buffer (%d).\n", r); 285771fe6b9SJerome Glisse return r; 286771fe6b9SJerome Glisse } 287771fe6b9SJerome Glisse r = radeon_object_pin(rdev->wb.wb_obj, 288771fe6b9SJerome Glisse RADEON_GEM_DOMAIN_GTT, 289771fe6b9SJerome Glisse &rdev->wb.gpu_addr); 290771fe6b9SJerome Glisse if (r) { 291771fe6b9SJerome Glisse DRM_ERROR("radeon: failed to pin WB buffer (%d).\n", r); 292771fe6b9SJerome Glisse return r; 293771fe6b9SJerome Glisse } 294771fe6b9SJerome Glisse r = radeon_object_kmap(rdev->wb.wb_obj, (void **)&rdev->wb.wb); 295771fe6b9SJerome Glisse if (r) { 296771fe6b9SJerome Glisse DRM_ERROR("radeon: failed to map WB buffer (%d).\n", r); 297771fe6b9SJerome Glisse return r; 298771fe6b9SJerome Glisse } 299771fe6b9SJerome Glisse } 300771fe6b9SJerome Glisse WREG32(0x774, rdev->wb.gpu_addr); 301771fe6b9SJerome Glisse WREG32(0x70C, rdev->wb.gpu_addr + 1024); 302771fe6b9SJerome Glisse WREG32(0x770, 0xff); 303771fe6b9SJerome Glisse return 0; 304771fe6b9SJerome Glisse } 305771fe6b9SJerome Glisse 306771fe6b9SJerome Glisse void r100_wb_fini(struct radeon_device *rdev) 307771fe6b9SJerome Glisse { 308771fe6b9SJerome Glisse if (rdev->wb.wb_obj) { 309771fe6b9SJerome Glisse radeon_object_kunmap(rdev->wb.wb_obj); 310771fe6b9SJerome Glisse radeon_object_unpin(rdev->wb.wb_obj); 311771fe6b9SJerome Glisse radeon_object_unref(&rdev->wb.wb_obj); 312771fe6b9SJerome Glisse rdev->wb.wb = NULL; 313771fe6b9SJerome Glisse rdev->wb.wb_obj = NULL; 314771fe6b9SJerome Glisse } 315771fe6b9SJerome Glisse } 316771fe6b9SJerome Glisse 317771fe6b9SJerome Glisse int r100_copy_blit(struct radeon_device *rdev, 318771fe6b9SJerome Glisse uint64_t src_offset, 319771fe6b9SJerome Glisse uint64_t dst_offset, 320771fe6b9SJerome Glisse unsigned num_pages, 321771fe6b9SJerome Glisse struct radeon_fence *fence) 322771fe6b9SJerome Glisse { 323771fe6b9SJerome Glisse uint32_t cur_pages; 324771fe6b9SJerome Glisse uint32_t stride_bytes = PAGE_SIZE; 325771fe6b9SJerome Glisse uint32_t pitch; 326771fe6b9SJerome Glisse uint32_t stride_pixels; 327771fe6b9SJerome Glisse unsigned ndw; 328771fe6b9SJerome Glisse int num_loops; 329771fe6b9SJerome Glisse int r = 0; 330771fe6b9SJerome Glisse 331771fe6b9SJerome Glisse /* radeon limited to 16k stride */ 332771fe6b9SJerome Glisse stride_bytes &= 0x3fff; 333771fe6b9SJerome Glisse /* radeon pitch is /64 */ 334771fe6b9SJerome Glisse pitch = stride_bytes / 64; 335771fe6b9SJerome Glisse stride_pixels = stride_bytes / 4; 336771fe6b9SJerome Glisse num_loops = DIV_ROUND_UP(num_pages, 8191); 337771fe6b9SJerome Glisse 338771fe6b9SJerome Glisse /* Ask for enough room for blit + flush + fence */ 339771fe6b9SJerome Glisse ndw = 64 + (10 * num_loops); 340771fe6b9SJerome Glisse r = radeon_ring_lock(rdev, ndw); 341771fe6b9SJerome Glisse if (r) { 342771fe6b9SJerome Glisse DRM_ERROR("radeon: moving bo (%d) asking for %u dw.\n", r, ndw); 343771fe6b9SJerome Glisse return -EINVAL; 344771fe6b9SJerome Glisse } 345771fe6b9SJerome Glisse while (num_pages > 0) { 346771fe6b9SJerome Glisse cur_pages = num_pages; 347771fe6b9SJerome Glisse if (cur_pages > 8191) { 348771fe6b9SJerome Glisse cur_pages = 8191; 349771fe6b9SJerome Glisse } 350771fe6b9SJerome Glisse num_pages -= cur_pages; 351771fe6b9SJerome Glisse 352771fe6b9SJerome Glisse /* pages are in Y direction - height 353771fe6b9SJerome Glisse page width in X direction - width */ 354771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET3(PACKET3_BITBLT_MULTI, 8)); 355771fe6b9SJerome Glisse radeon_ring_write(rdev, 356771fe6b9SJerome Glisse RADEON_GMC_SRC_PITCH_OFFSET_CNTL | 357771fe6b9SJerome Glisse RADEON_GMC_DST_PITCH_OFFSET_CNTL | 358771fe6b9SJerome Glisse RADEON_GMC_SRC_CLIPPING | 359771fe6b9SJerome Glisse RADEON_GMC_DST_CLIPPING | 360771fe6b9SJerome Glisse RADEON_GMC_BRUSH_NONE | 361771fe6b9SJerome Glisse (RADEON_COLOR_FORMAT_ARGB8888 << 8) | 362771fe6b9SJerome Glisse RADEON_GMC_SRC_DATATYPE_COLOR | 363771fe6b9SJerome Glisse RADEON_ROP3_S | 364771fe6b9SJerome Glisse RADEON_DP_SRC_SOURCE_MEMORY | 365771fe6b9SJerome Glisse RADEON_GMC_CLR_CMP_CNTL_DIS | 366771fe6b9SJerome Glisse RADEON_GMC_WR_MSK_DIS); 367771fe6b9SJerome Glisse radeon_ring_write(rdev, (pitch << 22) | (src_offset >> 10)); 368771fe6b9SJerome Glisse radeon_ring_write(rdev, (pitch << 22) | (dst_offset >> 10)); 369771fe6b9SJerome Glisse radeon_ring_write(rdev, (0x1fff) | (0x1fff << 16)); 370771fe6b9SJerome Glisse radeon_ring_write(rdev, 0); 371771fe6b9SJerome Glisse radeon_ring_write(rdev, (0x1fff) | (0x1fff << 16)); 372771fe6b9SJerome Glisse radeon_ring_write(rdev, num_pages); 373771fe6b9SJerome Glisse radeon_ring_write(rdev, num_pages); 374771fe6b9SJerome Glisse radeon_ring_write(rdev, cur_pages | (stride_pixels << 16)); 375771fe6b9SJerome Glisse } 376771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET0(RADEON_DSTCACHE_CTLSTAT, 0)); 377771fe6b9SJerome Glisse radeon_ring_write(rdev, RADEON_RB2D_DC_FLUSH_ALL); 378771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET0(RADEON_WAIT_UNTIL, 0)); 379771fe6b9SJerome Glisse radeon_ring_write(rdev, 380771fe6b9SJerome Glisse RADEON_WAIT_2D_IDLECLEAN | 381771fe6b9SJerome Glisse RADEON_WAIT_HOST_IDLECLEAN | 382771fe6b9SJerome Glisse RADEON_WAIT_DMA_GUI_IDLE); 383771fe6b9SJerome Glisse if (fence) { 384771fe6b9SJerome Glisse r = radeon_fence_emit(rdev, fence); 385771fe6b9SJerome Glisse } 386771fe6b9SJerome Glisse radeon_ring_unlock_commit(rdev); 387771fe6b9SJerome Glisse return r; 388771fe6b9SJerome Glisse } 389771fe6b9SJerome Glisse 390771fe6b9SJerome Glisse 391771fe6b9SJerome Glisse /* 392771fe6b9SJerome Glisse * CP 393771fe6b9SJerome Glisse */ 394771fe6b9SJerome Glisse void r100_ring_start(struct radeon_device *rdev) 395771fe6b9SJerome Glisse { 396771fe6b9SJerome Glisse int r; 397771fe6b9SJerome Glisse 398771fe6b9SJerome Glisse r = radeon_ring_lock(rdev, 2); 399771fe6b9SJerome Glisse if (r) { 400771fe6b9SJerome Glisse return; 401771fe6b9SJerome Glisse } 402771fe6b9SJerome Glisse radeon_ring_write(rdev, PACKET0(RADEON_ISYNC_CNTL, 0)); 403771fe6b9SJerome Glisse radeon_ring_write(rdev, 404771fe6b9SJerome Glisse RADEON_ISYNC_ANY2D_IDLE3D | 405771fe6b9SJerome Glisse RADEON_ISYNC_ANY3D_IDLE2D | 406771fe6b9SJerome Glisse RADEON_ISYNC_WAIT_IDLEGUI | 407771fe6b9SJerome Glisse RADEON_ISYNC_CPSCRATCH_IDLEGUI); 408771fe6b9SJerome Glisse radeon_ring_unlock_commit(rdev); 409771fe6b9SJerome Glisse } 410771fe6b9SJerome Glisse 411771fe6b9SJerome Glisse static void r100_cp_load_microcode(struct radeon_device *rdev) 412771fe6b9SJerome Glisse { 413771fe6b9SJerome Glisse int i; 414771fe6b9SJerome Glisse 415771fe6b9SJerome Glisse if (r100_gui_wait_for_idle(rdev)) { 416771fe6b9SJerome Glisse printk(KERN_WARNING "Failed to wait GUI idle while " 417771fe6b9SJerome Glisse "programming pipes. Bad things might happen.\n"); 418771fe6b9SJerome Glisse } 419771fe6b9SJerome Glisse 420771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_ADDR, 0); 421771fe6b9SJerome Glisse if ((rdev->family == CHIP_R100) || (rdev->family == CHIP_RV100) || 422771fe6b9SJerome Glisse (rdev->family == CHIP_RV200) || (rdev->family == CHIP_RS100) || 423771fe6b9SJerome Glisse (rdev->family == CHIP_RS200)) { 424771fe6b9SJerome Glisse DRM_INFO("Loading R100 Microcode\n"); 425771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 426771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, R100_cp_microcode[i][1]); 427771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, R100_cp_microcode[i][0]); 428771fe6b9SJerome Glisse } 429771fe6b9SJerome Glisse } else if ((rdev->family == CHIP_R200) || 430771fe6b9SJerome Glisse (rdev->family == CHIP_RV250) || 431771fe6b9SJerome Glisse (rdev->family == CHIP_RV280) || 432771fe6b9SJerome Glisse (rdev->family == CHIP_RS300)) { 433771fe6b9SJerome Glisse DRM_INFO("Loading R200 Microcode\n"); 434771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 435771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, R200_cp_microcode[i][1]); 436771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, R200_cp_microcode[i][0]); 437771fe6b9SJerome Glisse } 438771fe6b9SJerome Glisse } else if ((rdev->family == CHIP_R300) || 439771fe6b9SJerome Glisse (rdev->family == CHIP_R350) || 440771fe6b9SJerome Glisse (rdev->family == CHIP_RV350) || 441771fe6b9SJerome Glisse (rdev->family == CHIP_RV380) || 442771fe6b9SJerome Glisse (rdev->family == CHIP_RS400) || 443771fe6b9SJerome Glisse (rdev->family == CHIP_RS480)) { 444771fe6b9SJerome Glisse DRM_INFO("Loading R300 Microcode\n"); 445771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 446771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, R300_cp_microcode[i][1]); 447771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, R300_cp_microcode[i][0]); 448771fe6b9SJerome Glisse } 449771fe6b9SJerome Glisse } else if ((rdev->family == CHIP_R420) || 450771fe6b9SJerome Glisse (rdev->family == CHIP_R423) || 451771fe6b9SJerome Glisse (rdev->family == CHIP_RV410)) { 452771fe6b9SJerome Glisse DRM_INFO("Loading R400 Microcode\n"); 453771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 454771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, R420_cp_microcode[i][1]); 455771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, R420_cp_microcode[i][0]); 456771fe6b9SJerome Glisse } 457771fe6b9SJerome Glisse } else if ((rdev->family == CHIP_RS690) || 458771fe6b9SJerome Glisse (rdev->family == CHIP_RS740)) { 459771fe6b9SJerome Glisse DRM_INFO("Loading RS690/RS740 Microcode\n"); 460771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 461771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, RS690_cp_microcode[i][1]); 462771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, RS690_cp_microcode[i][0]); 463771fe6b9SJerome Glisse } 464771fe6b9SJerome Glisse } else if (rdev->family == CHIP_RS600) { 465771fe6b9SJerome Glisse DRM_INFO("Loading RS600 Microcode\n"); 466771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 467771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, RS600_cp_microcode[i][1]); 468771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, RS600_cp_microcode[i][0]); 469771fe6b9SJerome Glisse } 470771fe6b9SJerome Glisse } else if ((rdev->family == CHIP_RV515) || 471771fe6b9SJerome Glisse (rdev->family == CHIP_R520) || 472771fe6b9SJerome Glisse (rdev->family == CHIP_RV530) || 473771fe6b9SJerome Glisse (rdev->family == CHIP_R580) || 474771fe6b9SJerome Glisse (rdev->family == CHIP_RV560) || 475771fe6b9SJerome Glisse (rdev->family == CHIP_RV570)) { 476771fe6b9SJerome Glisse DRM_INFO("Loading R500 Microcode\n"); 477771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 478771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAH, R520_cp_microcode[i][1]); 479771fe6b9SJerome Glisse WREG32(RADEON_CP_ME_RAM_DATAL, R520_cp_microcode[i][0]); 480771fe6b9SJerome Glisse } 481771fe6b9SJerome Glisse } 482771fe6b9SJerome Glisse } 483771fe6b9SJerome Glisse 484771fe6b9SJerome Glisse int r100_cp_init(struct radeon_device *rdev, unsigned ring_size) 485771fe6b9SJerome Glisse { 486771fe6b9SJerome Glisse unsigned rb_bufsz; 487771fe6b9SJerome Glisse unsigned rb_blksz; 488771fe6b9SJerome Glisse unsigned max_fetch; 489771fe6b9SJerome Glisse unsigned pre_write_timer; 490771fe6b9SJerome Glisse unsigned pre_write_limit; 491771fe6b9SJerome Glisse unsigned indirect2_start; 492771fe6b9SJerome Glisse unsigned indirect1_start; 493771fe6b9SJerome Glisse uint32_t tmp; 494771fe6b9SJerome Glisse int r; 495771fe6b9SJerome Glisse 496771fe6b9SJerome Glisse if (r100_debugfs_cp_init(rdev)) { 497771fe6b9SJerome Glisse DRM_ERROR("Failed to register debugfs file for CP !\n"); 498771fe6b9SJerome Glisse } 499771fe6b9SJerome Glisse /* Reset CP */ 500771fe6b9SJerome Glisse tmp = RREG32(RADEON_CP_CSQ_STAT); 501771fe6b9SJerome Glisse if ((tmp & (1 << 31))) { 502771fe6b9SJerome Glisse DRM_INFO("radeon: cp busy (0x%08X) resetting\n", tmp); 503771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_MODE, 0); 504771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_CNTL, 0); 505771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, RADEON_SOFT_RESET_CP); 506771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_SOFT_RESET); 507771fe6b9SJerome Glisse mdelay(2); 508771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, 0); 509771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_SOFT_RESET); 510771fe6b9SJerome Glisse mdelay(2); 511771fe6b9SJerome Glisse tmp = RREG32(RADEON_CP_CSQ_STAT); 512771fe6b9SJerome Glisse if ((tmp & (1 << 31))) { 513771fe6b9SJerome Glisse DRM_INFO("radeon: cp reset failed (0x%08X)\n", tmp); 514771fe6b9SJerome Glisse } 515771fe6b9SJerome Glisse } else { 516771fe6b9SJerome Glisse DRM_INFO("radeon: cp idle (0x%08X)\n", tmp); 517771fe6b9SJerome Glisse } 518771fe6b9SJerome Glisse /* Align ring size */ 519771fe6b9SJerome Glisse rb_bufsz = drm_order(ring_size / 8); 520771fe6b9SJerome Glisse ring_size = (1 << (rb_bufsz + 1)) * 4; 521771fe6b9SJerome Glisse r100_cp_load_microcode(rdev); 522771fe6b9SJerome Glisse r = radeon_ring_init(rdev, ring_size); 523771fe6b9SJerome Glisse if (r) { 524771fe6b9SJerome Glisse return r; 525771fe6b9SJerome Glisse } 526771fe6b9SJerome Glisse /* Each time the cp read 1024 bytes (16 dword/quadword) update 527771fe6b9SJerome Glisse * the rptr copy in system ram */ 528771fe6b9SJerome Glisse rb_blksz = 9; 529771fe6b9SJerome Glisse /* cp will read 128bytes at a time (4 dwords) */ 530771fe6b9SJerome Glisse max_fetch = 1; 531771fe6b9SJerome Glisse rdev->cp.align_mask = 16 - 1; 532771fe6b9SJerome Glisse /* Write to CP_RB_WPTR will be delayed for pre_write_timer clocks */ 533771fe6b9SJerome Glisse pre_write_timer = 64; 534771fe6b9SJerome Glisse /* Force CP_RB_WPTR write if written more than one time before the 535771fe6b9SJerome Glisse * delay expire 536771fe6b9SJerome Glisse */ 537771fe6b9SJerome Glisse pre_write_limit = 0; 538771fe6b9SJerome Glisse /* Setup the cp cache like this (cache size is 96 dwords) : 539771fe6b9SJerome Glisse * RING 0 to 15 540771fe6b9SJerome Glisse * INDIRECT1 16 to 79 541771fe6b9SJerome Glisse * INDIRECT2 80 to 95 542771fe6b9SJerome Glisse * So ring cache size is 16dwords (> (2 * max_fetch = 2 * 4dwords)) 543771fe6b9SJerome Glisse * indirect1 cache size is 64dwords (> (2 * max_fetch = 2 * 4dwords)) 544771fe6b9SJerome Glisse * indirect2 cache size is 16dwords (> (2 * max_fetch = 2 * 4dwords)) 545771fe6b9SJerome Glisse * Idea being that most of the gpu cmd will be through indirect1 buffer 546771fe6b9SJerome Glisse * so it gets the bigger cache. 547771fe6b9SJerome Glisse */ 548771fe6b9SJerome Glisse indirect2_start = 80; 549771fe6b9SJerome Glisse indirect1_start = 16; 550771fe6b9SJerome Glisse /* cp setup */ 551771fe6b9SJerome Glisse WREG32(0x718, pre_write_timer | (pre_write_limit << 28)); 552771fe6b9SJerome Glisse WREG32(RADEON_CP_RB_CNTL, 5534e484e7dSMichel Dänzer #ifdef __BIG_ENDIAN 5544e484e7dSMichel Dänzer RADEON_BUF_SWAP_32BIT | 5554e484e7dSMichel Dänzer #endif 556771fe6b9SJerome Glisse REG_SET(RADEON_RB_BUFSZ, rb_bufsz) | 557771fe6b9SJerome Glisse REG_SET(RADEON_RB_BLKSZ, rb_blksz) | 558771fe6b9SJerome Glisse REG_SET(RADEON_MAX_FETCH, max_fetch) | 559771fe6b9SJerome Glisse RADEON_RB_NO_UPDATE); 560771fe6b9SJerome Glisse /* Set ring address */ 561771fe6b9SJerome Glisse DRM_INFO("radeon: ring at 0x%016lX\n", (unsigned long)rdev->cp.gpu_addr); 562771fe6b9SJerome Glisse WREG32(RADEON_CP_RB_BASE, rdev->cp.gpu_addr); 563771fe6b9SJerome Glisse /* Force read & write ptr to 0 */ 564771fe6b9SJerome Glisse tmp = RREG32(RADEON_CP_RB_CNTL); 565771fe6b9SJerome Glisse WREG32(RADEON_CP_RB_CNTL, tmp | RADEON_RB_RPTR_WR_ENA); 566771fe6b9SJerome Glisse WREG32(RADEON_CP_RB_RPTR_WR, 0); 567771fe6b9SJerome Glisse WREG32(RADEON_CP_RB_WPTR, 0); 568771fe6b9SJerome Glisse WREG32(RADEON_CP_RB_CNTL, tmp); 569771fe6b9SJerome Glisse udelay(10); 570771fe6b9SJerome Glisse rdev->cp.rptr = RREG32(RADEON_CP_RB_RPTR); 571771fe6b9SJerome Glisse rdev->cp.wptr = RREG32(RADEON_CP_RB_WPTR); 572771fe6b9SJerome Glisse /* Set cp mode to bus mastering & enable cp*/ 573771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_MODE, 574771fe6b9SJerome Glisse REG_SET(RADEON_INDIRECT2_START, indirect2_start) | 575771fe6b9SJerome Glisse REG_SET(RADEON_INDIRECT1_START, indirect1_start)); 576771fe6b9SJerome Glisse WREG32(0x718, 0); 577771fe6b9SJerome Glisse WREG32(0x744, 0x00004D4D); 578771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_CNTL, RADEON_CSQ_PRIBM_INDBM); 579771fe6b9SJerome Glisse radeon_ring_start(rdev); 580771fe6b9SJerome Glisse r = radeon_ring_test(rdev); 581771fe6b9SJerome Glisse if (r) { 582771fe6b9SJerome Glisse DRM_ERROR("radeon: cp isn't working (%d).\n", r); 583771fe6b9SJerome Glisse return r; 584771fe6b9SJerome Glisse } 585771fe6b9SJerome Glisse rdev->cp.ready = true; 586771fe6b9SJerome Glisse return 0; 587771fe6b9SJerome Glisse } 588771fe6b9SJerome Glisse 589771fe6b9SJerome Glisse void r100_cp_fini(struct radeon_device *rdev) 590771fe6b9SJerome Glisse { 591771fe6b9SJerome Glisse /* Disable ring */ 592771fe6b9SJerome Glisse rdev->cp.ready = false; 593771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_CNTL, 0); 594771fe6b9SJerome Glisse radeon_ring_fini(rdev); 595771fe6b9SJerome Glisse DRM_INFO("radeon: cp finalized\n"); 596771fe6b9SJerome Glisse } 597771fe6b9SJerome Glisse 598771fe6b9SJerome Glisse void r100_cp_disable(struct radeon_device *rdev) 599771fe6b9SJerome Glisse { 600771fe6b9SJerome Glisse /* Disable ring */ 601771fe6b9SJerome Glisse rdev->cp.ready = false; 602771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_MODE, 0); 603771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_CNTL, 0); 604771fe6b9SJerome Glisse if (r100_gui_wait_for_idle(rdev)) { 605771fe6b9SJerome Glisse printk(KERN_WARNING "Failed to wait GUI idle while " 606771fe6b9SJerome Glisse "programming pipes. Bad things might happen.\n"); 607771fe6b9SJerome Glisse } 608771fe6b9SJerome Glisse } 609771fe6b9SJerome Glisse 610771fe6b9SJerome Glisse int r100_cp_reset(struct radeon_device *rdev) 611771fe6b9SJerome Glisse { 612771fe6b9SJerome Glisse uint32_t tmp; 613771fe6b9SJerome Glisse bool reinit_cp; 614771fe6b9SJerome Glisse int i; 615771fe6b9SJerome Glisse 616771fe6b9SJerome Glisse reinit_cp = rdev->cp.ready; 617771fe6b9SJerome Glisse rdev->cp.ready = false; 618771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_MODE, 0); 619771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_CNTL, 0); 620771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, RADEON_SOFT_RESET_CP); 621771fe6b9SJerome Glisse (void)RREG32(RADEON_RBBM_SOFT_RESET); 622771fe6b9SJerome Glisse udelay(200); 623771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, 0); 624771fe6b9SJerome Glisse /* Wait to prevent race in RBBM_STATUS */ 625771fe6b9SJerome Glisse mdelay(1); 626771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 627771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_STATUS); 628771fe6b9SJerome Glisse if (!(tmp & (1 << 16))) { 629771fe6b9SJerome Glisse DRM_INFO("CP reset succeed (RBBM_STATUS=0x%08X)\n", 630771fe6b9SJerome Glisse tmp); 631771fe6b9SJerome Glisse if (reinit_cp) { 632771fe6b9SJerome Glisse return r100_cp_init(rdev, rdev->cp.ring_size); 633771fe6b9SJerome Glisse } 634771fe6b9SJerome Glisse return 0; 635771fe6b9SJerome Glisse } 636771fe6b9SJerome Glisse DRM_UDELAY(1); 637771fe6b9SJerome Glisse } 638771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_STATUS); 639771fe6b9SJerome Glisse DRM_ERROR("Failed to reset CP (RBBM_STATUS=0x%08X)!\n", tmp); 640771fe6b9SJerome Glisse return -1; 641771fe6b9SJerome Glisse } 642771fe6b9SJerome Glisse 643771fe6b9SJerome Glisse 644771fe6b9SJerome Glisse /* 645771fe6b9SJerome Glisse * CS functions 646771fe6b9SJerome Glisse */ 647771fe6b9SJerome Glisse int r100_cs_parse_packet0(struct radeon_cs_parser *p, 648771fe6b9SJerome Glisse struct radeon_cs_packet *pkt, 649068a117cSJerome Glisse const unsigned *auth, unsigned n, 650771fe6b9SJerome Glisse radeon_packet0_check_t check) 651771fe6b9SJerome Glisse { 652771fe6b9SJerome Glisse unsigned reg; 653771fe6b9SJerome Glisse unsigned i, j, m; 654771fe6b9SJerome Glisse unsigned idx; 655771fe6b9SJerome Glisse int r; 656771fe6b9SJerome Glisse 657771fe6b9SJerome Glisse idx = pkt->idx + 1; 658771fe6b9SJerome Glisse reg = pkt->reg; 659068a117cSJerome Glisse /* Check that register fall into register range 660068a117cSJerome Glisse * determined by the number of entry (n) in the 661068a117cSJerome Glisse * safe register bitmap. 662068a117cSJerome Glisse */ 663771fe6b9SJerome Glisse if (pkt->one_reg_wr) { 664771fe6b9SJerome Glisse if ((reg >> 7) > n) { 665771fe6b9SJerome Glisse return -EINVAL; 666771fe6b9SJerome Glisse } 667771fe6b9SJerome Glisse } else { 668771fe6b9SJerome Glisse if (((reg + (pkt->count << 2)) >> 7) > n) { 669771fe6b9SJerome Glisse return -EINVAL; 670771fe6b9SJerome Glisse } 671771fe6b9SJerome Glisse } 672771fe6b9SJerome Glisse for (i = 0; i <= pkt->count; i++, idx++) { 673771fe6b9SJerome Glisse j = (reg >> 7); 674771fe6b9SJerome Glisse m = 1 << ((reg >> 2) & 31); 675771fe6b9SJerome Glisse if (auth[j] & m) { 676771fe6b9SJerome Glisse r = check(p, pkt, idx, reg); 677771fe6b9SJerome Glisse if (r) { 678771fe6b9SJerome Glisse return r; 679771fe6b9SJerome Glisse } 680771fe6b9SJerome Glisse } 681771fe6b9SJerome Glisse if (pkt->one_reg_wr) { 682771fe6b9SJerome Glisse if (!(auth[j] & m)) { 683771fe6b9SJerome Glisse break; 684771fe6b9SJerome Glisse } 685771fe6b9SJerome Glisse } else { 686771fe6b9SJerome Glisse reg += 4; 687771fe6b9SJerome Glisse } 688771fe6b9SJerome Glisse } 689771fe6b9SJerome Glisse return 0; 690771fe6b9SJerome Glisse } 691771fe6b9SJerome Glisse 692771fe6b9SJerome Glisse void r100_cs_dump_packet(struct radeon_cs_parser *p, 693771fe6b9SJerome Glisse struct radeon_cs_packet *pkt) 694771fe6b9SJerome Glisse { 695771fe6b9SJerome Glisse struct radeon_cs_chunk *ib_chunk; 696771fe6b9SJerome Glisse volatile uint32_t *ib; 697771fe6b9SJerome Glisse unsigned i; 698771fe6b9SJerome Glisse unsigned idx; 699771fe6b9SJerome Glisse 700771fe6b9SJerome Glisse ib = p->ib->ptr; 701771fe6b9SJerome Glisse ib_chunk = &p->chunks[p->chunk_ib_idx]; 702771fe6b9SJerome Glisse idx = pkt->idx; 703771fe6b9SJerome Glisse for (i = 0; i <= (pkt->count + 1); i++, idx++) { 704771fe6b9SJerome Glisse DRM_INFO("ib[%d]=0x%08X\n", idx, ib[idx]); 705771fe6b9SJerome Glisse } 706771fe6b9SJerome Glisse } 707771fe6b9SJerome Glisse 708771fe6b9SJerome Glisse /** 709771fe6b9SJerome Glisse * r100_cs_packet_parse() - parse cp packet and point ib index to next packet 710771fe6b9SJerome Glisse * @parser: parser structure holding parsing context. 711771fe6b9SJerome Glisse * @pkt: where to store packet informations 712771fe6b9SJerome Glisse * 713771fe6b9SJerome Glisse * Assume that chunk_ib_index is properly set. Will return -EINVAL 714771fe6b9SJerome Glisse * if packet is bigger than remaining ib size. or if packets is unknown. 715771fe6b9SJerome Glisse **/ 716771fe6b9SJerome Glisse int r100_cs_packet_parse(struct radeon_cs_parser *p, 717771fe6b9SJerome Glisse struct radeon_cs_packet *pkt, 718771fe6b9SJerome Glisse unsigned idx) 719771fe6b9SJerome Glisse { 720771fe6b9SJerome Glisse struct radeon_cs_chunk *ib_chunk = &p->chunks[p->chunk_ib_idx]; 721771fe6b9SJerome Glisse uint32_t header = ib_chunk->kdata[idx]; 722771fe6b9SJerome Glisse 723771fe6b9SJerome Glisse if (idx >= ib_chunk->length_dw) { 724771fe6b9SJerome Glisse DRM_ERROR("Can not parse packet at %d after CS end %d !\n", 725771fe6b9SJerome Glisse idx, ib_chunk->length_dw); 726771fe6b9SJerome Glisse return -EINVAL; 727771fe6b9SJerome Glisse } 728771fe6b9SJerome Glisse pkt->idx = idx; 729771fe6b9SJerome Glisse pkt->type = CP_PACKET_GET_TYPE(header); 730771fe6b9SJerome Glisse pkt->count = CP_PACKET_GET_COUNT(header); 731771fe6b9SJerome Glisse switch (pkt->type) { 732771fe6b9SJerome Glisse case PACKET_TYPE0: 733771fe6b9SJerome Glisse pkt->reg = CP_PACKET0_GET_REG(header); 734771fe6b9SJerome Glisse pkt->one_reg_wr = CP_PACKET0_GET_ONE_REG_WR(header); 735771fe6b9SJerome Glisse break; 736771fe6b9SJerome Glisse case PACKET_TYPE3: 737771fe6b9SJerome Glisse pkt->opcode = CP_PACKET3_GET_OPCODE(header); 738771fe6b9SJerome Glisse break; 739771fe6b9SJerome Glisse case PACKET_TYPE2: 740771fe6b9SJerome Glisse pkt->count = -1; 741771fe6b9SJerome Glisse break; 742771fe6b9SJerome Glisse default: 743771fe6b9SJerome Glisse DRM_ERROR("Unknown packet type %d at %d !\n", pkt->type, idx); 744771fe6b9SJerome Glisse return -EINVAL; 745771fe6b9SJerome Glisse } 746771fe6b9SJerome Glisse if ((pkt->count + 1 + pkt->idx) >= ib_chunk->length_dw) { 747771fe6b9SJerome Glisse DRM_ERROR("Packet (%d:%d:%d) end after CS buffer (%d) !\n", 748771fe6b9SJerome Glisse pkt->idx, pkt->type, pkt->count, ib_chunk->length_dw); 749771fe6b9SJerome Glisse return -EINVAL; 750771fe6b9SJerome Glisse } 751771fe6b9SJerome Glisse return 0; 752771fe6b9SJerome Glisse } 753771fe6b9SJerome Glisse 754771fe6b9SJerome Glisse /** 755531369e6SDave Airlie * r100_cs_packet_next_vline() - parse userspace VLINE packet 756531369e6SDave Airlie * @parser: parser structure holding parsing context. 757531369e6SDave Airlie * 758531369e6SDave Airlie * Userspace sends a special sequence for VLINE waits. 759531369e6SDave Airlie * PACKET0 - VLINE_START_END + value 760531369e6SDave Airlie * PACKET0 - WAIT_UNTIL +_value 761531369e6SDave Airlie * RELOC (P3) - crtc_id in reloc. 762531369e6SDave Airlie * 763531369e6SDave Airlie * This function parses this and relocates the VLINE START END 764531369e6SDave Airlie * and WAIT UNTIL packets to the correct crtc. 765531369e6SDave Airlie * It also detects a switched off crtc and nulls out the 766531369e6SDave Airlie * wait in that case. 767531369e6SDave Airlie */ 768531369e6SDave Airlie int r100_cs_packet_parse_vline(struct radeon_cs_parser *p) 769531369e6SDave Airlie { 770531369e6SDave Airlie struct radeon_cs_chunk *ib_chunk; 771531369e6SDave Airlie struct drm_mode_object *obj; 772531369e6SDave Airlie struct drm_crtc *crtc; 773531369e6SDave Airlie struct radeon_crtc *radeon_crtc; 774531369e6SDave Airlie struct radeon_cs_packet p3reloc, waitreloc; 775531369e6SDave Airlie int crtc_id; 776531369e6SDave Airlie int r; 777531369e6SDave Airlie uint32_t header, h_idx, reg; 778531369e6SDave Airlie 779531369e6SDave Airlie ib_chunk = &p->chunks[p->chunk_ib_idx]; 780531369e6SDave Airlie 781531369e6SDave Airlie /* parse the wait until */ 782531369e6SDave Airlie r = r100_cs_packet_parse(p, &waitreloc, p->idx); 783531369e6SDave Airlie if (r) 784531369e6SDave Airlie return r; 785531369e6SDave Airlie 786531369e6SDave Airlie /* check its a wait until and only 1 count */ 787531369e6SDave Airlie if (waitreloc.reg != RADEON_WAIT_UNTIL || 788531369e6SDave Airlie waitreloc.count != 0) { 789531369e6SDave Airlie DRM_ERROR("vline wait had illegal wait until segment\n"); 790531369e6SDave Airlie r = -EINVAL; 791531369e6SDave Airlie return r; 792531369e6SDave Airlie } 793531369e6SDave Airlie 794531369e6SDave Airlie if (ib_chunk->kdata[waitreloc.idx + 1] != RADEON_WAIT_CRTC_VLINE) { 795531369e6SDave Airlie DRM_ERROR("vline wait had illegal wait until\n"); 796531369e6SDave Airlie r = -EINVAL; 797531369e6SDave Airlie return r; 798531369e6SDave Airlie } 799531369e6SDave Airlie 800531369e6SDave Airlie /* jump over the NOP */ 801531369e6SDave Airlie r = r100_cs_packet_parse(p, &p3reloc, p->idx); 802531369e6SDave Airlie if (r) 803531369e6SDave Airlie return r; 804531369e6SDave Airlie 805531369e6SDave Airlie h_idx = p->idx - 2; 806531369e6SDave Airlie p->idx += waitreloc.count; 807531369e6SDave Airlie p->idx += p3reloc.count; 808531369e6SDave Airlie 809531369e6SDave Airlie header = ib_chunk->kdata[h_idx]; 810531369e6SDave Airlie crtc_id = ib_chunk->kdata[h_idx + 5]; 811531369e6SDave Airlie reg = ib_chunk->kdata[h_idx] >> 2; 812531369e6SDave Airlie mutex_lock(&p->rdev->ddev->mode_config.mutex); 813531369e6SDave Airlie obj = drm_mode_object_find(p->rdev->ddev, crtc_id, DRM_MODE_OBJECT_CRTC); 814531369e6SDave Airlie if (!obj) { 815531369e6SDave Airlie DRM_ERROR("cannot find crtc %d\n", crtc_id); 816531369e6SDave Airlie r = -EINVAL; 817531369e6SDave Airlie goto out; 818531369e6SDave Airlie } 819531369e6SDave Airlie crtc = obj_to_crtc(obj); 820531369e6SDave Airlie radeon_crtc = to_radeon_crtc(crtc); 821531369e6SDave Airlie crtc_id = radeon_crtc->crtc_id; 822531369e6SDave Airlie 823531369e6SDave Airlie if (!crtc->enabled) { 824531369e6SDave Airlie /* if the CRTC isn't enabled - we need to nop out the wait until */ 825531369e6SDave Airlie ib_chunk->kdata[h_idx + 2] = PACKET2(0); 826531369e6SDave Airlie ib_chunk->kdata[h_idx + 3] = PACKET2(0); 827531369e6SDave Airlie } else if (crtc_id == 1) { 828531369e6SDave Airlie switch (reg) { 829531369e6SDave Airlie case AVIVO_D1MODE_VLINE_START_END: 830531369e6SDave Airlie header &= R300_CP_PACKET0_REG_MASK; 831531369e6SDave Airlie header |= AVIVO_D2MODE_VLINE_START_END >> 2; 832531369e6SDave Airlie break; 833531369e6SDave Airlie case RADEON_CRTC_GUI_TRIG_VLINE: 834531369e6SDave Airlie header &= R300_CP_PACKET0_REG_MASK; 835531369e6SDave Airlie header |= RADEON_CRTC2_GUI_TRIG_VLINE >> 2; 836531369e6SDave Airlie break; 837531369e6SDave Airlie default: 838531369e6SDave Airlie DRM_ERROR("unknown crtc reloc\n"); 839531369e6SDave Airlie r = -EINVAL; 840531369e6SDave Airlie goto out; 841531369e6SDave Airlie } 842531369e6SDave Airlie ib_chunk->kdata[h_idx] = header; 843531369e6SDave Airlie ib_chunk->kdata[h_idx + 3] |= RADEON_ENG_DISPLAY_SELECT_CRTC1; 844531369e6SDave Airlie } 845531369e6SDave Airlie out: 846531369e6SDave Airlie mutex_unlock(&p->rdev->ddev->mode_config.mutex); 847531369e6SDave Airlie return r; 848531369e6SDave Airlie } 849531369e6SDave Airlie 850531369e6SDave Airlie /** 851771fe6b9SJerome Glisse * r100_cs_packet_next_reloc() - parse next packet which should be reloc packet3 852771fe6b9SJerome Glisse * @parser: parser structure holding parsing context. 853771fe6b9SJerome Glisse * @data: pointer to relocation data 854771fe6b9SJerome Glisse * @offset_start: starting offset 855771fe6b9SJerome Glisse * @offset_mask: offset mask (to align start offset on) 856771fe6b9SJerome Glisse * @reloc: reloc informations 857771fe6b9SJerome Glisse * 858771fe6b9SJerome Glisse * Check next packet is relocation packet3, do bo validation and compute 859771fe6b9SJerome Glisse * GPU offset using the provided start. 860771fe6b9SJerome Glisse **/ 861771fe6b9SJerome Glisse int r100_cs_packet_next_reloc(struct radeon_cs_parser *p, 862771fe6b9SJerome Glisse struct radeon_cs_reloc **cs_reloc) 863771fe6b9SJerome Glisse { 864771fe6b9SJerome Glisse struct radeon_cs_chunk *ib_chunk; 865771fe6b9SJerome Glisse struct radeon_cs_chunk *relocs_chunk; 866771fe6b9SJerome Glisse struct radeon_cs_packet p3reloc; 867771fe6b9SJerome Glisse unsigned idx; 868771fe6b9SJerome Glisse int r; 869771fe6b9SJerome Glisse 870771fe6b9SJerome Glisse if (p->chunk_relocs_idx == -1) { 871771fe6b9SJerome Glisse DRM_ERROR("No relocation chunk !\n"); 872771fe6b9SJerome Glisse return -EINVAL; 873771fe6b9SJerome Glisse } 874771fe6b9SJerome Glisse *cs_reloc = NULL; 875771fe6b9SJerome Glisse ib_chunk = &p->chunks[p->chunk_ib_idx]; 876771fe6b9SJerome Glisse relocs_chunk = &p->chunks[p->chunk_relocs_idx]; 877771fe6b9SJerome Glisse r = r100_cs_packet_parse(p, &p3reloc, p->idx); 878771fe6b9SJerome Glisse if (r) { 879771fe6b9SJerome Glisse return r; 880771fe6b9SJerome Glisse } 881771fe6b9SJerome Glisse p->idx += p3reloc.count + 2; 882771fe6b9SJerome Glisse if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) { 883771fe6b9SJerome Glisse DRM_ERROR("No packet3 for relocation for packet at %d.\n", 884771fe6b9SJerome Glisse p3reloc.idx); 885771fe6b9SJerome Glisse r100_cs_dump_packet(p, &p3reloc); 886771fe6b9SJerome Glisse return -EINVAL; 887771fe6b9SJerome Glisse } 888771fe6b9SJerome Glisse idx = ib_chunk->kdata[p3reloc.idx + 1]; 889771fe6b9SJerome Glisse if (idx >= relocs_chunk->length_dw) { 890771fe6b9SJerome Glisse DRM_ERROR("Relocs at %d after relocations chunk end %d !\n", 891771fe6b9SJerome Glisse idx, relocs_chunk->length_dw); 892771fe6b9SJerome Glisse r100_cs_dump_packet(p, &p3reloc); 893771fe6b9SJerome Glisse return -EINVAL; 894771fe6b9SJerome Glisse } 895771fe6b9SJerome Glisse /* FIXME: we assume reloc size is 4 dwords */ 896771fe6b9SJerome Glisse *cs_reloc = p->relocs_ptr[(idx / 4)]; 897771fe6b9SJerome Glisse return 0; 898771fe6b9SJerome Glisse } 899771fe6b9SJerome Glisse 900771fe6b9SJerome Glisse static int r100_packet0_check(struct radeon_cs_parser *p, 901771fe6b9SJerome Glisse struct radeon_cs_packet *pkt) 902771fe6b9SJerome Glisse { 903771fe6b9SJerome Glisse struct radeon_cs_chunk *ib_chunk; 904771fe6b9SJerome Glisse struct radeon_cs_reloc *reloc; 905771fe6b9SJerome Glisse volatile uint32_t *ib; 906771fe6b9SJerome Glisse uint32_t tmp; 907771fe6b9SJerome Glisse unsigned reg; 908771fe6b9SJerome Glisse unsigned i; 909771fe6b9SJerome Glisse unsigned idx; 910771fe6b9SJerome Glisse bool onereg; 911771fe6b9SJerome Glisse int r; 912*e024e110SDave Airlie u32 tile_flags = 0; 913771fe6b9SJerome Glisse 914771fe6b9SJerome Glisse ib = p->ib->ptr; 915771fe6b9SJerome Glisse ib_chunk = &p->chunks[p->chunk_ib_idx]; 916771fe6b9SJerome Glisse idx = pkt->idx + 1; 917771fe6b9SJerome Glisse reg = pkt->reg; 918771fe6b9SJerome Glisse onereg = false; 919771fe6b9SJerome Glisse if (CP_PACKET0_GET_ONE_REG_WR(ib_chunk->kdata[pkt->idx])) { 920771fe6b9SJerome Glisse onereg = true; 921771fe6b9SJerome Glisse } 922771fe6b9SJerome Glisse for (i = 0; i <= pkt->count; i++, idx++, reg += 4) { 923771fe6b9SJerome Glisse switch (reg) { 924531369e6SDave Airlie case RADEON_CRTC_GUI_TRIG_VLINE: 925531369e6SDave Airlie r = r100_cs_packet_parse_vline(p); 926531369e6SDave Airlie if (r) { 927531369e6SDave Airlie DRM_ERROR("No reloc for ib[%d]=0x%04X\n", 928531369e6SDave Airlie idx, reg); 929531369e6SDave Airlie r100_cs_dump_packet(p, pkt); 930531369e6SDave Airlie return r; 931531369e6SDave Airlie } 932531369e6SDave Airlie break; 933771fe6b9SJerome Glisse /* FIXME: only allow PACKET3 blit? easier to check for out of 934771fe6b9SJerome Glisse * range access */ 935771fe6b9SJerome Glisse case RADEON_DST_PITCH_OFFSET: 936771fe6b9SJerome Glisse case RADEON_SRC_PITCH_OFFSET: 937771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 938771fe6b9SJerome Glisse if (r) { 939771fe6b9SJerome Glisse DRM_ERROR("No reloc for ib[%d]=0x%04X\n", 940771fe6b9SJerome Glisse idx, reg); 941771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 942771fe6b9SJerome Glisse return r; 943771fe6b9SJerome Glisse } 944771fe6b9SJerome Glisse tmp = ib_chunk->kdata[idx] & 0x003fffff; 945771fe6b9SJerome Glisse tmp += (((u32)reloc->lobj.gpu_offset) >> 10); 946*e024e110SDave Airlie 947*e024e110SDave Airlie if (reloc->lobj.tiling_flags & RADEON_TILING_MACRO) 948*e024e110SDave Airlie tile_flags |= RADEON_DST_TILE_MACRO; 949*e024e110SDave Airlie if (reloc->lobj.tiling_flags & RADEON_TILING_MICRO) { 950*e024e110SDave Airlie if (reg == RADEON_SRC_PITCH_OFFSET) { 951*e024e110SDave Airlie DRM_ERROR("Cannot src blit from microtiled surface\n"); 952*e024e110SDave Airlie r100_cs_dump_packet(p, pkt); 953*e024e110SDave Airlie return -EINVAL; 954*e024e110SDave Airlie } 955*e024e110SDave Airlie tile_flags |= RADEON_DST_TILE_MICRO; 956*e024e110SDave Airlie } 957*e024e110SDave Airlie 958*e024e110SDave Airlie tmp |= tile_flags; 959*e024e110SDave Airlie ib[idx] = (ib_chunk->kdata[idx] & 0x3fc00000) | tmp; 960771fe6b9SJerome Glisse break; 961771fe6b9SJerome Glisse case RADEON_RB3D_DEPTHOFFSET: 962771fe6b9SJerome Glisse case RADEON_RB3D_COLOROFFSET: 963771fe6b9SJerome Glisse case R300_RB3D_COLOROFFSET0: 964771fe6b9SJerome Glisse case R300_ZB_DEPTHOFFSET: 965771fe6b9SJerome Glisse case R200_PP_TXOFFSET_0: 966771fe6b9SJerome Glisse case R200_PP_TXOFFSET_1: 967771fe6b9SJerome Glisse case R200_PP_TXOFFSET_2: 968771fe6b9SJerome Glisse case R200_PP_TXOFFSET_3: 969771fe6b9SJerome Glisse case R200_PP_TXOFFSET_4: 970771fe6b9SJerome Glisse case R200_PP_TXOFFSET_5: 971771fe6b9SJerome Glisse case RADEON_PP_TXOFFSET_0: 972771fe6b9SJerome Glisse case RADEON_PP_TXOFFSET_1: 973771fe6b9SJerome Glisse case RADEON_PP_TXOFFSET_2: 974771fe6b9SJerome Glisse case R300_TX_OFFSET_0: 975771fe6b9SJerome Glisse case R300_TX_OFFSET_0+4: 976771fe6b9SJerome Glisse case R300_TX_OFFSET_0+8: 977771fe6b9SJerome Glisse case R300_TX_OFFSET_0+12: 978771fe6b9SJerome Glisse case R300_TX_OFFSET_0+16: 979771fe6b9SJerome Glisse case R300_TX_OFFSET_0+20: 980771fe6b9SJerome Glisse case R300_TX_OFFSET_0+24: 981771fe6b9SJerome Glisse case R300_TX_OFFSET_0+28: 982771fe6b9SJerome Glisse case R300_TX_OFFSET_0+32: 983771fe6b9SJerome Glisse case R300_TX_OFFSET_0+36: 984771fe6b9SJerome Glisse case R300_TX_OFFSET_0+40: 985771fe6b9SJerome Glisse case R300_TX_OFFSET_0+44: 986771fe6b9SJerome Glisse case R300_TX_OFFSET_0+48: 987771fe6b9SJerome Glisse case R300_TX_OFFSET_0+52: 988771fe6b9SJerome Glisse case R300_TX_OFFSET_0+56: 989771fe6b9SJerome Glisse case R300_TX_OFFSET_0+60: 990b995e433SDave Airlie /* rn50 has no 3D engine so fail on any 3d setup */ 991b995e433SDave Airlie if (ASIC_IS_RN50(p->rdev)) { 992b995e433SDave Airlie DRM_ERROR("attempt to use RN50 3D engine failed\n"); 993b995e433SDave Airlie return -EINVAL; 994b995e433SDave Airlie } 995771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 996771fe6b9SJerome Glisse if (r) { 997771fe6b9SJerome Glisse DRM_ERROR("No reloc for ib[%d]=0x%04X\n", 998771fe6b9SJerome Glisse idx, reg); 999771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 1000771fe6b9SJerome Glisse return r; 1001771fe6b9SJerome Glisse } 1002771fe6b9SJerome Glisse ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); 1003771fe6b9SJerome Glisse break; 1004*e024e110SDave Airlie case R300_RB3D_COLORPITCH0: 1005*e024e110SDave Airlie case RADEON_RB3D_COLORPITCH: 1006*e024e110SDave Airlie r = r100_cs_packet_next_reloc(p, &reloc); 1007*e024e110SDave Airlie if (r) { 1008*e024e110SDave Airlie DRM_ERROR("No reloc for ib[%d]=0x%04X\n", 1009*e024e110SDave Airlie idx, reg); 1010*e024e110SDave Airlie r100_cs_dump_packet(p, pkt); 1011*e024e110SDave Airlie return r; 1012*e024e110SDave Airlie } 1013*e024e110SDave Airlie 1014*e024e110SDave Airlie if (reloc->lobj.tiling_flags & RADEON_TILING_MACRO) 1015*e024e110SDave Airlie tile_flags |= RADEON_COLOR_TILE_ENABLE; 1016*e024e110SDave Airlie if (reloc->lobj.tiling_flags & RADEON_TILING_MICRO) 1017*e024e110SDave Airlie tile_flags |= RADEON_COLOR_MICROTILE_ENABLE; 1018*e024e110SDave Airlie 1019*e024e110SDave Airlie tmp = ib_chunk->kdata[idx] & ~(0x7 << 16); 1020*e024e110SDave Airlie tmp |= tile_flags; 1021*e024e110SDave Airlie ib[idx] = tmp; 1022*e024e110SDave Airlie break; 1023771fe6b9SJerome Glisse default: 1024771fe6b9SJerome Glisse /* FIXME: we don't want to allow anyothers packet */ 1025771fe6b9SJerome Glisse break; 1026771fe6b9SJerome Glisse } 1027771fe6b9SJerome Glisse if (onereg) { 1028771fe6b9SJerome Glisse /* FIXME: forbid onereg write to register on relocate */ 1029771fe6b9SJerome Glisse break; 1030771fe6b9SJerome Glisse } 1031771fe6b9SJerome Glisse } 1032771fe6b9SJerome Glisse return 0; 1033771fe6b9SJerome Glisse } 1034771fe6b9SJerome Glisse 1035068a117cSJerome Glisse int r100_cs_track_check_pkt3_indx_buffer(struct radeon_cs_parser *p, 1036068a117cSJerome Glisse struct radeon_cs_packet *pkt, 1037068a117cSJerome Glisse struct radeon_object *robj) 1038068a117cSJerome Glisse { 1039068a117cSJerome Glisse struct radeon_cs_chunk *ib_chunk; 1040068a117cSJerome Glisse unsigned idx; 1041068a117cSJerome Glisse 1042068a117cSJerome Glisse ib_chunk = &p->chunks[p->chunk_ib_idx]; 1043068a117cSJerome Glisse idx = pkt->idx + 1; 1044068a117cSJerome Glisse if ((ib_chunk->kdata[idx+2] + 1) > radeon_object_size(robj)) { 1045068a117cSJerome Glisse DRM_ERROR("[drm] Buffer too small for PACKET3 INDX_BUFFER " 1046068a117cSJerome Glisse "(need %u have %lu) !\n", 1047068a117cSJerome Glisse ib_chunk->kdata[idx+2] + 1, 1048068a117cSJerome Glisse radeon_object_size(robj)); 1049068a117cSJerome Glisse return -EINVAL; 1050068a117cSJerome Glisse } 1051068a117cSJerome Glisse return 0; 1052068a117cSJerome Glisse } 1053068a117cSJerome Glisse 1054771fe6b9SJerome Glisse static int r100_packet3_check(struct radeon_cs_parser *p, 1055771fe6b9SJerome Glisse struct radeon_cs_packet *pkt) 1056771fe6b9SJerome Glisse { 1057771fe6b9SJerome Glisse struct radeon_cs_chunk *ib_chunk; 1058771fe6b9SJerome Glisse struct radeon_cs_reloc *reloc; 1059771fe6b9SJerome Glisse unsigned idx; 1060771fe6b9SJerome Glisse unsigned i, c; 1061771fe6b9SJerome Glisse volatile uint32_t *ib; 1062771fe6b9SJerome Glisse int r; 1063771fe6b9SJerome Glisse 1064771fe6b9SJerome Glisse ib = p->ib->ptr; 1065771fe6b9SJerome Glisse ib_chunk = &p->chunks[p->chunk_ib_idx]; 1066771fe6b9SJerome Glisse idx = pkt->idx + 1; 1067771fe6b9SJerome Glisse switch (pkt->opcode) { 1068771fe6b9SJerome Glisse case PACKET3_3D_LOAD_VBPNTR: 1069771fe6b9SJerome Glisse c = ib_chunk->kdata[idx++]; 1070771fe6b9SJerome Glisse for (i = 0; i < (c - 1); i += 2, idx += 3) { 1071771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 1072771fe6b9SJerome Glisse if (r) { 1073771fe6b9SJerome Glisse DRM_ERROR("No reloc for packet3 %d\n", 1074771fe6b9SJerome Glisse pkt->opcode); 1075771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 1076771fe6b9SJerome Glisse return r; 1077771fe6b9SJerome Glisse } 1078771fe6b9SJerome Glisse ib[idx+1] = ib_chunk->kdata[idx+1] + ((u32)reloc->lobj.gpu_offset); 1079771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 1080771fe6b9SJerome Glisse if (r) { 1081771fe6b9SJerome Glisse DRM_ERROR("No reloc for packet3 %d\n", 1082771fe6b9SJerome Glisse pkt->opcode); 1083771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 1084771fe6b9SJerome Glisse return r; 1085771fe6b9SJerome Glisse } 1086771fe6b9SJerome Glisse ib[idx+2] = ib_chunk->kdata[idx+2] + ((u32)reloc->lobj.gpu_offset); 1087771fe6b9SJerome Glisse } 1088771fe6b9SJerome Glisse if (c & 1) { 1089771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 1090771fe6b9SJerome Glisse if (r) { 1091771fe6b9SJerome Glisse DRM_ERROR("No reloc for packet3 %d\n", 1092771fe6b9SJerome Glisse pkt->opcode); 1093771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 1094771fe6b9SJerome Glisse return r; 1095771fe6b9SJerome Glisse } 1096771fe6b9SJerome Glisse ib[idx+1] = ib_chunk->kdata[idx+1] + ((u32)reloc->lobj.gpu_offset); 1097771fe6b9SJerome Glisse } 1098771fe6b9SJerome Glisse break; 1099771fe6b9SJerome Glisse case PACKET3_INDX_BUFFER: 1100771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 1101771fe6b9SJerome Glisse if (r) { 1102771fe6b9SJerome Glisse DRM_ERROR("No reloc for packet3 %d\n", pkt->opcode); 1103771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 1104771fe6b9SJerome Glisse return r; 1105771fe6b9SJerome Glisse } 1106771fe6b9SJerome Glisse ib[idx+1] = ib_chunk->kdata[idx+1] + ((u32)reloc->lobj.gpu_offset); 1107068a117cSJerome Glisse r = r100_cs_track_check_pkt3_indx_buffer(p, pkt, reloc->robj); 1108068a117cSJerome Glisse if (r) { 1109068a117cSJerome Glisse return r; 1110068a117cSJerome Glisse } 1111771fe6b9SJerome Glisse break; 1112771fe6b9SJerome Glisse case 0x23: 1113771fe6b9SJerome Glisse /* FIXME: cleanup */ 1114771fe6b9SJerome Glisse /* 3D_RNDR_GEN_INDX_PRIM on r100/r200 */ 1115771fe6b9SJerome Glisse r = r100_cs_packet_next_reloc(p, &reloc); 1116771fe6b9SJerome Glisse if (r) { 1117771fe6b9SJerome Glisse DRM_ERROR("No reloc for packet3 %d\n", pkt->opcode); 1118771fe6b9SJerome Glisse r100_cs_dump_packet(p, pkt); 1119771fe6b9SJerome Glisse return r; 1120771fe6b9SJerome Glisse } 1121771fe6b9SJerome Glisse ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset); 1122771fe6b9SJerome Glisse break; 1123771fe6b9SJerome Glisse case PACKET3_3D_DRAW_IMMD: 1124771fe6b9SJerome Glisse /* triggers drawing using in-packet vertex data */ 1125771fe6b9SJerome Glisse case PACKET3_3D_DRAW_IMMD_2: 1126771fe6b9SJerome Glisse /* triggers drawing using in-packet vertex data */ 1127771fe6b9SJerome Glisse case PACKET3_3D_DRAW_VBUF_2: 1128771fe6b9SJerome Glisse /* triggers drawing of vertex buffers setup elsewhere */ 1129771fe6b9SJerome Glisse case PACKET3_3D_DRAW_INDX_2: 1130771fe6b9SJerome Glisse /* triggers drawing using indices to vertex buffer */ 1131771fe6b9SJerome Glisse case PACKET3_3D_DRAW_VBUF: 1132771fe6b9SJerome Glisse /* triggers drawing of vertex buffers setup elsewhere */ 1133771fe6b9SJerome Glisse case PACKET3_3D_DRAW_INDX: 1134771fe6b9SJerome Glisse /* triggers drawing using indices to vertex buffer */ 1135771fe6b9SJerome Glisse case PACKET3_NOP: 1136771fe6b9SJerome Glisse break; 1137771fe6b9SJerome Glisse default: 1138771fe6b9SJerome Glisse DRM_ERROR("Packet3 opcode %x not supported\n", pkt->opcode); 1139771fe6b9SJerome Glisse return -EINVAL; 1140771fe6b9SJerome Glisse } 1141771fe6b9SJerome Glisse return 0; 1142771fe6b9SJerome Glisse } 1143771fe6b9SJerome Glisse 1144771fe6b9SJerome Glisse int r100_cs_parse(struct radeon_cs_parser *p) 1145771fe6b9SJerome Glisse { 1146771fe6b9SJerome Glisse struct radeon_cs_packet pkt; 1147771fe6b9SJerome Glisse int r; 1148771fe6b9SJerome Glisse 1149771fe6b9SJerome Glisse do { 1150771fe6b9SJerome Glisse r = r100_cs_packet_parse(p, &pkt, p->idx); 1151771fe6b9SJerome Glisse if (r) { 1152771fe6b9SJerome Glisse return r; 1153771fe6b9SJerome Glisse } 1154771fe6b9SJerome Glisse p->idx += pkt.count + 2; 1155771fe6b9SJerome Glisse switch (pkt.type) { 1156771fe6b9SJerome Glisse case PACKET_TYPE0: 1157771fe6b9SJerome Glisse r = r100_packet0_check(p, &pkt); 1158771fe6b9SJerome Glisse break; 1159771fe6b9SJerome Glisse case PACKET_TYPE2: 1160771fe6b9SJerome Glisse break; 1161771fe6b9SJerome Glisse case PACKET_TYPE3: 1162771fe6b9SJerome Glisse r = r100_packet3_check(p, &pkt); 1163771fe6b9SJerome Glisse break; 1164771fe6b9SJerome Glisse default: 1165771fe6b9SJerome Glisse DRM_ERROR("Unknown packet type %d !\n", 1166771fe6b9SJerome Glisse pkt.type); 1167771fe6b9SJerome Glisse return -EINVAL; 1168771fe6b9SJerome Glisse } 1169771fe6b9SJerome Glisse if (r) { 1170771fe6b9SJerome Glisse return r; 1171771fe6b9SJerome Glisse } 1172771fe6b9SJerome Glisse } while (p->idx < p->chunks[p->chunk_ib_idx].length_dw); 1173771fe6b9SJerome Glisse return 0; 1174771fe6b9SJerome Glisse } 1175771fe6b9SJerome Glisse 1176771fe6b9SJerome Glisse 1177771fe6b9SJerome Glisse /* 1178771fe6b9SJerome Glisse * Global GPU functions 1179771fe6b9SJerome Glisse */ 1180771fe6b9SJerome Glisse void r100_errata(struct radeon_device *rdev) 1181771fe6b9SJerome Glisse { 1182771fe6b9SJerome Glisse rdev->pll_errata = 0; 1183771fe6b9SJerome Glisse 1184771fe6b9SJerome Glisse if (rdev->family == CHIP_RV200 || rdev->family == CHIP_RS200) { 1185771fe6b9SJerome Glisse rdev->pll_errata |= CHIP_ERRATA_PLL_DUMMYREADS; 1186771fe6b9SJerome Glisse } 1187771fe6b9SJerome Glisse 1188771fe6b9SJerome Glisse if (rdev->family == CHIP_RV100 || 1189771fe6b9SJerome Glisse rdev->family == CHIP_RS100 || 1190771fe6b9SJerome Glisse rdev->family == CHIP_RS200) { 1191771fe6b9SJerome Glisse rdev->pll_errata |= CHIP_ERRATA_PLL_DELAY; 1192771fe6b9SJerome Glisse } 1193771fe6b9SJerome Glisse } 1194771fe6b9SJerome Glisse 1195771fe6b9SJerome Glisse /* Wait for vertical sync on primary CRTC */ 1196771fe6b9SJerome Glisse void r100_gpu_wait_for_vsync(struct radeon_device *rdev) 1197771fe6b9SJerome Glisse { 1198771fe6b9SJerome Glisse uint32_t crtc_gen_cntl, tmp; 1199771fe6b9SJerome Glisse int i; 1200771fe6b9SJerome Glisse 1201771fe6b9SJerome Glisse crtc_gen_cntl = RREG32(RADEON_CRTC_GEN_CNTL); 1202771fe6b9SJerome Glisse if ((crtc_gen_cntl & RADEON_CRTC_DISP_REQ_EN_B) || 1203771fe6b9SJerome Glisse !(crtc_gen_cntl & RADEON_CRTC_EN)) { 1204771fe6b9SJerome Glisse return; 1205771fe6b9SJerome Glisse } 1206771fe6b9SJerome Glisse /* Clear the CRTC_VBLANK_SAVE bit */ 1207771fe6b9SJerome Glisse WREG32(RADEON_CRTC_STATUS, RADEON_CRTC_VBLANK_SAVE_CLEAR); 1208771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 1209771fe6b9SJerome Glisse tmp = RREG32(RADEON_CRTC_STATUS); 1210771fe6b9SJerome Glisse if (tmp & RADEON_CRTC_VBLANK_SAVE) { 1211771fe6b9SJerome Glisse return; 1212771fe6b9SJerome Glisse } 1213771fe6b9SJerome Glisse DRM_UDELAY(1); 1214771fe6b9SJerome Glisse } 1215771fe6b9SJerome Glisse } 1216771fe6b9SJerome Glisse 1217771fe6b9SJerome Glisse /* Wait for vertical sync on secondary CRTC */ 1218771fe6b9SJerome Glisse void r100_gpu_wait_for_vsync2(struct radeon_device *rdev) 1219771fe6b9SJerome Glisse { 1220771fe6b9SJerome Glisse uint32_t crtc2_gen_cntl, tmp; 1221771fe6b9SJerome Glisse int i; 1222771fe6b9SJerome Glisse 1223771fe6b9SJerome Glisse crtc2_gen_cntl = RREG32(RADEON_CRTC2_GEN_CNTL); 1224771fe6b9SJerome Glisse if ((crtc2_gen_cntl & RADEON_CRTC2_DISP_REQ_EN_B) || 1225771fe6b9SJerome Glisse !(crtc2_gen_cntl & RADEON_CRTC2_EN)) 1226771fe6b9SJerome Glisse return; 1227771fe6b9SJerome Glisse 1228771fe6b9SJerome Glisse /* Clear the CRTC_VBLANK_SAVE bit */ 1229771fe6b9SJerome Glisse WREG32(RADEON_CRTC2_STATUS, RADEON_CRTC2_VBLANK_SAVE_CLEAR); 1230771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 1231771fe6b9SJerome Glisse tmp = RREG32(RADEON_CRTC2_STATUS); 1232771fe6b9SJerome Glisse if (tmp & RADEON_CRTC2_VBLANK_SAVE) { 1233771fe6b9SJerome Glisse return; 1234771fe6b9SJerome Glisse } 1235771fe6b9SJerome Glisse DRM_UDELAY(1); 1236771fe6b9SJerome Glisse } 1237771fe6b9SJerome Glisse } 1238771fe6b9SJerome Glisse 1239771fe6b9SJerome Glisse int r100_rbbm_fifo_wait_for_entry(struct radeon_device *rdev, unsigned n) 1240771fe6b9SJerome Glisse { 1241771fe6b9SJerome Glisse unsigned i; 1242771fe6b9SJerome Glisse uint32_t tmp; 1243771fe6b9SJerome Glisse 1244771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 1245771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_STATUS) & RADEON_RBBM_FIFOCNT_MASK; 1246771fe6b9SJerome Glisse if (tmp >= n) { 1247771fe6b9SJerome Glisse return 0; 1248771fe6b9SJerome Glisse } 1249771fe6b9SJerome Glisse DRM_UDELAY(1); 1250771fe6b9SJerome Glisse } 1251771fe6b9SJerome Glisse return -1; 1252771fe6b9SJerome Glisse } 1253771fe6b9SJerome Glisse 1254771fe6b9SJerome Glisse int r100_gui_wait_for_idle(struct radeon_device *rdev) 1255771fe6b9SJerome Glisse { 1256771fe6b9SJerome Glisse unsigned i; 1257771fe6b9SJerome Glisse uint32_t tmp; 1258771fe6b9SJerome Glisse 1259771fe6b9SJerome Glisse if (r100_rbbm_fifo_wait_for_entry(rdev, 64)) { 1260771fe6b9SJerome Glisse printk(KERN_WARNING "radeon: wait for empty RBBM fifo failed !" 1261771fe6b9SJerome Glisse " Bad things might happen.\n"); 1262771fe6b9SJerome Glisse } 1263771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 1264771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_STATUS); 1265771fe6b9SJerome Glisse if (!(tmp & (1 << 31))) { 1266771fe6b9SJerome Glisse return 0; 1267771fe6b9SJerome Glisse } 1268771fe6b9SJerome Glisse DRM_UDELAY(1); 1269771fe6b9SJerome Glisse } 1270771fe6b9SJerome Glisse return -1; 1271771fe6b9SJerome Glisse } 1272771fe6b9SJerome Glisse 1273771fe6b9SJerome Glisse int r100_mc_wait_for_idle(struct radeon_device *rdev) 1274771fe6b9SJerome Glisse { 1275771fe6b9SJerome Glisse unsigned i; 1276771fe6b9SJerome Glisse uint32_t tmp; 1277771fe6b9SJerome Glisse 1278771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 1279771fe6b9SJerome Glisse /* read MC_STATUS */ 1280771fe6b9SJerome Glisse tmp = RREG32(0x0150); 1281771fe6b9SJerome Glisse if (tmp & (1 << 2)) { 1282771fe6b9SJerome Glisse return 0; 1283771fe6b9SJerome Glisse } 1284771fe6b9SJerome Glisse DRM_UDELAY(1); 1285771fe6b9SJerome Glisse } 1286771fe6b9SJerome Glisse return -1; 1287771fe6b9SJerome Glisse } 1288771fe6b9SJerome Glisse 1289771fe6b9SJerome Glisse void r100_gpu_init(struct radeon_device *rdev) 1290771fe6b9SJerome Glisse { 1291771fe6b9SJerome Glisse /* TODO: anythings to do here ? pipes ? */ 1292771fe6b9SJerome Glisse r100_hdp_reset(rdev); 1293771fe6b9SJerome Glisse } 1294771fe6b9SJerome Glisse 1295771fe6b9SJerome Glisse void r100_hdp_reset(struct radeon_device *rdev) 1296771fe6b9SJerome Glisse { 1297771fe6b9SJerome Glisse uint32_t tmp; 1298771fe6b9SJerome Glisse 1299771fe6b9SJerome Glisse tmp = RREG32(RADEON_HOST_PATH_CNTL) & RADEON_HDP_APER_CNTL; 1300771fe6b9SJerome Glisse tmp |= (7 << 28); 1301771fe6b9SJerome Glisse WREG32(RADEON_HOST_PATH_CNTL, tmp | RADEON_HDP_SOFT_RESET | RADEON_HDP_READ_BUFFER_INVALIDATE); 1302771fe6b9SJerome Glisse (void)RREG32(RADEON_HOST_PATH_CNTL); 1303771fe6b9SJerome Glisse udelay(200); 1304771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, 0); 1305771fe6b9SJerome Glisse WREG32(RADEON_HOST_PATH_CNTL, tmp); 1306771fe6b9SJerome Glisse (void)RREG32(RADEON_HOST_PATH_CNTL); 1307771fe6b9SJerome Glisse } 1308771fe6b9SJerome Glisse 1309771fe6b9SJerome Glisse int r100_rb2d_reset(struct radeon_device *rdev) 1310771fe6b9SJerome Glisse { 1311771fe6b9SJerome Glisse uint32_t tmp; 1312771fe6b9SJerome Glisse int i; 1313771fe6b9SJerome Glisse 1314771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, RADEON_SOFT_RESET_E2); 1315771fe6b9SJerome Glisse (void)RREG32(RADEON_RBBM_SOFT_RESET); 1316771fe6b9SJerome Glisse udelay(200); 1317771fe6b9SJerome Glisse WREG32(RADEON_RBBM_SOFT_RESET, 0); 1318771fe6b9SJerome Glisse /* Wait to prevent race in RBBM_STATUS */ 1319771fe6b9SJerome Glisse mdelay(1); 1320771fe6b9SJerome Glisse for (i = 0; i < rdev->usec_timeout; i++) { 1321771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_STATUS); 1322771fe6b9SJerome Glisse if (!(tmp & (1 << 26))) { 1323771fe6b9SJerome Glisse DRM_INFO("RB2D reset succeed (RBBM_STATUS=0x%08X)\n", 1324771fe6b9SJerome Glisse tmp); 1325771fe6b9SJerome Glisse return 0; 1326771fe6b9SJerome Glisse } 1327771fe6b9SJerome Glisse DRM_UDELAY(1); 1328771fe6b9SJerome Glisse } 1329771fe6b9SJerome Glisse tmp = RREG32(RADEON_RBBM_STATUS); 1330771fe6b9SJerome Glisse DRM_ERROR("Failed to reset RB2D (RBBM_STATUS=0x%08X)!\n", tmp); 1331771fe6b9SJerome Glisse return -1; 1332771fe6b9SJerome Glisse } 1333771fe6b9SJerome Glisse 1334771fe6b9SJerome Glisse int r100_gpu_reset(struct radeon_device *rdev) 1335771fe6b9SJerome Glisse { 1336771fe6b9SJerome Glisse uint32_t status; 1337771fe6b9SJerome Glisse 1338771fe6b9SJerome Glisse /* reset order likely matter */ 1339771fe6b9SJerome Glisse status = RREG32(RADEON_RBBM_STATUS); 1340771fe6b9SJerome Glisse /* reset HDP */ 1341771fe6b9SJerome Glisse r100_hdp_reset(rdev); 1342771fe6b9SJerome Glisse /* reset rb2d */ 1343771fe6b9SJerome Glisse if (status & ((1 << 17) | (1 << 18) | (1 << 27))) { 1344771fe6b9SJerome Glisse r100_rb2d_reset(rdev); 1345771fe6b9SJerome Glisse } 1346771fe6b9SJerome Glisse /* TODO: reset 3D engine */ 1347771fe6b9SJerome Glisse /* reset CP */ 1348771fe6b9SJerome Glisse status = RREG32(RADEON_RBBM_STATUS); 1349771fe6b9SJerome Glisse if (status & (1 << 16)) { 1350771fe6b9SJerome Glisse r100_cp_reset(rdev); 1351771fe6b9SJerome Glisse } 1352771fe6b9SJerome Glisse /* Check if GPU is idle */ 1353771fe6b9SJerome Glisse status = RREG32(RADEON_RBBM_STATUS); 1354771fe6b9SJerome Glisse if (status & (1 << 31)) { 1355771fe6b9SJerome Glisse DRM_ERROR("Failed to reset GPU (RBBM_STATUS=0x%08X)\n", status); 1356771fe6b9SJerome Glisse return -1; 1357771fe6b9SJerome Glisse } 1358771fe6b9SJerome Glisse DRM_INFO("GPU reset succeed (RBBM_STATUS=0x%08X)\n", status); 1359771fe6b9SJerome Glisse return 0; 1360771fe6b9SJerome Glisse } 1361771fe6b9SJerome Glisse 1362771fe6b9SJerome Glisse 1363771fe6b9SJerome Glisse /* 1364771fe6b9SJerome Glisse * VRAM info 1365771fe6b9SJerome Glisse */ 1366771fe6b9SJerome Glisse static void r100_vram_get_type(struct radeon_device *rdev) 1367771fe6b9SJerome Glisse { 1368771fe6b9SJerome Glisse uint32_t tmp; 1369771fe6b9SJerome Glisse 1370771fe6b9SJerome Glisse rdev->mc.vram_is_ddr = false; 1371771fe6b9SJerome Glisse if (rdev->flags & RADEON_IS_IGP) 1372771fe6b9SJerome Glisse rdev->mc.vram_is_ddr = true; 1373771fe6b9SJerome Glisse else if (RREG32(RADEON_MEM_SDRAM_MODE_REG) & RADEON_MEM_CFG_TYPE_DDR) 1374771fe6b9SJerome Glisse rdev->mc.vram_is_ddr = true; 1375771fe6b9SJerome Glisse if ((rdev->family == CHIP_RV100) || 1376771fe6b9SJerome Glisse (rdev->family == CHIP_RS100) || 1377771fe6b9SJerome Glisse (rdev->family == CHIP_RS200)) { 1378771fe6b9SJerome Glisse tmp = RREG32(RADEON_MEM_CNTL); 1379771fe6b9SJerome Glisse if (tmp & RV100_HALF_MODE) { 1380771fe6b9SJerome Glisse rdev->mc.vram_width = 32; 1381771fe6b9SJerome Glisse } else { 1382771fe6b9SJerome Glisse rdev->mc.vram_width = 64; 1383771fe6b9SJerome Glisse } 1384771fe6b9SJerome Glisse if (rdev->flags & RADEON_SINGLE_CRTC) { 1385771fe6b9SJerome Glisse rdev->mc.vram_width /= 4; 1386771fe6b9SJerome Glisse rdev->mc.vram_is_ddr = true; 1387771fe6b9SJerome Glisse } 1388771fe6b9SJerome Glisse } else if (rdev->family <= CHIP_RV280) { 1389771fe6b9SJerome Glisse tmp = RREG32(RADEON_MEM_CNTL); 1390771fe6b9SJerome Glisse if (tmp & RADEON_MEM_NUM_CHANNELS_MASK) { 1391771fe6b9SJerome Glisse rdev->mc.vram_width = 128; 1392771fe6b9SJerome Glisse } else { 1393771fe6b9SJerome Glisse rdev->mc.vram_width = 64; 1394771fe6b9SJerome Glisse } 1395771fe6b9SJerome Glisse } else { 1396771fe6b9SJerome Glisse /* newer IGPs */ 1397771fe6b9SJerome Glisse rdev->mc.vram_width = 128; 1398771fe6b9SJerome Glisse } 1399771fe6b9SJerome Glisse } 1400771fe6b9SJerome Glisse 14012a0f8918SDave Airlie static u32 r100_get_accessible_vram(struct radeon_device *rdev) 1402771fe6b9SJerome Glisse { 14032a0f8918SDave Airlie u32 aper_size; 14042a0f8918SDave Airlie u8 byte; 14052a0f8918SDave Airlie 14062a0f8918SDave Airlie aper_size = RREG32(RADEON_CONFIG_APER_SIZE); 14072a0f8918SDave Airlie 14082a0f8918SDave Airlie /* Set HDP_APER_CNTL only on cards that are known not to be broken, 14092a0f8918SDave Airlie * that is has the 2nd generation multifunction PCI interface 14102a0f8918SDave Airlie */ 14112a0f8918SDave Airlie if (rdev->family == CHIP_RV280 || 14122a0f8918SDave Airlie rdev->family >= CHIP_RV350) { 14132a0f8918SDave Airlie WREG32_P(RADEON_HOST_PATH_CNTL, RADEON_HDP_APER_CNTL, 14142a0f8918SDave Airlie ~RADEON_HDP_APER_CNTL); 14152a0f8918SDave Airlie DRM_INFO("Generation 2 PCI interface, using max accessible memory\n"); 14162a0f8918SDave Airlie return aper_size * 2; 14172a0f8918SDave Airlie } 14182a0f8918SDave Airlie 14192a0f8918SDave Airlie /* Older cards have all sorts of funny issues to deal with. First 14202a0f8918SDave Airlie * check if it's a multifunction card by reading the PCI config 14212a0f8918SDave Airlie * header type... Limit those to one aperture size 14222a0f8918SDave Airlie */ 14232a0f8918SDave Airlie pci_read_config_byte(rdev->pdev, 0xe, &byte); 14242a0f8918SDave Airlie if (byte & 0x80) { 14252a0f8918SDave Airlie DRM_INFO("Generation 1 PCI interface in multifunction mode\n"); 14262a0f8918SDave Airlie DRM_INFO("Limiting VRAM to one aperture\n"); 14272a0f8918SDave Airlie return aper_size; 14282a0f8918SDave Airlie } 14292a0f8918SDave Airlie 14302a0f8918SDave Airlie /* Single function older card. We read HDP_APER_CNTL to see how the BIOS 14312a0f8918SDave Airlie * have set it up. We don't write this as it's broken on some ASICs but 14322a0f8918SDave Airlie * we expect the BIOS to have done the right thing (might be too optimistic...) 14332a0f8918SDave Airlie */ 14342a0f8918SDave Airlie if (RREG32(RADEON_HOST_PATH_CNTL) & RADEON_HDP_APER_CNTL) 14352a0f8918SDave Airlie return aper_size * 2; 14362a0f8918SDave Airlie return aper_size; 14372a0f8918SDave Airlie } 14382a0f8918SDave Airlie 14392a0f8918SDave Airlie void r100_vram_init_sizes(struct radeon_device *rdev) 14402a0f8918SDave Airlie { 14412a0f8918SDave Airlie u64 config_aper_size; 14422a0f8918SDave Airlie u32 accessible; 14432a0f8918SDave Airlie 14442a0f8918SDave Airlie config_aper_size = RREG32(RADEON_CONFIG_APER_SIZE); 1445771fe6b9SJerome Glisse 1446771fe6b9SJerome Glisse if (rdev->flags & RADEON_IS_IGP) { 1447771fe6b9SJerome Glisse uint32_t tom; 1448771fe6b9SJerome Glisse /* read NB_TOM to get the amount of ram stolen for the GPU */ 1449771fe6b9SJerome Glisse tom = RREG32(RADEON_NB_TOM); 1450771fe6b9SJerome Glisse rdev->mc.vram_size = (((tom >> 16) - (tom & 0xffff) + 1) << 16); 14513e43d821SDave Airlie /* for IGPs we need to keep VRAM where it was put by the BIOS */ 14523e43d821SDave Airlie rdev->mc.vram_location = (tom & 0xffff) << 16; 1453771fe6b9SJerome Glisse WREG32(RADEON_CONFIG_MEMSIZE, rdev->mc.vram_size); 1454771fe6b9SJerome Glisse } else { 1455771fe6b9SJerome Glisse rdev->mc.vram_size = RREG32(RADEON_CONFIG_MEMSIZE); 1456771fe6b9SJerome Glisse /* Some production boards of m6 will report 0 1457771fe6b9SJerome Glisse * if it's 8 MB 1458771fe6b9SJerome Glisse */ 1459771fe6b9SJerome Glisse if (rdev->mc.vram_size == 0) { 1460771fe6b9SJerome Glisse rdev->mc.vram_size = 8192 * 1024; 1461771fe6b9SJerome Glisse WREG32(RADEON_CONFIG_MEMSIZE, rdev->mc.vram_size); 1462771fe6b9SJerome Glisse } 14633e43d821SDave Airlie /* let driver place VRAM */ 14643e43d821SDave Airlie rdev->mc.vram_location = 0xFFFFFFFFUL; 14652a0f8918SDave Airlie /* Fix for RN50, M6, M7 with 8/16/32(??) MBs of VRAM - 14662a0f8918SDave Airlie * Novell bug 204882 + along with lots of ubuntu ones */ 14672a0f8918SDave Airlie if (config_aper_size > rdev->mc.vram_size) 14682a0f8918SDave Airlie rdev->mc.vram_size = config_aper_size; 1469771fe6b9SJerome Glisse } 1470771fe6b9SJerome Glisse 14712a0f8918SDave Airlie /* work out accessible VRAM */ 14722a0f8918SDave Airlie accessible = r100_get_accessible_vram(rdev); 14732a0f8918SDave Airlie 1474771fe6b9SJerome Glisse rdev->mc.aper_base = drm_get_resource_start(rdev->ddev, 0); 1475771fe6b9SJerome Glisse rdev->mc.aper_size = drm_get_resource_len(rdev->ddev, 0); 14762a0f8918SDave Airlie 14772a0f8918SDave Airlie if (accessible > rdev->mc.aper_size) 14782a0f8918SDave Airlie accessible = rdev->mc.aper_size; 14792a0f8918SDave Airlie 14802a0f8918SDave Airlie if (rdev->mc.vram_size > rdev->mc.aper_size) 14812a0f8918SDave Airlie rdev->mc.vram_size = rdev->mc.aper_size; 14822a0f8918SDave Airlie } 14832a0f8918SDave Airlie 14842a0f8918SDave Airlie void r100_vram_info(struct radeon_device *rdev) 14852a0f8918SDave Airlie { 14862a0f8918SDave Airlie r100_vram_get_type(rdev); 14872a0f8918SDave Airlie 14882a0f8918SDave Airlie r100_vram_init_sizes(rdev); 1489771fe6b9SJerome Glisse } 1490771fe6b9SJerome Glisse 1491771fe6b9SJerome Glisse 1492771fe6b9SJerome Glisse /* 1493771fe6b9SJerome Glisse * Indirect registers accessor 1494771fe6b9SJerome Glisse */ 1495771fe6b9SJerome Glisse void r100_pll_errata_after_index(struct radeon_device *rdev) 1496771fe6b9SJerome Glisse { 1497771fe6b9SJerome Glisse if (!(rdev->pll_errata & CHIP_ERRATA_PLL_DUMMYREADS)) { 1498771fe6b9SJerome Glisse return; 1499771fe6b9SJerome Glisse } 1500771fe6b9SJerome Glisse (void)RREG32(RADEON_CLOCK_CNTL_DATA); 1501771fe6b9SJerome Glisse (void)RREG32(RADEON_CRTC_GEN_CNTL); 1502771fe6b9SJerome Glisse } 1503771fe6b9SJerome Glisse 1504771fe6b9SJerome Glisse static void r100_pll_errata_after_data(struct radeon_device *rdev) 1505771fe6b9SJerome Glisse { 1506771fe6b9SJerome Glisse /* This workarounds is necessary on RV100, RS100 and RS200 chips 1507771fe6b9SJerome Glisse * or the chip could hang on a subsequent access 1508771fe6b9SJerome Glisse */ 1509771fe6b9SJerome Glisse if (rdev->pll_errata & CHIP_ERRATA_PLL_DELAY) { 1510771fe6b9SJerome Glisse udelay(5000); 1511771fe6b9SJerome Glisse } 1512771fe6b9SJerome Glisse 1513771fe6b9SJerome Glisse /* This function is required to workaround a hardware bug in some (all?) 1514771fe6b9SJerome Glisse * revisions of the R300. This workaround should be called after every 1515771fe6b9SJerome Glisse * CLOCK_CNTL_INDEX register access. If not, register reads afterward 1516771fe6b9SJerome Glisse * may not be correct. 1517771fe6b9SJerome Glisse */ 1518771fe6b9SJerome Glisse if (rdev->pll_errata & CHIP_ERRATA_R300_CG) { 1519771fe6b9SJerome Glisse uint32_t save, tmp; 1520771fe6b9SJerome Glisse 1521771fe6b9SJerome Glisse save = RREG32(RADEON_CLOCK_CNTL_INDEX); 1522771fe6b9SJerome Glisse tmp = save & ~(0x3f | RADEON_PLL_WR_EN); 1523771fe6b9SJerome Glisse WREG32(RADEON_CLOCK_CNTL_INDEX, tmp); 1524771fe6b9SJerome Glisse tmp = RREG32(RADEON_CLOCK_CNTL_DATA); 1525771fe6b9SJerome Glisse WREG32(RADEON_CLOCK_CNTL_INDEX, save); 1526771fe6b9SJerome Glisse } 1527771fe6b9SJerome Glisse } 1528771fe6b9SJerome Glisse 1529771fe6b9SJerome Glisse uint32_t r100_pll_rreg(struct radeon_device *rdev, uint32_t reg) 1530771fe6b9SJerome Glisse { 1531771fe6b9SJerome Glisse uint32_t data; 1532771fe6b9SJerome Glisse 1533771fe6b9SJerome Glisse WREG8(RADEON_CLOCK_CNTL_INDEX, reg & 0x3f); 1534771fe6b9SJerome Glisse r100_pll_errata_after_index(rdev); 1535771fe6b9SJerome Glisse data = RREG32(RADEON_CLOCK_CNTL_DATA); 1536771fe6b9SJerome Glisse r100_pll_errata_after_data(rdev); 1537771fe6b9SJerome Glisse return data; 1538771fe6b9SJerome Glisse } 1539771fe6b9SJerome Glisse 1540771fe6b9SJerome Glisse void r100_pll_wreg(struct radeon_device *rdev, uint32_t reg, uint32_t v) 1541771fe6b9SJerome Glisse { 1542771fe6b9SJerome Glisse WREG8(RADEON_CLOCK_CNTL_INDEX, ((reg & 0x3f) | RADEON_PLL_WR_EN)); 1543771fe6b9SJerome Glisse r100_pll_errata_after_index(rdev); 1544771fe6b9SJerome Glisse WREG32(RADEON_CLOCK_CNTL_DATA, v); 1545771fe6b9SJerome Glisse r100_pll_errata_after_data(rdev); 1546771fe6b9SJerome Glisse } 1547771fe6b9SJerome Glisse 1548771fe6b9SJerome Glisse uint32_t r100_mm_rreg(struct radeon_device *rdev, uint32_t reg) 1549771fe6b9SJerome Glisse { 1550771fe6b9SJerome Glisse if (reg < 0x10000) 1551771fe6b9SJerome Glisse return readl(((void __iomem *)rdev->rmmio) + reg); 1552771fe6b9SJerome Glisse else { 1553771fe6b9SJerome Glisse writel(reg, ((void __iomem *)rdev->rmmio) + RADEON_MM_INDEX); 1554771fe6b9SJerome Glisse return readl(((void __iomem *)rdev->rmmio) + RADEON_MM_DATA); 1555771fe6b9SJerome Glisse } 1556771fe6b9SJerome Glisse } 1557771fe6b9SJerome Glisse 1558771fe6b9SJerome Glisse void r100_mm_wreg(struct radeon_device *rdev, uint32_t reg, uint32_t v) 1559771fe6b9SJerome Glisse { 1560771fe6b9SJerome Glisse if (reg < 0x10000) 1561771fe6b9SJerome Glisse writel(v, ((void __iomem *)rdev->rmmio) + reg); 1562771fe6b9SJerome Glisse else { 1563771fe6b9SJerome Glisse writel(reg, ((void __iomem *)rdev->rmmio) + RADEON_MM_INDEX); 1564771fe6b9SJerome Glisse writel(v, ((void __iomem *)rdev->rmmio) + RADEON_MM_DATA); 1565771fe6b9SJerome Glisse } 1566771fe6b9SJerome Glisse } 1567771fe6b9SJerome Glisse 1568068a117cSJerome Glisse int r100_init(struct radeon_device *rdev) 1569068a117cSJerome Glisse { 1570068a117cSJerome Glisse return 0; 1571068a117cSJerome Glisse } 1572068a117cSJerome Glisse 1573771fe6b9SJerome Glisse /* 1574771fe6b9SJerome Glisse * Debugfs info 1575771fe6b9SJerome Glisse */ 1576771fe6b9SJerome Glisse #if defined(CONFIG_DEBUG_FS) 1577771fe6b9SJerome Glisse static int r100_debugfs_rbbm_info(struct seq_file *m, void *data) 1578771fe6b9SJerome Glisse { 1579771fe6b9SJerome Glisse struct drm_info_node *node = (struct drm_info_node *) m->private; 1580771fe6b9SJerome Glisse struct drm_device *dev = node->minor->dev; 1581771fe6b9SJerome Glisse struct radeon_device *rdev = dev->dev_private; 1582771fe6b9SJerome Glisse uint32_t reg, value; 1583771fe6b9SJerome Glisse unsigned i; 1584771fe6b9SJerome Glisse 1585771fe6b9SJerome Glisse seq_printf(m, "RBBM_STATUS 0x%08x\n", RREG32(RADEON_RBBM_STATUS)); 1586771fe6b9SJerome Glisse seq_printf(m, "RBBM_CMDFIFO_STAT 0x%08x\n", RREG32(0xE7C)); 1587771fe6b9SJerome Glisse seq_printf(m, "CP_STAT 0x%08x\n", RREG32(RADEON_CP_STAT)); 1588771fe6b9SJerome Glisse for (i = 0; i < 64; i++) { 1589771fe6b9SJerome Glisse WREG32(RADEON_RBBM_CMDFIFO_ADDR, i | 0x100); 1590771fe6b9SJerome Glisse reg = (RREG32(RADEON_RBBM_CMDFIFO_DATA) - 1) >> 2; 1591771fe6b9SJerome Glisse WREG32(RADEON_RBBM_CMDFIFO_ADDR, i); 1592771fe6b9SJerome Glisse value = RREG32(RADEON_RBBM_CMDFIFO_DATA); 1593771fe6b9SJerome Glisse seq_printf(m, "[0x%03X] 0x%04X=0x%08X\n", i, reg, value); 1594771fe6b9SJerome Glisse } 1595771fe6b9SJerome Glisse return 0; 1596771fe6b9SJerome Glisse } 1597771fe6b9SJerome Glisse 1598771fe6b9SJerome Glisse static int r100_debugfs_cp_ring_info(struct seq_file *m, void *data) 1599771fe6b9SJerome Glisse { 1600771fe6b9SJerome Glisse struct drm_info_node *node = (struct drm_info_node *) m->private; 1601771fe6b9SJerome Glisse struct drm_device *dev = node->minor->dev; 1602771fe6b9SJerome Glisse struct radeon_device *rdev = dev->dev_private; 1603771fe6b9SJerome Glisse uint32_t rdp, wdp; 1604771fe6b9SJerome Glisse unsigned count, i, j; 1605771fe6b9SJerome Glisse 1606771fe6b9SJerome Glisse radeon_ring_free_size(rdev); 1607771fe6b9SJerome Glisse rdp = RREG32(RADEON_CP_RB_RPTR); 1608771fe6b9SJerome Glisse wdp = RREG32(RADEON_CP_RB_WPTR); 1609771fe6b9SJerome Glisse count = (rdp + rdev->cp.ring_size - wdp) & rdev->cp.ptr_mask; 1610771fe6b9SJerome Glisse seq_printf(m, "CP_STAT 0x%08x\n", RREG32(RADEON_CP_STAT)); 1611771fe6b9SJerome Glisse seq_printf(m, "CP_RB_WPTR 0x%08x\n", wdp); 1612771fe6b9SJerome Glisse seq_printf(m, "CP_RB_RPTR 0x%08x\n", rdp); 1613771fe6b9SJerome Glisse seq_printf(m, "%u free dwords in ring\n", rdev->cp.ring_free_dw); 1614771fe6b9SJerome Glisse seq_printf(m, "%u dwords in ring\n", count); 1615771fe6b9SJerome Glisse for (j = 0; j <= count; j++) { 1616771fe6b9SJerome Glisse i = (rdp + j) & rdev->cp.ptr_mask; 1617771fe6b9SJerome Glisse seq_printf(m, "r[%04d]=0x%08x\n", i, rdev->cp.ring[i]); 1618771fe6b9SJerome Glisse } 1619771fe6b9SJerome Glisse return 0; 1620771fe6b9SJerome Glisse } 1621771fe6b9SJerome Glisse 1622771fe6b9SJerome Glisse 1623771fe6b9SJerome Glisse static int r100_debugfs_cp_csq_fifo(struct seq_file *m, void *data) 1624771fe6b9SJerome Glisse { 1625771fe6b9SJerome Glisse struct drm_info_node *node = (struct drm_info_node *) m->private; 1626771fe6b9SJerome Glisse struct drm_device *dev = node->minor->dev; 1627771fe6b9SJerome Glisse struct radeon_device *rdev = dev->dev_private; 1628771fe6b9SJerome Glisse uint32_t csq_stat, csq2_stat, tmp; 1629771fe6b9SJerome Glisse unsigned r_rptr, r_wptr, ib1_rptr, ib1_wptr, ib2_rptr, ib2_wptr; 1630771fe6b9SJerome Glisse unsigned i; 1631771fe6b9SJerome Glisse 1632771fe6b9SJerome Glisse seq_printf(m, "CP_STAT 0x%08x\n", RREG32(RADEON_CP_STAT)); 1633771fe6b9SJerome Glisse seq_printf(m, "CP_CSQ_MODE 0x%08x\n", RREG32(RADEON_CP_CSQ_MODE)); 1634771fe6b9SJerome Glisse csq_stat = RREG32(RADEON_CP_CSQ_STAT); 1635771fe6b9SJerome Glisse csq2_stat = RREG32(RADEON_CP_CSQ2_STAT); 1636771fe6b9SJerome Glisse r_rptr = (csq_stat >> 0) & 0x3ff; 1637771fe6b9SJerome Glisse r_wptr = (csq_stat >> 10) & 0x3ff; 1638771fe6b9SJerome Glisse ib1_rptr = (csq_stat >> 20) & 0x3ff; 1639771fe6b9SJerome Glisse ib1_wptr = (csq2_stat >> 0) & 0x3ff; 1640771fe6b9SJerome Glisse ib2_rptr = (csq2_stat >> 10) & 0x3ff; 1641771fe6b9SJerome Glisse ib2_wptr = (csq2_stat >> 20) & 0x3ff; 1642771fe6b9SJerome Glisse seq_printf(m, "CP_CSQ_STAT 0x%08x\n", csq_stat); 1643771fe6b9SJerome Glisse seq_printf(m, "CP_CSQ2_STAT 0x%08x\n", csq2_stat); 1644771fe6b9SJerome Glisse seq_printf(m, "Ring rptr %u\n", r_rptr); 1645771fe6b9SJerome Glisse seq_printf(m, "Ring wptr %u\n", r_wptr); 1646771fe6b9SJerome Glisse seq_printf(m, "Indirect1 rptr %u\n", ib1_rptr); 1647771fe6b9SJerome Glisse seq_printf(m, "Indirect1 wptr %u\n", ib1_wptr); 1648771fe6b9SJerome Glisse seq_printf(m, "Indirect2 rptr %u\n", ib2_rptr); 1649771fe6b9SJerome Glisse seq_printf(m, "Indirect2 wptr %u\n", ib2_wptr); 1650771fe6b9SJerome Glisse /* FIXME: 0, 128, 640 depends on fifo setup see cp_init_kms 1651771fe6b9SJerome Glisse * 128 = indirect1_start * 8 & 640 = indirect2_start * 8 */ 1652771fe6b9SJerome Glisse seq_printf(m, "Ring fifo:\n"); 1653771fe6b9SJerome Glisse for (i = 0; i < 256; i++) { 1654771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_ADDR, i << 2); 1655771fe6b9SJerome Glisse tmp = RREG32(RADEON_CP_CSQ_DATA); 1656771fe6b9SJerome Glisse seq_printf(m, "rfifo[%04d]=0x%08X\n", i, tmp); 1657771fe6b9SJerome Glisse } 1658771fe6b9SJerome Glisse seq_printf(m, "Indirect1 fifo:\n"); 1659771fe6b9SJerome Glisse for (i = 256; i <= 512; i++) { 1660771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_ADDR, i << 2); 1661771fe6b9SJerome Glisse tmp = RREG32(RADEON_CP_CSQ_DATA); 1662771fe6b9SJerome Glisse seq_printf(m, "ib1fifo[%04d]=0x%08X\n", i, tmp); 1663771fe6b9SJerome Glisse } 1664771fe6b9SJerome Glisse seq_printf(m, "Indirect2 fifo:\n"); 1665771fe6b9SJerome Glisse for (i = 640; i < ib1_wptr; i++) { 1666771fe6b9SJerome Glisse WREG32(RADEON_CP_CSQ_ADDR, i << 2); 1667771fe6b9SJerome Glisse tmp = RREG32(RADEON_CP_CSQ_DATA); 1668771fe6b9SJerome Glisse seq_printf(m, "ib2fifo[%04d]=0x%08X\n", i, tmp); 1669771fe6b9SJerome Glisse } 1670771fe6b9SJerome Glisse return 0; 1671771fe6b9SJerome Glisse } 1672771fe6b9SJerome Glisse 1673771fe6b9SJerome Glisse static int r100_debugfs_mc_info(struct seq_file *m, void *data) 1674771fe6b9SJerome Glisse { 1675771fe6b9SJerome Glisse struct drm_info_node *node = (struct drm_info_node *) m->private; 1676771fe6b9SJerome Glisse struct drm_device *dev = node->minor->dev; 1677771fe6b9SJerome Glisse struct radeon_device *rdev = dev->dev_private; 1678771fe6b9SJerome Glisse uint32_t tmp; 1679771fe6b9SJerome Glisse 1680771fe6b9SJerome Glisse tmp = RREG32(RADEON_CONFIG_MEMSIZE); 1681771fe6b9SJerome Glisse seq_printf(m, "CONFIG_MEMSIZE 0x%08x\n", tmp); 1682771fe6b9SJerome Glisse tmp = RREG32(RADEON_MC_FB_LOCATION); 1683771fe6b9SJerome Glisse seq_printf(m, "MC_FB_LOCATION 0x%08x\n", tmp); 1684771fe6b9SJerome Glisse tmp = RREG32(RADEON_BUS_CNTL); 1685771fe6b9SJerome Glisse seq_printf(m, "BUS_CNTL 0x%08x\n", tmp); 1686771fe6b9SJerome Glisse tmp = RREG32(RADEON_MC_AGP_LOCATION); 1687771fe6b9SJerome Glisse seq_printf(m, "MC_AGP_LOCATION 0x%08x\n", tmp); 1688771fe6b9SJerome Glisse tmp = RREG32(RADEON_AGP_BASE); 1689771fe6b9SJerome Glisse seq_printf(m, "AGP_BASE 0x%08x\n", tmp); 1690771fe6b9SJerome Glisse tmp = RREG32(RADEON_HOST_PATH_CNTL); 1691771fe6b9SJerome Glisse seq_printf(m, "HOST_PATH_CNTL 0x%08x\n", tmp); 1692771fe6b9SJerome Glisse tmp = RREG32(0x01D0); 1693771fe6b9SJerome Glisse seq_printf(m, "AIC_CTRL 0x%08x\n", tmp); 1694771fe6b9SJerome Glisse tmp = RREG32(RADEON_AIC_LO_ADDR); 1695771fe6b9SJerome Glisse seq_printf(m, "AIC_LO_ADDR 0x%08x\n", tmp); 1696771fe6b9SJerome Glisse tmp = RREG32(RADEON_AIC_HI_ADDR); 1697771fe6b9SJerome Glisse seq_printf(m, "AIC_HI_ADDR 0x%08x\n", tmp); 1698771fe6b9SJerome Glisse tmp = RREG32(0x01E4); 1699771fe6b9SJerome Glisse seq_printf(m, "AIC_TLB_ADDR 0x%08x\n", tmp); 1700771fe6b9SJerome Glisse return 0; 1701771fe6b9SJerome Glisse } 1702771fe6b9SJerome Glisse 1703771fe6b9SJerome Glisse static struct drm_info_list r100_debugfs_rbbm_list[] = { 1704771fe6b9SJerome Glisse {"r100_rbbm_info", r100_debugfs_rbbm_info, 0, NULL}, 1705771fe6b9SJerome Glisse }; 1706771fe6b9SJerome Glisse 1707771fe6b9SJerome Glisse static struct drm_info_list r100_debugfs_cp_list[] = { 1708771fe6b9SJerome Glisse {"r100_cp_ring_info", r100_debugfs_cp_ring_info, 0, NULL}, 1709771fe6b9SJerome Glisse {"r100_cp_csq_fifo", r100_debugfs_cp_csq_fifo, 0, NULL}, 1710771fe6b9SJerome Glisse }; 1711771fe6b9SJerome Glisse 1712771fe6b9SJerome Glisse static struct drm_info_list r100_debugfs_mc_info_list[] = { 1713771fe6b9SJerome Glisse {"r100_mc_info", r100_debugfs_mc_info, 0, NULL}, 1714771fe6b9SJerome Glisse }; 1715771fe6b9SJerome Glisse #endif 1716771fe6b9SJerome Glisse 1717771fe6b9SJerome Glisse int r100_debugfs_rbbm_init(struct radeon_device *rdev) 1718771fe6b9SJerome Glisse { 1719771fe6b9SJerome Glisse #if defined(CONFIG_DEBUG_FS) 1720771fe6b9SJerome Glisse return radeon_debugfs_add_files(rdev, r100_debugfs_rbbm_list, 1); 1721771fe6b9SJerome Glisse #else 1722771fe6b9SJerome Glisse return 0; 1723771fe6b9SJerome Glisse #endif 1724771fe6b9SJerome Glisse } 1725771fe6b9SJerome Glisse 1726771fe6b9SJerome Glisse int r100_debugfs_cp_init(struct radeon_device *rdev) 1727771fe6b9SJerome Glisse { 1728771fe6b9SJerome Glisse #if defined(CONFIG_DEBUG_FS) 1729771fe6b9SJerome Glisse return radeon_debugfs_add_files(rdev, r100_debugfs_cp_list, 2); 1730771fe6b9SJerome Glisse #else 1731771fe6b9SJerome Glisse return 0; 1732771fe6b9SJerome Glisse #endif 1733771fe6b9SJerome Glisse } 1734771fe6b9SJerome Glisse 1735771fe6b9SJerome Glisse int r100_debugfs_mc_info_init(struct radeon_device *rdev) 1736771fe6b9SJerome Glisse { 1737771fe6b9SJerome Glisse #if defined(CONFIG_DEBUG_FS) 1738771fe6b9SJerome Glisse return radeon_debugfs_add_files(rdev, r100_debugfs_mc_info_list, 1); 1739771fe6b9SJerome Glisse #else 1740771fe6b9SJerome Glisse return 0; 1741771fe6b9SJerome Glisse #endif 1742771fe6b9SJerome Glisse } 1743*e024e110SDave Airlie 1744*e024e110SDave Airlie int r100_set_surface_reg(struct radeon_device *rdev, int reg, 1745*e024e110SDave Airlie uint32_t tiling_flags, uint32_t pitch, 1746*e024e110SDave Airlie uint32_t offset, uint32_t obj_size) 1747*e024e110SDave Airlie { 1748*e024e110SDave Airlie int surf_index = reg * 16; 1749*e024e110SDave Airlie int flags = 0; 1750*e024e110SDave Airlie 1751*e024e110SDave Airlie /* r100/r200 divide by 16 */ 1752*e024e110SDave Airlie if (rdev->family < CHIP_R300) 1753*e024e110SDave Airlie flags = pitch / 16; 1754*e024e110SDave Airlie else 1755*e024e110SDave Airlie flags = pitch / 8; 1756*e024e110SDave Airlie 1757*e024e110SDave Airlie if (rdev->family <= CHIP_RS200) { 1758*e024e110SDave Airlie if ((tiling_flags & (RADEON_TILING_MACRO|RADEON_TILING_MICRO)) 1759*e024e110SDave Airlie == (RADEON_TILING_MACRO|RADEON_TILING_MICRO)) 1760*e024e110SDave Airlie flags |= RADEON_SURF_TILE_COLOR_BOTH; 1761*e024e110SDave Airlie if (tiling_flags & RADEON_TILING_MACRO) 1762*e024e110SDave Airlie flags |= RADEON_SURF_TILE_COLOR_MACRO; 1763*e024e110SDave Airlie } else if (rdev->family <= CHIP_RV280) { 1764*e024e110SDave Airlie if (tiling_flags & (RADEON_TILING_MACRO)) 1765*e024e110SDave Airlie flags |= R200_SURF_TILE_COLOR_MACRO; 1766*e024e110SDave Airlie if (tiling_flags & RADEON_TILING_MICRO) 1767*e024e110SDave Airlie flags |= R200_SURF_TILE_COLOR_MICRO; 1768*e024e110SDave Airlie } else { 1769*e024e110SDave Airlie if (tiling_flags & RADEON_TILING_MACRO) 1770*e024e110SDave Airlie flags |= R300_SURF_TILE_MACRO; 1771*e024e110SDave Airlie if (tiling_flags & RADEON_TILING_MICRO) 1772*e024e110SDave Airlie flags |= R300_SURF_TILE_MICRO; 1773*e024e110SDave Airlie } 1774*e024e110SDave Airlie 1775*e024e110SDave Airlie DRM_DEBUG("writing surface %d %d %x %x\n", reg, flags, offset, offset+obj_size-1); 1776*e024e110SDave Airlie WREG32(RADEON_SURFACE0_INFO + surf_index, flags); 1777*e024e110SDave Airlie WREG32(RADEON_SURFACE0_LOWER_BOUND + surf_index, offset); 1778*e024e110SDave Airlie WREG32(RADEON_SURFACE0_UPPER_BOUND + surf_index, offset + obj_size - 1); 1779*e024e110SDave Airlie return 0; 1780*e024e110SDave Airlie } 1781*e024e110SDave Airlie 1782*e024e110SDave Airlie void r100_clear_surface_reg(struct radeon_device *rdev, int reg) 1783*e024e110SDave Airlie { 1784*e024e110SDave Airlie int surf_index = reg * 16; 1785*e024e110SDave Airlie WREG32(RADEON_SURFACE0_INFO + surf_index, 0); 1786*e024e110SDave Airlie } 1787