Lines Matching +full:sync +full:- +full:update +full:- +full:mask

38  * sDMA - System DMA
55 * cik_sdma_get_rptr - get the current read pointer
67 if (rdev->wb.enabled) { in cik_sdma_get_rptr()
68 rptr = rdev->wb.wb[ring->rptr_offs/4]; in cik_sdma_get_rptr()
70 if (ring->idx == R600_RING_TYPE_DMA_INDEX) in cik_sdma_get_rptr()
82 * cik_sdma_get_wptr - get the current write pointer
94 if (ring->idx == R600_RING_TYPE_DMA_INDEX) in cik_sdma_get_wptr()
103 * cik_sdma_set_wptr - commit the write pointer
115 if (ring->idx == R600_RING_TYPE_DMA_INDEX) in cik_sdma_set_wptr()
120 WREG32(reg, (ring->wptr << 2) & 0x3fffc); in cik_sdma_set_wptr()
125 * cik_sdma_ring_ib_execute - Schedule an IB on the DMA engine
135 struct radeon_ring *ring = &rdev->ring[ib->ring]; in cik_sdma_ring_ib_execute()
136 u32 extra_bits = (ib->vm ? ib->vm->ids[ib->ring].id : 0) & 0xf; in cik_sdma_ring_ib_execute()
138 if (rdev->wb.enabled) { in cik_sdma_ring_ib_execute()
139 u32 next_rptr = ring->wptr + 5; in cik_sdma_ring_ib_execute()
144 radeon_ring_write(ring, ring->next_rptr_gpu_addr & 0xfffffffc); in cik_sdma_ring_ib_execute()
145 radeon_ring_write(ring, upper_32_bits(ring->next_rptr_gpu_addr)); in cik_sdma_ring_ib_execute()
151 while ((ring->wptr & 7) != 4) in cik_sdma_ring_ib_execute()
154 radeon_ring_write(ring, ib->gpu_addr & 0xffffffe0); /* base must be 32 byte aligned */ in cik_sdma_ring_ib_execute()
155 radeon_ring_write(ring, upper_32_bits(ib->gpu_addr)); in cik_sdma_ring_ib_execute()
156 radeon_ring_write(ring, ib->length_dw); in cik_sdma_ring_ib_execute()
161 * cik_sdma_hdp_flush_ring_emit - emit an hdp flush on the DMA ring
171 struct radeon_ring *ring = &rdev->ring[ridx]; in cik_sdma_hdp_flush_ring_emit()
185 radeon_ring_write(ring, ref_and_mask); /* mask */ in cik_sdma_hdp_flush_ring_emit()
190 * cik_sdma_fence_ring_emit - emit a fence on the DMA ring
202 struct radeon_ring *ring = &rdev->ring[fence->ring]; in cik_sdma_fence_ring_emit()
203 u64 addr = rdev->fence_drv[fence->ring].gpu_addr; in cik_sdma_fence_ring_emit()
209 radeon_ring_write(ring, fence->seq); in cik_sdma_fence_ring_emit()
213 cik_sdma_hdp_flush_ring_emit(rdev, fence->ring); in cik_sdma_fence_ring_emit()
217 * cik_sdma_semaphore_ring_emit - emit a semaphore on the dma ring
232 u64 addr = semaphore->gpu_addr; in cik_sdma_semaphore_ring_emit()
243 * cik_sdma_gfx_stop - stop the gfx async dma engines
254 if ((rdev->asic->copy.copy_ring_index == R600_RING_TYPE_DMA_INDEX) || in cik_sdma_gfx_stop()
255 (rdev->asic->copy.copy_ring_index == CAYMAN_RING_TYPE_DMA1_INDEX)) in cik_sdma_gfx_stop()
256 radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size); in cik_sdma_gfx_stop()
268 rdev->ring[R600_RING_TYPE_DMA_INDEX].ready = false; in cik_sdma_gfx_stop()
269 rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX].ready = false; in cik_sdma_gfx_stop()
284 * cik_sdma_rlc_stop - stop the compute async dma engines
296 * cik_sdma_ctx_switch_enable - enable/disable sdma engine preemption
323 * cik_sdma_enable - stop the async dma engines
357 * cik_sdma_gfx_resume - setup and start the async dma engines
374 ring = &rdev->ring[R600_RING_TYPE_DMA_INDEX]; in cik_sdma_gfx_resume()
378 ring = &rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX]; in cik_sdma_gfx_resume()
387 rb_bufsz = order_base_2(ring->ring_size / 4); in cik_sdma_gfx_resume()
400 upper_32_bits(rdev->wb.gpu_addr + wb_offset) & 0xFFFFFFFF); in cik_sdma_gfx_resume()
402 ((rdev->wb.gpu_addr + wb_offset) & 0xFFFFFFFC)); in cik_sdma_gfx_resume()
404 if (rdev->wb.enabled) in cik_sdma_gfx_resume()
407 WREG32(SDMA0_GFX_RB_BASE + reg_offset, ring->gpu_addr >> 8); in cik_sdma_gfx_resume()
408 WREG32(SDMA0_GFX_RB_BASE_HI + reg_offset, ring->gpu_addr >> 40); in cik_sdma_gfx_resume()
410 ring->wptr = 0; in cik_sdma_gfx_resume()
411 WREG32(SDMA0_GFX_RB_WPTR + reg_offset, ring->wptr << 2); in cik_sdma_gfx_resume()
423 ring->ready = true; in cik_sdma_gfx_resume()
425 r = radeon_ring_test(rdev, ring->idx, ring); in cik_sdma_gfx_resume()
427 ring->ready = false; in cik_sdma_gfx_resume()
432 if ((rdev->asic->copy.copy_ring_index == R600_RING_TYPE_DMA_INDEX) || in cik_sdma_gfx_resume()
433 (rdev->asic->copy.copy_ring_index == CAYMAN_RING_TYPE_DMA1_INDEX)) in cik_sdma_gfx_resume()
434 radeon_ttm_set_active_vram_size(rdev, rdev->mc.real_vram_size); in cik_sdma_gfx_resume()
440 * cik_sdma_rlc_resume - setup and start the async dma engines
454 * cik_sdma_load_microcode - load the sDMA ME ucode
459 * Returns 0 for success, -EINVAL if the ucode is not available.
465 if (!rdev->sdma_fw) in cik_sdma_load_microcode()
466 return -EINVAL; in cik_sdma_load_microcode()
471 if (rdev->new_fw) { in cik_sdma_load_microcode()
473 (const struct sdma_firmware_header_v1_0 *)rdev->sdma_fw->data; in cik_sdma_load_microcode()
477 radeon_ucode_print_sdma_hdr(&hdr->header); in cik_sdma_load_microcode()
481 (rdev->sdma_fw->data + le32_to_cpu(hdr->header.ucode_array_offset_bytes)); in cik_sdma_load_microcode()
482 fw_size = le32_to_cpu(hdr->header.ucode_size_bytes) / 4; in cik_sdma_load_microcode()
490 (rdev->sdma_fw->data + le32_to_cpu(hdr->header.ucode_array_offset_bytes)); in cik_sdma_load_microcode()
491 fw_size = le32_to_cpu(hdr->header.ucode_size_bytes) / 4; in cik_sdma_load_microcode()
500 fw_data = (const __be32 *)rdev->sdma_fw->data; in cik_sdma_load_microcode()
507 fw_data = (const __be32 *)rdev->sdma_fw->data; in cik_sdma_load_microcode()
520 * cik_sdma_resume - setup and start the async dma engines
550 * cik_sdma_fini - tear down the async dma engines
560 radeon_ring_fini(rdev, &rdev->ring[R600_RING_TYPE_DMA_INDEX]); in cik_sdma_fini()
561 radeon_ring_fini(rdev, &rdev->ring[CAYMAN_RING_TYPE_DMA1_INDEX]); in cik_sdma_fini()
562 /* XXX - compute dma queue tear down */ in cik_sdma_fini()
566 * cik_copy_dma - copy pages using the DMA engine
572 * @resv: reservation object to sync to
584 struct radeon_sync sync; in cik_copy_dma() local
585 int ring_index = rdev->asic->copy.dma_ring_index; in cik_copy_dma()
586 struct radeon_ring *ring = &rdev->ring[ring_index]; in cik_copy_dma()
591 radeon_sync_create(&sync); in cik_copy_dma()
598 radeon_sync_free(rdev, &sync, NULL); in cik_copy_dma()
602 radeon_sync_resv(rdev, &sync, resv, false); in cik_copy_dma()
603 radeon_sync_rings(rdev, &sync, ring->idx); in cik_copy_dma()
609 size_in_bytes -= cur_size_in_bytes; in cik_copy_dma()
621 r = radeon_fence_emit(rdev, &fence, ring->idx); in cik_copy_dma()
624 radeon_sync_free(rdev, &sync, NULL); in cik_copy_dma()
629 radeon_sync_free(rdev, &sync, fence); in cik_copy_dma()
635 * cik_sdma_ring_test - simple async dma engine test
653 if (ring->idx == R600_RING_TYPE_DMA_INDEX) in cik_sdma_ring_test()
658 gpu_addr = rdev->wb.gpu_addr + index; in cik_sdma_ring_test()
661 rdev->wb.wb[index/4] = cpu_to_le32(tmp); in cik_sdma_ring_test()
665 DRM_ERROR("radeon: dma failed to lock ring %d (%d).\n", ring->idx, r); in cik_sdma_ring_test()
675 for (i = 0; i < rdev->usec_timeout; i++) { in cik_sdma_ring_test()
676 tmp = le32_to_cpu(rdev->wb.wb[index/4]); in cik_sdma_ring_test()
682 if (i < rdev->usec_timeout) { in cik_sdma_ring_test()
683 DRM_INFO("ring test on %d succeeded in %d usecs\n", ring->idx, i); in cik_sdma_ring_test()
686 ring->idx, tmp); in cik_sdma_ring_test()
687 r = -EINVAL; in cik_sdma_ring_test()
693 * cik_sdma_ib_test - test an IB on the DMA engine
710 if (ring->idx == R600_RING_TYPE_DMA_INDEX) in cik_sdma_ib_test()
715 gpu_addr = rdev->wb.gpu_addr + index; in cik_sdma_ib_test()
718 rdev->wb.wb[index/4] = cpu_to_le32(tmp); in cik_sdma_ib_test()
720 r = radeon_ib_get(rdev, ring->idx, &ib, NULL, 256); in cik_sdma_ib_test()
746 return -ETIMEDOUT; in cik_sdma_ib_test()
749 for (i = 0; i < rdev->usec_timeout; i++) { in cik_sdma_ib_test()
750 tmp = le32_to_cpu(rdev->wb.wb[index/4]); in cik_sdma_ib_test()
755 if (i < rdev->usec_timeout) { in cik_sdma_ib_test()
756 DRM_INFO("ib test on ring %d succeeded in %u usecs\n", ib.fence->ring, i); in cik_sdma_ib_test()
759 r = -EINVAL; in cik_sdma_ib_test()
766 * cik_sdma_is_lockup - Check if the DMA engine is locked up
777 u32 mask; in cik_sdma_is_lockup() local
779 if (ring->idx == R600_RING_TYPE_DMA_INDEX) in cik_sdma_is_lockup()
780 mask = RADEON_RESET_DMA; in cik_sdma_is_lockup()
782 mask = RADEON_RESET_DMA1; in cik_sdma_is_lockup()
784 if (!(reset_mask & mask)) { in cik_sdma_is_lockup()
792 * cik_sdma_vm_copy_pages - update PTEs by copying them from the GART
798 * @count: number of page entries to update
800 * Update PTEs by copying them from the GART using sDMA (CIK).
812 ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_COPY, in cik_sdma_vm_copy_pages()
814 ib->ptr[ib->length_dw++] = bytes; in cik_sdma_vm_copy_pages()
815 ib->ptr[ib->length_dw++] = 0; /* src/dst endian swap */ in cik_sdma_vm_copy_pages()
816 ib->ptr[ib->length_dw++] = lower_32_bits(src); in cik_sdma_vm_copy_pages()
817 ib->ptr[ib->length_dw++] = upper_32_bits(src); in cik_sdma_vm_copy_pages()
818 ib->ptr[ib->length_dw++] = lower_32_bits(pe); in cik_sdma_vm_copy_pages()
819 ib->ptr[ib->length_dw++] = upper_32_bits(pe); in cik_sdma_vm_copy_pages()
823 count -= bytes / 8; in cik_sdma_vm_copy_pages()
828 * cik_sdma_vm_write_pages - update PTEs by writing them manually
834 * @count: number of page entries to update
838 * Update PTEs by writing them manually using sDMA (CIK).
854 /* for non-physically contiguous pages (system) */ in cik_sdma_vm_write_pages()
855 ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_WRITE, in cik_sdma_vm_write_pages()
857 ib->ptr[ib->length_dw++] = pe; in cik_sdma_vm_write_pages()
858 ib->ptr[ib->length_dw++] = upper_32_bits(pe); in cik_sdma_vm_write_pages()
859 ib->ptr[ib->length_dw++] = ndw; in cik_sdma_vm_write_pages()
860 for (; ndw > 0; ndw -= 2, --count, pe += 8) { in cik_sdma_vm_write_pages()
870 ib->ptr[ib->length_dw++] = value; in cik_sdma_vm_write_pages()
871 ib->ptr[ib->length_dw++] = upper_32_bits(value); in cik_sdma_vm_write_pages()
877 * cik_sdma_vm_set_pages - update the page tables using sDMA
883 * @count: number of page entries to update
887 * Update the page tables using sDMA (CIK).
909 ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_GENERATE_PTE_PDE, 0, 0); in cik_sdma_vm_set_pages()
910 ib->ptr[ib->length_dw++] = pe; /* dst addr */ in cik_sdma_vm_set_pages()
911 ib->ptr[ib->length_dw++] = upper_32_bits(pe); in cik_sdma_vm_set_pages()
912 ib->ptr[ib->length_dw++] = flags; /* mask */ in cik_sdma_vm_set_pages()
913 ib->ptr[ib->length_dw++] = 0; in cik_sdma_vm_set_pages()
914 ib->ptr[ib->length_dw++] = value; /* value */ in cik_sdma_vm_set_pages()
915 ib->ptr[ib->length_dw++] = upper_32_bits(value); in cik_sdma_vm_set_pages()
916 ib->ptr[ib->length_dw++] = incr; /* increment size */ in cik_sdma_vm_set_pages()
917 ib->ptr[ib->length_dw++] = 0; in cik_sdma_vm_set_pages()
918 ib->ptr[ib->length_dw++] = ndw; /* number of entries */ in cik_sdma_vm_set_pages()
922 count -= ndw; in cik_sdma_vm_set_pages()
927 * cik_sdma_vm_pad_ib - pad the IB to the required number of dw
934 while (ib->length_dw & 0x7) in cik_sdma_vm_pad_ib()
935 ib->ptr[ib->length_dw++] = SDMA_PACKET(SDMA_OPCODE_NOP, 0, 0); in cik_sdma_vm_pad_ib()
939 * cik_dma_vm_flush - cik vm flush using sDMA
941 * Update the page table base and flush the VM TLB
954 radeon_ring_write(ring, (VM_CONTEXT8_PAGE_TABLE_BASE_ADDR + ((vm_id - 8) << 2)) >> 2); in cik_dma_vm_flush()
958 /* update SH_MEM_* regs */ in cik_dma_vm_flush()
984 cik_sdma_hdp_flush_ring_emit(rdev, ring->idx); in cik_dma_vm_flush()
995 radeon_ring_write(ring, 0); /* mask */ in cik_dma_vm_flush()