11da177e4SLinus Torvalds /* $Id: io-unit.c,v 1.24 2001/12/17 07:05:09 davem Exp $ 21da177e4SLinus Torvalds * io-unit.c: IO-UNIT specific routines for memory management. 31da177e4SLinus Torvalds * 41da177e4SLinus Torvalds * Copyright (C) 1997,1998 Jakub Jelinek (jj@sunsite.mff.cuni.cz) 51da177e4SLinus Torvalds */ 61da177e4SLinus Torvalds 71da177e4SLinus Torvalds #include <linux/kernel.h> 81da177e4SLinus Torvalds #include <linux/init.h> 91da177e4SLinus Torvalds #include <linux/slab.h> 101da177e4SLinus Torvalds #include <linux/spinlock.h> 111da177e4SLinus Torvalds #include <linux/mm.h> 121da177e4SLinus Torvalds #include <linux/highmem.h> /* pte_offset_map => kmap_atomic */ 131da177e4SLinus Torvalds #include <linux/bitops.h> 141da177e4SLinus Torvalds 151da177e4SLinus Torvalds #include <asm/scatterlist.h> 161da177e4SLinus Torvalds #include <asm/pgalloc.h> 171da177e4SLinus Torvalds #include <asm/pgtable.h> 181da177e4SLinus Torvalds #include <asm/sbus.h> 191da177e4SLinus Torvalds #include <asm/io.h> 201da177e4SLinus Torvalds #include <asm/io-unit.h> 211da177e4SLinus Torvalds #include <asm/mxcc.h> 221da177e4SLinus Torvalds #include <asm/cacheflush.h> 231da177e4SLinus Torvalds #include <asm/tlbflush.h> 241da177e4SLinus Torvalds #include <asm/dma.h> 25d4accd60SDavid S. Miller #include <asm/oplib.h> 261da177e4SLinus Torvalds 271da177e4SLinus Torvalds /* #define IOUNIT_DEBUG */ 281da177e4SLinus Torvalds #ifdef IOUNIT_DEBUG 291da177e4SLinus Torvalds #define IOD(x) printk(x) 301da177e4SLinus Torvalds #else 311da177e4SLinus Torvalds #define IOD(x) do { } while (0) 321da177e4SLinus Torvalds #endif 331da177e4SLinus Torvalds 341da177e4SLinus Torvalds #define IOPERM (IOUPTE_CACHE | IOUPTE_WRITE | IOUPTE_VALID) 351da177e4SLinus Torvalds #define MKIOPTE(phys) __iopte((((phys)>>4) & IOUPTE_PAGE) | IOPERM) 361da177e4SLinus Torvalds 371da177e4SLinus Torvalds void __init 381da177e4SLinus Torvalds iounit_init(int sbi_node, int io_node, struct sbus_bus *sbus) 391da177e4SLinus Torvalds { 401da177e4SLinus Torvalds iopte_t *xpt, *xptend; 411da177e4SLinus Torvalds struct iounit_struct *iounit; 421da177e4SLinus Torvalds struct linux_prom_registers iommu_promregs[PROMREG_MAX]; 431da177e4SLinus Torvalds struct resource r; 441da177e4SLinus Torvalds 45c80892d1SYan Burman iounit = kzalloc(sizeof(struct iounit_struct), GFP_ATOMIC); 46d4accd60SDavid S. Miller if (!iounit) { 47d4accd60SDavid S. Miller prom_printf("SUN4D: Cannot alloc iounit, halting.\n"); 48d4accd60SDavid S. Miller prom_halt(); 49d4accd60SDavid S. Miller } 501da177e4SLinus Torvalds 511da177e4SLinus Torvalds iounit->limit[0] = IOUNIT_BMAP1_START; 521da177e4SLinus Torvalds iounit->limit[1] = IOUNIT_BMAP2_START; 531da177e4SLinus Torvalds iounit->limit[2] = IOUNIT_BMAPM_START; 541da177e4SLinus Torvalds iounit->limit[3] = IOUNIT_BMAPM_END; 551da177e4SLinus Torvalds iounit->rotor[1] = IOUNIT_BMAP2_START; 561da177e4SLinus Torvalds iounit->rotor[2] = IOUNIT_BMAPM_START; 571da177e4SLinus Torvalds 581da177e4SLinus Torvalds xpt = NULL; 591da177e4SLinus Torvalds if(prom_getproperty(sbi_node, "reg", (void *) iommu_promregs, 601da177e4SLinus Torvalds sizeof(iommu_promregs)) != -1) { 611da177e4SLinus Torvalds prom_apply_generic_ranges(io_node, 0, iommu_promregs, 3); 621da177e4SLinus Torvalds memset(&r, 0, sizeof(r)); 631da177e4SLinus Torvalds r.flags = iommu_promregs[2].which_io; 641da177e4SLinus Torvalds r.start = iommu_promregs[2].phys_addr; 651da177e4SLinus Torvalds xpt = (iopte_t *) sbus_ioremap(&r, 0, PAGE_SIZE * 16, "XPT"); 661da177e4SLinus Torvalds } 671da177e4SLinus Torvalds if(!xpt) panic("Cannot map External Page Table."); 681da177e4SLinus Torvalds 691da177e4SLinus Torvalds sbus->iommu = (struct iommu_struct *)iounit; 701da177e4SLinus Torvalds iounit->page_table = xpt; 712f72ba43SRaymond Burns spin_lock_init(&iounit->lock); 721da177e4SLinus Torvalds 731da177e4SLinus Torvalds for (xptend = iounit->page_table + (16 * PAGE_SIZE) / sizeof(iopte_t); 741da177e4SLinus Torvalds xpt < xptend;) 751da177e4SLinus Torvalds iopte_val(*xpt++) = 0; 761da177e4SLinus Torvalds } 771da177e4SLinus Torvalds 781da177e4SLinus Torvalds /* One has to hold iounit->lock to call this */ 791da177e4SLinus Torvalds static unsigned long iounit_get_area(struct iounit_struct *iounit, unsigned long vaddr, int size) 801da177e4SLinus Torvalds { 811da177e4SLinus Torvalds int i, j, k, npages; 821da177e4SLinus Torvalds unsigned long rotor, scan, limit; 831da177e4SLinus Torvalds iopte_t iopte; 841da177e4SLinus Torvalds 851da177e4SLinus Torvalds npages = ((vaddr & ~PAGE_MASK) + size + (PAGE_SIZE-1)) >> PAGE_SHIFT; 861da177e4SLinus Torvalds 871da177e4SLinus Torvalds /* A tiny bit of magic ingredience :) */ 881da177e4SLinus Torvalds switch (npages) { 891da177e4SLinus Torvalds case 1: i = 0x0231; break; 901da177e4SLinus Torvalds case 2: i = 0x0132; break; 911da177e4SLinus Torvalds default: i = 0x0213; break; 921da177e4SLinus Torvalds } 931da177e4SLinus Torvalds 941da177e4SLinus Torvalds IOD(("iounit_get_area(%08lx,%d[%d])=", vaddr, size, npages)); 951da177e4SLinus Torvalds 961da177e4SLinus Torvalds next: j = (i & 15); 971da177e4SLinus Torvalds rotor = iounit->rotor[j - 1]; 981da177e4SLinus Torvalds limit = iounit->limit[j]; 991da177e4SLinus Torvalds scan = rotor; 1001da177e4SLinus Torvalds nexti: scan = find_next_zero_bit(iounit->bmap, limit, scan); 1011da177e4SLinus Torvalds if (scan + npages > limit) { 1021da177e4SLinus Torvalds if (limit != rotor) { 1031da177e4SLinus Torvalds limit = rotor; 1041da177e4SLinus Torvalds scan = iounit->limit[j - 1]; 1051da177e4SLinus Torvalds goto nexti; 1061da177e4SLinus Torvalds } 1071da177e4SLinus Torvalds i >>= 4; 1081da177e4SLinus Torvalds if (!(i & 15)) 1091da177e4SLinus Torvalds panic("iounit_get_area: Couldn't find free iopte slots for (%08lx,%d)\n", vaddr, size); 1101da177e4SLinus Torvalds goto next; 1111da177e4SLinus Torvalds } 1121da177e4SLinus Torvalds for (k = 1, scan++; k < npages; k++) 1131da177e4SLinus Torvalds if (test_bit(scan++, iounit->bmap)) 1141da177e4SLinus Torvalds goto nexti; 1151da177e4SLinus Torvalds iounit->rotor[j - 1] = (scan < limit) ? scan : iounit->limit[j - 1]; 1161da177e4SLinus Torvalds scan -= npages; 1171da177e4SLinus Torvalds iopte = MKIOPTE(__pa(vaddr & PAGE_MASK)); 1181da177e4SLinus Torvalds vaddr = IOUNIT_DMA_BASE + (scan << PAGE_SHIFT) + (vaddr & ~PAGE_MASK); 1191da177e4SLinus Torvalds for (k = 0; k < npages; k++, iopte = __iopte(iopte_val(iopte) + 0x100), scan++) { 1201da177e4SLinus Torvalds set_bit(scan, iounit->bmap); 1211da177e4SLinus Torvalds iounit->page_table[scan] = iopte; 1221da177e4SLinus Torvalds } 1231da177e4SLinus Torvalds IOD(("%08lx\n", vaddr)); 1241da177e4SLinus Torvalds return vaddr; 1251da177e4SLinus Torvalds } 1261da177e4SLinus Torvalds 1271da177e4SLinus Torvalds static __u32 iounit_get_scsi_one(char *vaddr, unsigned long len, struct sbus_bus *sbus) 1281da177e4SLinus Torvalds { 1291da177e4SLinus Torvalds unsigned long ret, flags; 1301da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 1311da177e4SLinus Torvalds 1321da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1331da177e4SLinus Torvalds ret = iounit_get_area(iounit, (unsigned long)vaddr, len); 1341da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1351da177e4SLinus Torvalds return ret; 1361da177e4SLinus Torvalds } 1371da177e4SLinus Torvalds 1381da177e4SLinus Torvalds static void iounit_get_scsi_sgl(struct scatterlist *sg, int sz, struct sbus_bus *sbus) 1391da177e4SLinus Torvalds { 1401da177e4SLinus Torvalds unsigned long flags; 1411da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 1421da177e4SLinus Torvalds 1431da177e4SLinus Torvalds /* FIXME: Cache some resolved pages - often several sg entries are to the same page */ 1441da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1451da177e4SLinus Torvalds while (sz != 0) { 1461da177e4SLinus Torvalds --sz; 1471da177e4SLinus Torvalds sg[sz].dvma_address = iounit_get_area(iounit, (unsigned long)page_address(sg[sz].page) + sg[sz].offset, sg[sz].length); 1481da177e4SLinus Torvalds sg[sz].dvma_length = sg[sz].length; 1491da177e4SLinus Torvalds } 1501da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1511da177e4SLinus Torvalds } 1521da177e4SLinus Torvalds 1531da177e4SLinus Torvalds static void iounit_release_scsi_one(__u32 vaddr, unsigned long len, struct sbus_bus *sbus) 1541da177e4SLinus Torvalds { 1551da177e4SLinus Torvalds unsigned long flags; 1561da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 1571da177e4SLinus Torvalds 1581da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1591da177e4SLinus Torvalds len = ((vaddr & ~PAGE_MASK) + len + (PAGE_SIZE-1)) >> PAGE_SHIFT; 1601da177e4SLinus Torvalds vaddr = (vaddr - IOUNIT_DMA_BASE) >> PAGE_SHIFT; 1611da177e4SLinus Torvalds IOD(("iounit_release %08lx-%08lx\n", (long)vaddr, (long)len+vaddr)); 1621da177e4SLinus Torvalds for (len += vaddr; vaddr < len; vaddr++) 1631da177e4SLinus Torvalds clear_bit(vaddr, iounit->bmap); 1641da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1651da177e4SLinus Torvalds } 1661da177e4SLinus Torvalds 1671da177e4SLinus Torvalds static void iounit_release_scsi_sgl(struct scatterlist *sg, int sz, struct sbus_bus *sbus) 1681da177e4SLinus Torvalds { 1691da177e4SLinus Torvalds unsigned long flags; 1701da177e4SLinus Torvalds unsigned long vaddr, len; 1711da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 1721da177e4SLinus Torvalds 1731da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1741da177e4SLinus Torvalds while (sz != 0) { 1751da177e4SLinus Torvalds --sz; 1761da177e4SLinus Torvalds len = ((sg[sz].dvma_address & ~PAGE_MASK) + sg[sz].length + (PAGE_SIZE-1)) >> PAGE_SHIFT; 1771da177e4SLinus Torvalds vaddr = (sg[sz].dvma_address - IOUNIT_DMA_BASE) >> PAGE_SHIFT; 1781da177e4SLinus Torvalds IOD(("iounit_release %08lx-%08lx\n", (long)vaddr, (long)len+vaddr)); 1791da177e4SLinus Torvalds for (len += vaddr; vaddr < len; vaddr++) 1801da177e4SLinus Torvalds clear_bit(vaddr, iounit->bmap); 1811da177e4SLinus Torvalds } 1821da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1831da177e4SLinus Torvalds } 1841da177e4SLinus Torvalds 1851da177e4SLinus Torvalds #ifdef CONFIG_SBUS 1861da177e4SLinus Torvalds static int iounit_map_dma_area(dma_addr_t *pba, unsigned long va, __u32 addr, int len) 1871da177e4SLinus Torvalds { 1881da177e4SLinus Torvalds unsigned long page, end; 1891da177e4SLinus Torvalds pgprot_t dvma_prot; 1901da177e4SLinus Torvalds iopte_t *iopte; 1911da177e4SLinus Torvalds struct sbus_bus *sbus; 1921da177e4SLinus Torvalds 1931da177e4SLinus Torvalds *pba = addr; 1941da177e4SLinus Torvalds 1951da177e4SLinus Torvalds dvma_prot = __pgprot(SRMMU_CACHE | SRMMU_ET_PTE | SRMMU_PRIV); 1961da177e4SLinus Torvalds end = PAGE_ALIGN((addr + len)); 1971da177e4SLinus Torvalds while(addr < end) { 1981da177e4SLinus Torvalds page = va; 1991da177e4SLinus Torvalds { 2001da177e4SLinus Torvalds pgd_t *pgdp; 2011da177e4SLinus Torvalds pmd_t *pmdp; 2021da177e4SLinus Torvalds pte_t *ptep; 2031da177e4SLinus Torvalds long i; 2041da177e4SLinus Torvalds 2051da177e4SLinus Torvalds pgdp = pgd_offset(&init_mm, addr); 2061da177e4SLinus Torvalds pmdp = pmd_offset(pgdp, addr); 2071da177e4SLinus Torvalds ptep = pte_offset_map(pmdp, addr); 2081da177e4SLinus Torvalds 2091da177e4SLinus Torvalds set_pte(ptep, mk_pte(virt_to_page(page), dvma_prot)); 2101da177e4SLinus Torvalds 2111da177e4SLinus Torvalds i = ((addr - IOUNIT_DMA_BASE) >> PAGE_SHIFT); 2121da177e4SLinus Torvalds 2131da177e4SLinus Torvalds for_each_sbus(sbus) { 2141da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 2151da177e4SLinus Torvalds 2161da177e4SLinus Torvalds iopte = (iopte_t *)(iounit->page_table + i); 2171da177e4SLinus Torvalds *iopte = MKIOPTE(__pa(page)); 2181da177e4SLinus Torvalds } 2191da177e4SLinus Torvalds } 2201da177e4SLinus Torvalds addr += PAGE_SIZE; 2211da177e4SLinus Torvalds va += PAGE_SIZE; 2221da177e4SLinus Torvalds } 2231da177e4SLinus Torvalds flush_cache_all(); 2241da177e4SLinus Torvalds flush_tlb_all(); 2251da177e4SLinus Torvalds 2261da177e4SLinus Torvalds return 0; 2271da177e4SLinus Torvalds } 2281da177e4SLinus Torvalds 2291da177e4SLinus Torvalds static void iounit_unmap_dma_area(unsigned long addr, int len) 2301da177e4SLinus Torvalds { 2311da177e4SLinus Torvalds /* XXX Somebody please fill this in */ 2321da177e4SLinus Torvalds } 2331da177e4SLinus Torvalds 2341da177e4SLinus Torvalds /* XXX We do not pass sbus device here, bad. */ 2351da177e4SLinus Torvalds static struct page *iounit_translate_dvma(unsigned long addr) 2361da177e4SLinus Torvalds { 2371da177e4SLinus Torvalds struct sbus_bus *sbus = sbus_root; /* They are all the same */ 2381da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 2391da177e4SLinus Torvalds int i; 2401da177e4SLinus Torvalds iopte_t *iopte; 2411da177e4SLinus Torvalds 2421da177e4SLinus Torvalds i = ((addr - IOUNIT_DMA_BASE) >> PAGE_SHIFT); 2431da177e4SLinus Torvalds iopte = (iopte_t *)(iounit->page_table + i); 2441da177e4SLinus Torvalds return pfn_to_page(iopte_val(*iopte) >> (PAGE_SHIFT-4)); /* XXX sun4d guru, help */ 2451da177e4SLinus Torvalds } 2461da177e4SLinus Torvalds #endif 2471da177e4SLinus Torvalds 2481da177e4SLinus Torvalds static char *iounit_lockarea(char *vaddr, unsigned long len) 2491da177e4SLinus Torvalds { 2501da177e4SLinus Torvalds /* FIXME: Write this */ 2511da177e4SLinus Torvalds return vaddr; 2521da177e4SLinus Torvalds } 2531da177e4SLinus Torvalds 2541da177e4SLinus Torvalds static void iounit_unlockarea(char *vaddr, unsigned long len) 2551da177e4SLinus Torvalds { 2561da177e4SLinus Torvalds /* FIXME: Write this */ 2571da177e4SLinus Torvalds } 2581da177e4SLinus Torvalds 2591da177e4SLinus Torvalds void __init ld_mmu_iounit(void) 2601da177e4SLinus Torvalds { 2611da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_lockarea, iounit_lockarea, BTFIXUPCALL_RETO0); 2621da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_unlockarea, iounit_unlockarea, BTFIXUPCALL_NOP); 2631da177e4SLinus Torvalds 2641da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_get_scsi_one, iounit_get_scsi_one, BTFIXUPCALL_NORM); 2651da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_get_scsi_sgl, iounit_get_scsi_sgl, BTFIXUPCALL_NORM); 2661da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_release_scsi_one, iounit_release_scsi_one, BTFIXUPCALL_NORM); 2671da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_release_scsi_sgl, iounit_release_scsi_sgl, BTFIXUPCALL_NORM); 2681da177e4SLinus Torvalds 2691da177e4SLinus Torvalds #ifdef CONFIG_SBUS 2701da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_map_dma_area, iounit_map_dma_area, BTFIXUPCALL_NORM); 2711da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_unmap_dma_area, iounit_unmap_dma_area, BTFIXUPCALL_NORM); 2721da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_translate_dvma, iounit_translate_dvma, BTFIXUPCALL_NORM); 2731da177e4SLinus Torvalds #endif 2741da177e4SLinus Torvalds } 2751da177e4SLinus Torvalds 2761da177e4SLinus Torvalds __u32 iounit_map_dma_init(struct sbus_bus *sbus, int size) 2771da177e4SLinus Torvalds { 2781da177e4SLinus Torvalds int i, j, k, npages; 2791da177e4SLinus Torvalds unsigned long rotor, scan, limit; 2801da177e4SLinus Torvalds unsigned long flags; 2811da177e4SLinus Torvalds __u32 ret; 2821da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 2831da177e4SLinus Torvalds 2841da177e4SLinus Torvalds npages = (size + (PAGE_SIZE-1)) >> PAGE_SHIFT; 2851da177e4SLinus Torvalds i = 0x0213; 2861da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 2871da177e4SLinus Torvalds next: j = (i & 15); 2881da177e4SLinus Torvalds rotor = iounit->rotor[j - 1]; 2891da177e4SLinus Torvalds limit = iounit->limit[j]; 2901da177e4SLinus Torvalds scan = rotor; 2911da177e4SLinus Torvalds nexti: scan = find_next_zero_bit(iounit->bmap, limit, scan); 2921da177e4SLinus Torvalds if (scan + npages > limit) { 2931da177e4SLinus Torvalds if (limit != rotor) { 2941da177e4SLinus Torvalds limit = rotor; 2951da177e4SLinus Torvalds scan = iounit->limit[j - 1]; 2961da177e4SLinus Torvalds goto nexti; 2971da177e4SLinus Torvalds } 2981da177e4SLinus Torvalds i >>= 4; 2991da177e4SLinus Torvalds if (!(i & 15)) 3001da177e4SLinus Torvalds panic("iounit_map_dma_init: Couldn't find free iopte slots for %d bytes\n", size); 3011da177e4SLinus Torvalds goto next; 3021da177e4SLinus Torvalds } 3031da177e4SLinus Torvalds for (k = 1, scan++; k < npages; k++) 3041da177e4SLinus Torvalds if (test_bit(scan++, iounit->bmap)) 3051da177e4SLinus Torvalds goto nexti; 3061da177e4SLinus Torvalds iounit->rotor[j - 1] = (scan < limit) ? scan : iounit->limit[j - 1]; 3071da177e4SLinus Torvalds scan -= npages; 3081da177e4SLinus Torvalds ret = IOUNIT_DMA_BASE + (scan << PAGE_SHIFT); 3091da177e4SLinus Torvalds for (k = 0; k < npages; k++, scan++) 3101da177e4SLinus Torvalds set_bit(scan, iounit->bmap); 3111da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 3121da177e4SLinus Torvalds return ret; 3131da177e4SLinus Torvalds } 3141da177e4SLinus Torvalds 3151da177e4SLinus Torvalds __u32 iounit_map_dma_page(__u32 vaddr, void *addr, struct sbus_bus *sbus) 3161da177e4SLinus Torvalds { 3171da177e4SLinus Torvalds int scan = (vaddr - IOUNIT_DMA_BASE) >> PAGE_SHIFT; 3181da177e4SLinus Torvalds struct iounit_struct *iounit = (struct iounit_struct *)sbus->iommu; 3191da177e4SLinus Torvalds 3201da177e4SLinus Torvalds iounit->page_table[scan] = MKIOPTE(__pa(((unsigned long)addr) & PAGE_MASK)); 3211da177e4SLinus Torvalds return vaddr + (((unsigned long)addr) & ~PAGE_MASK); 3221da177e4SLinus Torvalds } 323