188278ca2SAdrian Bunk /* 21da177e4SLinus Torvalds * io-unit.c: IO-UNIT specific routines for memory management. 31da177e4SLinus Torvalds * 41da177e4SLinus Torvalds * Copyright (C) 1997,1998 Jakub Jelinek (jj@sunsite.mff.cuni.cz) 51da177e4SLinus Torvalds */ 61da177e4SLinus Torvalds 71da177e4SLinus Torvalds #include <linux/kernel.h> 81da177e4SLinus Torvalds #include <linux/init.h> 91da177e4SLinus Torvalds #include <linux/slab.h> 101da177e4SLinus Torvalds #include <linux/spinlock.h> 111da177e4SLinus Torvalds #include <linux/mm.h> 121da177e4SLinus Torvalds #include <linux/highmem.h> /* pte_offset_map => kmap_atomic */ 131da177e4SLinus Torvalds #include <linux/bitops.h> 140912a5dbSJens Axboe #include <linux/scatterlist.h> 151da177e4SLinus Torvalds 161da177e4SLinus Torvalds #include <asm/pgalloc.h> 171da177e4SLinus Torvalds #include <asm/pgtable.h> 181da177e4SLinus Torvalds #include <asm/sbus.h> 191da177e4SLinus Torvalds #include <asm/io.h> 201da177e4SLinus Torvalds #include <asm/io-unit.h> 211da177e4SLinus Torvalds #include <asm/mxcc.h> 221da177e4SLinus Torvalds #include <asm/cacheflush.h> 231da177e4SLinus Torvalds #include <asm/tlbflush.h> 241da177e4SLinus Torvalds #include <asm/dma.h> 25d4accd60SDavid S. Miller #include <asm/oplib.h> 261da177e4SLinus Torvalds 271da177e4SLinus Torvalds /* #define IOUNIT_DEBUG */ 281da177e4SLinus Torvalds #ifdef IOUNIT_DEBUG 291da177e4SLinus Torvalds #define IOD(x) printk(x) 301da177e4SLinus Torvalds #else 311da177e4SLinus Torvalds #define IOD(x) do { } while (0) 321da177e4SLinus Torvalds #endif 331da177e4SLinus Torvalds 341da177e4SLinus Torvalds #define IOPERM (IOUPTE_CACHE | IOUPTE_WRITE | IOUPTE_VALID) 351da177e4SLinus Torvalds #define MKIOPTE(phys) __iopte((((phys)>>4) & IOUPTE_PAGE) | IOPERM) 361da177e4SLinus Torvalds 37e0039348SDavid S. Miller void __init iounit_init(struct sbus_bus *sbus) 381da177e4SLinus Torvalds { 39e0039348SDavid S. Miller struct device_node *dp = sbus->ofdev.node; 401da177e4SLinus Torvalds struct iounit_struct *iounit; 41e0039348SDavid S. Miller iopte_t *xpt, *xptend; 42e0039348SDavid S. Miller struct of_device *op; 43e0039348SDavid S. Miller 44e0039348SDavid S. Miller op = of_find_device_by_node(dp); 45e0039348SDavid S. Miller if (!op) { 46e0039348SDavid S. Miller prom_printf("SUN4D: Cannot find SBI of_device.\n"); 47e0039348SDavid S. Miller prom_halt(); 48e0039348SDavid S. Miller } 491da177e4SLinus Torvalds 50c80892d1SYan Burman iounit = kzalloc(sizeof(struct iounit_struct), GFP_ATOMIC); 51d4accd60SDavid S. Miller if (!iounit) { 52d4accd60SDavid S. Miller prom_printf("SUN4D: Cannot alloc iounit, halting.\n"); 53d4accd60SDavid S. Miller prom_halt(); 54d4accd60SDavid S. Miller } 551da177e4SLinus Torvalds 561da177e4SLinus Torvalds iounit->limit[0] = IOUNIT_BMAP1_START; 571da177e4SLinus Torvalds iounit->limit[1] = IOUNIT_BMAP2_START; 581da177e4SLinus Torvalds iounit->limit[2] = IOUNIT_BMAPM_START; 591da177e4SLinus Torvalds iounit->limit[3] = IOUNIT_BMAPM_END; 601da177e4SLinus Torvalds iounit->rotor[1] = IOUNIT_BMAP2_START; 611da177e4SLinus Torvalds iounit->rotor[2] = IOUNIT_BMAPM_START; 621da177e4SLinus Torvalds 63e0039348SDavid S. Miller xpt = of_ioremap(&op->resource[2], 0, PAGE_SIZE * 16, "XPT"); 64e0039348SDavid S. Miller if (!xpt) { 65e0039348SDavid S. Miller prom_printf("SUN4D: Cannot map External Page Table."); 66e0039348SDavid S. Miller prom_halt(); 671da177e4SLinus Torvalds } 681da177e4SLinus Torvalds 693ac4c949SRobert Reif sbus->ofdev.dev.archdata.iommu = iounit; 70e0039348SDavid S. Miller op->dev.archdata.iommu = iounit; 711da177e4SLinus Torvalds iounit->page_table = xpt; 722f72ba43SRaymond Burns spin_lock_init(&iounit->lock); 731da177e4SLinus Torvalds 741da177e4SLinus Torvalds for (xptend = iounit->page_table + (16 * PAGE_SIZE) / sizeof(iopte_t); 751da177e4SLinus Torvalds xpt < xptend;) 761da177e4SLinus Torvalds iopte_val(*xpt++) = 0; 771da177e4SLinus Torvalds } 781da177e4SLinus Torvalds 791da177e4SLinus Torvalds /* One has to hold iounit->lock to call this */ 801da177e4SLinus Torvalds static unsigned long iounit_get_area(struct iounit_struct *iounit, unsigned long vaddr, int size) 811da177e4SLinus Torvalds { 821da177e4SLinus Torvalds int i, j, k, npages; 831da177e4SLinus Torvalds unsigned long rotor, scan, limit; 841da177e4SLinus Torvalds iopte_t iopte; 851da177e4SLinus Torvalds 861da177e4SLinus Torvalds npages = ((vaddr & ~PAGE_MASK) + size + (PAGE_SIZE-1)) >> PAGE_SHIFT; 871da177e4SLinus Torvalds 881da177e4SLinus Torvalds /* A tiny bit of magic ingredience :) */ 891da177e4SLinus Torvalds switch (npages) { 901da177e4SLinus Torvalds case 1: i = 0x0231; break; 911da177e4SLinus Torvalds case 2: i = 0x0132; break; 921da177e4SLinus Torvalds default: i = 0x0213; break; 931da177e4SLinus Torvalds } 941da177e4SLinus Torvalds 951da177e4SLinus Torvalds IOD(("iounit_get_area(%08lx,%d[%d])=", vaddr, size, npages)); 961da177e4SLinus Torvalds 971da177e4SLinus Torvalds next: j = (i & 15); 981da177e4SLinus Torvalds rotor = iounit->rotor[j - 1]; 991da177e4SLinus Torvalds limit = iounit->limit[j]; 1001da177e4SLinus Torvalds scan = rotor; 1011da177e4SLinus Torvalds nexti: scan = find_next_zero_bit(iounit->bmap, limit, scan); 1021da177e4SLinus Torvalds if (scan + npages > limit) { 1031da177e4SLinus Torvalds if (limit != rotor) { 1041da177e4SLinus Torvalds limit = rotor; 1051da177e4SLinus Torvalds scan = iounit->limit[j - 1]; 1061da177e4SLinus Torvalds goto nexti; 1071da177e4SLinus Torvalds } 1081da177e4SLinus Torvalds i >>= 4; 1091da177e4SLinus Torvalds if (!(i & 15)) 1101da177e4SLinus Torvalds panic("iounit_get_area: Couldn't find free iopte slots for (%08lx,%d)\n", vaddr, size); 1111da177e4SLinus Torvalds goto next; 1121da177e4SLinus Torvalds } 1131da177e4SLinus Torvalds for (k = 1, scan++; k < npages; k++) 1141da177e4SLinus Torvalds if (test_bit(scan++, iounit->bmap)) 1151da177e4SLinus Torvalds goto nexti; 1161da177e4SLinus Torvalds iounit->rotor[j - 1] = (scan < limit) ? scan : iounit->limit[j - 1]; 1171da177e4SLinus Torvalds scan -= npages; 1181da177e4SLinus Torvalds iopte = MKIOPTE(__pa(vaddr & PAGE_MASK)); 1191da177e4SLinus Torvalds vaddr = IOUNIT_DMA_BASE + (scan << PAGE_SHIFT) + (vaddr & ~PAGE_MASK); 1201da177e4SLinus Torvalds for (k = 0; k < npages; k++, iopte = __iopte(iopte_val(iopte) + 0x100), scan++) { 1211da177e4SLinus Torvalds set_bit(scan, iounit->bmap); 1221da177e4SLinus Torvalds iounit->page_table[scan] = iopte; 1231da177e4SLinus Torvalds } 1241da177e4SLinus Torvalds IOD(("%08lx\n", vaddr)); 1251da177e4SLinus Torvalds return vaddr; 1261da177e4SLinus Torvalds } 1271da177e4SLinus Torvalds 1281da177e4SLinus Torvalds static __u32 iounit_get_scsi_one(char *vaddr, unsigned long len, struct sbus_bus *sbus) 1291da177e4SLinus Torvalds { 1301da177e4SLinus Torvalds unsigned long ret, flags; 1313ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 1321da177e4SLinus Torvalds 1331da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1341da177e4SLinus Torvalds ret = iounit_get_area(iounit, (unsigned long)vaddr, len); 1351da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1361da177e4SLinus Torvalds return ret; 1371da177e4SLinus Torvalds } 1381da177e4SLinus Torvalds 1391da177e4SLinus Torvalds static void iounit_get_scsi_sgl(struct scatterlist *sg, int sz, struct sbus_bus *sbus) 1401da177e4SLinus Torvalds { 1411da177e4SLinus Torvalds unsigned long flags; 1423ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 1431da177e4SLinus Torvalds 1441da177e4SLinus Torvalds /* FIXME: Cache some resolved pages - often several sg entries are to the same page */ 1451da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1461da177e4SLinus Torvalds while (sz != 0) { 1471da177e4SLinus Torvalds --sz; 1486ee4e28bSDavid S. Miller sg->dvma_address = iounit_get_area(iounit, (unsigned long) sg_virt(sg), sg->length); 1490912a5dbSJens Axboe sg->dvma_length = sg->length; 1500912a5dbSJens Axboe sg = sg_next(sg); 1511da177e4SLinus Torvalds } 1521da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1531da177e4SLinus Torvalds } 1541da177e4SLinus Torvalds 1551da177e4SLinus Torvalds static void iounit_release_scsi_one(__u32 vaddr, unsigned long len, struct sbus_bus *sbus) 1561da177e4SLinus Torvalds { 1571da177e4SLinus Torvalds unsigned long flags; 1583ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 1591da177e4SLinus Torvalds 1601da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1611da177e4SLinus Torvalds len = ((vaddr & ~PAGE_MASK) + len + (PAGE_SIZE-1)) >> PAGE_SHIFT; 1621da177e4SLinus Torvalds vaddr = (vaddr - IOUNIT_DMA_BASE) >> PAGE_SHIFT; 1631da177e4SLinus Torvalds IOD(("iounit_release %08lx-%08lx\n", (long)vaddr, (long)len+vaddr)); 1641da177e4SLinus Torvalds for (len += vaddr; vaddr < len; vaddr++) 1651da177e4SLinus Torvalds clear_bit(vaddr, iounit->bmap); 1661da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1671da177e4SLinus Torvalds } 1681da177e4SLinus Torvalds 1691da177e4SLinus Torvalds static void iounit_release_scsi_sgl(struct scatterlist *sg, int sz, struct sbus_bus *sbus) 1701da177e4SLinus Torvalds { 1711da177e4SLinus Torvalds unsigned long flags; 1721da177e4SLinus Torvalds unsigned long vaddr, len; 1733ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 1741da177e4SLinus Torvalds 1751da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 1761da177e4SLinus Torvalds while (sz != 0) { 1771da177e4SLinus Torvalds --sz; 1780912a5dbSJens Axboe len = ((sg->dvma_address & ~PAGE_MASK) + sg->length + (PAGE_SIZE-1)) >> PAGE_SHIFT; 1790912a5dbSJens Axboe vaddr = (sg->dvma_address - IOUNIT_DMA_BASE) >> PAGE_SHIFT; 1801da177e4SLinus Torvalds IOD(("iounit_release %08lx-%08lx\n", (long)vaddr, (long)len+vaddr)); 1811da177e4SLinus Torvalds for (len += vaddr; vaddr < len; vaddr++) 1821da177e4SLinus Torvalds clear_bit(vaddr, iounit->bmap); 1830912a5dbSJens Axboe sg = sg_next(sg); 1841da177e4SLinus Torvalds } 1851da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 1861da177e4SLinus Torvalds } 1871da177e4SLinus Torvalds 1881da177e4SLinus Torvalds #ifdef CONFIG_SBUS 1891da177e4SLinus Torvalds static int iounit_map_dma_area(dma_addr_t *pba, unsigned long va, __u32 addr, int len) 1901da177e4SLinus Torvalds { 1911da177e4SLinus Torvalds unsigned long page, end; 1921da177e4SLinus Torvalds pgprot_t dvma_prot; 1931da177e4SLinus Torvalds iopte_t *iopte; 1941da177e4SLinus Torvalds struct sbus_bus *sbus; 1951da177e4SLinus Torvalds 1961da177e4SLinus Torvalds *pba = addr; 1971da177e4SLinus Torvalds 1981da177e4SLinus Torvalds dvma_prot = __pgprot(SRMMU_CACHE | SRMMU_ET_PTE | SRMMU_PRIV); 1991da177e4SLinus Torvalds end = PAGE_ALIGN((addr + len)); 2001da177e4SLinus Torvalds while(addr < end) { 2011da177e4SLinus Torvalds page = va; 2021da177e4SLinus Torvalds { 2031da177e4SLinus Torvalds pgd_t *pgdp; 2041da177e4SLinus Torvalds pmd_t *pmdp; 2051da177e4SLinus Torvalds pte_t *ptep; 2061da177e4SLinus Torvalds long i; 2071da177e4SLinus Torvalds 2081da177e4SLinus Torvalds pgdp = pgd_offset(&init_mm, addr); 2091da177e4SLinus Torvalds pmdp = pmd_offset(pgdp, addr); 2101da177e4SLinus Torvalds ptep = pte_offset_map(pmdp, addr); 2111da177e4SLinus Torvalds 2121da177e4SLinus Torvalds set_pte(ptep, mk_pte(virt_to_page(page), dvma_prot)); 2131da177e4SLinus Torvalds 2141da177e4SLinus Torvalds i = ((addr - IOUNIT_DMA_BASE) >> PAGE_SHIFT); 2151da177e4SLinus Torvalds 2161da177e4SLinus Torvalds for_each_sbus(sbus) { 2173ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 2181da177e4SLinus Torvalds 2191da177e4SLinus Torvalds iopte = (iopte_t *)(iounit->page_table + i); 2201da177e4SLinus Torvalds *iopte = MKIOPTE(__pa(page)); 2211da177e4SLinus Torvalds } 2221da177e4SLinus Torvalds } 2231da177e4SLinus Torvalds addr += PAGE_SIZE; 2241da177e4SLinus Torvalds va += PAGE_SIZE; 2251da177e4SLinus Torvalds } 2261da177e4SLinus Torvalds flush_cache_all(); 2271da177e4SLinus Torvalds flush_tlb_all(); 2281da177e4SLinus Torvalds 2291da177e4SLinus Torvalds return 0; 2301da177e4SLinus Torvalds } 2311da177e4SLinus Torvalds 2321da177e4SLinus Torvalds static void iounit_unmap_dma_area(unsigned long addr, int len) 2331da177e4SLinus Torvalds { 2341da177e4SLinus Torvalds /* XXX Somebody please fill this in */ 2351da177e4SLinus Torvalds } 2361da177e4SLinus Torvalds 2371da177e4SLinus Torvalds /* XXX We do not pass sbus device here, bad. */ 2381da177e4SLinus Torvalds static struct page *iounit_translate_dvma(unsigned long addr) 2391da177e4SLinus Torvalds { 2401da177e4SLinus Torvalds struct sbus_bus *sbus = sbus_root; /* They are all the same */ 2413ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 2421da177e4SLinus Torvalds int i; 2431da177e4SLinus Torvalds iopte_t *iopte; 2441da177e4SLinus Torvalds 2451da177e4SLinus Torvalds i = ((addr - IOUNIT_DMA_BASE) >> PAGE_SHIFT); 2461da177e4SLinus Torvalds iopte = (iopte_t *)(iounit->page_table + i); 2471da177e4SLinus Torvalds return pfn_to_page(iopte_val(*iopte) >> (PAGE_SHIFT-4)); /* XXX sun4d guru, help */ 2481da177e4SLinus Torvalds } 2491da177e4SLinus Torvalds #endif 2501da177e4SLinus Torvalds 2511da177e4SLinus Torvalds static char *iounit_lockarea(char *vaddr, unsigned long len) 2521da177e4SLinus Torvalds { 2531da177e4SLinus Torvalds /* FIXME: Write this */ 2541da177e4SLinus Torvalds return vaddr; 2551da177e4SLinus Torvalds } 2561da177e4SLinus Torvalds 2571da177e4SLinus Torvalds static void iounit_unlockarea(char *vaddr, unsigned long len) 2581da177e4SLinus Torvalds { 2591da177e4SLinus Torvalds /* FIXME: Write this */ 2601da177e4SLinus Torvalds } 2611da177e4SLinus Torvalds 2621da177e4SLinus Torvalds void __init ld_mmu_iounit(void) 2631da177e4SLinus Torvalds { 2641da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_lockarea, iounit_lockarea, BTFIXUPCALL_RETO0); 2651da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_unlockarea, iounit_unlockarea, BTFIXUPCALL_NOP); 2661da177e4SLinus Torvalds 2671da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_get_scsi_one, iounit_get_scsi_one, BTFIXUPCALL_NORM); 2681da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_get_scsi_sgl, iounit_get_scsi_sgl, BTFIXUPCALL_NORM); 2691da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_release_scsi_one, iounit_release_scsi_one, BTFIXUPCALL_NORM); 2701da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_release_scsi_sgl, iounit_release_scsi_sgl, BTFIXUPCALL_NORM); 2711da177e4SLinus Torvalds 2721da177e4SLinus Torvalds #ifdef CONFIG_SBUS 2731da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_map_dma_area, iounit_map_dma_area, BTFIXUPCALL_NORM); 2741da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_unmap_dma_area, iounit_unmap_dma_area, BTFIXUPCALL_NORM); 2751da177e4SLinus Torvalds BTFIXUPSET_CALL(mmu_translate_dvma, iounit_translate_dvma, BTFIXUPCALL_NORM); 2761da177e4SLinus Torvalds #endif 2771da177e4SLinus Torvalds } 2781da177e4SLinus Torvalds 2791da177e4SLinus Torvalds __u32 iounit_map_dma_init(struct sbus_bus *sbus, int size) 2801da177e4SLinus Torvalds { 2811da177e4SLinus Torvalds int i, j, k, npages; 2821da177e4SLinus Torvalds unsigned long rotor, scan, limit; 2831da177e4SLinus Torvalds unsigned long flags; 2841da177e4SLinus Torvalds __u32 ret; 2853ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 2861da177e4SLinus Torvalds 2871da177e4SLinus Torvalds npages = (size + (PAGE_SIZE-1)) >> PAGE_SHIFT; 2881da177e4SLinus Torvalds i = 0x0213; 2891da177e4SLinus Torvalds spin_lock_irqsave(&iounit->lock, flags); 2901da177e4SLinus Torvalds next: j = (i & 15); 2911da177e4SLinus Torvalds rotor = iounit->rotor[j - 1]; 2921da177e4SLinus Torvalds limit = iounit->limit[j]; 2931da177e4SLinus Torvalds scan = rotor; 2941da177e4SLinus Torvalds nexti: scan = find_next_zero_bit(iounit->bmap, limit, scan); 2951da177e4SLinus Torvalds if (scan + npages > limit) { 2961da177e4SLinus Torvalds if (limit != rotor) { 2971da177e4SLinus Torvalds limit = rotor; 2981da177e4SLinus Torvalds scan = iounit->limit[j - 1]; 2991da177e4SLinus Torvalds goto nexti; 3001da177e4SLinus Torvalds } 3011da177e4SLinus Torvalds i >>= 4; 3021da177e4SLinus Torvalds if (!(i & 15)) 3031da177e4SLinus Torvalds panic("iounit_map_dma_init: Couldn't find free iopte slots for %d bytes\n", size); 3041da177e4SLinus Torvalds goto next; 3051da177e4SLinus Torvalds } 3061da177e4SLinus Torvalds for (k = 1, scan++; k < npages; k++) 3071da177e4SLinus Torvalds if (test_bit(scan++, iounit->bmap)) 3081da177e4SLinus Torvalds goto nexti; 3091da177e4SLinus Torvalds iounit->rotor[j - 1] = (scan < limit) ? scan : iounit->limit[j - 1]; 3101da177e4SLinus Torvalds scan -= npages; 3111da177e4SLinus Torvalds ret = IOUNIT_DMA_BASE + (scan << PAGE_SHIFT); 3121da177e4SLinus Torvalds for (k = 0; k < npages; k++, scan++) 3131da177e4SLinus Torvalds set_bit(scan, iounit->bmap); 3141da177e4SLinus Torvalds spin_unlock_irqrestore(&iounit->lock, flags); 3151da177e4SLinus Torvalds return ret; 3161da177e4SLinus Torvalds } 3171da177e4SLinus Torvalds 3181da177e4SLinus Torvalds __u32 iounit_map_dma_page(__u32 vaddr, void *addr, struct sbus_bus *sbus) 3191da177e4SLinus Torvalds { 3201da177e4SLinus Torvalds int scan = (vaddr - IOUNIT_DMA_BASE) >> PAGE_SHIFT; 3213ac4c949SRobert Reif struct iounit_struct *iounit = sbus->ofdev.dev.archdata.iommu; 3221da177e4SLinus Torvalds 3231da177e4SLinus Torvalds iounit->page_table[scan] = MKIOPTE(__pa(((unsigned long)addr) & PAGE_MASK)); 3241da177e4SLinus Torvalds return vaddr + (((unsigned long)addr) & ~PAGE_MASK); 3251da177e4SLinus Torvalds } 326