127137e52SSam Ravnborg /* 227137e52SSam Ravnborg * SPARC64 Huge TLB page support. 327137e52SSam Ravnborg * 427137e52SSam Ravnborg * Copyright (C) 2002, 2003, 2006 David S. Miller (davem@davemloft.net) 527137e52SSam Ravnborg */ 627137e52SSam Ravnborg 727137e52SSam Ravnborg #include <linux/init.h> 827137e52SSam Ravnborg #include <linux/fs.h> 927137e52SSam Ravnborg #include <linux/mm.h> 1027137e52SSam Ravnborg #include <linux/hugetlb.h> 1127137e52SSam Ravnborg #include <linux/pagemap.h> 1227137e52SSam Ravnborg #include <linux/sysctl.h> 1327137e52SSam Ravnborg 1427137e52SSam Ravnborg #include <asm/mman.h> 1527137e52SSam Ravnborg #include <asm/pgalloc.h> 1627137e52SSam Ravnborg #include <asm/tlb.h> 1727137e52SSam Ravnborg #include <asm/tlbflush.h> 1827137e52SSam Ravnborg #include <asm/cacheflush.h> 1927137e52SSam Ravnborg #include <asm/mmu_context.h> 2027137e52SSam Ravnborg 2127137e52SSam Ravnborg /* Slightly simplified from the non-hugepage variant because by 2227137e52SSam Ravnborg * definition we don't have to worry about any page coloring stuff 2327137e52SSam Ravnborg */ 2427137e52SSam Ravnborg #define VA_EXCLUDE_START (0x0000080000000000UL - (1UL << 32UL)) 2527137e52SSam Ravnborg #define VA_EXCLUDE_END (0xfffff80000000000UL + (1UL << 32UL)) 2627137e52SSam Ravnborg 2727137e52SSam Ravnborg static unsigned long hugetlb_get_unmapped_area_bottomup(struct file *filp, 2827137e52SSam Ravnborg unsigned long addr, 2927137e52SSam Ravnborg unsigned long len, 3027137e52SSam Ravnborg unsigned long pgoff, 3127137e52SSam Ravnborg unsigned long flags) 3227137e52SSam Ravnborg { 3327137e52SSam Ravnborg unsigned long task_size = TASK_SIZE; 34*2aea28b9SMichel Lespinasse struct vm_unmapped_area_info info; 3527137e52SSam Ravnborg 3627137e52SSam Ravnborg if (test_thread_flag(TIF_32BIT)) 3727137e52SSam Ravnborg task_size = STACK_TOP32; 3827137e52SSam Ravnborg 39*2aea28b9SMichel Lespinasse info.flags = 0; 40*2aea28b9SMichel Lespinasse info.length = len; 41*2aea28b9SMichel Lespinasse info.low_limit = TASK_UNMAPPED_BASE; 42*2aea28b9SMichel Lespinasse info.high_limit = min(task_size, VA_EXCLUDE_START); 43*2aea28b9SMichel Lespinasse info.align_mask = PAGE_MASK & ~HPAGE_MASK; 44*2aea28b9SMichel Lespinasse info.align_offset = 0; 45*2aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 46*2aea28b9SMichel Lespinasse 47*2aea28b9SMichel Lespinasse if ((addr & ~PAGE_MASK) && task_size > VA_EXCLUDE_END) { 48*2aea28b9SMichel Lespinasse VM_BUG_ON(addr != -ENOMEM); 49*2aea28b9SMichel Lespinasse info.low_limit = VA_EXCLUDE_END; 50*2aea28b9SMichel Lespinasse info.high_limit = task_size; 51*2aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 5227137e52SSam Ravnborg } 5327137e52SSam Ravnborg 5427137e52SSam Ravnborg return addr; 5527137e52SSam Ravnborg } 5627137e52SSam Ravnborg 5727137e52SSam Ravnborg static unsigned long 5827137e52SSam Ravnborg hugetlb_get_unmapped_area_topdown(struct file *filp, const unsigned long addr0, 5927137e52SSam Ravnborg const unsigned long len, 6027137e52SSam Ravnborg const unsigned long pgoff, 6127137e52SSam Ravnborg const unsigned long flags) 6227137e52SSam Ravnborg { 6327137e52SSam Ravnborg struct mm_struct *mm = current->mm; 6427137e52SSam Ravnborg unsigned long addr = addr0; 65*2aea28b9SMichel Lespinasse struct vm_unmapped_area_info info; 6627137e52SSam Ravnborg 6727137e52SSam Ravnborg /* This should only ever run for 32-bit processes. */ 6827137e52SSam Ravnborg BUG_ON(!test_thread_flag(TIF_32BIT)); 6927137e52SSam Ravnborg 70*2aea28b9SMichel Lespinasse info.flags = VM_UNMAPPED_AREA_TOPDOWN; 71*2aea28b9SMichel Lespinasse info.length = len; 72*2aea28b9SMichel Lespinasse info.low_limit = PAGE_SIZE; 73*2aea28b9SMichel Lespinasse info.high_limit = mm->mmap_base; 74*2aea28b9SMichel Lespinasse info.align_mask = PAGE_MASK & ~HPAGE_MASK; 75*2aea28b9SMichel Lespinasse info.align_offset = 0; 76*2aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 7727137e52SSam Ravnborg 7827137e52SSam Ravnborg /* 7927137e52SSam Ravnborg * A failed mmap() very likely causes application failure, 8027137e52SSam Ravnborg * so fall back to the bottom-up function here. This scenario 8127137e52SSam Ravnborg * can happen with large stack limits and large mmap() 8227137e52SSam Ravnborg * allocations. 8327137e52SSam Ravnborg */ 84*2aea28b9SMichel Lespinasse if (addr & ~PAGE_MASK) { 85*2aea28b9SMichel Lespinasse VM_BUG_ON(addr != -ENOMEM); 86*2aea28b9SMichel Lespinasse info.flags = 0; 87*2aea28b9SMichel Lespinasse info.low_limit = TASK_UNMAPPED_BASE; 88*2aea28b9SMichel Lespinasse info.high_limit = STACK_TOP32; 89*2aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 90*2aea28b9SMichel Lespinasse } 9127137e52SSam Ravnborg 9227137e52SSam Ravnborg return addr; 9327137e52SSam Ravnborg } 9427137e52SSam Ravnborg 9527137e52SSam Ravnborg unsigned long 9627137e52SSam Ravnborg hugetlb_get_unmapped_area(struct file *file, unsigned long addr, 9727137e52SSam Ravnborg unsigned long len, unsigned long pgoff, unsigned long flags) 9827137e52SSam Ravnborg { 9927137e52SSam Ravnborg struct mm_struct *mm = current->mm; 10027137e52SSam Ravnborg struct vm_area_struct *vma; 10127137e52SSam Ravnborg unsigned long task_size = TASK_SIZE; 10227137e52SSam Ravnborg 10327137e52SSam Ravnborg if (test_thread_flag(TIF_32BIT)) 10427137e52SSam Ravnborg task_size = STACK_TOP32; 10527137e52SSam Ravnborg 10627137e52SSam Ravnborg if (len & ~HPAGE_MASK) 10727137e52SSam Ravnborg return -EINVAL; 10827137e52SSam Ravnborg if (len > task_size) 10927137e52SSam Ravnborg return -ENOMEM; 11027137e52SSam Ravnborg 11127137e52SSam Ravnborg if (flags & MAP_FIXED) { 11227137e52SSam Ravnborg if (prepare_hugepage_range(file, addr, len)) 11327137e52SSam Ravnborg return -EINVAL; 11427137e52SSam Ravnborg return addr; 11527137e52SSam Ravnborg } 11627137e52SSam Ravnborg 11727137e52SSam Ravnborg if (addr) { 11827137e52SSam Ravnborg addr = ALIGN(addr, HPAGE_SIZE); 11927137e52SSam Ravnborg vma = find_vma(mm, addr); 12027137e52SSam Ravnborg if (task_size - len >= addr && 12127137e52SSam Ravnborg (!vma || addr + len <= vma->vm_start)) 12227137e52SSam Ravnborg return addr; 12327137e52SSam Ravnborg } 12427137e52SSam Ravnborg if (mm->get_unmapped_area == arch_get_unmapped_area) 12527137e52SSam Ravnborg return hugetlb_get_unmapped_area_bottomup(file, addr, len, 12627137e52SSam Ravnborg pgoff, flags); 12727137e52SSam Ravnborg else 12827137e52SSam Ravnborg return hugetlb_get_unmapped_area_topdown(file, addr, len, 12927137e52SSam Ravnborg pgoff, flags); 13027137e52SSam Ravnborg } 13127137e52SSam Ravnborg 13227137e52SSam Ravnborg pte_t *huge_pte_alloc(struct mm_struct *mm, 13327137e52SSam Ravnborg unsigned long addr, unsigned long sz) 13427137e52SSam Ravnborg { 13527137e52SSam Ravnborg pgd_t *pgd; 13627137e52SSam Ravnborg pud_t *pud; 13727137e52SSam Ravnborg pmd_t *pmd; 13827137e52SSam Ravnborg pte_t *pte = NULL; 13927137e52SSam Ravnborg 14027137e52SSam Ravnborg /* We must align the address, because our caller will run 14127137e52SSam Ravnborg * set_huge_pte_at() on whatever we return, which writes out 14227137e52SSam Ravnborg * all of the sub-ptes for the hugepage range. So we have 14327137e52SSam Ravnborg * to give it the first such sub-pte. 14427137e52SSam Ravnborg */ 14527137e52SSam Ravnborg addr &= HPAGE_MASK; 14627137e52SSam Ravnborg 14727137e52SSam Ravnborg pgd = pgd_offset(mm, addr); 14827137e52SSam Ravnborg pud = pud_alloc(mm, pgd, addr); 14927137e52SSam Ravnborg if (pud) { 15027137e52SSam Ravnborg pmd = pmd_alloc(mm, pud, addr); 15127137e52SSam Ravnborg if (pmd) 1528ac1f832SAndrea Arcangeli pte = pte_alloc_map(mm, NULL, pmd, addr); 15327137e52SSam Ravnborg } 15427137e52SSam Ravnborg return pte; 15527137e52SSam Ravnborg } 15627137e52SSam Ravnborg 15727137e52SSam Ravnborg pte_t *huge_pte_offset(struct mm_struct *mm, unsigned long addr) 15827137e52SSam Ravnborg { 15927137e52SSam Ravnborg pgd_t *pgd; 16027137e52SSam Ravnborg pud_t *pud; 16127137e52SSam Ravnborg pmd_t *pmd; 16227137e52SSam Ravnborg pte_t *pte = NULL; 16327137e52SSam Ravnborg 16427137e52SSam Ravnborg addr &= HPAGE_MASK; 16527137e52SSam Ravnborg 16627137e52SSam Ravnborg pgd = pgd_offset(mm, addr); 16727137e52SSam Ravnborg if (!pgd_none(*pgd)) { 16827137e52SSam Ravnborg pud = pud_offset(pgd, addr); 16927137e52SSam Ravnborg if (!pud_none(*pud)) { 17027137e52SSam Ravnborg pmd = pmd_offset(pud, addr); 17127137e52SSam Ravnborg if (!pmd_none(*pmd)) 17227137e52SSam Ravnborg pte = pte_offset_map(pmd, addr); 17327137e52SSam Ravnborg } 17427137e52SSam Ravnborg } 17527137e52SSam Ravnborg return pte; 17627137e52SSam Ravnborg } 17727137e52SSam Ravnborg 17827137e52SSam Ravnborg int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr, pte_t *ptep) 17927137e52SSam Ravnborg { 18027137e52SSam Ravnborg return 0; 18127137e52SSam Ravnborg } 18227137e52SSam Ravnborg 18327137e52SSam Ravnborg void set_huge_pte_at(struct mm_struct *mm, unsigned long addr, 18427137e52SSam Ravnborg pte_t *ptep, pte_t entry) 18527137e52SSam Ravnborg { 18627137e52SSam Ravnborg int i; 18727137e52SSam Ravnborg 18827137e52SSam Ravnborg if (!pte_present(*ptep) && pte_present(entry)) 18927137e52SSam Ravnborg mm->context.huge_pte_count++; 19027137e52SSam Ravnborg 19127137e52SSam Ravnborg addr &= HPAGE_MASK; 19227137e52SSam Ravnborg for (i = 0; i < (1 << HUGETLB_PAGE_ORDER); i++) { 19327137e52SSam Ravnborg set_pte_at(mm, addr, ptep, entry); 19427137e52SSam Ravnborg ptep++; 19527137e52SSam Ravnborg addr += PAGE_SIZE; 19627137e52SSam Ravnborg pte_val(entry) += PAGE_SIZE; 19727137e52SSam Ravnborg } 19827137e52SSam Ravnborg } 19927137e52SSam Ravnborg 20027137e52SSam Ravnborg pte_t huge_ptep_get_and_clear(struct mm_struct *mm, unsigned long addr, 20127137e52SSam Ravnborg pte_t *ptep) 20227137e52SSam Ravnborg { 20327137e52SSam Ravnborg pte_t entry; 20427137e52SSam Ravnborg int i; 20527137e52SSam Ravnborg 20627137e52SSam Ravnborg entry = *ptep; 20727137e52SSam Ravnborg if (pte_present(entry)) 20827137e52SSam Ravnborg mm->context.huge_pte_count--; 20927137e52SSam Ravnborg 21027137e52SSam Ravnborg addr &= HPAGE_MASK; 21127137e52SSam Ravnborg 21227137e52SSam Ravnborg for (i = 0; i < (1 << HUGETLB_PAGE_ORDER); i++) { 21327137e52SSam Ravnborg pte_clear(mm, addr, ptep); 21427137e52SSam Ravnborg addr += PAGE_SIZE; 21527137e52SSam Ravnborg ptep++; 21627137e52SSam Ravnborg } 21727137e52SSam Ravnborg 21827137e52SSam Ravnborg return entry; 21927137e52SSam Ravnborg } 22027137e52SSam Ravnborg 22127137e52SSam Ravnborg struct page *follow_huge_addr(struct mm_struct *mm, 22227137e52SSam Ravnborg unsigned long address, int write) 22327137e52SSam Ravnborg { 22427137e52SSam Ravnborg return ERR_PTR(-EINVAL); 22527137e52SSam Ravnborg } 22627137e52SSam Ravnborg 22727137e52SSam Ravnborg int pmd_huge(pmd_t pmd) 22827137e52SSam Ravnborg { 22927137e52SSam Ravnborg return 0; 23027137e52SSam Ravnborg } 23127137e52SSam Ravnborg 23227137e52SSam Ravnborg int pud_huge(pud_t pud) 23327137e52SSam Ravnborg { 23427137e52SSam Ravnborg return 0; 23527137e52SSam Ravnborg } 23627137e52SSam Ravnborg 23727137e52SSam Ravnborg struct page *follow_huge_pmd(struct mm_struct *mm, unsigned long address, 23827137e52SSam Ravnborg pmd_t *pmd, int write) 23927137e52SSam Ravnborg { 24027137e52SSam Ravnborg return NULL; 24127137e52SSam Ravnborg } 242