127137e52SSam Ravnborg /* 227137e52SSam Ravnborg * SPARC64 Huge TLB page support. 327137e52SSam Ravnborg * 427137e52SSam Ravnborg * Copyright (C) 2002, 2003, 2006 David S. Miller (davem@davemloft.net) 527137e52SSam Ravnborg */ 627137e52SSam Ravnborg 727137e52SSam Ravnborg #include <linux/fs.h> 827137e52SSam Ravnborg #include <linux/mm.h> 927137e52SSam Ravnborg #include <linux/hugetlb.h> 1027137e52SSam Ravnborg #include <linux/pagemap.h> 1127137e52SSam Ravnborg #include <linux/sysctl.h> 1227137e52SSam Ravnborg 1327137e52SSam Ravnborg #include <asm/mman.h> 1427137e52SSam Ravnborg #include <asm/pgalloc.h> 1527137e52SSam Ravnborg #include <asm/tlb.h> 1627137e52SSam Ravnborg #include <asm/tlbflush.h> 1727137e52SSam Ravnborg #include <asm/cacheflush.h> 1827137e52SSam Ravnborg #include <asm/mmu_context.h> 1927137e52SSam Ravnborg 2027137e52SSam Ravnborg /* Slightly simplified from the non-hugepage variant because by 2127137e52SSam Ravnborg * definition we don't have to worry about any page coloring stuff 2227137e52SSam Ravnborg */ 2327137e52SSam Ravnborg 2427137e52SSam Ravnborg static unsigned long hugetlb_get_unmapped_area_bottomup(struct file *filp, 2527137e52SSam Ravnborg unsigned long addr, 2627137e52SSam Ravnborg unsigned long len, 2727137e52SSam Ravnborg unsigned long pgoff, 2827137e52SSam Ravnborg unsigned long flags) 2927137e52SSam Ravnborg { 3027137e52SSam Ravnborg unsigned long task_size = TASK_SIZE; 312aea28b9SMichel Lespinasse struct vm_unmapped_area_info info; 3227137e52SSam Ravnborg 3327137e52SSam Ravnborg if (test_thread_flag(TIF_32BIT)) 3427137e52SSam Ravnborg task_size = STACK_TOP32; 3527137e52SSam Ravnborg 362aea28b9SMichel Lespinasse info.flags = 0; 372aea28b9SMichel Lespinasse info.length = len; 382aea28b9SMichel Lespinasse info.low_limit = TASK_UNMAPPED_BASE; 392aea28b9SMichel Lespinasse info.high_limit = min(task_size, VA_EXCLUDE_START); 402aea28b9SMichel Lespinasse info.align_mask = PAGE_MASK & ~HPAGE_MASK; 412aea28b9SMichel Lespinasse info.align_offset = 0; 422aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 432aea28b9SMichel Lespinasse 442aea28b9SMichel Lespinasse if ((addr & ~PAGE_MASK) && task_size > VA_EXCLUDE_END) { 452aea28b9SMichel Lespinasse VM_BUG_ON(addr != -ENOMEM); 462aea28b9SMichel Lespinasse info.low_limit = VA_EXCLUDE_END; 472aea28b9SMichel Lespinasse info.high_limit = task_size; 482aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 4927137e52SSam Ravnborg } 5027137e52SSam Ravnborg 5127137e52SSam Ravnborg return addr; 5227137e52SSam Ravnborg } 5327137e52SSam Ravnborg 5427137e52SSam Ravnborg static unsigned long 5527137e52SSam Ravnborg hugetlb_get_unmapped_area_topdown(struct file *filp, const unsigned long addr0, 5627137e52SSam Ravnborg const unsigned long len, 5727137e52SSam Ravnborg const unsigned long pgoff, 5827137e52SSam Ravnborg const unsigned long flags) 5927137e52SSam Ravnborg { 6027137e52SSam Ravnborg struct mm_struct *mm = current->mm; 6127137e52SSam Ravnborg unsigned long addr = addr0; 622aea28b9SMichel Lespinasse struct vm_unmapped_area_info info; 6327137e52SSam Ravnborg 6427137e52SSam Ravnborg /* This should only ever run for 32-bit processes. */ 6527137e52SSam Ravnborg BUG_ON(!test_thread_flag(TIF_32BIT)); 6627137e52SSam Ravnborg 672aea28b9SMichel Lespinasse info.flags = VM_UNMAPPED_AREA_TOPDOWN; 682aea28b9SMichel Lespinasse info.length = len; 692aea28b9SMichel Lespinasse info.low_limit = PAGE_SIZE; 702aea28b9SMichel Lespinasse info.high_limit = mm->mmap_base; 712aea28b9SMichel Lespinasse info.align_mask = PAGE_MASK & ~HPAGE_MASK; 722aea28b9SMichel Lespinasse info.align_offset = 0; 732aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 7427137e52SSam Ravnborg 7527137e52SSam Ravnborg /* 7627137e52SSam Ravnborg * A failed mmap() very likely causes application failure, 7727137e52SSam Ravnborg * so fall back to the bottom-up function here. This scenario 7827137e52SSam Ravnborg * can happen with large stack limits and large mmap() 7927137e52SSam Ravnborg * allocations. 8027137e52SSam Ravnborg */ 812aea28b9SMichel Lespinasse if (addr & ~PAGE_MASK) { 822aea28b9SMichel Lespinasse VM_BUG_ON(addr != -ENOMEM); 832aea28b9SMichel Lespinasse info.flags = 0; 842aea28b9SMichel Lespinasse info.low_limit = TASK_UNMAPPED_BASE; 852aea28b9SMichel Lespinasse info.high_limit = STACK_TOP32; 862aea28b9SMichel Lespinasse addr = vm_unmapped_area(&info); 872aea28b9SMichel Lespinasse } 8827137e52SSam Ravnborg 8927137e52SSam Ravnborg return addr; 9027137e52SSam Ravnborg } 9127137e52SSam Ravnborg 9227137e52SSam Ravnborg unsigned long 9327137e52SSam Ravnborg hugetlb_get_unmapped_area(struct file *file, unsigned long addr, 9427137e52SSam Ravnborg unsigned long len, unsigned long pgoff, unsigned long flags) 9527137e52SSam Ravnborg { 9627137e52SSam Ravnborg struct mm_struct *mm = current->mm; 9727137e52SSam Ravnborg struct vm_area_struct *vma; 9827137e52SSam Ravnborg unsigned long task_size = TASK_SIZE; 9927137e52SSam Ravnborg 10027137e52SSam Ravnborg if (test_thread_flag(TIF_32BIT)) 10127137e52SSam Ravnborg task_size = STACK_TOP32; 10227137e52SSam Ravnborg 10327137e52SSam Ravnborg if (len & ~HPAGE_MASK) 10427137e52SSam Ravnborg return -EINVAL; 10527137e52SSam Ravnborg if (len > task_size) 10627137e52SSam Ravnborg return -ENOMEM; 10727137e52SSam Ravnborg 10827137e52SSam Ravnborg if (flags & MAP_FIXED) { 10927137e52SSam Ravnborg if (prepare_hugepage_range(file, addr, len)) 11027137e52SSam Ravnborg return -EINVAL; 11127137e52SSam Ravnborg return addr; 11227137e52SSam Ravnborg } 11327137e52SSam Ravnborg 11427137e52SSam Ravnborg if (addr) { 11527137e52SSam Ravnborg addr = ALIGN(addr, HPAGE_SIZE); 11627137e52SSam Ravnborg vma = find_vma(mm, addr); 11727137e52SSam Ravnborg if (task_size - len >= addr && 11827137e52SSam Ravnborg (!vma || addr + len <= vma->vm_start)) 11927137e52SSam Ravnborg return addr; 12027137e52SSam Ravnborg } 12127137e52SSam Ravnborg if (mm->get_unmapped_area == arch_get_unmapped_area) 12227137e52SSam Ravnborg return hugetlb_get_unmapped_area_bottomup(file, addr, len, 12327137e52SSam Ravnborg pgoff, flags); 12427137e52SSam Ravnborg else 12527137e52SSam Ravnborg return hugetlb_get_unmapped_area_topdown(file, addr, len, 12627137e52SSam Ravnborg pgoff, flags); 12727137e52SSam Ravnborg } 12827137e52SSam Ravnborg 12927137e52SSam Ravnborg pte_t *huge_pte_alloc(struct mm_struct *mm, 13027137e52SSam Ravnborg unsigned long addr, unsigned long sz) 13127137e52SSam Ravnborg { 13227137e52SSam Ravnborg pgd_t *pgd; 13327137e52SSam Ravnborg pud_t *pud; 13427137e52SSam Ravnborg pmd_t *pmd; 13527137e52SSam Ravnborg pte_t *pte = NULL; 13627137e52SSam Ravnborg 13727137e52SSam Ravnborg /* We must align the address, because our caller will run 13827137e52SSam Ravnborg * set_huge_pte_at() on whatever we return, which writes out 13927137e52SSam Ravnborg * all of the sub-ptes for the hugepage range. So we have 14027137e52SSam Ravnborg * to give it the first such sub-pte. 14127137e52SSam Ravnborg */ 14227137e52SSam Ravnborg addr &= HPAGE_MASK; 14327137e52SSam Ravnborg 14427137e52SSam Ravnborg pgd = pgd_offset(mm, addr); 14527137e52SSam Ravnborg pud = pud_alloc(mm, pgd, addr); 14627137e52SSam Ravnborg if (pud) { 14727137e52SSam Ravnborg pmd = pmd_alloc(mm, pud, addr); 14827137e52SSam Ravnborg if (pmd) 1493ed3a4f0SKirill A. Shutemov pte = pte_alloc_map(mm, pmd, addr); 15027137e52SSam Ravnborg } 15127137e52SSam Ravnborg return pte; 15227137e52SSam Ravnborg } 15327137e52SSam Ravnborg 15427137e52SSam Ravnborg pte_t *huge_pte_offset(struct mm_struct *mm, unsigned long addr) 15527137e52SSam Ravnborg { 15627137e52SSam Ravnborg pgd_t *pgd; 15727137e52SSam Ravnborg pud_t *pud; 15827137e52SSam Ravnborg pmd_t *pmd; 15927137e52SSam Ravnborg pte_t *pte = NULL; 16027137e52SSam Ravnborg 16127137e52SSam Ravnborg addr &= HPAGE_MASK; 16227137e52SSam Ravnborg 16327137e52SSam Ravnborg pgd = pgd_offset(mm, addr); 16427137e52SSam Ravnborg if (!pgd_none(*pgd)) { 16527137e52SSam Ravnborg pud = pud_offset(pgd, addr); 16627137e52SSam Ravnborg if (!pud_none(*pud)) { 16727137e52SSam Ravnborg pmd = pmd_offset(pud, addr); 16827137e52SSam Ravnborg if (!pmd_none(*pmd)) 16927137e52SSam Ravnborg pte = pte_offset_map(pmd, addr); 17027137e52SSam Ravnborg } 17127137e52SSam Ravnborg } 17227137e52SSam Ravnborg return pte; 17327137e52SSam Ravnborg } 17427137e52SSam Ravnborg 17527137e52SSam Ravnborg void set_huge_pte_at(struct mm_struct *mm, unsigned long addr, 17627137e52SSam Ravnborg pte_t *ptep, pte_t entry) 17727137e52SSam Ravnborg { 17827137e52SSam Ravnborg int i; 179*24e49ee3SNitin Gupta pte_t orig[2]; 180*24e49ee3SNitin Gupta unsigned long nptes; 18127137e52SSam Ravnborg 18227137e52SSam Ravnborg if (!pte_present(*ptep) && pte_present(entry)) 18327137e52SSam Ravnborg mm->context.huge_pte_count++; 18427137e52SSam Ravnborg 18527137e52SSam Ravnborg addr &= HPAGE_MASK; 186*24e49ee3SNitin Gupta 187*24e49ee3SNitin Gupta nptes = 1 << HUGETLB_PAGE_ORDER; 188*24e49ee3SNitin Gupta orig[0] = *ptep; 189*24e49ee3SNitin Gupta orig[1] = *(ptep + nptes / 2); 190*24e49ee3SNitin Gupta for (i = 0; i < nptes; i++) { 191*24e49ee3SNitin Gupta *ptep = entry; 19227137e52SSam Ravnborg ptep++; 19327137e52SSam Ravnborg addr += PAGE_SIZE; 19427137e52SSam Ravnborg pte_val(entry) += PAGE_SIZE; 19527137e52SSam Ravnborg } 196*24e49ee3SNitin Gupta 197*24e49ee3SNitin Gupta /* Issue TLB flush at REAL_HPAGE_SIZE boundaries */ 198*24e49ee3SNitin Gupta addr -= REAL_HPAGE_SIZE; 199*24e49ee3SNitin Gupta ptep -= nptes / 2; 200*24e49ee3SNitin Gupta maybe_tlb_batch_add(mm, addr, ptep, orig[1], 0); 201*24e49ee3SNitin Gupta addr -= REAL_HPAGE_SIZE; 202*24e49ee3SNitin Gupta ptep -= nptes / 2; 203*24e49ee3SNitin Gupta maybe_tlb_batch_add(mm, addr, ptep, orig[0], 0); 20427137e52SSam Ravnborg } 20527137e52SSam Ravnborg 20627137e52SSam Ravnborg pte_t huge_ptep_get_and_clear(struct mm_struct *mm, unsigned long addr, 20727137e52SSam Ravnborg pte_t *ptep) 20827137e52SSam Ravnborg { 20927137e52SSam Ravnborg pte_t entry; 21027137e52SSam Ravnborg int i; 211*24e49ee3SNitin Gupta unsigned long nptes; 21227137e52SSam Ravnborg 21327137e52SSam Ravnborg entry = *ptep; 21427137e52SSam Ravnborg if (pte_present(entry)) 21527137e52SSam Ravnborg mm->context.huge_pte_count--; 21627137e52SSam Ravnborg 21727137e52SSam Ravnborg addr &= HPAGE_MASK; 218*24e49ee3SNitin Gupta nptes = 1 << HUGETLB_PAGE_ORDER; 219*24e49ee3SNitin Gupta for (i = 0; i < nptes; i++) { 220*24e49ee3SNitin Gupta *ptep = __pte(0UL); 22127137e52SSam Ravnborg addr += PAGE_SIZE; 22227137e52SSam Ravnborg ptep++; 22327137e52SSam Ravnborg } 22427137e52SSam Ravnborg 225*24e49ee3SNitin Gupta /* Issue TLB flush at REAL_HPAGE_SIZE boundaries */ 226*24e49ee3SNitin Gupta addr -= REAL_HPAGE_SIZE; 227*24e49ee3SNitin Gupta ptep -= nptes / 2; 228*24e49ee3SNitin Gupta maybe_tlb_batch_add(mm, addr, ptep, entry, 0); 229*24e49ee3SNitin Gupta addr -= REAL_HPAGE_SIZE; 230*24e49ee3SNitin Gupta ptep -= nptes / 2; 231*24e49ee3SNitin Gupta maybe_tlb_batch_add(mm, addr, ptep, entry, 0); 232*24e49ee3SNitin Gupta 23327137e52SSam Ravnborg return entry; 23427137e52SSam Ravnborg } 23527137e52SSam Ravnborg 23627137e52SSam Ravnborg int pmd_huge(pmd_t pmd) 23727137e52SSam Ravnborg { 23827137e52SSam Ravnborg return 0; 23927137e52SSam Ravnborg } 24027137e52SSam Ravnborg 24127137e52SSam Ravnborg int pud_huge(pud_t pud) 24227137e52SSam Ravnborg { 24327137e52SSam Ravnborg return 0; 24427137e52SSam Ravnborg } 245