xref: /openbmc/linux/arch/sparc/mm/hugetlbpage.c (revision 24e49ee3d76b70853a96520e46b8837e5eae65b2)
127137e52SSam Ravnborg /*
227137e52SSam Ravnborg  * SPARC64 Huge TLB page support.
327137e52SSam Ravnborg  *
427137e52SSam Ravnborg  * Copyright (C) 2002, 2003, 2006 David S. Miller (davem@davemloft.net)
527137e52SSam Ravnborg  */
627137e52SSam Ravnborg 
727137e52SSam Ravnborg #include <linux/fs.h>
827137e52SSam Ravnborg #include <linux/mm.h>
927137e52SSam Ravnborg #include <linux/hugetlb.h>
1027137e52SSam Ravnborg #include <linux/pagemap.h>
1127137e52SSam Ravnborg #include <linux/sysctl.h>
1227137e52SSam Ravnborg 
1327137e52SSam Ravnborg #include <asm/mman.h>
1427137e52SSam Ravnborg #include <asm/pgalloc.h>
1527137e52SSam Ravnborg #include <asm/tlb.h>
1627137e52SSam Ravnborg #include <asm/tlbflush.h>
1727137e52SSam Ravnborg #include <asm/cacheflush.h>
1827137e52SSam Ravnborg #include <asm/mmu_context.h>
1927137e52SSam Ravnborg 
2027137e52SSam Ravnborg /* Slightly simplified from the non-hugepage variant because by
2127137e52SSam Ravnborg  * definition we don't have to worry about any page coloring stuff
2227137e52SSam Ravnborg  */
2327137e52SSam Ravnborg 
2427137e52SSam Ravnborg static unsigned long hugetlb_get_unmapped_area_bottomup(struct file *filp,
2527137e52SSam Ravnborg 							unsigned long addr,
2627137e52SSam Ravnborg 							unsigned long len,
2727137e52SSam Ravnborg 							unsigned long pgoff,
2827137e52SSam Ravnborg 							unsigned long flags)
2927137e52SSam Ravnborg {
3027137e52SSam Ravnborg 	unsigned long task_size = TASK_SIZE;
312aea28b9SMichel Lespinasse 	struct vm_unmapped_area_info info;
3227137e52SSam Ravnborg 
3327137e52SSam Ravnborg 	if (test_thread_flag(TIF_32BIT))
3427137e52SSam Ravnborg 		task_size = STACK_TOP32;
3527137e52SSam Ravnborg 
362aea28b9SMichel Lespinasse 	info.flags = 0;
372aea28b9SMichel Lespinasse 	info.length = len;
382aea28b9SMichel Lespinasse 	info.low_limit = TASK_UNMAPPED_BASE;
392aea28b9SMichel Lespinasse 	info.high_limit = min(task_size, VA_EXCLUDE_START);
402aea28b9SMichel Lespinasse 	info.align_mask = PAGE_MASK & ~HPAGE_MASK;
412aea28b9SMichel Lespinasse 	info.align_offset = 0;
422aea28b9SMichel Lespinasse 	addr = vm_unmapped_area(&info);
432aea28b9SMichel Lespinasse 
442aea28b9SMichel Lespinasse 	if ((addr & ~PAGE_MASK) && task_size > VA_EXCLUDE_END) {
452aea28b9SMichel Lespinasse 		VM_BUG_ON(addr != -ENOMEM);
462aea28b9SMichel Lespinasse 		info.low_limit = VA_EXCLUDE_END;
472aea28b9SMichel Lespinasse 		info.high_limit = task_size;
482aea28b9SMichel Lespinasse 		addr = vm_unmapped_area(&info);
4927137e52SSam Ravnborg 	}
5027137e52SSam Ravnborg 
5127137e52SSam Ravnborg 	return addr;
5227137e52SSam Ravnborg }
5327137e52SSam Ravnborg 
5427137e52SSam Ravnborg static unsigned long
5527137e52SSam Ravnborg hugetlb_get_unmapped_area_topdown(struct file *filp, const unsigned long addr0,
5627137e52SSam Ravnborg 				  const unsigned long len,
5727137e52SSam Ravnborg 				  const unsigned long pgoff,
5827137e52SSam Ravnborg 				  const unsigned long flags)
5927137e52SSam Ravnborg {
6027137e52SSam Ravnborg 	struct mm_struct *mm = current->mm;
6127137e52SSam Ravnborg 	unsigned long addr = addr0;
622aea28b9SMichel Lespinasse 	struct vm_unmapped_area_info info;
6327137e52SSam Ravnborg 
6427137e52SSam Ravnborg 	/* This should only ever run for 32-bit processes.  */
6527137e52SSam Ravnborg 	BUG_ON(!test_thread_flag(TIF_32BIT));
6627137e52SSam Ravnborg 
672aea28b9SMichel Lespinasse 	info.flags = VM_UNMAPPED_AREA_TOPDOWN;
682aea28b9SMichel Lespinasse 	info.length = len;
692aea28b9SMichel Lespinasse 	info.low_limit = PAGE_SIZE;
702aea28b9SMichel Lespinasse 	info.high_limit = mm->mmap_base;
712aea28b9SMichel Lespinasse 	info.align_mask = PAGE_MASK & ~HPAGE_MASK;
722aea28b9SMichel Lespinasse 	info.align_offset = 0;
732aea28b9SMichel Lespinasse 	addr = vm_unmapped_area(&info);
7427137e52SSam Ravnborg 
7527137e52SSam Ravnborg 	/*
7627137e52SSam Ravnborg 	 * A failed mmap() very likely causes application failure,
7727137e52SSam Ravnborg 	 * so fall back to the bottom-up function here. This scenario
7827137e52SSam Ravnborg 	 * can happen with large stack limits and large mmap()
7927137e52SSam Ravnborg 	 * allocations.
8027137e52SSam Ravnborg 	 */
812aea28b9SMichel Lespinasse 	if (addr & ~PAGE_MASK) {
822aea28b9SMichel Lespinasse 		VM_BUG_ON(addr != -ENOMEM);
832aea28b9SMichel Lespinasse 		info.flags = 0;
842aea28b9SMichel Lespinasse 		info.low_limit = TASK_UNMAPPED_BASE;
852aea28b9SMichel Lespinasse 		info.high_limit = STACK_TOP32;
862aea28b9SMichel Lespinasse 		addr = vm_unmapped_area(&info);
872aea28b9SMichel Lespinasse 	}
8827137e52SSam Ravnborg 
8927137e52SSam Ravnborg 	return addr;
9027137e52SSam Ravnborg }
9127137e52SSam Ravnborg 
9227137e52SSam Ravnborg unsigned long
9327137e52SSam Ravnborg hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
9427137e52SSam Ravnborg 		unsigned long len, unsigned long pgoff, unsigned long flags)
9527137e52SSam Ravnborg {
9627137e52SSam Ravnborg 	struct mm_struct *mm = current->mm;
9727137e52SSam Ravnborg 	struct vm_area_struct *vma;
9827137e52SSam Ravnborg 	unsigned long task_size = TASK_SIZE;
9927137e52SSam Ravnborg 
10027137e52SSam Ravnborg 	if (test_thread_flag(TIF_32BIT))
10127137e52SSam Ravnborg 		task_size = STACK_TOP32;
10227137e52SSam Ravnborg 
10327137e52SSam Ravnborg 	if (len & ~HPAGE_MASK)
10427137e52SSam Ravnborg 		return -EINVAL;
10527137e52SSam Ravnborg 	if (len > task_size)
10627137e52SSam Ravnborg 		return -ENOMEM;
10727137e52SSam Ravnborg 
10827137e52SSam Ravnborg 	if (flags & MAP_FIXED) {
10927137e52SSam Ravnborg 		if (prepare_hugepage_range(file, addr, len))
11027137e52SSam Ravnborg 			return -EINVAL;
11127137e52SSam Ravnborg 		return addr;
11227137e52SSam Ravnborg 	}
11327137e52SSam Ravnborg 
11427137e52SSam Ravnborg 	if (addr) {
11527137e52SSam Ravnborg 		addr = ALIGN(addr, HPAGE_SIZE);
11627137e52SSam Ravnborg 		vma = find_vma(mm, addr);
11727137e52SSam Ravnborg 		if (task_size - len >= addr &&
11827137e52SSam Ravnborg 		    (!vma || addr + len <= vma->vm_start))
11927137e52SSam Ravnborg 			return addr;
12027137e52SSam Ravnborg 	}
12127137e52SSam Ravnborg 	if (mm->get_unmapped_area == arch_get_unmapped_area)
12227137e52SSam Ravnborg 		return hugetlb_get_unmapped_area_bottomup(file, addr, len,
12327137e52SSam Ravnborg 				pgoff, flags);
12427137e52SSam Ravnborg 	else
12527137e52SSam Ravnborg 		return hugetlb_get_unmapped_area_topdown(file, addr, len,
12627137e52SSam Ravnborg 				pgoff, flags);
12727137e52SSam Ravnborg }
12827137e52SSam Ravnborg 
12927137e52SSam Ravnborg pte_t *huge_pte_alloc(struct mm_struct *mm,
13027137e52SSam Ravnborg 			unsigned long addr, unsigned long sz)
13127137e52SSam Ravnborg {
13227137e52SSam Ravnborg 	pgd_t *pgd;
13327137e52SSam Ravnborg 	pud_t *pud;
13427137e52SSam Ravnborg 	pmd_t *pmd;
13527137e52SSam Ravnborg 	pte_t *pte = NULL;
13627137e52SSam Ravnborg 
13727137e52SSam Ravnborg 	/* We must align the address, because our caller will run
13827137e52SSam Ravnborg 	 * set_huge_pte_at() on whatever we return, which writes out
13927137e52SSam Ravnborg 	 * all of the sub-ptes for the hugepage range.  So we have
14027137e52SSam Ravnborg 	 * to give it the first such sub-pte.
14127137e52SSam Ravnborg 	 */
14227137e52SSam Ravnborg 	addr &= HPAGE_MASK;
14327137e52SSam Ravnborg 
14427137e52SSam Ravnborg 	pgd = pgd_offset(mm, addr);
14527137e52SSam Ravnborg 	pud = pud_alloc(mm, pgd, addr);
14627137e52SSam Ravnborg 	if (pud) {
14727137e52SSam Ravnborg 		pmd = pmd_alloc(mm, pud, addr);
14827137e52SSam Ravnborg 		if (pmd)
1493ed3a4f0SKirill A. Shutemov 			pte = pte_alloc_map(mm, pmd, addr);
15027137e52SSam Ravnborg 	}
15127137e52SSam Ravnborg 	return pte;
15227137e52SSam Ravnborg }
15327137e52SSam Ravnborg 
15427137e52SSam Ravnborg pte_t *huge_pte_offset(struct mm_struct *mm, unsigned long addr)
15527137e52SSam Ravnborg {
15627137e52SSam Ravnborg 	pgd_t *pgd;
15727137e52SSam Ravnborg 	pud_t *pud;
15827137e52SSam Ravnborg 	pmd_t *pmd;
15927137e52SSam Ravnborg 	pte_t *pte = NULL;
16027137e52SSam Ravnborg 
16127137e52SSam Ravnborg 	addr &= HPAGE_MASK;
16227137e52SSam Ravnborg 
16327137e52SSam Ravnborg 	pgd = pgd_offset(mm, addr);
16427137e52SSam Ravnborg 	if (!pgd_none(*pgd)) {
16527137e52SSam Ravnborg 		pud = pud_offset(pgd, addr);
16627137e52SSam Ravnborg 		if (!pud_none(*pud)) {
16727137e52SSam Ravnborg 			pmd = pmd_offset(pud, addr);
16827137e52SSam Ravnborg 			if (!pmd_none(*pmd))
16927137e52SSam Ravnborg 				pte = pte_offset_map(pmd, addr);
17027137e52SSam Ravnborg 		}
17127137e52SSam Ravnborg 	}
17227137e52SSam Ravnborg 	return pte;
17327137e52SSam Ravnborg }
17427137e52SSam Ravnborg 
17527137e52SSam Ravnborg void set_huge_pte_at(struct mm_struct *mm, unsigned long addr,
17627137e52SSam Ravnborg 		     pte_t *ptep, pte_t entry)
17727137e52SSam Ravnborg {
17827137e52SSam Ravnborg 	int i;
179*24e49ee3SNitin Gupta 	pte_t orig[2];
180*24e49ee3SNitin Gupta 	unsigned long nptes;
18127137e52SSam Ravnborg 
18227137e52SSam Ravnborg 	if (!pte_present(*ptep) && pte_present(entry))
18327137e52SSam Ravnborg 		mm->context.huge_pte_count++;
18427137e52SSam Ravnborg 
18527137e52SSam Ravnborg 	addr &= HPAGE_MASK;
186*24e49ee3SNitin Gupta 
187*24e49ee3SNitin Gupta 	nptes = 1 << HUGETLB_PAGE_ORDER;
188*24e49ee3SNitin Gupta 	orig[0] = *ptep;
189*24e49ee3SNitin Gupta 	orig[1] = *(ptep + nptes / 2);
190*24e49ee3SNitin Gupta 	for (i = 0; i < nptes; i++) {
191*24e49ee3SNitin Gupta 		*ptep = entry;
19227137e52SSam Ravnborg 		ptep++;
19327137e52SSam Ravnborg 		addr += PAGE_SIZE;
19427137e52SSam Ravnborg 		pte_val(entry) += PAGE_SIZE;
19527137e52SSam Ravnborg 	}
196*24e49ee3SNitin Gupta 
197*24e49ee3SNitin Gupta 	/* Issue TLB flush at REAL_HPAGE_SIZE boundaries */
198*24e49ee3SNitin Gupta 	addr -= REAL_HPAGE_SIZE;
199*24e49ee3SNitin Gupta 	ptep -= nptes / 2;
200*24e49ee3SNitin Gupta 	maybe_tlb_batch_add(mm, addr, ptep, orig[1], 0);
201*24e49ee3SNitin Gupta 	addr -= REAL_HPAGE_SIZE;
202*24e49ee3SNitin Gupta 	ptep -= nptes / 2;
203*24e49ee3SNitin Gupta 	maybe_tlb_batch_add(mm, addr, ptep, orig[0], 0);
20427137e52SSam Ravnborg }
20527137e52SSam Ravnborg 
20627137e52SSam Ravnborg pte_t huge_ptep_get_and_clear(struct mm_struct *mm, unsigned long addr,
20727137e52SSam Ravnborg 			      pte_t *ptep)
20827137e52SSam Ravnborg {
20927137e52SSam Ravnborg 	pte_t entry;
21027137e52SSam Ravnborg 	int i;
211*24e49ee3SNitin Gupta 	unsigned long nptes;
21227137e52SSam Ravnborg 
21327137e52SSam Ravnborg 	entry = *ptep;
21427137e52SSam Ravnborg 	if (pte_present(entry))
21527137e52SSam Ravnborg 		mm->context.huge_pte_count--;
21627137e52SSam Ravnborg 
21727137e52SSam Ravnborg 	addr &= HPAGE_MASK;
218*24e49ee3SNitin Gupta 	nptes = 1 << HUGETLB_PAGE_ORDER;
219*24e49ee3SNitin Gupta 	for (i = 0; i < nptes; i++) {
220*24e49ee3SNitin Gupta 		*ptep = __pte(0UL);
22127137e52SSam Ravnborg 		addr += PAGE_SIZE;
22227137e52SSam Ravnborg 		ptep++;
22327137e52SSam Ravnborg 	}
22427137e52SSam Ravnborg 
225*24e49ee3SNitin Gupta 	/* Issue TLB flush at REAL_HPAGE_SIZE boundaries */
226*24e49ee3SNitin Gupta 	addr -= REAL_HPAGE_SIZE;
227*24e49ee3SNitin Gupta 	ptep -= nptes / 2;
228*24e49ee3SNitin Gupta 	maybe_tlb_batch_add(mm, addr, ptep, entry, 0);
229*24e49ee3SNitin Gupta 	addr -= REAL_HPAGE_SIZE;
230*24e49ee3SNitin Gupta 	ptep -= nptes / 2;
231*24e49ee3SNitin Gupta 	maybe_tlb_batch_add(mm, addr, ptep, entry, 0);
232*24e49ee3SNitin Gupta 
23327137e52SSam Ravnborg 	return entry;
23427137e52SSam Ravnborg }
23527137e52SSam Ravnborg 
23627137e52SSam Ravnborg int pmd_huge(pmd_t pmd)
23727137e52SSam Ravnborg {
23827137e52SSam Ravnborg 	return 0;
23927137e52SSam Ravnborg }
24027137e52SSam Ravnborg 
24127137e52SSam Ravnborg int pud_huge(pud_t pud)
24227137e52SSam Ravnborg {
24327137e52SSam Ravnborg 	return 0;
24427137e52SSam Ravnborg }
245