xref: /openbmc/linux/mm/mprotect.c (revision 8f860591ffb29738cf5539b6fbf27f50dcdeb380)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *  mm/mprotect.c
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  *  (C) Copyright 1994 Linus Torvalds
51da177e4SLinus Torvalds  *  (C) Copyright 2002 Christoph Hellwig
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  *  Address space accounting code	<alan@redhat.com>
81da177e4SLinus Torvalds  *  (C) Copyright 2002 Red Hat Inc, All Rights Reserved
91da177e4SLinus Torvalds  */
101da177e4SLinus Torvalds 
111da177e4SLinus Torvalds #include <linux/mm.h>
121da177e4SLinus Torvalds #include <linux/hugetlb.h>
131da177e4SLinus Torvalds #include <linux/slab.h>
141da177e4SLinus Torvalds #include <linux/shm.h>
151da177e4SLinus Torvalds #include <linux/mman.h>
161da177e4SLinus Torvalds #include <linux/fs.h>
171da177e4SLinus Torvalds #include <linux/highmem.h>
181da177e4SLinus Torvalds #include <linux/security.h>
191da177e4SLinus Torvalds #include <linux/mempolicy.h>
201da177e4SLinus Torvalds #include <linux/personality.h>
211da177e4SLinus Torvalds #include <linux/syscalls.h>
221da177e4SLinus Torvalds 
231da177e4SLinus Torvalds #include <asm/uaccess.h>
241da177e4SLinus Torvalds #include <asm/pgtable.h>
251da177e4SLinus Torvalds #include <asm/cacheflush.h>
261da177e4SLinus Torvalds #include <asm/tlbflush.h>
271da177e4SLinus Torvalds 
281da177e4SLinus Torvalds static void change_pte_range(struct mm_struct *mm, pmd_t *pmd,
291da177e4SLinus Torvalds 		unsigned long addr, unsigned long end, pgprot_t newprot)
301da177e4SLinus Torvalds {
311da177e4SLinus Torvalds 	pte_t *pte;
32705e87c0SHugh Dickins 	spinlock_t *ptl;
331da177e4SLinus Torvalds 
34705e87c0SHugh Dickins 	pte = pte_offset_map_lock(mm, pmd, addr, &ptl);
351da177e4SLinus Torvalds 	do {
361da177e4SLinus Torvalds 		if (pte_present(*pte)) {
371da177e4SLinus Torvalds 			pte_t ptent;
381da177e4SLinus Torvalds 
391da177e4SLinus Torvalds 			/* Avoid an SMP race with hardware updated dirty/clean
401da177e4SLinus Torvalds 			 * bits by wiping the pte and then setting the new pte
411da177e4SLinus Torvalds 			 * into place.
421da177e4SLinus Torvalds 			 */
431da177e4SLinus Torvalds 			ptent = pte_modify(ptep_get_and_clear(mm, addr, pte), newprot);
441da177e4SLinus Torvalds 			set_pte_at(mm, addr, pte, ptent);
451da177e4SLinus Torvalds 			lazy_mmu_prot_update(ptent);
461da177e4SLinus Torvalds 		}
471da177e4SLinus Torvalds 	} while (pte++, addr += PAGE_SIZE, addr != end);
48705e87c0SHugh Dickins 	pte_unmap_unlock(pte - 1, ptl);
491da177e4SLinus Torvalds }
501da177e4SLinus Torvalds 
511da177e4SLinus Torvalds static inline void change_pmd_range(struct mm_struct *mm, pud_t *pud,
521da177e4SLinus Torvalds 		unsigned long addr, unsigned long end, pgprot_t newprot)
531da177e4SLinus Torvalds {
541da177e4SLinus Torvalds 	pmd_t *pmd;
551da177e4SLinus Torvalds 	unsigned long next;
561da177e4SLinus Torvalds 
571da177e4SLinus Torvalds 	pmd = pmd_offset(pud, addr);
581da177e4SLinus Torvalds 	do {
591da177e4SLinus Torvalds 		next = pmd_addr_end(addr, end);
601da177e4SLinus Torvalds 		if (pmd_none_or_clear_bad(pmd))
611da177e4SLinus Torvalds 			continue;
621da177e4SLinus Torvalds 		change_pte_range(mm, pmd, addr, next, newprot);
631da177e4SLinus Torvalds 	} while (pmd++, addr = next, addr != end);
641da177e4SLinus Torvalds }
651da177e4SLinus Torvalds 
661da177e4SLinus Torvalds static inline void change_pud_range(struct mm_struct *mm, pgd_t *pgd,
671da177e4SLinus Torvalds 		unsigned long addr, unsigned long end, pgprot_t newprot)
681da177e4SLinus Torvalds {
691da177e4SLinus Torvalds 	pud_t *pud;
701da177e4SLinus Torvalds 	unsigned long next;
711da177e4SLinus Torvalds 
721da177e4SLinus Torvalds 	pud = pud_offset(pgd, addr);
731da177e4SLinus Torvalds 	do {
741da177e4SLinus Torvalds 		next = pud_addr_end(addr, end);
751da177e4SLinus Torvalds 		if (pud_none_or_clear_bad(pud))
761da177e4SLinus Torvalds 			continue;
771da177e4SLinus Torvalds 		change_pmd_range(mm, pud, addr, next, newprot);
781da177e4SLinus Torvalds 	} while (pud++, addr = next, addr != end);
791da177e4SLinus Torvalds }
801da177e4SLinus Torvalds 
811da177e4SLinus Torvalds static void change_protection(struct vm_area_struct *vma,
821da177e4SLinus Torvalds 		unsigned long addr, unsigned long end, pgprot_t newprot)
831da177e4SLinus Torvalds {
841da177e4SLinus Torvalds 	struct mm_struct *mm = vma->vm_mm;
851da177e4SLinus Torvalds 	pgd_t *pgd;
861da177e4SLinus Torvalds 	unsigned long next;
871da177e4SLinus Torvalds 	unsigned long start = addr;
881da177e4SLinus Torvalds 
891da177e4SLinus Torvalds 	BUG_ON(addr >= end);
901da177e4SLinus Torvalds 	pgd = pgd_offset(mm, addr);
911da177e4SLinus Torvalds 	flush_cache_range(vma, addr, end);
921da177e4SLinus Torvalds 	do {
931da177e4SLinus Torvalds 		next = pgd_addr_end(addr, end);
941da177e4SLinus Torvalds 		if (pgd_none_or_clear_bad(pgd))
951da177e4SLinus Torvalds 			continue;
961da177e4SLinus Torvalds 		change_pud_range(mm, pgd, addr, next, newprot);
971da177e4SLinus Torvalds 	} while (pgd++, addr = next, addr != end);
981da177e4SLinus Torvalds 	flush_tlb_range(vma, start, end);
991da177e4SLinus Torvalds }
1001da177e4SLinus Torvalds 
1011da177e4SLinus Torvalds static int
1021da177e4SLinus Torvalds mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev,
1031da177e4SLinus Torvalds 	unsigned long start, unsigned long end, unsigned long newflags)
1041da177e4SLinus Torvalds {
1051da177e4SLinus Torvalds 	struct mm_struct *mm = vma->vm_mm;
1061da177e4SLinus Torvalds 	unsigned long oldflags = vma->vm_flags;
1071da177e4SLinus Torvalds 	long nrpages = (end - start) >> PAGE_SHIFT;
1081da177e4SLinus Torvalds 	unsigned long charged = 0;
1091da177e4SLinus Torvalds 	pgprot_t newprot;
1101da177e4SLinus Torvalds 	pgoff_t pgoff;
1111da177e4SLinus Torvalds 	int error;
1121da177e4SLinus Torvalds 
1131da177e4SLinus Torvalds 	if (newflags == oldflags) {
1141da177e4SLinus Torvalds 		*pprev = vma;
1151da177e4SLinus Torvalds 		return 0;
1161da177e4SLinus Torvalds 	}
1171da177e4SLinus Torvalds 
1181da177e4SLinus Torvalds 	/*
1191da177e4SLinus Torvalds 	 * If we make a private mapping writable we increase our commit;
1201da177e4SLinus Torvalds 	 * but (without finer accounting) cannot reduce our commit if we
1211da177e4SLinus Torvalds 	 * make it unwritable again.
1221da177e4SLinus Torvalds 	 *
1231da177e4SLinus Torvalds 	 * FIXME? We haven't defined a VM_NORESERVE flag, so mprotecting
1241da177e4SLinus Torvalds 	 * a MAP_NORESERVE private mapping to writable will now reserve.
1251da177e4SLinus Torvalds 	 */
1261da177e4SLinus Torvalds 	if (newflags & VM_WRITE) {
127*8f860591SZhang, Yanmin 		if (!(oldflags & (VM_ACCOUNT|VM_WRITE|VM_SHARED))) {
1281da177e4SLinus Torvalds 			charged = nrpages;
1291da177e4SLinus Torvalds 			if (security_vm_enough_memory(charged))
1301da177e4SLinus Torvalds 				return -ENOMEM;
1311da177e4SLinus Torvalds 			newflags |= VM_ACCOUNT;
1321da177e4SLinus Torvalds 		}
1331da177e4SLinus Torvalds 	}
1341da177e4SLinus Torvalds 
1351da177e4SLinus Torvalds 	newprot = protection_map[newflags & 0xf];
1361da177e4SLinus Torvalds 
1371da177e4SLinus Torvalds 	/*
1381da177e4SLinus Torvalds 	 * First try to merge with previous and/or next vma.
1391da177e4SLinus Torvalds 	 */
1401da177e4SLinus Torvalds 	pgoff = vma->vm_pgoff + ((start - vma->vm_start) >> PAGE_SHIFT);
1411da177e4SLinus Torvalds 	*pprev = vma_merge(mm, *pprev, start, end, newflags,
1421da177e4SLinus Torvalds 			vma->anon_vma, vma->vm_file, pgoff, vma_policy(vma));
1431da177e4SLinus Torvalds 	if (*pprev) {
1441da177e4SLinus Torvalds 		vma = *pprev;
1451da177e4SLinus Torvalds 		goto success;
1461da177e4SLinus Torvalds 	}
1471da177e4SLinus Torvalds 
1481da177e4SLinus Torvalds 	*pprev = vma;
1491da177e4SLinus Torvalds 
1501da177e4SLinus Torvalds 	if (start != vma->vm_start) {
1511da177e4SLinus Torvalds 		error = split_vma(mm, vma, start, 1);
1521da177e4SLinus Torvalds 		if (error)
1531da177e4SLinus Torvalds 			goto fail;
1541da177e4SLinus Torvalds 	}
1551da177e4SLinus Torvalds 
1561da177e4SLinus Torvalds 	if (end != vma->vm_end) {
1571da177e4SLinus Torvalds 		error = split_vma(mm, vma, end, 0);
1581da177e4SLinus Torvalds 		if (error)
1591da177e4SLinus Torvalds 			goto fail;
1601da177e4SLinus Torvalds 	}
1611da177e4SLinus Torvalds 
1621da177e4SLinus Torvalds success:
1631da177e4SLinus Torvalds 	/*
1641da177e4SLinus Torvalds 	 * vm_flags and vm_page_prot are protected by the mmap_sem
1651da177e4SLinus Torvalds 	 * held in write mode.
1661da177e4SLinus Torvalds 	 */
1671da177e4SLinus Torvalds 	vma->vm_flags = newflags;
1681da177e4SLinus Torvalds 	vma->vm_page_prot = newprot;
169*8f860591SZhang, Yanmin 	if (is_vm_hugetlb_page(vma))
170*8f860591SZhang, Yanmin 		hugetlb_change_protection(vma, start, end, newprot);
171*8f860591SZhang, Yanmin 	else
1721da177e4SLinus Torvalds 		change_protection(vma, start, end, newprot);
173ab50b8edSHugh Dickins 	vm_stat_account(mm, oldflags, vma->vm_file, -nrpages);
174ab50b8edSHugh Dickins 	vm_stat_account(mm, newflags, vma->vm_file, nrpages);
1751da177e4SLinus Torvalds 	return 0;
1761da177e4SLinus Torvalds 
1771da177e4SLinus Torvalds fail:
1781da177e4SLinus Torvalds 	vm_unacct_memory(charged);
1791da177e4SLinus Torvalds 	return error;
1801da177e4SLinus Torvalds }
1811da177e4SLinus Torvalds 
1821da177e4SLinus Torvalds asmlinkage long
1831da177e4SLinus Torvalds sys_mprotect(unsigned long start, size_t len, unsigned long prot)
1841da177e4SLinus Torvalds {
1851da177e4SLinus Torvalds 	unsigned long vm_flags, nstart, end, tmp, reqprot;
1861da177e4SLinus Torvalds 	struct vm_area_struct *vma, *prev;
1871da177e4SLinus Torvalds 	int error = -EINVAL;
1881da177e4SLinus Torvalds 	const int grows = prot & (PROT_GROWSDOWN|PROT_GROWSUP);
1891da177e4SLinus Torvalds 	prot &= ~(PROT_GROWSDOWN|PROT_GROWSUP);
1901da177e4SLinus Torvalds 	if (grows == (PROT_GROWSDOWN|PROT_GROWSUP)) /* can't be both */
1911da177e4SLinus Torvalds 		return -EINVAL;
1921da177e4SLinus Torvalds 
1931da177e4SLinus Torvalds 	if (start & ~PAGE_MASK)
1941da177e4SLinus Torvalds 		return -EINVAL;
1951da177e4SLinus Torvalds 	if (!len)
1961da177e4SLinus Torvalds 		return 0;
1971da177e4SLinus Torvalds 	len = PAGE_ALIGN(len);
1981da177e4SLinus Torvalds 	end = start + len;
1991da177e4SLinus Torvalds 	if (end <= start)
2001da177e4SLinus Torvalds 		return -ENOMEM;
2011da177e4SLinus Torvalds 	if (prot & ~(PROT_READ | PROT_WRITE | PROT_EXEC | PROT_SEM))
2021da177e4SLinus Torvalds 		return -EINVAL;
2031da177e4SLinus Torvalds 
2041da177e4SLinus Torvalds 	reqprot = prot;
2051da177e4SLinus Torvalds 	/*
2061da177e4SLinus Torvalds 	 * Does the application expect PROT_READ to imply PROT_EXEC:
2071da177e4SLinus Torvalds 	 */
2081da177e4SLinus Torvalds 	if (unlikely((prot & PROT_READ) &&
2091da177e4SLinus Torvalds 			(current->personality & READ_IMPLIES_EXEC)))
2101da177e4SLinus Torvalds 		prot |= PROT_EXEC;
2111da177e4SLinus Torvalds 
2121da177e4SLinus Torvalds 	vm_flags = calc_vm_prot_bits(prot);
2131da177e4SLinus Torvalds 
2141da177e4SLinus Torvalds 	down_write(&current->mm->mmap_sem);
2151da177e4SLinus Torvalds 
2161da177e4SLinus Torvalds 	vma = find_vma_prev(current->mm, start, &prev);
2171da177e4SLinus Torvalds 	error = -ENOMEM;
2181da177e4SLinus Torvalds 	if (!vma)
2191da177e4SLinus Torvalds 		goto out;
2201da177e4SLinus Torvalds 	if (unlikely(grows & PROT_GROWSDOWN)) {
2211da177e4SLinus Torvalds 		if (vma->vm_start >= end)
2221da177e4SLinus Torvalds 			goto out;
2231da177e4SLinus Torvalds 		start = vma->vm_start;
2241da177e4SLinus Torvalds 		error = -EINVAL;
2251da177e4SLinus Torvalds 		if (!(vma->vm_flags & VM_GROWSDOWN))
2261da177e4SLinus Torvalds 			goto out;
2271da177e4SLinus Torvalds 	}
2281da177e4SLinus Torvalds 	else {
2291da177e4SLinus Torvalds 		if (vma->vm_start > start)
2301da177e4SLinus Torvalds 			goto out;
2311da177e4SLinus Torvalds 		if (unlikely(grows & PROT_GROWSUP)) {
2321da177e4SLinus Torvalds 			end = vma->vm_end;
2331da177e4SLinus Torvalds 			error = -EINVAL;
2341da177e4SLinus Torvalds 			if (!(vma->vm_flags & VM_GROWSUP))
2351da177e4SLinus Torvalds 				goto out;
2361da177e4SLinus Torvalds 		}
2371da177e4SLinus Torvalds 	}
2381da177e4SLinus Torvalds 	if (start > vma->vm_start)
2391da177e4SLinus Torvalds 		prev = vma;
2401da177e4SLinus Torvalds 
2411da177e4SLinus Torvalds 	for (nstart = start ; ; ) {
2421da177e4SLinus Torvalds 		unsigned long newflags;
2431da177e4SLinus Torvalds 
2441da177e4SLinus Torvalds 		/* Here we know that  vma->vm_start <= nstart < vma->vm_end. */
2451da177e4SLinus Torvalds 
2461da177e4SLinus Torvalds 		newflags = vm_flags | (vma->vm_flags & ~(VM_READ | VM_WRITE | VM_EXEC));
2471da177e4SLinus Torvalds 
2487e2cff42SPaolo 'Blaisorblade' Giarrusso 		/* newflags >> 4 shift VM_MAY% in place of VM_% */
2497e2cff42SPaolo 'Blaisorblade' Giarrusso 		if ((newflags & ~(newflags >> 4)) & (VM_READ | VM_WRITE | VM_EXEC)) {
2501da177e4SLinus Torvalds 			error = -EACCES;
2511da177e4SLinus Torvalds 			goto out;
2521da177e4SLinus Torvalds 		}
2531da177e4SLinus Torvalds 
2541da177e4SLinus Torvalds 		error = security_file_mprotect(vma, reqprot, prot);
2551da177e4SLinus Torvalds 		if (error)
2561da177e4SLinus Torvalds 			goto out;
2571da177e4SLinus Torvalds 
2581da177e4SLinus Torvalds 		tmp = vma->vm_end;
2591da177e4SLinus Torvalds 		if (tmp > end)
2601da177e4SLinus Torvalds 			tmp = end;
2611da177e4SLinus Torvalds 		error = mprotect_fixup(vma, &prev, nstart, tmp, newflags);
2621da177e4SLinus Torvalds 		if (error)
2631da177e4SLinus Torvalds 			goto out;
2641da177e4SLinus Torvalds 		nstart = tmp;
2651da177e4SLinus Torvalds 
2661da177e4SLinus Torvalds 		if (nstart < prev->vm_end)
2671da177e4SLinus Torvalds 			nstart = prev->vm_end;
2681da177e4SLinus Torvalds 		if (nstart >= end)
2691da177e4SLinus Torvalds 			goto out;
2701da177e4SLinus Torvalds 
2711da177e4SLinus Torvalds 		vma = prev->vm_next;
2721da177e4SLinus Torvalds 		if (!vma || vma->vm_start != nstart) {
2731da177e4SLinus Torvalds 			error = -ENOMEM;
2741da177e4SLinus Torvalds 			goto out;
2751da177e4SLinus Torvalds 		}
2761da177e4SLinus Torvalds 	}
2771da177e4SLinus Torvalds out:
2781da177e4SLinus Torvalds 	up_write(&current->mm->mmap_sem);
2791da177e4SLinus Torvalds 	return error;
2801da177e4SLinus Torvalds }
281