xref: /openbmc/linux/mm/mprotect.c (revision 6606c3e0da5360799e07ae24b05080cc85c68e72)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *  mm/mprotect.c
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  *  (C) Copyright 1994 Linus Torvalds
51da177e4SLinus Torvalds  *  (C) Copyright 2002 Christoph Hellwig
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  *  Address space accounting code	<alan@redhat.com>
81da177e4SLinus Torvalds  *  (C) Copyright 2002 Red Hat Inc, All Rights Reserved
91da177e4SLinus Torvalds  */
101da177e4SLinus Torvalds 
111da177e4SLinus Torvalds #include <linux/mm.h>
121da177e4SLinus Torvalds #include <linux/hugetlb.h>
131da177e4SLinus Torvalds #include <linux/slab.h>
141da177e4SLinus Torvalds #include <linux/shm.h>
151da177e4SLinus Torvalds #include <linux/mman.h>
161da177e4SLinus Torvalds #include <linux/fs.h>
171da177e4SLinus Torvalds #include <linux/highmem.h>
181da177e4SLinus Torvalds #include <linux/security.h>
191da177e4SLinus Torvalds #include <linux/mempolicy.h>
201da177e4SLinus Torvalds #include <linux/personality.h>
211da177e4SLinus Torvalds #include <linux/syscalls.h>
220697212aSChristoph Lameter #include <linux/swap.h>
230697212aSChristoph Lameter #include <linux/swapops.h>
241da177e4SLinus Torvalds #include <asm/uaccess.h>
251da177e4SLinus Torvalds #include <asm/pgtable.h>
261da177e4SLinus Torvalds #include <asm/cacheflush.h>
271da177e4SLinus Torvalds #include <asm/tlbflush.h>
281da177e4SLinus Torvalds 
291da177e4SLinus Torvalds static void change_pte_range(struct mm_struct *mm, pmd_t *pmd,
30c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
31c1e6098bSPeter Zijlstra 		int dirty_accountable)
321da177e4SLinus Torvalds {
330697212aSChristoph Lameter 	pte_t *pte, oldpte;
34705e87c0SHugh Dickins 	spinlock_t *ptl;
351da177e4SLinus Torvalds 
36705e87c0SHugh Dickins 	pte = pte_offset_map_lock(mm, pmd, addr, &ptl);
37*6606c3e0SZachary Amsden 	arch_enter_lazy_mmu_mode();
381da177e4SLinus Torvalds 	do {
390697212aSChristoph Lameter 		oldpte = *pte;
400697212aSChristoph Lameter 		if (pte_present(oldpte)) {
411da177e4SLinus Torvalds 			pte_t ptent;
421da177e4SLinus Torvalds 
431da177e4SLinus Torvalds 			/* Avoid an SMP race with hardware updated dirty/clean
441da177e4SLinus Torvalds 			 * bits by wiping the pte and then setting the new pte
451da177e4SLinus Torvalds 			 * into place.
461da177e4SLinus Torvalds 			 */
47c1e6098bSPeter Zijlstra 			ptent = ptep_get_and_clear(mm, addr, pte);
48c1e6098bSPeter Zijlstra 			ptent = pte_modify(ptent, newprot);
49c1e6098bSPeter Zijlstra 			/*
50c1e6098bSPeter Zijlstra 			 * Avoid taking write faults for pages we know to be
51c1e6098bSPeter Zijlstra 			 * dirty.
52c1e6098bSPeter Zijlstra 			 */
53c1e6098bSPeter Zijlstra 			if (dirty_accountable && pte_dirty(ptent))
54c1e6098bSPeter Zijlstra 				ptent = pte_mkwrite(ptent);
551da177e4SLinus Torvalds 			set_pte_at(mm, addr, pte, ptent);
561da177e4SLinus Torvalds 			lazy_mmu_prot_update(ptent);
570697212aSChristoph Lameter #ifdef CONFIG_MIGRATION
580697212aSChristoph Lameter 		} else if (!pte_file(oldpte)) {
590697212aSChristoph Lameter 			swp_entry_t entry = pte_to_swp_entry(oldpte);
600697212aSChristoph Lameter 
610697212aSChristoph Lameter 			if (is_write_migration_entry(entry)) {
620697212aSChristoph Lameter 				/*
630697212aSChristoph Lameter 				 * A protection check is difficult so
640697212aSChristoph Lameter 				 * just be safe and disable write
650697212aSChristoph Lameter 				 */
660697212aSChristoph Lameter 				make_migration_entry_read(&entry);
670697212aSChristoph Lameter 				set_pte_at(mm, addr, pte,
680697212aSChristoph Lameter 					swp_entry_to_pte(entry));
691da177e4SLinus Torvalds 			}
700697212aSChristoph Lameter #endif
710697212aSChristoph Lameter 		}
720697212aSChristoph Lameter 
731da177e4SLinus Torvalds 	} while (pte++, addr += PAGE_SIZE, addr != end);
74*6606c3e0SZachary Amsden 	arch_leave_lazy_mmu_mode();
75705e87c0SHugh Dickins 	pte_unmap_unlock(pte - 1, ptl);
761da177e4SLinus Torvalds }
771da177e4SLinus Torvalds 
781da177e4SLinus Torvalds static inline void change_pmd_range(struct mm_struct *mm, pud_t *pud,
79c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
80c1e6098bSPeter Zijlstra 		int dirty_accountable)
811da177e4SLinus Torvalds {
821da177e4SLinus Torvalds 	pmd_t *pmd;
831da177e4SLinus Torvalds 	unsigned long next;
841da177e4SLinus Torvalds 
851da177e4SLinus Torvalds 	pmd = pmd_offset(pud, addr);
861da177e4SLinus Torvalds 	do {
871da177e4SLinus Torvalds 		next = pmd_addr_end(addr, end);
881da177e4SLinus Torvalds 		if (pmd_none_or_clear_bad(pmd))
891da177e4SLinus Torvalds 			continue;
90c1e6098bSPeter Zijlstra 		change_pte_range(mm, pmd, addr, next, newprot, dirty_accountable);
911da177e4SLinus Torvalds 	} while (pmd++, addr = next, addr != end);
921da177e4SLinus Torvalds }
931da177e4SLinus Torvalds 
941da177e4SLinus Torvalds static inline void change_pud_range(struct mm_struct *mm, pgd_t *pgd,
95c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
96c1e6098bSPeter Zijlstra 		int dirty_accountable)
971da177e4SLinus Torvalds {
981da177e4SLinus Torvalds 	pud_t *pud;
991da177e4SLinus Torvalds 	unsigned long next;
1001da177e4SLinus Torvalds 
1011da177e4SLinus Torvalds 	pud = pud_offset(pgd, addr);
1021da177e4SLinus Torvalds 	do {
1031da177e4SLinus Torvalds 		next = pud_addr_end(addr, end);
1041da177e4SLinus Torvalds 		if (pud_none_or_clear_bad(pud))
1051da177e4SLinus Torvalds 			continue;
106c1e6098bSPeter Zijlstra 		change_pmd_range(mm, pud, addr, next, newprot, dirty_accountable);
1071da177e4SLinus Torvalds 	} while (pud++, addr = next, addr != end);
1081da177e4SLinus Torvalds }
1091da177e4SLinus Torvalds 
1101da177e4SLinus Torvalds static void change_protection(struct vm_area_struct *vma,
111c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
112c1e6098bSPeter Zijlstra 		int dirty_accountable)
1131da177e4SLinus Torvalds {
1141da177e4SLinus Torvalds 	struct mm_struct *mm = vma->vm_mm;
1151da177e4SLinus Torvalds 	pgd_t *pgd;
1161da177e4SLinus Torvalds 	unsigned long next;
1171da177e4SLinus Torvalds 	unsigned long start = addr;
1181da177e4SLinus Torvalds 
1191da177e4SLinus Torvalds 	BUG_ON(addr >= end);
1201da177e4SLinus Torvalds 	pgd = pgd_offset(mm, addr);
1211da177e4SLinus Torvalds 	flush_cache_range(vma, addr, end);
1221da177e4SLinus Torvalds 	do {
1231da177e4SLinus Torvalds 		next = pgd_addr_end(addr, end);
1241da177e4SLinus Torvalds 		if (pgd_none_or_clear_bad(pgd))
1251da177e4SLinus Torvalds 			continue;
126c1e6098bSPeter Zijlstra 		change_pud_range(mm, pgd, addr, next, newprot, dirty_accountable);
1271da177e4SLinus Torvalds 	} while (pgd++, addr = next, addr != end);
1281da177e4SLinus Torvalds 	flush_tlb_range(vma, start, end);
1291da177e4SLinus Torvalds }
1301da177e4SLinus Torvalds 
1311da177e4SLinus Torvalds static int
1321da177e4SLinus Torvalds mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev,
1331da177e4SLinus Torvalds 	unsigned long start, unsigned long end, unsigned long newflags)
1341da177e4SLinus Torvalds {
1351da177e4SLinus Torvalds 	struct mm_struct *mm = vma->vm_mm;
1361da177e4SLinus Torvalds 	unsigned long oldflags = vma->vm_flags;
1371da177e4SLinus Torvalds 	long nrpages = (end - start) >> PAGE_SHIFT;
1381da177e4SLinus Torvalds 	unsigned long charged = 0;
1391da177e4SLinus Torvalds 	pgoff_t pgoff;
1401da177e4SLinus Torvalds 	int error;
141c1e6098bSPeter Zijlstra 	int dirty_accountable = 0;
1421da177e4SLinus Torvalds 
1431da177e4SLinus Torvalds 	if (newflags == oldflags) {
1441da177e4SLinus Torvalds 		*pprev = vma;
1451da177e4SLinus Torvalds 		return 0;
1461da177e4SLinus Torvalds 	}
1471da177e4SLinus Torvalds 
1481da177e4SLinus Torvalds 	/*
1491da177e4SLinus Torvalds 	 * If we make a private mapping writable we increase our commit;
1501da177e4SLinus Torvalds 	 * but (without finer accounting) cannot reduce our commit if we
1511da177e4SLinus Torvalds 	 * make it unwritable again.
1521da177e4SLinus Torvalds 	 *
1531da177e4SLinus Torvalds 	 * FIXME? We haven't defined a VM_NORESERVE flag, so mprotecting
1541da177e4SLinus Torvalds 	 * a MAP_NORESERVE private mapping to writable will now reserve.
1551da177e4SLinus Torvalds 	 */
1561da177e4SLinus Torvalds 	if (newflags & VM_WRITE) {
1578f860591SZhang, Yanmin 		if (!(oldflags & (VM_ACCOUNT|VM_WRITE|VM_SHARED))) {
1581da177e4SLinus Torvalds 			charged = nrpages;
1591da177e4SLinus Torvalds 			if (security_vm_enough_memory(charged))
1601da177e4SLinus Torvalds 				return -ENOMEM;
1611da177e4SLinus Torvalds 			newflags |= VM_ACCOUNT;
1621da177e4SLinus Torvalds 		}
1631da177e4SLinus Torvalds 	}
1641da177e4SLinus Torvalds 
1651da177e4SLinus Torvalds 	/*
1661da177e4SLinus Torvalds 	 * First try to merge with previous and/or next vma.
1671da177e4SLinus Torvalds 	 */
1681da177e4SLinus Torvalds 	pgoff = vma->vm_pgoff + ((start - vma->vm_start) >> PAGE_SHIFT);
1691da177e4SLinus Torvalds 	*pprev = vma_merge(mm, *pprev, start, end, newflags,
1701da177e4SLinus Torvalds 			vma->anon_vma, vma->vm_file, pgoff, vma_policy(vma));
1711da177e4SLinus Torvalds 	if (*pprev) {
1721da177e4SLinus Torvalds 		vma = *pprev;
1731da177e4SLinus Torvalds 		goto success;
1741da177e4SLinus Torvalds 	}
1751da177e4SLinus Torvalds 
1761da177e4SLinus Torvalds 	*pprev = vma;
1771da177e4SLinus Torvalds 
1781da177e4SLinus Torvalds 	if (start != vma->vm_start) {
1791da177e4SLinus Torvalds 		error = split_vma(mm, vma, start, 1);
1801da177e4SLinus Torvalds 		if (error)
1811da177e4SLinus Torvalds 			goto fail;
1821da177e4SLinus Torvalds 	}
1831da177e4SLinus Torvalds 
1841da177e4SLinus Torvalds 	if (end != vma->vm_end) {
1851da177e4SLinus Torvalds 		error = split_vma(mm, vma, end, 0);
1861da177e4SLinus Torvalds 		if (error)
1871da177e4SLinus Torvalds 			goto fail;
1881da177e4SLinus Torvalds 	}
1891da177e4SLinus Torvalds 
1901da177e4SLinus Torvalds success:
1911da177e4SLinus Torvalds 	/*
1921da177e4SLinus Torvalds 	 * vm_flags and vm_page_prot are protected by the mmap_sem
1931da177e4SLinus Torvalds 	 * held in write mode.
1941da177e4SLinus Torvalds 	 */
1951da177e4SLinus Torvalds 	vma->vm_flags = newflags;
196d08b3851SPeter Zijlstra 	vma->vm_page_prot = protection_map[newflags &
197d08b3851SPeter Zijlstra 		(VM_READ|VM_WRITE|VM_EXEC|VM_SHARED)];
198c1e6098bSPeter Zijlstra 	if (vma_wants_writenotify(vma)) {
199d08b3851SPeter Zijlstra 		vma->vm_page_prot = protection_map[newflags &
200d08b3851SPeter Zijlstra 			(VM_READ|VM_WRITE|VM_EXEC)];
201c1e6098bSPeter Zijlstra 		dirty_accountable = 1;
202c1e6098bSPeter Zijlstra 	}
203d08b3851SPeter Zijlstra 
2048f860591SZhang, Yanmin 	if (is_vm_hugetlb_page(vma))
205d08b3851SPeter Zijlstra 		hugetlb_change_protection(vma, start, end, vma->vm_page_prot);
2068f860591SZhang, Yanmin 	else
207c1e6098bSPeter Zijlstra 		change_protection(vma, start, end, vma->vm_page_prot, dirty_accountable);
208ab50b8edSHugh Dickins 	vm_stat_account(mm, oldflags, vma->vm_file, -nrpages);
209ab50b8edSHugh Dickins 	vm_stat_account(mm, newflags, vma->vm_file, nrpages);
2101da177e4SLinus Torvalds 	return 0;
2111da177e4SLinus Torvalds 
2121da177e4SLinus Torvalds fail:
2131da177e4SLinus Torvalds 	vm_unacct_memory(charged);
2141da177e4SLinus Torvalds 	return error;
2151da177e4SLinus Torvalds }
2161da177e4SLinus Torvalds 
2171da177e4SLinus Torvalds asmlinkage long
2181da177e4SLinus Torvalds sys_mprotect(unsigned long start, size_t len, unsigned long prot)
2191da177e4SLinus Torvalds {
2201da177e4SLinus Torvalds 	unsigned long vm_flags, nstart, end, tmp, reqprot;
2211da177e4SLinus Torvalds 	struct vm_area_struct *vma, *prev;
2221da177e4SLinus Torvalds 	int error = -EINVAL;
2231da177e4SLinus Torvalds 	const int grows = prot & (PROT_GROWSDOWN|PROT_GROWSUP);
2241da177e4SLinus Torvalds 	prot &= ~(PROT_GROWSDOWN|PROT_GROWSUP);
2251da177e4SLinus Torvalds 	if (grows == (PROT_GROWSDOWN|PROT_GROWSUP)) /* can't be both */
2261da177e4SLinus Torvalds 		return -EINVAL;
2271da177e4SLinus Torvalds 
2281da177e4SLinus Torvalds 	if (start & ~PAGE_MASK)
2291da177e4SLinus Torvalds 		return -EINVAL;
2301da177e4SLinus Torvalds 	if (!len)
2311da177e4SLinus Torvalds 		return 0;
2321da177e4SLinus Torvalds 	len = PAGE_ALIGN(len);
2331da177e4SLinus Torvalds 	end = start + len;
2341da177e4SLinus Torvalds 	if (end <= start)
2351da177e4SLinus Torvalds 		return -ENOMEM;
2361da177e4SLinus Torvalds 	if (prot & ~(PROT_READ | PROT_WRITE | PROT_EXEC | PROT_SEM))
2371da177e4SLinus Torvalds 		return -EINVAL;
2381da177e4SLinus Torvalds 
2391da177e4SLinus Torvalds 	reqprot = prot;
2401da177e4SLinus Torvalds 	/*
2411da177e4SLinus Torvalds 	 * Does the application expect PROT_READ to imply PROT_EXEC:
2421da177e4SLinus Torvalds 	 */
243b344e05cSHua Zhong 	if ((prot & PROT_READ) && (current->personality & READ_IMPLIES_EXEC))
2441da177e4SLinus Torvalds 		prot |= PROT_EXEC;
2451da177e4SLinus Torvalds 
2461da177e4SLinus Torvalds 	vm_flags = calc_vm_prot_bits(prot);
2471da177e4SLinus Torvalds 
2481da177e4SLinus Torvalds 	down_write(&current->mm->mmap_sem);
2491da177e4SLinus Torvalds 
2501da177e4SLinus Torvalds 	vma = find_vma_prev(current->mm, start, &prev);
2511da177e4SLinus Torvalds 	error = -ENOMEM;
2521da177e4SLinus Torvalds 	if (!vma)
2531da177e4SLinus Torvalds 		goto out;
2541da177e4SLinus Torvalds 	if (unlikely(grows & PROT_GROWSDOWN)) {
2551da177e4SLinus Torvalds 		if (vma->vm_start >= end)
2561da177e4SLinus Torvalds 			goto out;
2571da177e4SLinus Torvalds 		start = vma->vm_start;
2581da177e4SLinus Torvalds 		error = -EINVAL;
2591da177e4SLinus Torvalds 		if (!(vma->vm_flags & VM_GROWSDOWN))
2601da177e4SLinus Torvalds 			goto out;
2611da177e4SLinus Torvalds 	}
2621da177e4SLinus Torvalds 	else {
2631da177e4SLinus Torvalds 		if (vma->vm_start > start)
2641da177e4SLinus Torvalds 			goto out;
2651da177e4SLinus Torvalds 		if (unlikely(grows & PROT_GROWSUP)) {
2661da177e4SLinus Torvalds 			end = vma->vm_end;
2671da177e4SLinus Torvalds 			error = -EINVAL;
2681da177e4SLinus Torvalds 			if (!(vma->vm_flags & VM_GROWSUP))
2691da177e4SLinus Torvalds 				goto out;
2701da177e4SLinus Torvalds 		}
2711da177e4SLinus Torvalds 	}
2721da177e4SLinus Torvalds 	if (start > vma->vm_start)
2731da177e4SLinus Torvalds 		prev = vma;
2741da177e4SLinus Torvalds 
2751da177e4SLinus Torvalds 	for (nstart = start ; ; ) {
2761da177e4SLinus Torvalds 		unsigned long newflags;
2771da177e4SLinus Torvalds 
2781da177e4SLinus Torvalds 		/* Here we know that  vma->vm_start <= nstart < vma->vm_end. */
2791da177e4SLinus Torvalds 
2801da177e4SLinus Torvalds 		newflags = vm_flags | (vma->vm_flags & ~(VM_READ | VM_WRITE | VM_EXEC));
2811da177e4SLinus Torvalds 
2827e2cff42SPaolo 'Blaisorblade' Giarrusso 		/* newflags >> 4 shift VM_MAY% in place of VM_% */
2837e2cff42SPaolo 'Blaisorblade' Giarrusso 		if ((newflags & ~(newflags >> 4)) & (VM_READ | VM_WRITE | VM_EXEC)) {
2841da177e4SLinus Torvalds 			error = -EACCES;
2851da177e4SLinus Torvalds 			goto out;
2861da177e4SLinus Torvalds 		}
2871da177e4SLinus Torvalds 
2881da177e4SLinus Torvalds 		error = security_file_mprotect(vma, reqprot, prot);
2891da177e4SLinus Torvalds 		if (error)
2901da177e4SLinus Torvalds 			goto out;
2911da177e4SLinus Torvalds 
2921da177e4SLinus Torvalds 		tmp = vma->vm_end;
2931da177e4SLinus Torvalds 		if (tmp > end)
2941da177e4SLinus Torvalds 			tmp = end;
2951da177e4SLinus Torvalds 		error = mprotect_fixup(vma, &prev, nstart, tmp, newflags);
2961da177e4SLinus Torvalds 		if (error)
2971da177e4SLinus Torvalds 			goto out;
2981da177e4SLinus Torvalds 		nstart = tmp;
2991da177e4SLinus Torvalds 
3001da177e4SLinus Torvalds 		if (nstart < prev->vm_end)
3011da177e4SLinus Torvalds 			nstart = prev->vm_end;
3021da177e4SLinus Torvalds 		if (nstart >= end)
3031da177e4SLinus Torvalds 			goto out;
3041da177e4SLinus Torvalds 
3051da177e4SLinus Torvalds 		vma = prev->vm_next;
3061da177e4SLinus Torvalds 		if (!vma || vma->vm_start != nstart) {
3071da177e4SLinus Torvalds 			error = -ENOMEM;
3081da177e4SLinus Torvalds 			goto out;
3091da177e4SLinus Torvalds 		}
3101da177e4SLinus Torvalds 	}
3111da177e4SLinus Torvalds out:
3121da177e4SLinus Torvalds 	up_write(&current->mm->mmap_sem);
3131da177e4SLinus Torvalds 	return error;
3141da177e4SLinus Torvalds }
315