xref: /openbmc/linux/mm/mprotect.c (revision 1ddd439ef987c9f0209e6ce824b67518f2afe67b)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *  mm/mprotect.c
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  *  (C) Copyright 1994 Linus Torvalds
51da177e4SLinus Torvalds  *  (C) Copyright 2002 Christoph Hellwig
61da177e4SLinus Torvalds  *
71da177e4SLinus Torvalds  *  Address space accounting code	<alan@redhat.com>
81da177e4SLinus Torvalds  *  (C) Copyright 2002 Red Hat Inc, All Rights Reserved
91da177e4SLinus Torvalds  */
101da177e4SLinus Torvalds 
111da177e4SLinus Torvalds #include <linux/mm.h>
121da177e4SLinus Torvalds #include <linux/hugetlb.h>
131da177e4SLinus Torvalds #include <linux/slab.h>
141da177e4SLinus Torvalds #include <linux/shm.h>
151da177e4SLinus Torvalds #include <linux/mman.h>
161da177e4SLinus Torvalds #include <linux/fs.h>
171da177e4SLinus Torvalds #include <linux/highmem.h>
181da177e4SLinus Torvalds #include <linux/security.h>
191da177e4SLinus Torvalds #include <linux/mempolicy.h>
201da177e4SLinus Torvalds #include <linux/personality.h>
211da177e4SLinus Torvalds #include <linux/syscalls.h>
220697212aSChristoph Lameter #include <linux/swap.h>
230697212aSChristoph Lameter #include <linux/swapops.h>
241da177e4SLinus Torvalds #include <asm/uaccess.h>
251da177e4SLinus Torvalds #include <asm/pgtable.h>
261da177e4SLinus Torvalds #include <asm/cacheflush.h>
271da177e4SLinus Torvalds #include <asm/tlbflush.h>
281da177e4SLinus Torvalds 
291da177e4SLinus Torvalds static void change_pte_range(struct mm_struct *mm, pmd_t *pmd,
30c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
31c1e6098bSPeter Zijlstra 		int dirty_accountable)
321da177e4SLinus Torvalds {
330697212aSChristoph Lameter 	pte_t *pte, oldpte;
34705e87c0SHugh Dickins 	spinlock_t *ptl;
351da177e4SLinus Torvalds 
36705e87c0SHugh Dickins 	pte = pte_offset_map_lock(mm, pmd, addr, &ptl);
376606c3e0SZachary Amsden 	arch_enter_lazy_mmu_mode();
381da177e4SLinus Torvalds 	do {
390697212aSChristoph Lameter 		oldpte = *pte;
400697212aSChristoph Lameter 		if (pte_present(oldpte)) {
411da177e4SLinus Torvalds 			pte_t ptent;
421da177e4SLinus Torvalds 
431da177e4SLinus Torvalds 			/* Avoid an SMP race with hardware updated dirty/clean
441da177e4SLinus Torvalds 			 * bits by wiping the pte and then setting the new pte
451da177e4SLinus Torvalds 			 * into place.
461da177e4SLinus Torvalds 			 */
47c1e6098bSPeter Zijlstra 			ptent = ptep_get_and_clear(mm, addr, pte);
48c1e6098bSPeter Zijlstra 			ptent = pte_modify(ptent, newprot);
49c1e6098bSPeter Zijlstra 			/*
50c1e6098bSPeter Zijlstra 			 * Avoid taking write faults for pages we know to be
51c1e6098bSPeter Zijlstra 			 * dirty.
52c1e6098bSPeter Zijlstra 			 */
53c1e6098bSPeter Zijlstra 			if (dirty_accountable && pte_dirty(ptent))
54c1e6098bSPeter Zijlstra 				ptent = pte_mkwrite(ptent);
551da177e4SLinus Torvalds 			set_pte_at(mm, addr, pte, ptent);
560697212aSChristoph Lameter #ifdef CONFIG_MIGRATION
570697212aSChristoph Lameter 		} else if (!pte_file(oldpte)) {
580697212aSChristoph Lameter 			swp_entry_t entry = pte_to_swp_entry(oldpte);
590697212aSChristoph Lameter 
600697212aSChristoph Lameter 			if (is_write_migration_entry(entry)) {
610697212aSChristoph Lameter 				/*
620697212aSChristoph Lameter 				 * A protection check is difficult so
630697212aSChristoph Lameter 				 * just be safe and disable write
640697212aSChristoph Lameter 				 */
650697212aSChristoph Lameter 				make_migration_entry_read(&entry);
660697212aSChristoph Lameter 				set_pte_at(mm, addr, pte,
670697212aSChristoph Lameter 					swp_entry_to_pte(entry));
681da177e4SLinus Torvalds 			}
690697212aSChristoph Lameter #endif
700697212aSChristoph Lameter 		}
710697212aSChristoph Lameter 
721da177e4SLinus Torvalds 	} while (pte++, addr += PAGE_SIZE, addr != end);
736606c3e0SZachary Amsden 	arch_leave_lazy_mmu_mode();
74705e87c0SHugh Dickins 	pte_unmap_unlock(pte - 1, ptl);
751da177e4SLinus Torvalds }
761da177e4SLinus Torvalds 
771da177e4SLinus Torvalds static inline void change_pmd_range(struct mm_struct *mm, pud_t *pud,
78c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
79c1e6098bSPeter Zijlstra 		int dirty_accountable)
801da177e4SLinus Torvalds {
811da177e4SLinus Torvalds 	pmd_t *pmd;
821da177e4SLinus Torvalds 	unsigned long next;
831da177e4SLinus Torvalds 
841da177e4SLinus Torvalds 	pmd = pmd_offset(pud, addr);
851da177e4SLinus Torvalds 	do {
861da177e4SLinus Torvalds 		next = pmd_addr_end(addr, end);
871da177e4SLinus Torvalds 		if (pmd_none_or_clear_bad(pmd))
881da177e4SLinus Torvalds 			continue;
89c1e6098bSPeter Zijlstra 		change_pte_range(mm, pmd, addr, next, newprot, dirty_accountable);
901da177e4SLinus Torvalds 	} while (pmd++, addr = next, addr != end);
911da177e4SLinus Torvalds }
921da177e4SLinus Torvalds 
931da177e4SLinus Torvalds static inline void change_pud_range(struct mm_struct *mm, pgd_t *pgd,
94c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
95c1e6098bSPeter Zijlstra 		int dirty_accountable)
961da177e4SLinus Torvalds {
971da177e4SLinus Torvalds 	pud_t *pud;
981da177e4SLinus Torvalds 	unsigned long next;
991da177e4SLinus Torvalds 
1001da177e4SLinus Torvalds 	pud = pud_offset(pgd, addr);
1011da177e4SLinus Torvalds 	do {
1021da177e4SLinus Torvalds 		next = pud_addr_end(addr, end);
1031da177e4SLinus Torvalds 		if (pud_none_or_clear_bad(pud))
1041da177e4SLinus Torvalds 			continue;
105c1e6098bSPeter Zijlstra 		change_pmd_range(mm, pud, addr, next, newprot, dirty_accountable);
1061da177e4SLinus Torvalds 	} while (pud++, addr = next, addr != end);
1071da177e4SLinus Torvalds }
1081da177e4SLinus Torvalds 
1091da177e4SLinus Torvalds static void change_protection(struct vm_area_struct *vma,
110c1e6098bSPeter Zijlstra 		unsigned long addr, unsigned long end, pgprot_t newprot,
111c1e6098bSPeter Zijlstra 		int dirty_accountable)
1121da177e4SLinus Torvalds {
1131da177e4SLinus Torvalds 	struct mm_struct *mm = vma->vm_mm;
1141da177e4SLinus Torvalds 	pgd_t *pgd;
1151da177e4SLinus Torvalds 	unsigned long next;
1161da177e4SLinus Torvalds 	unsigned long start = addr;
1171da177e4SLinus Torvalds 
1181da177e4SLinus Torvalds 	BUG_ON(addr >= end);
1191da177e4SLinus Torvalds 	pgd = pgd_offset(mm, addr);
1201da177e4SLinus Torvalds 	flush_cache_range(vma, addr, end);
1211da177e4SLinus Torvalds 	do {
1221da177e4SLinus Torvalds 		next = pgd_addr_end(addr, end);
1231da177e4SLinus Torvalds 		if (pgd_none_or_clear_bad(pgd))
1241da177e4SLinus Torvalds 			continue;
125c1e6098bSPeter Zijlstra 		change_pud_range(mm, pgd, addr, next, newprot, dirty_accountable);
1261da177e4SLinus Torvalds 	} while (pgd++, addr = next, addr != end);
1271da177e4SLinus Torvalds 	flush_tlb_range(vma, start, end);
1281da177e4SLinus Torvalds }
1291da177e4SLinus Torvalds 
130b6a2fea3SOllie Wild int
1311da177e4SLinus Torvalds mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev,
1321da177e4SLinus Torvalds 	unsigned long start, unsigned long end, unsigned long newflags)
1331da177e4SLinus Torvalds {
1341da177e4SLinus Torvalds 	struct mm_struct *mm = vma->vm_mm;
1351da177e4SLinus Torvalds 	unsigned long oldflags = vma->vm_flags;
1361da177e4SLinus Torvalds 	long nrpages = (end - start) >> PAGE_SHIFT;
1371da177e4SLinus Torvalds 	unsigned long charged = 0;
1381da177e4SLinus Torvalds 	pgoff_t pgoff;
1391da177e4SLinus Torvalds 	int error;
140c1e6098bSPeter Zijlstra 	int dirty_accountable = 0;
1411da177e4SLinus Torvalds 
1421da177e4SLinus Torvalds 	if (newflags == oldflags) {
1431da177e4SLinus Torvalds 		*pprev = vma;
1441da177e4SLinus Torvalds 		return 0;
1451da177e4SLinus Torvalds 	}
1461da177e4SLinus Torvalds 
1471da177e4SLinus Torvalds 	/*
1481da177e4SLinus Torvalds 	 * If we make a private mapping writable we increase our commit;
1491da177e4SLinus Torvalds 	 * but (without finer accounting) cannot reduce our commit if we
1501da177e4SLinus Torvalds 	 * make it unwritable again.
1511da177e4SLinus Torvalds 	 *
1521da177e4SLinus Torvalds 	 * FIXME? We haven't defined a VM_NORESERVE flag, so mprotecting
1531da177e4SLinus Torvalds 	 * a MAP_NORESERVE private mapping to writable will now reserve.
1541da177e4SLinus Torvalds 	 */
1551da177e4SLinus Torvalds 	if (newflags & VM_WRITE) {
1568f860591SZhang, Yanmin 		if (!(oldflags & (VM_ACCOUNT|VM_WRITE|VM_SHARED))) {
1571da177e4SLinus Torvalds 			charged = nrpages;
1581da177e4SLinus Torvalds 			if (security_vm_enough_memory(charged))
1591da177e4SLinus Torvalds 				return -ENOMEM;
1601da177e4SLinus Torvalds 			newflags |= VM_ACCOUNT;
1611da177e4SLinus Torvalds 		}
1621da177e4SLinus Torvalds 	}
1631da177e4SLinus Torvalds 
1641da177e4SLinus Torvalds 	/*
1651da177e4SLinus Torvalds 	 * First try to merge with previous and/or next vma.
1661da177e4SLinus Torvalds 	 */
1671da177e4SLinus Torvalds 	pgoff = vma->vm_pgoff + ((start - vma->vm_start) >> PAGE_SHIFT);
1681da177e4SLinus Torvalds 	*pprev = vma_merge(mm, *pprev, start, end, newflags,
1691da177e4SLinus Torvalds 			vma->anon_vma, vma->vm_file, pgoff, vma_policy(vma));
1701da177e4SLinus Torvalds 	if (*pprev) {
1711da177e4SLinus Torvalds 		vma = *pprev;
1721da177e4SLinus Torvalds 		goto success;
1731da177e4SLinus Torvalds 	}
1741da177e4SLinus Torvalds 
1751da177e4SLinus Torvalds 	*pprev = vma;
1761da177e4SLinus Torvalds 
1771da177e4SLinus Torvalds 	if (start != vma->vm_start) {
1781da177e4SLinus Torvalds 		error = split_vma(mm, vma, start, 1);
1791da177e4SLinus Torvalds 		if (error)
1801da177e4SLinus Torvalds 			goto fail;
1811da177e4SLinus Torvalds 	}
1821da177e4SLinus Torvalds 
1831da177e4SLinus Torvalds 	if (end != vma->vm_end) {
1841da177e4SLinus Torvalds 		error = split_vma(mm, vma, end, 0);
1851da177e4SLinus Torvalds 		if (error)
1861da177e4SLinus Torvalds 			goto fail;
1871da177e4SLinus Torvalds 	}
1881da177e4SLinus Torvalds 
1891da177e4SLinus Torvalds success:
1901da177e4SLinus Torvalds 	/*
1911da177e4SLinus Torvalds 	 * vm_flags and vm_page_prot are protected by the mmap_sem
1921da177e4SLinus Torvalds 	 * held in write mode.
1931da177e4SLinus Torvalds 	 */
1941da177e4SLinus Torvalds 	vma->vm_flags = newflags;
1953ed75eb8SColy Li 	vma->vm_page_prot = vm_get_page_prot(newflags);
196c1e6098bSPeter Zijlstra 	if (vma_wants_writenotify(vma)) {
197*1ddd439eSHugh Dickins 		vma->vm_page_prot = vm_get_page_prot(newflags & ~VM_SHARED);
198c1e6098bSPeter Zijlstra 		dirty_accountable = 1;
199c1e6098bSPeter Zijlstra 	}
200d08b3851SPeter Zijlstra 
2018f860591SZhang, Yanmin 	if (is_vm_hugetlb_page(vma))
202d08b3851SPeter Zijlstra 		hugetlb_change_protection(vma, start, end, vma->vm_page_prot);
2038f860591SZhang, Yanmin 	else
204c1e6098bSPeter Zijlstra 		change_protection(vma, start, end, vma->vm_page_prot, dirty_accountable);
205ab50b8edSHugh Dickins 	vm_stat_account(mm, oldflags, vma->vm_file, -nrpages);
206ab50b8edSHugh Dickins 	vm_stat_account(mm, newflags, vma->vm_file, nrpages);
2071da177e4SLinus Torvalds 	return 0;
2081da177e4SLinus Torvalds 
2091da177e4SLinus Torvalds fail:
2101da177e4SLinus Torvalds 	vm_unacct_memory(charged);
2111da177e4SLinus Torvalds 	return error;
2121da177e4SLinus Torvalds }
2131da177e4SLinus Torvalds 
2141da177e4SLinus Torvalds asmlinkage long
2151da177e4SLinus Torvalds sys_mprotect(unsigned long start, size_t len, unsigned long prot)
2161da177e4SLinus Torvalds {
2171da177e4SLinus Torvalds 	unsigned long vm_flags, nstart, end, tmp, reqprot;
2181da177e4SLinus Torvalds 	struct vm_area_struct *vma, *prev;
2191da177e4SLinus Torvalds 	int error = -EINVAL;
2201da177e4SLinus Torvalds 	const int grows = prot & (PROT_GROWSDOWN|PROT_GROWSUP);
2211da177e4SLinus Torvalds 	prot &= ~(PROT_GROWSDOWN|PROT_GROWSUP);
2221da177e4SLinus Torvalds 	if (grows == (PROT_GROWSDOWN|PROT_GROWSUP)) /* can't be both */
2231da177e4SLinus Torvalds 		return -EINVAL;
2241da177e4SLinus Torvalds 
2251da177e4SLinus Torvalds 	if (start & ~PAGE_MASK)
2261da177e4SLinus Torvalds 		return -EINVAL;
2271da177e4SLinus Torvalds 	if (!len)
2281da177e4SLinus Torvalds 		return 0;
2291da177e4SLinus Torvalds 	len = PAGE_ALIGN(len);
2301da177e4SLinus Torvalds 	end = start + len;
2311da177e4SLinus Torvalds 	if (end <= start)
2321da177e4SLinus Torvalds 		return -ENOMEM;
2331da177e4SLinus Torvalds 	if (prot & ~(PROT_READ | PROT_WRITE | PROT_EXEC | PROT_SEM))
2341da177e4SLinus Torvalds 		return -EINVAL;
2351da177e4SLinus Torvalds 
2361da177e4SLinus Torvalds 	reqprot = prot;
2371da177e4SLinus Torvalds 	/*
2381da177e4SLinus Torvalds 	 * Does the application expect PROT_READ to imply PROT_EXEC:
2391da177e4SLinus Torvalds 	 */
240b344e05cSHua Zhong 	if ((prot & PROT_READ) && (current->personality & READ_IMPLIES_EXEC))
2411da177e4SLinus Torvalds 		prot |= PROT_EXEC;
2421da177e4SLinus Torvalds 
2431da177e4SLinus Torvalds 	vm_flags = calc_vm_prot_bits(prot);
2441da177e4SLinus Torvalds 
2451da177e4SLinus Torvalds 	down_write(&current->mm->mmap_sem);
2461da177e4SLinus Torvalds 
2471da177e4SLinus Torvalds 	vma = find_vma_prev(current->mm, start, &prev);
2481da177e4SLinus Torvalds 	error = -ENOMEM;
2491da177e4SLinus Torvalds 	if (!vma)
2501da177e4SLinus Torvalds 		goto out;
2511da177e4SLinus Torvalds 	if (unlikely(grows & PROT_GROWSDOWN)) {
2521da177e4SLinus Torvalds 		if (vma->vm_start >= end)
2531da177e4SLinus Torvalds 			goto out;
2541da177e4SLinus Torvalds 		start = vma->vm_start;
2551da177e4SLinus Torvalds 		error = -EINVAL;
2561da177e4SLinus Torvalds 		if (!(vma->vm_flags & VM_GROWSDOWN))
2571da177e4SLinus Torvalds 			goto out;
2581da177e4SLinus Torvalds 	}
2591da177e4SLinus Torvalds 	else {
2601da177e4SLinus Torvalds 		if (vma->vm_start > start)
2611da177e4SLinus Torvalds 			goto out;
2621da177e4SLinus Torvalds 		if (unlikely(grows & PROT_GROWSUP)) {
2631da177e4SLinus Torvalds 			end = vma->vm_end;
2641da177e4SLinus Torvalds 			error = -EINVAL;
2651da177e4SLinus Torvalds 			if (!(vma->vm_flags & VM_GROWSUP))
2661da177e4SLinus Torvalds 				goto out;
2671da177e4SLinus Torvalds 		}
2681da177e4SLinus Torvalds 	}
2691da177e4SLinus Torvalds 	if (start > vma->vm_start)
2701da177e4SLinus Torvalds 		prev = vma;
2711da177e4SLinus Torvalds 
2721da177e4SLinus Torvalds 	for (nstart = start ; ; ) {
2731da177e4SLinus Torvalds 		unsigned long newflags;
2741da177e4SLinus Torvalds 
2751da177e4SLinus Torvalds 		/* Here we know that  vma->vm_start <= nstart < vma->vm_end. */
2761da177e4SLinus Torvalds 
2771da177e4SLinus Torvalds 		newflags = vm_flags | (vma->vm_flags & ~(VM_READ | VM_WRITE | VM_EXEC));
2781da177e4SLinus Torvalds 
2797e2cff42SPaolo 'Blaisorblade' Giarrusso 		/* newflags >> 4 shift VM_MAY% in place of VM_% */
2807e2cff42SPaolo 'Blaisorblade' Giarrusso 		if ((newflags & ~(newflags >> 4)) & (VM_READ | VM_WRITE | VM_EXEC)) {
2811da177e4SLinus Torvalds 			error = -EACCES;
2821da177e4SLinus Torvalds 			goto out;
2831da177e4SLinus Torvalds 		}
2841da177e4SLinus Torvalds 
2851da177e4SLinus Torvalds 		error = security_file_mprotect(vma, reqprot, prot);
2861da177e4SLinus Torvalds 		if (error)
2871da177e4SLinus Torvalds 			goto out;
2881da177e4SLinus Torvalds 
2891da177e4SLinus Torvalds 		tmp = vma->vm_end;
2901da177e4SLinus Torvalds 		if (tmp > end)
2911da177e4SLinus Torvalds 			tmp = end;
2921da177e4SLinus Torvalds 		error = mprotect_fixup(vma, &prev, nstart, tmp, newflags);
2931da177e4SLinus Torvalds 		if (error)
2941da177e4SLinus Torvalds 			goto out;
2951da177e4SLinus Torvalds 		nstart = tmp;
2961da177e4SLinus Torvalds 
2971da177e4SLinus Torvalds 		if (nstart < prev->vm_end)
2981da177e4SLinus Torvalds 			nstart = prev->vm_end;
2991da177e4SLinus Torvalds 		if (nstart >= end)
3001da177e4SLinus Torvalds 			goto out;
3011da177e4SLinus Torvalds 
3021da177e4SLinus Torvalds 		vma = prev->vm_next;
3031da177e4SLinus Torvalds 		if (!vma || vma->vm_start != nstart) {
3041da177e4SLinus Torvalds 			error = -ENOMEM;
3051da177e4SLinus Torvalds 			goto out;
3061da177e4SLinus Torvalds 		}
3071da177e4SLinus Torvalds 	}
3081da177e4SLinus Torvalds out:
3091da177e4SLinus Torvalds 	up_write(&current->mm->mmap_sem);
3101da177e4SLinus Torvalds 	return error;
3111da177e4SLinus Torvalds }
312