11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * mm/mprotect.c 31da177e4SLinus Torvalds * 41da177e4SLinus Torvalds * (C) Copyright 1994 Linus Torvalds 51da177e4SLinus Torvalds * (C) Copyright 2002 Christoph Hellwig 61da177e4SLinus Torvalds * 71da177e4SLinus Torvalds * Address space accounting code <alan@redhat.com> 81da177e4SLinus Torvalds * (C) Copyright 2002 Red Hat Inc, All Rights Reserved 91da177e4SLinus Torvalds */ 101da177e4SLinus Torvalds 111da177e4SLinus Torvalds #include <linux/mm.h> 121da177e4SLinus Torvalds #include <linux/hugetlb.h> 131da177e4SLinus Torvalds #include <linux/slab.h> 141da177e4SLinus Torvalds #include <linux/shm.h> 151da177e4SLinus Torvalds #include <linux/mman.h> 161da177e4SLinus Torvalds #include <linux/fs.h> 171da177e4SLinus Torvalds #include <linux/highmem.h> 181da177e4SLinus Torvalds #include <linux/security.h> 191da177e4SLinus Torvalds #include <linux/mempolicy.h> 201da177e4SLinus Torvalds #include <linux/personality.h> 211da177e4SLinus Torvalds #include <linux/syscalls.h> 221da177e4SLinus Torvalds 231da177e4SLinus Torvalds #include <asm/uaccess.h> 241da177e4SLinus Torvalds #include <asm/pgtable.h> 251da177e4SLinus Torvalds #include <asm/cacheflush.h> 261da177e4SLinus Torvalds #include <asm/tlbflush.h> 271da177e4SLinus Torvalds 281da177e4SLinus Torvalds static void change_pte_range(struct mm_struct *mm, pmd_t *pmd, 291da177e4SLinus Torvalds unsigned long addr, unsigned long end, pgprot_t newprot) 301da177e4SLinus Torvalds { 311da177e4SLinus Torvalds pte_t *pte; 321da177e4SLinus Torvalds 331da177e4SLinus Torvalds pte = pte_offset_map(pmd, addr); 341da177e4SLinus Torvalds do { 351da177e4SLinus Torvalds if (pte_present(*pte)) { 361da177e4SLinus Torvalds pte_t ptent; 371da177e4SLinus Torvalds 381da177e4SLinus Torvalds /* Avoid an SMP race with hardware updated dirty/clean 391da177e4SLinus Torvalds * bits by wiping the pte and then setting the new pte 401da177e4SLinus Torvalds * into place. 411da177e4SLinus Torvalds */ 421da177e4SLinus Torvalds ptent = pte_modify(ptep_get_and_clear(mm, addr, pte), newprot); 431da177e4SLinus Torvalds set_pte_at(mm, addr, pte, ptent); 441da177e4SLinus Torvalds lazy_mmu_prot_update(ptent); 451da177e4SLinus Torvalds } 461da177e4SLinus Torvalds } while (pte++, addr += PAGE_SIZE, addr != end); 471da177e4SLinus Torvalds pte_unmap(pte - 1); 481da177e4SLinus Torvalds } 491da177e4SLinus Torvalds 501da177e4SLinus Torvalds static inline void change_pmd_range(struct mm_struct *mm, pud_t *pud, 511da177e4SLinus Torvalds unsigned long addr, unsigned long end, pgprot_t newprot) 521da177e4SLinus Torvalds { 531da177e4SLinus Torvalds pmd_t *pmd; 541da177e4SLinus Torvalds unsigned long next; 551da177e4SLinus Torvalds 561da177e4SLinus Torvalds pmd = pmd_offset(pud, addr); 571da177e4SLinus Torvalds do { 581da177e4SLinus Torvalds next = pmd_addr_end(addr, end); 591da177e4SLinus Torvalds if (pmd_none_or_clear_bad(pmd)) 601da177e4SLinus Torvalds continue; 611da177e4SLinus Torvalds change_pte_range(mm, pmd, addr, next, newprot); 621da177e4SLinus Torvalds } while (pmd++, addr = next, addr != end); 631da177e4SLinus Torvalds } 641da177e4SLinus Torvalds 651da177e4SLinus Torvalds static inline void change_pud_range(struct mm_struct *mm, pgd_t *pgd, 661da177e4SLinus Torvalds unsigned long addr, unsigned long end, pgprot_t newprot) 671da177e4SLinus Torvalds { 681da177e4SLinus Torvalds pud_t *pud; 691da177e4SLinus Torvalds unsigned long next; 701da177e4SLinus Torvalds 711da177e4SLinus Torvalds pud = pud_offset(pgd, addr); 721da177e4SLinus Torvalds do { 731da177e4SLinus Torvalds next = pud_addr_end(addr, end); 741da177e4SLinus Torvalds if (pud_none_or_clear_bad(pud)) 751da177e4SLinus Torvalds continue; 761da177e4SLinus Torvalds change_pmd_range(mm, pud, addr, next, newprot); 771da177e4SLinus Torvalds } while (pud++, addr = next, addr != end); 781da177e4SLinus Torvalds } 791da177e4SLinus Torvalds 801da177e4SLinus Torvalds static void change_protection(struct vm_area_struct *vma, 811da177e4SLinus Torvalds unsigned long addr, unsigned long end, pgprot_t newprot) 821da177e4SLinus Torvalds { 831da177e4SLinus Torvalds struct mm_struct *mm = vma->vm_mm; 841da177e4SLinus Torvalds pgd_t *pgd; 851da177e4SLinus Torvalds unsigned long next; 861da177e4SLinus Torvalds unsigned long start = addr; 871da177e4SLinus Torvalds 881da177e4SLinus Torvalds BUG_ON(addr >= end); 891da177e4SLinus Torvalds pgd = pgd_offset(mm, addr); 901da177e4SLinus Torvalds flush_cache_range(vma, addr, end); 911da177e4SLinus Torvalds spin_lock(&mm->page_table_lock); 921da177e4SLinus Torvalds do { 931da177e4SLinus Torvalds next = pgd_addr_end(addr, end); 941da177e4SLinus Torvalds if (pgd_none_or_clear_bad(pgd)) 951da177e4SLinus Torvalds continue; 961da177e4SLinus Torvalds change_pud_range(mm, pgd, addr, next, newprot); 971da177e4SLinus Torvalds } while (pgd++, addr = next, addr != end); 981da177e4SLinus Torvalds flush_tlb_range(vma, start, end); 991da177e4SLinus Torvalds spin_unlock(&mm->page_table_lock); 1001da177e4SLinus Torvalds } 1011da177e4SLinus Torvalds 1021da177e4SLinus Torvalds static int 1031da177e4SLinus Torvalds mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev, 1041da177e4SLinus Torvalds unsigned long start, unsigned long end, unsigned long newflags) 1051da177e4SLinus Torvalds { 1061da177e4SLinus Torvalds struct mm_struct *mm = vma->vm_mm; 1071da177e4SLinus Torvalds unsigned long oldflags = vma->vm_flags; 1081da177e4SLinus Torvalds long nrpages = (end - start) >> PAGE_SHIFT; 1091da177e4SLinus Torvalds unsigned long charged = 0; 1101da177e4SLinus Torvalds pgprot_t newprot; 1111da177e4SLinus Torvalds pgoff_t pgoff; 1121da177e4SLinus Torvalds int error; 1131da177e4SLinus Torvalds 1141da177e4SLinus Torvalds if (newflags == oldflags) { 1151da177e4SLinus Torvalds *pprev = vma; 1161da177e4SLinus Torvalds return 0; 1171da177e4SLinus Torvalds } 1181da177e4SLinus Torvalds 1191da177e4SLinus Torvalds /* 1201da177e4SLinus Torvalds * If we make a private mapping writable we increase our commit; 1211da177e4SLinus Torvalds * but (without finer accounting) cannot reduce our commit if we 1221da177e4SLinus Torvalds * make it unwritable again. 1231da177e4SLinus Torvalds * 1241da177e4SLinus Torvalds * FIXME? We haven't defined a VM_NORESERVE flag, so mprotecting 1251da177e4SLinus Torvalds * a MAP_NORESERVE private mapping to writable will now reserve. 1261da177e4SLinus Torvalds */ 1271da177e4SLinus Torvalds if (newflags & VM_WRITE) { 1281da177e4SLinus Torvalds if (!(oldflags & (VM_ACCOUNT|VM_WRITE|VM_SHARED|VM_HUGETLB))) { 1291da177e4SLinus Torvalds charged = nrpages; 1301da177e4SLinus Torvalds if (security_vm_enough_memory(charged)) 1311da177e4SLinus Torvalds return -ENOMEM; 1321da177e4SLinus Torvalds newflags |= VM_ACCOUNT; 1331da177e4SLinus Torvalds } 1341da177e4SLinus Torvalds } 1351da177e4SLinus Torvalds 1361da177e4SLinus Torvalds newprot = protection_map[newflags & 0xf]; 1371da177e4SLinus Torvalds 1381da177e4SLinus Torvalds /* 1391da177e4SLinus Torvalds * First try to merge with previous and/or next vma. 1401da177e4SLinus Torvalds */ 1411da177e4SLinus Torvalds pgoff = vma->vm_pgoff + ((start - vma->vm_start) >> PAGE_SHIFT); 1421da177e4SLinus Torvalds *pprev = vma_merge(mm, *pprev, start, end, newflags, 1431da177e4SLinus Torvalds vma->anon_vma, vma->vm_file, pgoff, vma_policy(vma)); 1441da177e4SLinus Torvalds if (*pprev) { 1451da177e4SLinus Torvalds vma = *pprev; 1461da177e4SLinus Torvalds goto success; 1471da177e4SLinus Torvalds } 1481da177e4SLinus Torvalds 1491da177e4SLinus Torvalds *pprev = vma; 1501da177e4SLinus Torvalds 1511da177e4SLinus Torvalds if (start != vma->vm_start) { 1521da177e4SLinus Torvalds error = split_vma(mm, vma, start, 1); 1531da177e4SLinus Torvalds if (error) 1541da177e4SLinus Torvalds goto fail; 1551da177e4SLinus Torvalds } 1561da177e4SLinus Torvalds 1571da177e4SLinus Torvalds if (end != vma->vm_end) { 1581da177e4SLinus Torvalds error = split_vma(mm, vma, end, 0); 1591da177e4SLinus Torvalds if (error) 1601da177e4SLinus Torvalds goto fail; 1611da177e4SLinus Torvalds } 1621da177e4SLinus Torvalds 1631da177e4SLinus Torvalds success: 1641da177e4SLinus Torvalds /* 1651da177e4SLinus Torvalds * vm_flags and vm_page_prot are protected by the mmap_sem 1661da177e4SLinus Torvalds * held in write mode. 1671da177e4SLinus Torvalds */ 1681da177e4SLinus Torvalds vma->vm_flags = newflags; 1691da177e4SLinus Torvalds vma->vm_page_prot = newprot; 1701da177e4SLinus Torvalds change_protection(vma, start, end, newprot); 171*ab50b8edSHugh Dickins vm_stat_account(mm, oldflags, vma->vm_file, -nrpages); 172*ab50b8edSHugh Dickins vm_stat_account(mm, newflags, vma->vm_file, nrpages); 1731da177e4SLinus Torvalds return 0; 1741da177e4SLinus Torvalds 1751da177e4SLinus Torvalds fail: 1761da177e4SLinus Torvalds vm_unacct_memory(charged); 1771da177e4SLinus Torvalds return error; 1781da177e4SLinus Torvalds } 1791da177e4SLinus Torvalds 1801da177e4SLinus Torvalds asmlinkage long 1811da177e4SLinus Torvalds sys_mprotect(unsigned long start, size_t len, unsigned long prot) 1821da177e4SLinus Torvalds { 1831da177e4SLinus Torvalds unsigned long vm_flags, nstart, end, tmp, reqprot; 1841da177e4SLinus Torvalds struct vm_area_struct *vma, *prev; 1851da177e4SLinus Torvalds int error = -EINVAL; 1861da177e4SLinus Torvalds const int grows = prot & (PROT_GROWSDOWN|PROT_GROWSUP); 1871da177e4SLinus Torvalds prot &= ~(PROT_GROWSDOWN|PROT_GROWSUP); 1881da177e4SLinus Torvalds if (grows == (PROT_GROWSDOWN|PROT_GROWSUP)) /* can't be both */ 1891da177e4SLinus Torvalds return -EINVAL; 1901da177e4SLinus Torvalds 1911da177e4SLinus Torvalds if (start & ~PAGE_MASK) 1921da177e4SLinus Torvalds return -EINVAL; 1931da177e4SLinus Torvalds if (!len) 1941da177e4SLinus Torvalds return 0; 1951da177e4SLinus Torvalds len = PAGE_ALIGN(len); 1961da177e4SLinus Torvalds end = start + len; 1971da177e4SLinus Torvalds if (end <= start) 1981da177e4SLinus Torvalds return -ENOMEM; 1991da177e4SLinus Torvalds if (prot & ~(PROT_READ | PROT_WRITE | PROT_EXEC | PROT_SEM)) 2001da177e4SLinus Torvalds return -EINVAL; 2011da177e4SLinus Torvalds 2021da177e4SLinus Torvalds reqprot = prot; 2031da177e4SLinus Torvalds /* 2041da177e4SLinus Torvalds * Does the application expect PROT_READ to imply PROT_EXEC: 2051da177e4SLinus Torvalds */ 2061da177e4SLinus Torvalds if (unlikely((prot & PROT_READ) && 2071da177e4SLinus Torvalds (current->personality & READ_IMPLIES_EXEC))) 2081da177e4SLinus Torvalds prot |= PROT_EXEC; 2091da177e4SLinus Torvalds 2101da177e4SLinus Torvalds vm_flags = calc_vm_prot_bits(prot); 2111da177e4SLinus Torvalds 2121da177e4SLinus Torvalds down_write(¤t->mm->mmap_sem); 2131da177e4SLinus Torvalds 2141da177e4SLinus Torvalds vma = find_vma_prev(current->mm, start, &prev); 2151da177e4SLinus Torvalds error = -ENOMEM; 2161da177e4SLinus Torvalds if (!vma) 2171da177e4SLinus Torvalds goto out; 2181da177e4SLinus Torvalds if (unlikely(grows & PROT_GROWSDOWN)) { 2191da177e4SLinus Torvalds if (vma->vm_start >= end) 2201da177e4SLinus Torvalds goto out; 2211da177e4SLinus Torvalds start = vma->vm_start; 2221da177e4SLinus Torvalds error = -EINVAL; 2231da177e4SLinus Torvalds if (!(vma->vm_flags & VM_GROWSDOWN)) 2241da177e4SLinus Torvalds goto out; 2251da177e4SLinus Torvalds } 2261da177e4SLinus Torvalds else { 2271da177e4SLinus Torvalds if (vma->vm_start > start) 2281da177e4SLinus Torvalds goto out; 2291da177e4SLinus Torvalds if (unlikely(grows & PROT_GROWSUP)) { 2301da177e4SLinus Torvalds end = vma->vm_end; 2311da177e4SLinus Torvalds error = -EINVAL; 2321da177e4SLinus Torvalds if (!(vma->vm_flags & VM_GROWSUP)) 2331da177e4SLinus Torvalds goto out; 2341da177e4SLinus Torvalds } 2351da177e4SLinus Torvalds } 2361da177e4SLinus Torvalds if (start > vma->vm_start) 2371da177e4SLinus Torvalds prev = vma; 2381da177e4SLinus Torvalds 2391da177e4SLinus Torvalds for (nstart = start ; ; ) { 2401da177e4SLinus Torvalds unsigned long newflags; 2411da177e4SLinus Torvalds 2421da177e4SLinus Torvalds /* Here we know that vma->vm_start <= nstart < vma->vm_end. */ 2431da177e4SLinus Torvalds 2441da177e4SLinus Torvalds if (is_vm_hugetlb_page(vma)) { 2451da177e4SLinus Torvalds error = -EACCES; 2461da177e4SLinus Torvalds goto out; 2471da177e4SLinus Torvalds } 2481da177e4SLinus Torvalds 2491da177e4SLinus Torvalds newflags = vm_flags | (vma->vm_flags & ~(VM_READ | VM_WRITE | VM_EXEC)); 2501da177e4SLinus Torvalds 2517e2cff42SPaolo 'Blaisorblade' Giarrusso /* newflags >> 4 shift VM_MAY% in place of VM_% */ 2527e2cff42SPaolo 'Blaisorblade' Giarrusso if ((newflags & ~(newflags >> 4)) & (VM_READ | VM_WRITE | VM_EXEC)) { 2531da177e4SLinus Torvalds error = -EACCES; 2541da177e4SLinus Torvalds goto out; 2551da177e4SLinus Torvalds } 2561da177e4SLinus Torvalds 2571da177e4SLinus Torvalds error = security_file_mprotect(vma, reqprot, prot); 2581da177e4SLinus Torvalds if (error) 2591da177e4SLinus Torvalds goto out; 2601da177e4SLinus Torvalds 2611da177e4SLinus Torvalds tmp = vma->vm_end; 2621da177e4SLinus Torvalds if (tmp > end) 2631da177e4SLinus Torvalds tmp = end; 2641da177e4SLinus Torvalds error = mprotect_fixup(vma, &prev, nstart, tmp, newflags); 2651da177e4SLinus Torvalds if (error) 2661da177e4SLinus Torvalds goto out; 2671da177e4SLinus Torvalds nstart = tmp; 2681da177e4SLinus Torvalds 2691da177e4SLinus Torvalds if (nstart < prev->vm_end) 2701da177e4SLinus Torvalds nstart = prev->vm_end; 2711da177e4SLinus Torvalds if (nstart >= end) 2721da177e4SLinus Torvalds goto out; 2731da177e4SLinus Torvalds 2741da177e4SLinus Torvalds vma = prev->vm_next; 2751da177e4SLinus Torvalds if (!vma || vma->vm_start != nstart) { 2761da177e4SLinus Torvalds error = -ENOMEM; 2771da177e4SLinus Torvalds goto out; 2781da177e4SLinus Torvalds } 2791da177e4SLinus Torvalds } 2801da177e4SLinus Torvalds out: 2811da177e4SLinus Torvalds up_write(¤t->mm->mmap_sem); 2821da177e4SLinus Torvalds return error; 2831da177e4SLinus Torvalds } 284