11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * mm/mprotect.c 31da177e4SLinus Torvalds * 41da177e4SLinus Torvalds * (C) Copyright 1994 Linus Torvalds 51da177e4SLinus Torvalds * (C) Copyright 2002 Christoph Hellwig 61da177e4SLinus Torvalds * 7046c6884SAlan Cox * Address space accounting code <alan@lxorguk.ukuu.org.uk> 81da177e4SLinus Torvalds * (C) Copyright 2002 Red Hat Inc, All Rights Reserved 91da177e4SLinus Torvalds */ 101da177e4SLinus Torvalds 111da177e4SLinus Torvalds #include <linux/mm.h> 121da177e4SLinus Torvalds #include <linux/hugetlb.h> 131da177e4SLinus Torvalds #include <linux/shm.h> 141da177e4SLinus Torvalds #include <linux/mman.h> 151da177e4SLinus Torvalds #include <linux/fs.h> 161da177e4SLinus Torvalds #include <linux/highmem.h> 171da177e4SLinus Torvalds #include <linux/security.h> 181da177e4SLinus Torvalds #include <linux/mempolicy.h> 191da177e4SLinus Torvalds #include <linux/personality.h> 201da177e4SLinus Torvalds #include <linux/syscalls.h> 210697212aSChristoph Lameter #include <linux/swap.h> 220697212aSChristoph Lameter #include <linux/swapops.h> 23cddb8a5cSAndrea Arcangeli #include <linux/mmu_notifier.h> 2464cdd548SKOSAKI Motohiro #include <linux/migrate.h> 25cdd6c482SIngo Molnar #include <linux/perf_event.h> 261da177e4SLinus Torvalds #include <asm/uaccess.h> 271da177e4SLinus Torvalds #include <asm/pgtable.h> 281da177e4SLinus Torvalds #include <asm/cacheflush.h> 291da177e4SLinus Torvalds #include <asm/tlbflush.h> 301da177e4SLinus Torvalds 311c12c4cfSVenki Pallipadi #ifndef pgprot_modify 321c12c4cfSVenki Pallipadi static inline pgprot_t pgprot_modify(pgprot_t oldprot, pgprot_t newprot) 331c12c4cfSVenki Pallipadi { 341c12c4cfSVenki Pallipadi return newprot; 351c12c4cfSVenki Pallipadi } 361c12c4cfSVenki Pallipadi #endif 371c12c4cfSVenki Pallipadi 38*7da4d641SPeter Zijlstra static unsigned long change_pte_range(struct mm_struct *mm, pmd_t *pmd, 39c1e6098bSPeter Zijlstra unsigned long addr, unsigned long end, pgprot_t newprot, 40c1e6098bSPeter Zijlstra int dirty_accountable) 411da177e4SLinus Torvalds { 420697212aSChristoph Lameter pte_t *pte, oldpte; 43705e87c0SHugh Dickins spinlock_t *ptl; 44*7da4d641SPeter Zijlstra unsigned long pages = 0; 451da177e4SLinus Torvalds 46705e87c0SHugh Dickins pte = pte_offset_map_lock(mm, pmd, addr, &ptl); 476606c3e0SZachary Amsden arch_enter_lazy_mmu_mode(); 481da177e4SLinus Torvalds do { 490697212aSChristoph Lameter oldpte = *pte; 500697212aSChristoph Lameter if (pte_present(oldpte)) { 511da177e4SLinus Torvalds pte_t ptent; 521da177e4SLinus Torvalds 531ea0704eSJeremy Fitzhardinge ptent = ptep_modify_prot_start(mm, addr, pte); 54c1e6098bSPeter Zijlstra ptent = pte_modify(ptent, newprot); 551ea0704eSJeremy Fitzhardinge 56c1e6098bSPeter Zijlstra /* 57c1e6098bSPeter Zijlstra * Avoid taking write faults for pages we know to be 58c1e6098bSPeter Zijlstra * dirty. 59c1e6098bSPeter Zijlstra */ 60c1e6098bSPeter Zijlstra if (dirty_accountable && pte_dirty(ptent)) 61c1e6098bSPeter Zijlstra ptent = pte_mkwrite(ptent); 621ea0704eSJeremy Fitzhardinge 631ea0704eSJeremy Fitzhardinge ptep_modify_prot_commit(mm, addr, pte, ptent); 64*7da4d641SPeter Zijlstra pages++; 65ce1744f4SKonstantin Khlebnikov } else if (IS_ENABLED(CONFIG_MIGRATION) && !pte_file(oldpte)) { 660697212aSChristoph Lameter swp_entry_t entry = pte_to_swp_entry(oldpte); 670697212aSChristoph Lameter 680697212aSChristoph Lameter if (is_write_migration_entry(entry)) { 690697212aSChristoph Lameter /* 700697212aSChristoph Lameter * A protection check is difficult so 710697212aSChristoph Lameter * just be safe and disable write 720697212aSChristoph Lameter */ 730697212aSChristoph Lameter make_migration_entry_read(&entry); 740697212aSChristoph Lameter set_pte_at(mm, addr, pte, 750697212aSChristoph Lameter swp_entry_to_pte(entry)); 761da177e4SLinus Torvalds } 77*7da4d641SPeter Zijlstra pages++; 780697212aSChristoph Lameter } 791da177e4SLinus Torvalds } while (pte++, addr += PAGE_SIZE, addr != end); 806606c3e0SZachary Amsden arch_leave_lazy_mmu_mode(); 81705e87c0SHugh Dickins pte_unmap_unlock(pte - 1, ptl); 82*7da4d641SPeter Zijlstra 83*7da4d641SPeter Zijlstra return pages; 841da177e4SLinus Torvalds } 851da177e4SLinus Torvalds 86*7da4d641SPeter Zijlstra static inline unsigned long change_pmd_range(struct vm_area_struct *vma, pud_t *pud, 87c1e6098bSPeter Zijlstra unsigned long addr, unsigned long end, pgprot_t newprot, 88c1e6098bSPeter Zijlstra int dirty_accountable) 891da177e4SLinus Torvalds { 901da177e4SLinus Torvalds pmd_t *pmd; 911da177e4SLinus Torvalds unsigned long next; 92*7da4d641SPeter Zijlstra unsigned long pages = 0; 931da177e4SLinus Torvalds 941da177e4SLinus Torvalds pmd = pmd_offset(pud, addr); 951da177e4SLinus Torvalds do { 961da177e4SLinus Torvalds next = pmd_addr_end(addr, end); 97cd7548abSJohannes Weiner if (pmd_trans_huge(*pmd)) { 98cd7548abSJohannes Weiner if (next - addr != HPAGE_PMD_SIZE) 99b36f5b07SJohannes Weiner split_huge_page_pmd(vma->vm_mm, pmd); 100*7da4d641SPeter Zijlstra else if (change_huge_pmd(vma, pmd, addr, newprot)) { 101*7da4d641SPeter Zijlstra pages += HPAGE_PMD_NR; 102cd7548abSJohannes Weiner continue; 103*7da4d641SPeter Zijlstra } 104cd7548abSJohannes Weiner /* fall through */ 105cd7548abSJohannes Weiner } 1061da177e4SLinus Torvalds if (pmd_none_or_clear_bad(pmd)) 1071da177e4SLinus Torvalds continue; 108*7da4d641SPeter Zijlstra pages += change_pte_range(vma->vm_mm, pmd, addr, next, newprot, 109b36f5b07SJohannes Weiner dirty_accountable); 1101da177e4SLinus Torvalds } while (pmd++, addr = next, addr != end); 111*7da4d641SPeter Zijlstra 112*7da4d641SPeter Zijlstra return pages; 1131da177e4SLinus Torvalds } 1141da177e4SLinus Torvalds 115*7da4d641SPeter Zijlstra static inline unsigned long change_pud_range(struct vm_area_struct *vma, pgd_t *pgd, 116c1e6098bSPeter Zijlstra unsigned long addr, unsigned long end, pgprot_t newprot, 117c1e6098bSPeter Zijlstra int dirty_accountable) 1181da177e4SLinus Torvalds { 1191da177e4SLinus Torvalds pud_t *pud; 1201da177e4SLinus Torvalds unsigned long next; 121*7da4d641SPeter Zijlstra unsigned long pages = 0; 1221da177e4SLinus Torvalds 1231da177e4SLinus Torvalds pud = pud_offset(pgd, addr); 1241da177e4SLinus Torvalds do { 1251da177e4SLinus Torvalds next = pud_addr_end(addr, end); 1261da177e4SLinus Torvalds if (pud_none_or_clear_bad(pud)) 1271da177e4SLinus Torvalds continue; 128*7da4d641SPeter Zijlstra pages += change_pmd_range(vma, pud, addr, next, newprot, 129b36f5b07SJohannes Weiner dirty_accountable); 1301da177e4SLinus Torvalds } while (pud++, addr = next, addr != end); 131*7da4d641SPeter Zijlstra 132*7da4d641SPeter Zijlstra return pages; 1331da177e4SLinus Torvalds } 1341da177e4SLinus Torvalds 135*7da4d641SPeter Zijlstra static unsigned long change_protection_range(struct vm_area_struct *vma, 136c1e6098bSPeter Zijlstra unsigned long addr, unsigned long end, pgprot_t newprot, 137c1e6098bSPeter Zijlstra int dirty_accountable) 1381da177e4SLinus Torvalds { 1391da177e4SLinus Torvalds struct mm_struct *mm = vma->vm_mm; 1401da177e4SLinus Torvalds pgd_t *pgd; 1411da177e4SLinus Torvalds unsigned long next; 1421da177e4SLinus Torvalds unsigned long start = addr; 143*7da4d641SPeter Zijlstra unsigned long pages = 0; 1441da177e4SLinus Torvalds 1451da177e4SLinus Torvalds BUG_ON(addr >= end); 1461da177e4SLinus Torvalds pgd = pgd_offset(mm, addr); 1471da177e4SLinus Torvalds flush_cache_range(vma, addr, end); 1481da177e4SLinus Torvalds do { 1491da177e4SLinus Torvalds next = pgd_addr_end(addr, end); 1501da177e4SLinus Torvalds if (pgd_none_or_clear_bad(pgd)) 1511da177e4SLinus Torvalds continue; 152*7da4d641SPeter Zijlstra pages += change_pud_range(vma, pgd, addr, next, newprot, 153b36f5b07SJohannes Weiner dirty_accountable); 1541da177e4SLinus Torvalds } while (pgd++, addr = next, addr != end); 155*7da4d641SPeter Zijlstra 1561da177e4SLinus Torvalds flush_tlb_range(vma, start, end); 157*7da4d641SPeter Zijlstra 158*7da4d641SPeter Zijlstra return pages; 159*7da4d641SPeter Zijlstra } 160*7da4d641SPeter Zijlstra 161*7da4d641SPeter Zijlstra unsigned long change_protection(struct vm_area_struct *vma, unsigned long start, 162*7da4d641SPeter Zijlstra unsigned long end, pgprot_t newprot, 163*7da4d641SPeter Zijlstra int dirty_accountable) 164*7da4d641SPeter Zijlstra { 165*7da4d641SPeter Zijlstra struct mm_struct *mm = vma->vm_mm; 166*7da4d641SPeter Zijlstra unsigned long pages; 167*7da4d641SPeter Zijlstra 168*7da4d641SPeter Zijlstra mmu_notifier_invalidate_range_start(mm, start, end); 169*7da4d641SPeter Zijlstra if (is_vm_hugetlb_page(vma)) 170*7da4d641SPeter Zijlstra pages = hugetlb_change_protection(vma, start, end, newprot); 171*7da4d641SPeter Zijlstra else 172*7da4d641SPeter Zijlstra pages = change_protection_range(vma, start, end, newprot, dirty_accountable); 173*7da4d641SPeter Zijlstra mmu_notifier_invalidate_range_end(mm, start, end); 174*7da4d641SPeter Zijlstra 175*7da4d641SPeter Zijlstra return pages; 1761da177e4SLinus Torvalds } 1771da177e4SLinus Torvalds 178b6a2fea3SOllie Wild int 1791da177e4SLinus Torvalds mprotect_fixup(struct vm_area_struct *vma, struct vm_area_struct **pprev, 1801da177e4SLinus Torvalds unsigned long start, unsigned long end, unsigned long newflags) 1811da177e4SLinus Torvalds { 1821da177e4SLinus Torvalds struct mm_struct *mm = vma->vm_mm; 1831da177e4SLinus Torvalds unsigned long oldflags = vma->vm_flags; 1841da177e4SLinus Torvalds long nrpages = (end - start) >> PAGE_SHIFT; 1851da177e4SLinus Torvalds unsigned long charged = 0; 1861da177e4SLinus Torvalds pgoff_t pgoff; 1871da177e4SLinus Torvalds int error; 188c1e6098bSPeter Zijlstra int dirty_accountable = 0; 1891da177e4SLinus Torvalds 1901da177e4SLinus Torvalds if (newflags == oldflags) { 1911da177e4SLinus Torvalds *pprev = vma; 1921da177e4SLinus Torvalds return 0; 1931da177e4SLinus Torvalds } 1941da177e4SLinus Torvalds 1951da177e4SLinus Torvalds /* 1961da177e4SLinus Torvalds * If we make a private mapping writable we increase our commit; 1971da177e4SLinus Torvalds * but (without finer accounting) cannot reduce our commit if we 1985a6fe125SMel Gorman * make it unwritable again. hugetlb mapping were accounted for 1995a6fe125SMel Gorman * even if read-only so there is no need to account for them here 2001da177e4SLinus Torvalds */ 2011da177e4SLinus Torvalds if (newflags & VM_WRITE) { 2025a6fe125SMel Gorman if (!(oldflags & (VM_ACCOUNT|VM_WRITE|VM_HUGETLB| 203cdfd4325SAndy Whitcroft VM_SHARED|VM_NORESERVE))) { 2041da177e4SLinus Torvalds charged = nrpages; 205191c5424SAl Viro if (security_vm_enough_memory_mm(mm, charged)) 2061da177e4SLinus Torvalds return -ENOMEM; 2071da177e4SLinus Torvalds newflags |= VM_ACCOUNT; 2081da177e4SLinus Torvalds } 2091da177e4SLinus Torvalds } 2101da177e4SLinus Torvalds 2111da177e4SLinus Torvalds /* 2121da177e4SLinus Torvalds * First try to merge with previous and/or next vma. 2131da177e4SLinus Torvalds */ 2141da177e4SLinus Torvalds pgoff = vma->vm_pgoff + ((start - vma->vm_start) >> PAGE_SHIFT); 2151da177e4SLinus Torvalds *pprev = vma_merge(mm, *pprev, start, end, newflags, 2161da177e4SLinus Torvalds vma->anon_vma, vma->vm_file, pgoff, vma_policy(vma)); 2171da177e4SLinus Torvalds if (*pprev) { 2181da177e4SLinus Torvalds vma = *pprev; 2191da177e4SLinus Torvalds goto success; 2201da177e4SLinus Torvalds } 2211da177e4SLinus Torvalds 2221da177e4SLinus Torvalds *pprev = vma; 2231da177e4SLinus Torvalds 2241da177e4SLinus Torvalds if (start != vma->vm_start) { 2251da177e4SLinus Torvalds error = split_vma(mm, vma, start, 1); 2261da177e4SLinus Torvalds if (error) 2271da177e4SLinus Torvalds goto fail; 2281da177e4SLinus Torvalds } 2291da177e4SLinus Torvalds 2301da177e4SLinus Torvalds if (end != vma->vm_end) { 2311da177e4SLinus Torvalds error = split_vma(mm, vma, end, 0); 2321da177e4SLinus Torvalds if (error) 2331da177e4SLinus Torvalds goto fail; 2341da177e4SLinus Torvalds } 2351da177e4SLinus Torvalds 2361da177e4SLinus Torvalds success: 2371da177e4SLinus Torvalds /* 2381da177e4SLinus Torvalds * vm_flags and vm_page_prot are protected by the mmap_sem 2391da177e4SLinus Torvalds * held in write mode. 2401da177e4SLinus Torvalds */ 2411da177e4SLinus Torvalds vma->vm_flags = newflags; 2421c12c4cfSVenki Pallipadi vma->vm_page_prot = pgprot_modify(vma->vm_page_prot, 2431c12c4cfSVenki Pallipadi vm_get_page_prot(newflags)); 2441c12c4cfSVenki Pallipadi 245c1e6098bSPeter Zijlstra if (vma_wants_writenotify(vma)) { 2461ddd439eSHugh Dickins vma->vm_page_prot = vm_get_page_prot(newflags & ~VM_SHARED); 247c1e6098bSPeter Zijlstra dirty_accountable = 1; 248c1e6098bSPeter Zijlstra } 249d08b3851SPeter Zijlstra 250c1e6098bSPeter Zijlstra change_protection(vma, start, end, vma->vm_page_prot, dirty_accountable); 251*7da4d641SPeter Zijlstra 252ab50b8edSHugh Dickins vm_stat_account(mm, oldflags, vma->vm_file, -nrpages); 253ab50b8edSHugh Dickins vm_stat_account(mm, newflags, vma->vm_file, nrpages); 25463bfd738SPekka Enberg perf_event_mmap(vma); 2551da177e4SLinus Torvalds return 0; 2561da177e4SLinus Torvalds 2571da177e4SLinus Torvalds fail: 2581da177e4SLinus Torvalds vm_unacct_memory(charged); 2591da177e4SLinus Torvalds return error; 2601da177e4SLinus Torvalds } 2611da177e4SLinus Torvalds 2626a6160a7SHeiko Carstens SYSCALL_DEFINE3(mprotect, unsigned long, start, size_t, len, 2636a6160a7SHeiko Carstens unsigned long, prot) 2641da177e4SLinus Torvalds { 2651da177e4SLinus Torvalds unsigned long vm_flags, nstart, end, tmp, reqprot; 2661da177e4SLinus Torvalds struct vm_area_struct *vma, *prev; 2671da177e4SLinus Torvalds int error = -EINVAL; 2681da177e4SLinus Torvalds const int grows = prot & (PROT_GROWSDOWN|PROT_GROWSUP); 2691da177e4SLinus Torvalds prot &= ~(PROT_GROWSDOWN|PROT_GROWSUP); 2701da177e4SLinus Torvalds if (grows == (PROT_GROWSDOWN|PROT_GROWSUP)) /* can't be both */ 2711da177e4SLinus Torvalds return -EINVAL; 2721da177e4SLinus Torvalds 2731da177e4SLinus Torvalds if (start & ~PAGE_MASK) 2741da177e4SLinus Torvalds return -EINVAL; 2751da177e4SLinus Torvalds if (!len) 2761da177e4SLinus Torvalds return 0; 2771da177e4SLinus Torvalds len = PAGE_ALIGN(len); 2781da177e4SLinus Torvalds end = start + len; 2791da177e4SLinus Torvalds if (end <= start) 2801da177e4SLinus Torvalds return -ENOMEM; 281b845f313SDave Kleikamp if (!arch_validate_prot(prot)) 2821da177e4SLinus Torvalds return -EINVAL; 2831da177e4SLinus Torvalds 2841da177e4SLinus Torvalds reqprot = prot; 2851da177e4SLinus Torvalds /* 2861da177e4SLinus Torvalds * Does the application expect PROT_READ to imply PROT_EXEC: 2871da177e4SLinus Torvalds */ 288b344e05cSHua Zhong if ((prot & PROT_READ) && (current->personality & READ_IMPLIES_EXEC)) 2891da177e4SLinus Torvalds prot |= PROT_EXEC; 2901da177e4SLinus Torvalds 2911da177e4SLinus Torvalds vm_flags = calc_vm_prot_bits(prot); 2921da177e4SLinus Torvalds 2931da177e4SLinus Torvalds down_write(¤t->mm->mmap_sem); 2941da177e4SLinus Torvalds 295097d5910SLinus Torvalds vma = find_vma(current->mm, start); 2961da177e4SLinus Torvalds error = -ENOMEM; 2971da177e4SLinus Torvalds if (!vma) 2981da177e4SLinus Torvalds goto out; 299097d5910SLinus Torvalds prev = vma->vm_prev; 3001da177e4SLinus Torvalds if (unlikely(grows & PROT_GROWSDOWN)) { 3011da177e4SLinus Torvalds if (vma->vm_start >= end) 3021da177e4SLinus Torvalds goto out; 3031da177e4SLinus Torvalds start = vma->vm_start; 3041da177e4SLinus Torvalds error = -EINVAL; 3051da177e4SLinus Torvalds if (!(vma->vm_flags & VM_GROWSDOWN)) 3061da177e4SLinus Torvalds goto out; 3071da177e4SLinus Torvalds } 3081da177e4SLinus Torvalds else { 3091da177e4SLinus Torvalds if (vma->vm_start > start) 3101da177e4SLinus Torvalds goto out; 3111da177e4SLinus Torvalds if (unlikely(grows & PROT_GROWSUP)) { 3121da177e4SLinus Torvalds end = vma->vm_end; 3131da177e4SLinus Torvalds error = -EINVAL; 3141da177e4SLinus Torvalds if (!(vma->vm_flags & VM_GROWSUP)) 3151da177e4SLinus Torvalds goto out; 3161da177e4SLinus Torvalds } 3171da177e4SLinus Torvalds } 3181da177e4SLinus Torvalds if (start > vma->vm_start) 3191da177e4SLinus Torvalds prev = vma; 3201da177e4SLinus Torvalds 3211da177e4SLinus Torvalds for (nstart = start ; ; ) { 3221da177e4SLinus Torvalds unsigned long newflags; 3231da177e4SLinus Torvalds 3241da177e4SLinus Torvalds /* Here we know that vma->vm_start <= nstart < vma->vm_end. */ 3251da177e4SLinus Torvalds 3261da177e4SLinus Torvalds newflags = vm_flags | (vma->vm_flags & ~(VM_READ | VM_WRITE | VM_EXEC)); 3271da177e4SLinus Torvalds 3287e2cff42SPaolo 'Blaisorblade' Giarrusso /* newflags >> 4 shift VM_MAY% in place of VM_% */ 3297e2cff42SPaolo 'Blaisorblade' Giarrusso if ((newflags & ~(newflags >> 4)) & (VM_READ | VM_WRITE | VM_EXEC)) { 3301da177e4SLinus Torvalds error = -EACCES; 3311da177e4SLinus Torvalds goto out; 3321da177e4SLinus Torvalds } 3331da177e4SLinus Torvalds 3341da177e4SLinus Torvalds error = security_file_mprotect(vma, reqprot, prot); 3351da177e4SLinus Torvalds if (error) 3361da177e4SLinus Torvalds goto out; 3371da177e4SLinus Torvalds 3381da177e4SLinus Torvalds tmp = vma->vm_end; 3391da177e4SLinus Torvalds if (tmp > end) 3401da177e4SLinus Torvalds tmp = end; 3411da177e4SLinus Torvalds error = mprotect_fixup(vma, &prev, nstart, tmp, newflags); 3421da177e4SLinus Torvalds if (error) 3431da177e4SLinus Torvalds goto out; 3441da177e4SLinus Torvalds nstart = tmp; 3451da177e4SLinus Torvalds 3461da177e4SLinus Torvalds if (nstart < prev->vm_end) 3471da177e4SLinus Torvalds nstart = prev->vm_end; 3481da177e4SLinus Torvalds if (nstart >= end) 3491da177e4SLinus Torvalds goto out; 3501da177e4SLinus Torvalds 3511da177e4SLinus Torvalds vma = prev->vm_next; 3521da177e4SLinus Torvalds if (!vma || vma->vm_start != nstart) { 3531da177e4SLinus Torvalds error = -ENOMEM; 3541da177e4SLinus Torvalds goto out; 3551da177e4SLinus Torvalds } 3561da177e4SLinus Torvalds } 3571da177e4SLinus Torvalds out: 3581da177e4SLinus Torvalds up_write(¤t->mm->mmap_sem); 3591da177e4SLinus Torvalds return error; 3601da177e4SLinus Torvalds } 361