11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * Copyright (C) 2000 - 2003 Jeff Dike (jdike@addtoit.com) 31da177e4SLinus Torvalds * Licensed under the GPL 41da177e4SLinus Torvalds */ 51da177e4SLinus Torvalds 61da177e4SLinus Torvalds #include "linux/stddef.h" 71da177e4SLinus Torvalds #include "linux/kernel.h" 81da177e4SLinus Torvalds #include "linux/mm.h" 91da177e4SLinus Torvalds #include "linux/bootmem.h" 101da177e4SLinus Torvalds #include "linux/swap.h" 111da177e4SLinus Torvalds #include "linux/highmem.h" 121da177e4SLinus Torvalds #include "linux/gfp.h" 131da177e4SLinus Torvalds #include "asm/page.h" 141da177e4SLinus Torvalds #include "asm/fixmap.h" 151da177e4SLinus Torvalds #include "asm/pgalloc.h" 161da177e4SLinus Torvalds #include "kern_util.h" 174ff83ce1SJeff Dike #include "as-layout.h" 181da177e4SLinus Torvalds #include "kern.h" 191da177e4SLinus Torvalds #include "mem_user.h" 20fab95c55SJeff Dike #include "um_uaccess.h" 211da177e4SLinus Torvalds #include "os.h" 22114069f7SJeff Dike #include "linux/types.h" 23114069f7SJeff Dike #include "linux/string.h" 24114069f7SJeff Dike #include "init.h" 25114069f7SJeff Dike #include "kern_constants.h" 261da177e4SLinus Torvalds 276bf79482SJeff Dike /* allocated in paging_init, zeroed in mem_init, and unchanged thereafter */ 281da177e4SLinus Torvalds unsigned long *empty_zero_page = NULL; 296bf79482SJeff Dike /* allocated in paging_init and unchanged thereafter */ 301da177e4SLinus Torvalds unsigned long *empty_bad_page = NULL; 311da177e4SLinus Torvalds pgd_t swapper_pg_dir[PTRS_PER_PGD]; 329902abd7SJeff Dike unsigned long long highmem; 331da177e4SLinus Torvalds int kmalloc_ok = 0; 341da177e4SLinus Torvalds 351da177e4SLinus Torvalds static unsigned long brk_end; 361da177e4SLinus Torvalds 371da177e4SLinus Torvalds void unmap_physmem(void) 381da177e4SLinus Torvalds { 391da177e4SLinus Torvalds os_unmap_memory((void *) brk_end, uml_reserved - brk_end); 401da177e4SLinus Torvalds } 411da177e4SLinus Torvalds 421da177e4SLinus Torvalds static void map_cb(void *unused) 431da177e4SLinus Torvalds { 441da177e4SLinus Torvalds map_memory(brk_end, __pa(brk_end), uml_reserved - brk_end, 1, 1, 0); 451da177e4SLinus Torvalds } 461da177e4SLinus Torvalds 471da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 481da177e4SLinus Torvalds static void setup_highmem(unsigned long highmem_start, 491da177e4SLinus Torvalds unsigned long highmem_len) 501da177e4SLinus Torvalds { 511da177e4SLinus Torvalds struct page *page; 521da177e4SLinus Torvalds unsigned long highmem_pfn; 531da177e4SLinus Torvalds int i; 541da177e4SLinus Torvalds 551da177e4SLinus Torvalds highmem_pfn = __pa(highmem_start) >> PAGE_SHIFT; 561da177e4SLinus Torvalds for(i = 0; i < highmem_len >> PAGE_SHIFT; i++){ 571da177e4SLinus Torvalds page = &mem_map[highmem_pfn + i]; 581da177e4SLinus Torvalds ClearPageReserved(page); 597835e98bSNick Piggin init_page_count(page); 601da177e4SLinus Torvalds __free_page(page); 611da177e4SLinus Torvalds } 621da177e4SLinus Torvalds } 631da177e4SLinus Torvalds #endif 641da177e4SLinus Torvalds 6597a1fcbbSJeff Dike void __init mem_init(void) 661da177e4SLinus Torvalds { 671da177e4SLinus Torvalds /* clear the zero-page */ 681da177e4SLinus Torvalds memset((void *) empty_zero_page, 0, PAGE_SIZE); 691da177e4SLinus Torvalds 701da177e4SLinus Torvalds /* Map in the area just after the brk now that kmalloc is about 711da177e4SLinus Torvalds * to be turned on. 721da177e4SLinus Torvalds */ 731da177e4SLinus Torvalds brk_end = (unsigned long) UML_ROUND_UP(sbrk(0)); 741da177e4SLinus Torvalds map_cb(NULL); 751da177e4SLinus Torvalds initial_thread_cb(map_cb, NULL); 761da177e4SLinus Torvalds free_bootmem(__pa(brk_end), uml_reserved - brk_end); 771da177e4SLinus Torvalds uml_reserved = brk_end; 781da177e4SLinus Torvalds 791da177e4SLinus Torvalds /* this will put all low memory onto the freelists */ 801da177e4SLinus Torvalds totalram_pages = free_all_bootmem(); 81af84eab2SJason Lunz max_low_pfn = totalram_pages; 82c1f60a5aSChristoph Lameter #ifdef CONFIG_HIGHMEM 831da177e4SLinus Torvalds totalhigh_pages = highmem >> PAGE_SHIFT; 841da177e4SLinus Torvalds totalram_pages += totalhigh_pages; 85c1f60a5aSChristoph Lameter #endif 861da177e4SLinus Torvalds num_physpages = totalram_pages; 871da177e4SLinus Torvalds max_pfn = totalram_pages; 881da177e4SLinus Torvalds printk(KERN_INFO "Memory: %luk available\n", 891da177e4SLinus Torvalds (unsigned long) nr_free_pages() << (PAGE_SHIFT-10)); 901da177e4SLinus Torvalds kmalloc_ok = 1; 911da177e4SLinus Torvalds 921da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 931da177e4SLinus Torvalds setup_highmem(end_iomem, highmem); 941da177e4SLinus Torvalds #endif 951da177e4SLinus Torvalds } 961da177e4SLinus Torvalds 9712f49643SJeff Dike /* 9812f49643SJeff Dike * Create a page table and place a pointer to it in a middle page 9912f49643SJeff Dike * directory entry. 10012f49643SJeff Dike */ 10112f49643SJeff Dike static void __init one_page_table_init(pmd_t *pmd) 10212f49643SJeff Dike { 10312f49643SJeff Dike if (pmd_none(*pmd)) { 10412f49643SJeff Dike pte_t *pte = (pte_t *) alloc_bootmem_low_pages(PAGE_SIZE); 10512f49643SJeff Dike set_pmd(pmd, __pmd(_KERNPG_TABLE + 10612f49643SJeff Dike (unsigned long) __pa(pte))); 10712f49643SJeff Dike if (pte != pte_offset_kernel(pmd, 0)) 10812f49643SJeff Dike BUG(); 10912f49643SJeff Dike } 11012f49643SJeff Dike } 11112f49643SJeff Dike 11212f49643SJeff Dike static void __init one_md_table_init(pud_t *pud) 11312f49643SJeff Dike { 11412f49643SJeff Dike #ifdef CONFIG_3_LEVEL_PGTABLES 11512f49643SJeff Dike pmd_t *pmd_table = (pmd_t *) alloc_bootmem_low_pages(PAGE_SIZE); 11612f49643SJeff Dike set_pud(pud, __pud(_KERNPG_TABLE + (unsigned long) __pa(pmd_table))); 11712f49643SJeff Dike if (pmd_table != pmd_offset(pud, 0)) 11812f49643SJeff Dike BUG(); 11912f49643SJeff Dike #endif 12012f49643SJeff Dike } 12112f49643SJeff Dike 1221da177e4SLinus Torvalds static void __init fixrange_init(unsigned long start, unsigned long end, 1231da177e4SLinus Torvalds pgd_t *pgd_base) 1241da177e4SLinus Torvalds { 1251da177e4SLinus Torvalds pgd_t *pgd; 12612f49643SJeff Dike pud_t *pud; 1271da177e4SLinus Torvalds pmd_t *pmd; 1281da177e4SLinus Torvalds int i, j; 1291da177e4SLinus Torvalds unsigned long vaddr; 1301da177e4SLinus Torvalds 1311da177e4SLinus Torvalds vaddr = start; 1321da177e4SLinus Torvalds i = pgd_index(vaddr); 1331da177e4SLinus Torvalds j = pmd_index(vaddr); 1341da177e4SLinus Torvalds pgd = pgd_base + i; 1351da177e4SLinus Torvalds 1361da177e4SLinus Torvalds for ( ; (i < PTRS_PER_PGD) && (vaddr < end); pgd++, i++) { 13712f49643SJeff Dike pud = pud_offset(pgd, vaddr); 13812f49643SJeff Dike if (pud_none(*pud)) 13912f49643SJeff Dike one_md_table_init(pud); 14012f49643SJeff Dike pmd = pmd_offset(pud, vaddr); 1411da177e4SLinus Torvalds for (; (j < PTRS_PER_PMD) && (vaddr != end); pmd++, j++) { 14212f49643SJeff Dike one_page_table_init(pmd); 1431da177e4SLinus Torvalds vaddr += PMD_SIZE; 1441da177e4SLinus Torvalds } 1451da177e4SLinus Torvalds j = 0; 1461da177e4SLinus Torvalds } 1471da177e4SLinus Torvalds } 1481da177e4SLinus Torvalds 1491da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 1501da177e4SLinus Torvalds pte_t *kmap_pte; 1511da177e4SLinus Torvalds pgprot_t kmap_prot; 1521da177e4SLinus Torvalds 1531da177e4SLinus Torvalds #define kmap_get_fixmap_pte(vaddr) \ 1541da177e4SLinus Torvalds pte_offset_kernel(pmd_offset(pud_offset(pgd_offset_k(vaddr), (vaddr)),\ 1551da177e4SLinus Torvalds (vaddr)), (vaddr)) 1561da177e4SLinus Torvalds 1571da177e4SLinus Torvalds static void __init kmap_init(void) 1581da177e4SLinus Torvalds { 1591da177e4SLinus Torvalds unsigned long kmap_vstart; 1601da177e4SLinus Torvalds 1611da177e4SLinus Torvalds /* cache the first kmap pte */ 1621da177e4SLinus Torvalds kmap_vstart = __fix_to_virt(FIX_KMAP_BEGIN); 1631da177e4SLinus Torvalds kmap_pte = kmap_get_fixmap_pte(kmap_vstart); 1641da177e4SLinus Torvalds 1651da177e4SLinus Torvalds kmap_prot = PAGE_KERNEL; 1661da177e4SLinus Torvalds } 1671da177e4SLinus Torvalds 168b4a08a10SAl Viro static void __init init_highmem(void) 1691da177e4SLinus Torvalds { 1701da177e4SLinus Torvalds pgd_t *pgd; 1711da177e4SLinus Torvalds pud_t *pud; 1721da177e4SLinus Torvalds pmd_t *pmd; 1731da177e4SLinus Torvalds pte_t *pte; 1741da177e4SLinus Torvalds unsigned long vaddr; 1751da177e4SLinus Torvalds 1761da177e4SLinus Torvalds /* 1771da177e4SLinus Torvalds * Permanent kmaps: 1781da177e4SLinus Torvalds */ 1791da177e4SLinus Torvalds vaddr = PKMAP_BASE; 1801da177e4SLinus Torvalds fixrange_init(vaddr, vaddr + PAGE_SIZE*LAST_PKMAP, swapper_pg_dir); 1811da177e4SLinus Torvalds 1821da177e4SLinus Torvalds pgd = swapper_pg_dir + pgd_index(vaddr); 1831da177e4SLinus Torvalds pud = pud_offset(pgd, vaddr); 1841da177e4SLinus Torvalds pmd = pmd_offset(pud, vaddr); 1851da177e4SLinus Torvalds pte = pte_offset_kernel(pmd, vaddr); 1861da177e4SLinus Torvalds pkmap_page_table = pte; 1871da177e4SLinus Torvalds 1881da177e4SLinus Torvalds kmap_init(); 1891da177e4SLinus Torvalds } 1901da177e4SLinus Torvalds #endif /* CONFIG_HIGHMEM */ 1911da177e4SLinus Torvalds 1921da177e4SLinus Torvalds static void __init fixaddr_user_init( void) 1931da177e4SLinus Torvalds { 1949a0b3869Sviro@ZenIV.linux.org.uk #ifdef CONFIG_ARCH_REUSE_HOST_VSYSCALL_AREA 1951da177e4SLinus Torvalds long size = FIXADDR_USER_END - FIXADDR_USER_START; 1961da177e4SLinus Torvalds pgd_t *pgd; 1971da177e4SLinus Torvalds pud_t *pud; 1981da177e4SLinus Torvalds pmd_t *pmd; 1991da177e4SLinus Torvalds pte_t *pte; 2001da177e4SLinus Torvalds unsigned long paddr, vaddr = FIXADDR_USER_START; 2011da177e4SLinus Torvalds 2021da177e4SLinus Torvalds if ( ! size ) 2031da177e4SLinus Torvalds return; 2041da177e4SLinus Torvalds 2051da177e4SLinus Torvalds fixrange_init( FIXADDR_USER_START, FIXADDR_USER_END, swapper_pg_dir); 2061da177e4SLinus Torvalds paddr = (unsigned long)alloc_bootmem_low_pages( size); 2071da177e4SLinus Torvalds memcpy( (void *)paddr, (void *)FIXADDR_USER_START, size); 2081da177e4SLinus Torvalds paddr = __pa(paddr); 2091da177e4SLinus Torvalds for ( ; size > 0; size-=PAGE_SIZE, vaddr+=PAGE_SIZE, paddr+=PAGE_SIZE){ 2101da177e4SLinus Torvalds pgd = swapper_pg_dir + pgd_index(vaddr); 2111da177e4SLinus Torvalds pud = pud_offset(pgd, vaddr); 2121da177e4SLinus Torvalds pmd = pmd_offset(pud, vaddr); 2131da177e4SLinus Torvalds pte = pte_offset_kernel(pmd, vaddr); 2141da177e4SLinus Torvalds pte_set_val( (*pte), paddr, PAGE_READONLY); 2151da177e4SLinus Torvalds } 2161da177e4SLinus Torvalds #endif 2171da177e4SLinus Torvalds } 2181da177e4SLinus Torvalds 21936e45463SJeff Dike void __init paging_init(void) 2201da177e4SLinus Torvalds { 2211da177e4SLinus Torvalds unsigned long zones_size[MAX_NR_ZONES], vaddr; 2221da177e4SLinus Torvalds int i; 2231da177e4SLinus Torvalds 2241da177e4SLinus Torvalds empty_zero_page = (unsigned long *) alloc_bootmem_low_pages(PAGE_SIZE); 2251da177e4SLinus Torvalds empty_bad_page = (unsigned long *) alloc_bootmem_low_pages(PAGE_SIZE); 22691b165c0SJeff Dike for(i = 0; i < ARRAY_SIZE(zones_size); i++) 2271da177e4SLinus Torvalds zones_size[i] = 0; 22891b165c0SJeff Dike 2290715501bSJeff Dike zones_size[ZONE_NORMAL] = (end_iomem >> PAGE_SHIFT) - 2300715501bSJeff Dike (uml_physmem >> PAGE_SHIFT); 231e53ef38dSChristoph Lameter #ifdef CONFIG_HIGHMEM 232353f8d1cSPaolo 'Blaisorblade' Giarrusso zones_size[ZONE_HIGHMEM] = highmem >> PAGE_SHIFT; 233e53ef38dSChristoph Lameter #endif 2341da177e4SLinus Torvalds free_area_init(zones_size); 2351da177e4SLinus Torvalds 2361da177e4SLinus Torvalds /* 2371da177e4SLinus Torvalds * Fixed mappings, only the page table structure has to be 2381da177e4SLinus Torvalds * created - mappings will be set by set_fixmap(): 2391da177e4SLinus Torvalds */ 2401da177e4SLinus Torvalds vaddr = __fix_to_virt(__end_of_fixed_addresses - 1) & PMD_MASK; 2411da177e4SLinus Torvalds fixrange_init(vaddr, FIXADDR_TOP, swapper_pg_dir); 2421da177e4SLinus Torvalds 2431da177e4SLinus Torvalds fixaddr_user_init(); 2441da177e4SLinus Torvalds 2451da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 2461da177e4SLinus Torvalds init_highmem(); 2471da177e4SLinus Torvalds #endif 2481da177e4SLinus Torvalds } 2491da177e4SLinus Torvalds 25053f9fc93SAl Viro struct page *arch_validate(struct page *page, gfp_t mask, int order) 2511da177e4SLinus Torvalds { 2521da177e4SLinus Torvalds unsigned long addr, zero = 0; 2531da177e4SLinus Torvalds int i; 2541da177e4SLinus Torvalds 2551da177e4SLinus Torvalds again: 25660678bbcSJeff Dike if(page == NULL) 25760678bbcSJeff Dike return page; 25860678bbcSJeff Dike if(PageHighMem(page)) 25960678bbcSJeff Dike return page; 2601da177e4SLinus Torvalds 2611da177e4SLinus Torvalds addr = (unsigned long) page_address(page); 2621da177e4SLinus Torvalds for(i = 0; i < (1 << order); i++){ 2631da177e4SLinus Torvalds current->thread.fault_addr = (void *) addr; 2641da177e4SLinus Torvalds if(__do_copy_to_user((void __user *) addr, &zero, 2651da177e4SLinus Torvalds sizeof(zero), 2661da177e4SLinus Torvalds ¤t->thread.fault_addr, 2671da177e4SLinus Torvalds ¤t->thread.fault_catcher)){ 26860678bbcSJeff Dike if(!(mask & __GFP_WAIT)) 26960678bbcSJeff Dike return NULL; 2701da177e4SLinus Torvalds else break; 2711da177e4SLinus Torvalds } 2721da177e4SLinus Torvalds addr += PAGE_SIZE; 2731da177e4SLinus Torvalds } 2741da177e4SLinus Torvalds 27560678bbcSJeff Dike if(i == (1 << order)) 27660678bbcSJeff Dike return page; 2771da177e4SLinus Torvalds page = alloc_pages(mask, order); 2781da177e4SLinus Torvalds goto again; 2791da177e4SLinus Torvalds } 2801da177e4SLinus Torvalds 2811da177e4SLinus Torvalds /* This can't do anything because nothing in the kernel image can be freed 2821da177e4SLinus Torvalds * since it's not in kernel physical memory. 2831da177e4SLinus Torvalds */ 2841da177e4SLinus Torvalds 2851da177e4SLinus Torvalds void free_initmem(void) 2861da177e4SLinus Torvalds { 2871da177e4SLinus Torvalds } 2881da177e4SLinus Torvalds 2891da177e4SLinus Torvalds #ifdef CONFIG_BLK_DEV_INITRD 2901da177e4SLinus Torvalds void free_initrd_mem(unsigned long start, unsigned long end) 2911da177e4SLinus Torvalds { 2921da177e4SLinus Torvalds if (start < end) 2931da177e4SLinus Torvalds printk ("Freeing initrd memory: %ldk freed\n", 2941da177e4SLinus Torvalds (end - start) >> 10); 2951da177e4SLinus Torvalds for (; start < end; start += PAGE_SIZE) { 2961da177e4SLinus Torvalds ClearPageReserved(virt_to_page(start)); 2977835e98bSNick Piggin init_page_count(virt_to_page(start)); 2981da177e4SLinus Torvalds free_page(start); 2991da177e4SLinus Torvalds totalram_pages++; 3001da177e4SLinus Torvalds } 3011da177e4SLinus Torvalds } 3021da177e4SLinus Torvalds #endif 3031da177e4SLinus Torvalds 3041da177e4SLinus Torvalds void show_mem(void) 3051da177e4SLinus Torvalds { 3061da177e4SLinus Torvalds int pfn, total = 0, reserved = 0; 3071da177e4SLinus Torvalds int shared = 0, cached = 0; 3081da177e4SLinus Torvalds int highmem = 0; 3091da177e4SLinus Torvalds struct page *page; 3101da177e4SLinus Torvalds 3111da177e4SLinus Torvalds printk("Mem-info:\n"); 3121da177e4SLinus Torvalds show_free_areas(); 3131da177e4SLinus Torvalds printk("Free swap: %6ldkB\n", nr_swap_pages<<(PAGE_SHIFT-10)); 3141da177e4SLinus Torvalds pfn = max_mapnr; 3151da177e4SLinus Torvalds while(pfn-- > 0) { 3161da177e4SLinus Torvalds page = pfn_to_page(pfn); 3171da177e4SLinus Torvalds total++; 3181da177e4SLinus Torvalds if(PageHighMem(page)) 3191da177e4SLinus Torvalds highmem++; 3201da177e4SLinus Torvalds if(PageReserved(page)) 3211da177e4SLinus Torvalds reserved++; 3221da177e4SLinus Torvalds else if(PageSwapCache(page)) 3231da177e4SLinus Torvalds cached++; 3241da177e4SLinus Torvalds else if(page_count(page)) 3251da177e4SLinus Torvalds shared += page_count(page) - 1; 3261da177e4SLinus Torvalds } 3271da177e4SLinus Torvalds printk("%d pages of RAM\n", total); 3281da177e4SLinus Torvalds printk("%d pages of HIGHMEM\n", highmem); 3291da177e4SLinus Torvalds printk("%d reserved pages\n", reserved); 3301da177e4SLinus Torvalds printk("%d pages shared\n", shared); 3311da177e4SLinus Torvalds printk("%d pages swap cached\n", cached); 3321da177e4SLinus Torvalds } 3331da177e4SLinus Torvalds 3341da177e4SLinus Torvalds /* 3351da177e4SLinus Torvalds * Allocate and free page tables. 3361da177e4SLinus Torvalds */ 3371da177e4SLinus Torvalds 3381da177e4SLinus Torvalds pgd_t *pgd_alloc(struct mm_struct *mm) 3391da177e4SLinus Torvalds { 3401da177e4SLinus Torvalds pgd_t *pgd = (pgd_t *)__get_free_page(GFP_KERNEL); 3411da177e4SLinus Torvalds 3421da177e4SLinus Torvalds if (pgd) { 3431da177e4SLinus Torvalds memset(pgd, 0, USER_PTRS_PER_PGD * sizeof(pgd_t)); 3441da177e4SLinus Torvalds memcpy(pgd + USER_PTRS_PER_PGD, 3451da177e4SLinus Torvalds swapper_pg_dir + USER_PTRS_PER_PGD, 3461da177e4SLinus Torvalds (PTRS_PER_PGD - USER_PTRS_PER_PGD) * sizeof(pgd_t)); 3471da177e4SLinus Torvalds } 3481da177e4SLinus Torvalds return pgd; 3491da177e4SLinus Torvalds } 3501da177e4SLinus Torvalds 351*5e541973SBenjamin Herrenschmidt void pgd_free(struct mm_struct *mm, pgd_t *pgd) 3521da177e4SLinus Torvalds { 3531da177e4SLinus Torvalds free_page((unsigned long) pgd); 3541da177e4SLinus Torvalds } 3551da177e4SLinus Torvalds 3561da177e4SLinus Torvalds pte_t *pte_alloc_one_kernel(struct mm_struct *mm, unsigned long address) 3571da177e4SLinus Torvalds { 3581da177e4SLinus Torvalds pte_t *pte; 3591da177e4SLinus Torvalds 3601da177e4SLinus Torvalds pte = (pte_t *)__get_free_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO); 3611da177e4SLinus Torvalds return pte; 3621da177e4SLinus Torvalds } 3631da177e4SLinus Torvalds 3641da177e4SLinus Torvalds struct page *pte_alloc_one(struct mm_struct *mm, unsigned long address) 3651da177e4SLinus Torvalds { 3661da177e4SLinus Torvalds struct page *pte; 3671da177e4SLinus Torvalds 3681da177e4SLinus Torvalds pte = alloc_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO); 3691da177e4SLinus Torvalds return pte; 3701da177e4SLinus Torvalds } 371