11da177e4SLinus Torvalds /* 2009ec2a9SJeff Dike * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com) 31da177e4SLinus Torvalds * Licensed under the GPL 41da177e4SLinus Torvalds */ 51da177e4SLinus Torvalds 6009ec2a9SJeff Dike #include <linux/stddef.h> 7*73395a00SAl Viro #include <linux/module.h> 8009ec2a9SJeff Dike #include <linux/bootmem.h> 9009ec2a9SJeff Dike #include <linux/highmem.h> 10009ec2a9SJeff Dike #include <linux/mm.h> 11009ec2a9SJeff Dike #include <linux/swap.h> 125a0e3ad6STejun Heo #include <linux/slab.h> 13009ec2a9SJeff Dike #include <asm/fixmap.h> 14009ec2a9SJeff Dike #include <asm/page.h> 154ff83ce1SJeff Dike #include "as-layout.h" 16114069f7SJeff Dike #include "init.h" 17009ec2a9SJeff Dike #include "kern.h" 18009ec2a9SJeff Dike #include "kern_util.h" 19009ec2a9SJeff Dike #include "mem_user.h" 20009ec2a9SJeff Dike #include "os.h" 211da177e4SLinus Torvalds 226bf79482SJeff Dike /* allocated in paging_init, zeroed in mem_init, and unchanged thereafter */ 231da177e4SLinus Torvalds unsigned long *empty_zero_page = NULL; 24*73395a00SAl Viro EXPORT_SYMBOL(empty_zero_page); 256bf79482SJeff Dike /* allocated in paging_init and unchanged thereafter */ 264a567582SWANG Cong static unsigned long *empty_bad_page = NULL; 2780e39311SJeff Dike 2880e39311SJeff Dike /* 2980e39311SJeff Dike * Initialized during boot, and readonly for initializing page tables 3080e39311SJeff Dike * afterwards 3180e39311SJeff Dike */ 321da177e4SLinus Torvalds pgd_t swapper_pg_dir[PTRS_PER_PGD]; 3380e39311SJeff Dike 3480e39311SJeff Dike /* Initialized at boot time, and readonly after that */ 359902abd7SJeff Dike unsigned long long highmem; 361da177e4SLinus Torvalds int kmalloc_ok = 0; 371da177e4SLinus Torvalds 3880e39311SJeff Dike /* Used during early boot */ 391da177e4SLinus Torvalds static unsigned long brk_end; 401da177e4SLinus Torvalds 411da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 421da177e4SLinus Torvalds static void setup_highmem(unsigned long highmem_start, 431da177e4SLinus Torvalds unsigned long highmem_len) 441da177e4SLinus Torvalds { 451da177e4SLinus Torvalds struct page *page; 461da177e4SLinus Torvalds unsigned long highmem_pfn; 471da177e4SLinus Torvalds int i; 481da177e4SLinus Torvalds 491da177e4SLinus Torvalds highmem_pfn = __pa(highmem_start) >> PAGE_SHIFT; 501da177e4SLinus Torvalds for (i = 0; i < highmem_len >> PAGE_SHIFT; i++) { 511da177e4SLinus Torvalds page = &mem_map[highmem_pfn + i]; 521da177e4SLinus Torvalds ClearPageReserved(page); 537835e98bSNick Piggin init_page_count(page); 541da177e4SLinus Torvalds __free_page(page); 551da177e4SLinus Torvalds } 561da177e4SLinus Torvalds } 571da177e4SLinus Torvalds #endif 581da177e4SLinus Torvalds 5997a1fcbbSJeff Dike void __init mem_init(void) 601da177e4SLinus Torvalds { 611da177e4SLinus Torvalds /* clear the zero-page */ 62c0a9290eSWANG Cong memset(empty_zero_page, 0, PAGE_SIZE); 631da177e4SLinus Torvalds 641da177e4SLinus Torvalds /* Map in the area just after the brk now that kmalloc is about 651da177e4SLinus Torvalds * to be turned on. 661da177e4SLinus Torvalds */ 671da177e4SLinus Torvalds brk_end = (unsigned long) UML_ROUND_UP(sbrk(0)); 68ab26a527SJeff Dike map_memory(brk_end, __pa(brk_end), uml_reserved - brk_end, 1, 1, 0); 691da177e4SLinus Torvalds free_bootmem(__pa(brk_end), uml_reserved - brk_end); 701da177e4SLinus Torvalds uml_reserved = brk_end; 711da177e4SLinus Torvalds 721da177e4SLinus Torvalds /* this will put all low memory onto the freelists */ 731da177e4SLinus Torvalds totalram_pages = free_all_bootmem(); 74af84eab2SJason Lunz max_low_pfn = totalram_pages; 75c1f60a5aSChristoph Lameter #ifdef CONFIG_HIGHMEM 761da177e4SLinus Torvalds totalhigh_pages = highmem >> PAGE_SHIFT; 771da177e4SLinus Torvalds totalram_pages += totalhigh_pages; 78c1f60a5aSChristoph Lameter #endif 791da177e4SLinus Torvalds num_physpages = totalram_pages; 801da177e4SLinus Torvalds max_pfn = totalram_pages; 811da177e4SLinus Torvalds printk(KERN_INFO "Memory: %luk available\n", 82cc013a88SGeert Uytterhoeven nr_free_pages() << (PAGE_SHIFT-10)); 831da177e4SLinus Torvalds kmalloc_ok = 1; 841da177e4SLinus Torvalds 851da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 861da177e4SLinus Torvalds setup_highmem(end_iomem, highmem); 871da177e4SLinus Torvalds #endif 881da177e4SLinus Torvalds } 891da177e4SLinus Torvalds 9012f49643SJeff Dike /* 9112f49643SJeff Dike * Create a page table and place a pointer to it in a middle page 9212f49643SJeff Dike * directory entry. 9312f49643SJeff Dike */ 9412f49643SJeff Dike static void __init one_page_table_init(pmd_t *pmd) 9512f49643SJeff Dike { 9612f49643SJeff Dike if (pmd_none(*pmd)) { 9712f49643SJeff Dike pte_t *pte = (pte_t *) alloc_bootmem_low_pages(PAGE_SIZE); 9812f49643SJeff Dike set_pmd(pmd, __pmd(_KERNPG_TABLE + 9912f49643SJeff Dike (unsigned long) __pa(pte))); 10012f49643SJeff Dike if (pte != pte_offset_kernel(pmd, 0)) 10112f49643SJeff Dike BUG(); 10212f49643SJeff Dike } 10312f49643SJeff Dike } 10412f49643SJeff Dike 10512f49643SJeff Dike static void __init one_md_table_init(pud_t *pud) 10612f49643SJeff Dike { 10712f49643SJeff Dike #ifdef CONFIG_3_LEVEL_PGTABLES 10812f49643SJeff Dike pmd_t *pmd_table = (pmd_t *) alloc_bootmem_low_pages(PAGE_SIZE); 10912f49643SJeff Dike set_pud(pud, __pud(_KERNPG_TABLE + (unsigned long) __pa(pmd_table))); 11012f49643SJeff Dike if (pmd_table != pmd_offset(pud, 0)) 11112f49643SJeff Dike BUG(); 11212f49643SJeff Dike #endif 11312f49643SJeff Dike } 11412f49643SJeff Dike 1151da177e4SLinus Torvalds static void __init fixrange_init(unsigned long start, unsigned long end, 1161da177e4SLinus Torvalds pgd_t *pgd_base) 1171da177e4SLinus Torvalds { 1181da177e4SLinus Torvalds pgd_t *pgd; 11912f49643SJeff Dike pud_t *pud; 1201da177e4SLinus Torvalds pmd_t *pmd; 1211da177e4SLinus Torvalds int i, j; 1221da177e4SLinus Torvalds unsigned long vaddr; 1231da177e4SLinus Torvalds 1241da177e4SLinus Torvalds vaddr = start; 1251da177e4SLinus Torvalds i = pgd_index(vaddr); 1261da177e4SLinus Torvalds j = pmd_index(vaddr); 1271da177e4SLinus Torvalds pgd = pgd_base + i; 1281da177e4SLinus Torvalds 1291da177e4SLinus Torvalds for ( ; (i < PTRS_PER_PGD) && (vaddr < end); pgd++, i++) { 13012f49643SJeff Dike pud = pud_offset(pgd, vaddr); 13112f49643SJeff Dike if (pud_none(*pud)) 13212f49643SJeff Dike one_md_table_init(pud); 13312f49643SJeff Dike pmd = pmd_offset(pud, vaddr); 134655e4ed0SJeff Dike for (; (j < PTRS_PER_PMD) && (vaddr < end); pmd++, j++) { 13512f49643SJeff Dike one_page_table_init(pmd); 1361da177e4SLinus Torvalds vaddr += PMD_SIZE; 1371da177e4SLinus Torvalds } 1381da177e4SLinus Torvalds j = 0; 1391da177e4SLinus Torvalds } 1401da177e4SLinus Torvalds } 1411da177e4SLinus Torvalds 1421da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 1431da177e4SLinus Torvalds pte_t *kmap_pte; 1441da177e4SLinus Torvalds pgprot_t kmap_prot; 1451da177e4SLinus Torvalds 1461da177e4SLinus Torvalds #define kmap_get_fixmap_pte(vaddr) \ 1471da177e4SLinus Torvalds pte_offset_kernel(pmd_offset(pud_offset(pgd_offset_k(vaddr), (vaddr)),\ 1481da177e4SLinus Torvalds (vaddr)), (vaddr)) 1491da177e4SLinus Torvalds 1501da177e4SLinus Torvalds static void __init kmap_init(void) 1511da177e4SLinus Torvalds { 1521da177e4SLinus Torvalds unsigned long kmap_vstart; 1531da177e4SLinus Torvalds 1541da177e4SLinus Torvalds /* cache the first kmap pte */ 1551da177e4SLinus Torvalds kmap_vstart = __fix_to_virt(FIX_KMAP_BEGIN); 1561da177e4SLinus Torvalds kmap_pte = kmap_get_fixmap_pte(kmap_vstart); 1571da177e4SLinus Torvalds 1581da177e4SLinus Torvalds kmap_prot = PAGE_KERNEL; 1591da177e4SLinus Torvalds } 1601da177e4SLinus Torvalds 161b4a08a10SAl Viro static void __init init_highmem(void) 1621da177e4SLinus Torvalds { 1631da177e4SLinus Torvalds pgd_t *pgd; 1641da177e4SLinus Torvalds pud_t *pud; 1651da177e4SLinus Torvalds pmd_t *pmd; 1661da177e4SLinus Torvalds pte_t *pte; 1671da177e4SLinus Torvalds unsigned long vaddr; 1681da177e4SLinus Torvalds 1691da177e4SLinus Torvalds /* 1701da177e4SLinus Torvalds * Permanent kmaps: 1711da177e4SLinus Torvalds */ 1721da177e4SLinus Torvalds vaddr = PKMAP_BASE; 1731da177e4SLinus Torvalds fixrange_init(vaddr, vaddr + PAGE_SIZE*LAST_PKMAP, swapper_pg_dir); 1741da177e4SLinus Torvalds 1751da177e4SLinus Torvalds pgd = swapper_pg_dir + pgd_index(vaddr); 1761da177e4SLinus Torvalds pud = pud_offset(pgd, vaddr); 1771da177e4SLinus Torvalds pmd = pmd_offset(pud, vaddr); 1781da177e4SLinus Torvalds pte = pte_offset_kernel(pmd, vaddr); 1791da177e4SLinus Torvalds pkmap_page_table = pte; 1801da177e4SLinus Torvalds 1811da177e4SLinus Torvalds kmap_init(); 1821da177e4SLinus Torvalds } 1831da177e4SLinus Torvalds #endif /* CONFIG_HIGHMEM */ 1841da177e4SLinus Torvalds 1851da177e4SLinus Torvalds static void __init fixaddr_user_init( void) 1861da177e4SLinus Torvalds { 1879a0b3869Sviro@ZenIV.linux.org.uk #ifdef CONFIG_ARCH_REUSE_HOST_VSYSCALL_AREA 1881da177e4SLinus Torvalds long size = FIXADDR_USER_END - FIXADDR_USER_START; 1891da177e4SLinus Torvalds pgd_t *pgd; 1901da177e4SLinus Torvalds pud_t *pud; 1911da177e4SLinus Torvalds pmd_t *pmd; 1921da177e4SLinus Torvalds pte_t *pte; 193655e4ed0SJeff Dike phys_t p; 194655e4ed0SJeff Dike unsigned long v, vaddr = FIXADDR_USER_START; 1951da177e4SLinus Torvalds 1961da177e4SLinus Torvalds if (!size) 1971da177e4SLinus Torvalds return; 1981da177e4SLinus Torvalds 1991da177e4SLinus Torvalds fixrange_init( FIXADDR_USER_START, FIXADDR_USER_END, swapper_pg_dir); 200655e4ed0SJeff Dike v = (unsigned long) alloc_bootmem_low_pages(size); 201655e4ed0SJeff Dike memcpy((void *) v , (void *) FIXADDR_USER_START, size); 202655e4ed0SJeff Dike p = __pa(v); 203009ec2a9SJeff Dike for ( ; size > 0; size -= PAGE_SIZE, vaddr += PAGE_SIZE, 204655e4ed0SJeff Dike p += PAGE_SIZE) { 2051da177e4SLinus Torvalds pgd = swapper_pg_dir + pgd_index(vaddr); 2061da177e4SLinus Torvalds pud = pud_offset(pgd, vaddr); 2071da177e4SLinus Torvalds pmd = pmd_offset(pud, vaddr); 2081da177e4SLinus Torvalds pte = pte_offset_kernel(pmd, vaddr); 209655e4ed0SJeff Dike pte_set_val(*pte, p, PAGE_READONLY); 2101da177e4SLinus Torvalds } 2111da177e4SLinus Torvalds #endif 2121da177e4SLinus Torvalds } 2131da177e4SLinus Torvalds 21436e45463SJeff Dike void __init paging_init(void) 2151da177e4SLinus Torvalds { 2161da177e4SLinus Torvalds unsigned long zones_size[MAX_NR_ZONES], vaddr; 2171da177e4SLinus Torvalds int i; 2181da177e4SLinus Torvalds 2191da177e4SLinus Torvalds empty_zero_page = (unsigned long *) alloc_bootmem_low_pages(PAGE_SIZE); 2201da177e4SLinus Torvalds empty_bad_page = (unsigned long *) alloc_bootmem_low_pages(PAGE_SIZE); 22191b165c0SJeff Dike for (i = 0; i < ARRAY_SIZE(zones_size); i++) 2221da177e4SLinus Torvalds zones_size[i] = 0; 22391b165c0SJeff Dike 2240715501bSJeff Dike zones_size[ZONE_NORMAL] = (end_iomem >> PAGE_SHIFT) - 2250715501bSJeff Dike (uml_physmem >> PAGE_SHIFT); 226e53ef38dSChristoph Lameter #ifdef CONFIG_HIGHMEM 227353f8d1cSPaolo 'Blaisorblade' Giarrusso zones_size[ZONE_HIGHMEM] = highmem >> PAGE_SHIFT; 228e53ef38dSChristoph Lameter #endif 2291da177e4SLinus Torvalds free_area_init(zones_size); 2301da177e4SLinus Torvalds 2311da177e4SLinus Torvalds /* 2321da177e4SLinus Torvalds * Fixed mappings, only the page table structure has to be 2331da177e4SLinus Torvalds * created - mappings will be set by set_fixmap(): 2341da177e4SLinus Torvalds */ 2351da177e4SLinus Torvalds vaddr = __fix_to_virt(__end_of_fixed_addresses - 1) & PMD_MASK; 2361da177e4SLinus Torvalds fixrange_init(vaddr, FIXADDR_TOP, swapper_pg_dir); 2371da177e4SLinus Torvalds 2381da177e4SLinus Torvalds fixaddr_user_init(); 2391da177e4SLinus Torvalds 2401da177e4SLinus Torvalds #ifdef CONFIG_HIGHMEM 2411da177e4SLinus Torvalds init_highmem(); 2421da177e4SLinus Torvalds #endif 2431da177e4SLinus Torvalds } 2441da177e4SLinus Torvalds 2458192ab42SJeff Dike /* 2468192ab42SJeff Dike * This can't do anything because nothing in the kernel image can be freed 2471da177e4SLinus Torvalds * since it's not in kernel physical memory. 2481da177e4SLinus Torvalds */ 2491da177e4SLinus Torvalds 2501da177e4SLinus Torvalds void free_initmem(void) 2511da177e4SLinus Torvalds { 2521da177e4SLinus Torvalds } 2531da177e4SLinus Torvalds 2541da177e4SLinus Torvalds #ifdef CONFIG_BLK_DEV_INITRD 2551da177e4SLinus Torvalds void free_initrd_mem(unsigned long start, unsigned long end) 2561da177e4SLinus Torvalds { 2571da177e4SLinus Torvalds if (start < end) 258009ec2a9SJeff Dike printk(KERN_INFO "Freeing initrd memory: %ldk freed\n", 2591da177e4SLinus Torvalds (end - start) >> 10); 2601da177e4SLinus Torvalds for (; start < end; start += PAGE_SIZE) { 2611da177e4SLinus Torvalds ClearPageReserved(virt_to_page(start)); 2627835e98bSNick Piggin init_page_count(virt_to_page(start)); 2631da177e4SLinus Torvalds free_page(start); 2641da177e4SLinus Torvalds totalram_pages++; 2651da177e4SLinus Torvalds } 2661da177e4SLinus Torvalds } 2671da177e4SLinus Torvalds #endif 2681da177e4SLinus Torvalds 2698192ab42SJeff Dike /* Allocate and free page tables. */ 2701da177e4SLinus Torvalds 2711da177e4SLinus Torvalds pgd_t *pgd_alloc(struct mm_struct *mm) 2721da177e4SLinus Torvalds { 2731da177e4SLinus Torvalds pgd_t *pgd = (pgd_t *)__get_free_page(GFP_KERNEL); 2741da177e4SLinus Torvalds 2751da177e4SLinus Torvalds if (pgd) { 2761da177e4SLinus Torvalds memset(pgd, 0, USER_PTRS_PER_PGD * sizeof(pgd_t)); 2771da177e4SLinus Torvalds memcpy(pgd + USER_PTRS_PER_PGD, 2781da177e4SLinus Torvalds swapper_pg_dir + USER_PTRS_PER_PGD, 2791da177e4SLinus Torvalds (PTRS_PER_PGD - USER_PTRS_PER_PGD) * sizeof(pgd_t)); 2801da177e4SLinus Torvalds } 2811da177e4SLinus Torvalds return pgd; 2821da177e4SLinus Torvalds } 2831da177e4SLinus Torvalds 2845e541973SBenjamin Herrenschmidt void pgd_free(struct mm_struct *mm, pgd_t *pgd) 2851da177e4SLinus Torvalds { 2861da177e4SLinus Torvalds free_page((unsigned long) pgd); 2871da177e4SLinus Torvalds } 2881da177e4SLinus Torvalds 2891da177e4SLinus Torvalds pte_t *pte_alloc_one_kernel(struct mm_struct *mm, unsigned long address) 2901da177e4SLinus Torvalds { 2911da177e4SLinus Torvalds pte_t *pte; 2921da177e4SLinus Torvalds 2931da177e4SLinus Torvalds pte = (pte_t *)__get_free_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO); 2941da177e4SLinus Torvalds return pte; 2951da177e4SLinus Torvalds } 2961da177e4SLinus Torvalds 2972f569afdSMartin Schwidefsky pgtable_t pte_alloc_one(struct mm_struct *mm, unsigned long address) 2981da177e4SLinus Torvalds { 2991da177e4SLinus Torvalds struct page *pte; 3001da177e4SLinus Torvalds 3011da177e4SLinus Torvalds pte = alloc_page(GFP_KERNEL|__GFP_REPEAT|__GFP_ZERO); 3022f569afdSMartin Schwidefsky if (pte) 3032f569afdSMartin Schwidefsky pgtable_page_ctor(pte); 3041da177e4SLinus Torvalds return pte; 3051da177e4SLinus Torvalds } 3068192ab42SJeff Dike 3078192ab42SJeff Dike #ifdef CONFIG_3_LEVEL_PGTABLES 3088192ab42SJeff Dike pmd_t *pmd_alloc_one(struct mm_struct *mm, unsigned long address) 3098192ab42SJeff Dike { 3108192ab42SJeff Dike pmd_t *pmd = (pmd_t *) __get_free_page(GFP_KERNEL); 3118192ab42SJeff Dike 3128192ab42SJeff Dike if (pmd) 3138192ab42SJeff Dike memset(pmd, 0, PAGE_SIZE); 3148192ab42SJeff Dike 3158192ab42SJeff Dike return pmd; 3168192ab42SJeff Dike } 3178192ab42SJeff Dike #endif 31843f5b308SJeff Dike 31943f5b308SJeff Dike void *uml_kmalloc(int size, int flags) 32043f5b308SJeff Dike { 32143f5b308SJeff Dike return kmalloc(size, flags); 32243f5b308SJeff Dike } 323