11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * linux/arch/arm/mm/init.c 31da177e4SLinus Torvalds * 490072059SRussell King * Copyright (C) 1995-2005 Russell King 51da177e4SLinus Torvalds * 61da177e4SLinus Torvalds * This program is free software; you can redistribute it and/or modify 71da177e4SLinus Torvalds * it under the terms of the GNU General Public License version 2 as 81da177e4SLinus Torvalds * published by the Free Software Foundation. 91da177e4SLinus Torvalds */ 101da177e4SLinus Torvalds #include <linux/config.h> 111da177e4SLinus Torvalds #include <linux/kernel.h> 121da177e4SLinus Torvalds #include <linux/errno.h> 131da177e4SLinus Torvalds #include <linux/ptrace.h> 141da177e4SLinus Torvalds #include <linux/swap.h> 151da177e4SLinus Torvalds #include <linux/init.h> 161da177e4SLinus Torvalds #include <linux/bootmem.h> 171da177e4SLinus Torvalds #include <linux/mman.h> 181da177e4SLinus Torvalds #include <linux/nodemask.h> 191da177e4SLinus Torvalds #include <linux/initrd.h> 201da177e4SLinus Torvalds 211da177e4SLinus Torvalds #include <asm/mach-types.h> 221da177e4SLinus Torvalds #include <asm/hardware.h> 231da177e4SLinus Torvalds #include <asm/setup.h> 241da177e4SLinus Torvalds #include <asm/tlb.h> 251da177e4SLinus Torvalds 261da177e4SLinus Torvalds #include <asm/mach/arch.h> 271da177e4SLinus Torvalds #include <asm/mach/map.h> 281da177e4SLinus Torvalds 291da177e4SLinus Torvalds #define TABLE_SIZE (2 * PTRS_PER_PTE * sizeof(pte_t)) 301da177e4SLinus Torvalds 311da177e4SLinus Torvalds DEFINE_PER_CPU(struct mmu_gather, mmu_gathers); 321da177e4SLinus Torvalds 331da177e4SLinus Torvalds extern pgd_t swapper_pg_dir[PTRS_PER_PGD]; 341da177e4SLinus Torvalds extern void _stext, _text, _etext, __data_start, _end, __init_begin, __init_end; 351da177e4SLinus Torvalds extern unsigned long phys_initrd_start; 361da177e4SLinus Torvalds extern unsigned long phys_initrd_size; 371da177e4SLinus Torvalds 381da177e4SLinus Torvalds /* 391da177e4SLinus Torvalds * The sole use of this is to pass memory configuration 401da177e4SLinus Torvalds * data from paging_init to mem_init. 411da177e4SLinus Torvalds */ 421da177e4SLinus Torvalds static struct meminfo meminfo __initdata = { 0, }; 431da177e4SLinus Torvalds 441da177e4SLinus Torvalds /* 451da177e4SLinus Torvalds * empty_zero_page is a special page that is used for 461da177e4SLinus Torvalds * zero-initialized data and COW. 471da177e4SLinus Torvalds */ 481da177e4SLinus Torvalds struct page *empty_zero_page; 491da177e4SLinus Torvalds 501da177e4SLinus Torvalds void show_mem(void) 511da177e4SLinus Torvalds { 521da177e4SLinus Torvalds int free = 0, total = 0, reserved = 0; 531da177e4SLinus Torvalds int shared = 0, cached = 0, slab = 0, node; 541da177e4SLinus Torvalds 551da177e4SLinus Torvalds printk("Mem-info:\n"); 561da177e4SLinus Torvalds show_free_areas(); 571da177e4SLinus Torvalds printk("Free swap: %6ldkB\n", nr_swap_pages<<(PAGE_SHIFT-10)); 581da177e4SLinus Torvalds 591da177e4SLinus Torvalds for_each_online_node(node) { 601da177e4SLinus Torvalds struct page *page, *end; 611da177e4SLinus Torvalds 621da177e4SLinus Torvalds page = NODE_MEM_MAP(node); 631da177e4SLinus Torvalds end = page + NODE_DATA(node)->node_spanned_pages; 641da177e4SLinus Torvalds 651da177e4SLinus Torvalds do { 661da177e4SLinus Torvalds total++; 671da177e4SLinus Torvalds if (PageReserved(page)) 681da177e4SLinus Torvalds reserved++; 691da177e4SLinus Torvalds else if (PageSwapCache(page)) 701da177e4SLinus Torvalds cached++; 711da177e4SLinus Torvalds else if (PageSlab(page)) 721da177e4SLinus Torvalds slab++; 731da177e4SLinus Torvalds else if (!page_count(page)) 741da177e4SLinus Torvalds free++; 751da177e4SLinus Torvalds else 761da177e4SLinus Torvalds shared += page_count(page) - 1; 771da177e4SLinus Torvalds page++; 781da177e4SLinus Torvalds } while (page < end); 791da177e4SLinus Torvalds } 801da177e4SLinus Torvalds 811da177e4SLinus Torvalds printk("%d pages of RAM\n", total); 821da177e4SLinus Torvalds printk("%d free pages\n", free); 831da177e4SLinus Torvalds printk("%d reserved pages\n", reserved); 841da177e4SLinus Torvalds printk("%d slab pages\n", slab); 851da177e4SLinus Torvalds printk("%d pages shared\n", shared); 861da177e4SLinus Torvalds printk("%d pages swap cached\n", cached); 871da177e4SLinus Torvalds } 881da177e4SLinus Torvalds 8990072059SRussell King static inline pmd_t *pmd_off(pgd_t *pgd, unsigned long virt) 9090072059SRussell King { 9190072059SRussell King return pmd_offset(pgd, virt); 9290072059SRussell King } 931da177e4SLinus Torvalds 9490072059SRussell King static inline pmd_t *pmd_off_k(unsigned long virt) 9590072059SRussell King { 9690072059SRussell King return pmd_off(pgd_offset_k(virt), virt); 9790072059SRussell King } 9890072059SRussell King 9990072059SRussell King #define for_each_nodebank(iter,mi,no) \ 10090072059SRussell King for (iter = 0; iter < mi->nr_banks; iter++) \ 10190072059SRussell King if (mi->bank[iter].node == no) 1021da177e4SLinus Torvalds 1031da177e4SLinus Torvalds /* 1041da177e4SLinus Torvalds * FIXME: We really want to avoid allocating the bootmap bitmap 1051da177e4SLinus Torvalds * over the top of the initrd. Hopefully, this is located towards 1061da177e4SLinus Torvalds * the start of a bank, so if we allocate the bootmap bitmap at 1071da177e4SLinus Torvalds * the end, we won't clash. 1081da177e4SLinus Torvalds */ 1091da177e4SLinus Torvalds static unsigned int __init 1101da177e4SLinus Torvalds find_bootmap_pfn(int node, struct meminfo *mi, unsigned int bootmap_pages) 1111da177e4SLinus Torvalds { 1121da177e4SLinus Torvalds unsigned int start_pfn, bank, bootmap_pfn; 1131da177e4SLinus Torvalds 11490072059SRussell King start_pfn = PAGE_ALIGN(__pa(&_end)) >> PAGE_SHIFT; 1151da177e4SLinus Torvalds bootmap_pfn = 0; 1161da177e4SLinus Torvalds 11790072059SRussell King for_each_nodebank(bank, mi, node) { 1181da177e4SLinus Torvalds unsigned int start, end; 1191da177e4SLinus Torvalds 12092a8cbedSRussell King start = mi->bank[bank].start >> PAGE_SHIFT; 12192a8cbedSRussell King end = (mi->bank[bank].size + 12292a8cbedSRussell King mi->bank[bank].start) >> PAGE_SHIFT; 1231da177e4SLinus Torvalds 1241da177e4SLinus Torvalds if (end < start_pfn) 1251da177e4SLinus Torvalds continue; 1261da177e4SLinus Torvalds 1271da177e4SLinus Torvalds if (start < start_pfn) 1281da177e4SLinus Torvalds start = start_pfn; 1291da177e4SLinus Torvalds 1301da177e4SLinus Torvalds if (end <= start) 1311da177e4SLinus Torvalds continue; 1321da177e4SLinus Torvalds 1331da177e4SLinus Torvalds if (end - start >= bootmap_pages) { 1341da177e4SLinus Torvalds bootmap_pfn = start; 1351da177e4SLinus Torvalds break; 1361da177e4SLinus Torvalds } 1371da177e4SLinus Torvalds } 1381da177e4SLinus Torvalds 1391da177e4SLinus Torvalds if (bootmap_pfn == 0) 1401da177e4SLinus Torvalds BUG(); 1411da177e4SLinus Torvalds 1421da177e4SLinus Torvalds return bootmap_pfn; 1431da177e4SLinus Torvalds } 1441da177e4SLinus Torvalds 1451da177e4SLinus Torvalds static int __init check_initrd(struct meminfo *mi) 1461da177e4SLinus Torvalds { 1471da177e4SLinus Torvalds int initrd_node = -2; 1481da177e4SLinus Torvalds #ifdef CONFIG_BLK_DEV_INITRD 1491da177e4SLinus Torvalds unsigned long end = phys_initrd_start + phys_initrd_size; 1501da177e4SLinus Torvalds 1511da177e4SLinus Torvalds /* 1521da177e4SLinus Torvalds * Make sure that the initrd is within a valid area of 1531da177e4SLinus Torvalds * memory. 1541da177e4SLinus Torvalds */ 1551da177e4SLinus Torvalds if (phys_initrd_size) { 1561da177e4SLinus Torvalds unsigned int i; 1571da177e4SLinus Torvalds 1581da177e4SLinus Torvalds initrd_node = -1; 1591da177e4SLinus Torvalds 1601da177e4SLinus Torvalds for (i = 0; i < mi->nr_banks; i++) { 1611da177e4SLinus Torvalds unsigned long bank_end; 1621da177e4SLinus Torvalds 1631da177e4SLinus Torvalds bank_end = mi->bank[i].start + mi->bank[i].size; 1641da177e4SLinus Torvalds 1651da177e4SLinus Torvalds if (mi->bank[i].start <= phys_initrd_start && 1661da177e4SLinus Torvalds end <= bank_end) 1671da177e4SLinus Torvalds initrd_node = mi->bank[i].node; 1681da177e4SLinus Torvalds } 1691da177e4SLinus Torvalds } 1701da177e4SLinus Torvalds 1711da177e4SLinus Torvalds if (initrd_node == -1) { 1721da177e4SLinus Torvalds printk(KERN_ERR "initrd (0x%08lx - 0x%08lx) extends beyond " 1731da177e4SLinus Torvalds "physical memory - disabling initrd\n", 1741da177e4SLinus Torvalds phys_initrd_start, end); 1751da177e4SLinus Torvalds phys_initrd_start = phys_initrd_size = 0; 1761da177e4SLinus Torvalds } 1771da177e4SLinus Torvalds #endif 1781da177e4SLinus Torvalds 1791da177e4SLinus Torvalds return initrd_node; 1801da177e4SLinus Torvalds } 1811da177e4SLinus Torvalds 1821da177e4SLinus Torvalds /* 1831da177e4SLinus Torvalds * Reserve the various regions of node 0 1841da177e4SLinus Torvalds */ 18590072059SRussell King static __init void reserve_node_zero(pg_data_t *pgdat) 1861da177e4SLinus Torvalds { 1871da177e4SLinus Torvalds unsigned long res_size = 0; 1881da177e4SLinus Torvalds 1891da177e4SLinus Torvalds /* 1901da177e4SLinus Torvalds * Register the kernel text and data with bootmem. 1911da177e4SLinus Torvalds * Note that this can only be in node 0. 1921da177e4SLinus Torvalds */ 1931da177e4SLinus Torvalds #ifdef CONFIG_XIP_KERNEL 1941da177e4SLinus Torvalds reserve_bootmem_node(pgdat, __pa(&__data_start), &_end - &__data_start); 1951da177e4SLinus Torvalds #else 1961da177e4SLinus Torvalds reserve_bootmem_node(pgdat, __pa(&_stext), &_end - &_stext); 1971da177e4SLinus Torvalds #endif 1981da177e4SLinus Torvalds 1991da177e4SLinus Torvalds /* 2001da177e4SLinus Torvalds * Reserve the page tables. These are already in use, 2011da177e4SLinus Torvalds * and can only be in node 0. 2021da177e4SLinus Torvalds */ 2031da177e4SLinus Torvalds reserve_bootmem_node(pgdat, __pa(swapper_pg_dir), 2041da177e4SLinus Torvalds PTRS_PER_PGD * sizeof(pgd_t)); 2051da177e4SLinus Torvalds 2061da177e4SLinus Torvalds /* 2071da177e4SLinus Torvalds * Hmm... This should go elsewhere, but we really really need to 2081da177e4SLinus Torvalds * stop things allocating the low memory; ideally we need a better 2091da177e4SLinus Torvalds * implementation of GFP_DMA which does not assume that DMA-able 2101da177e4SLinus Torvalds * memory starts at zero. 2111da177e4SLinus Torvalds */ 2121da177e4SLinus Torvalds if (machine_is_integrator() || machine_is_cintegrator()) 2131da177e4SLinus Torvalds res_size = __pa(swapper_pg_dir) - PHYS_OFFSET; 2141da177e4SLinus Torvalds 2151da177e4SLinus Torvalds /* 2161da177e4SLinus Torvalds * These should likewise go elsewhere. They pre-reserve the 2171da177e4SLinus Torvalds * screen memory region at the start of main system memory. 2181da177e4SLinus Torvalds */ 2191da177e4SLinus Torvalds if (machine_is_edb7211()) 2201da177e4SLinus Torvalds res_size = 0x00020000; 2211da177e4SLinus Torvalds if (machine_is_p720t()) 2221da177e4SLinus Torvalds res_size = 0x00014000; 2231da177e4SLinus Torvalds 2241da177e4SLinus Torvalds #ifdef CONFIG_SA1111 2251da177e4SLinus Torvalds /* 2261da177e4SLinus Torvalds * Because of the SA1111 DMA bug, we want to preserve our 2271da177e4SLinus Torvalds * precious DMA-able memory... 2281da177e4SLinus Torvalds */ 2291da177e4SLinus Torvalds res_size = __pa(swapper_pg_dir) - PHYS_OFFSET; 2301da177e4SLinus Torvalds #endif 2311da177e4SLinus Torvalds if (res_size) 2321da177e4SLinus Torvalds reserve_bootmem_node(pgdat, PHYS_OFFSET, res_size); 2331da177e4SLinus Torvalds } 2341da177e4SLinus Torvalds 23590072059SRussell King void __init build_mem_type_table(void); 23690072059SRussell King void __init create_mapping(struct map_desc *md); 23790072059SRussell King 23890072059SRussell King static unsigned long __init 23990072059SRussell King bootmem_init_node(int node, int initrd_node, struct meminfo *mi) 2401da177e4SLinus Torvalds { 24190072059SRussell King unsigned long zone_size[MAX_NR_ZONES], zhole_size[MAX_NR_ZONES]; 24290072059SRussell King unsigned long start_pfn, end_pfn, boot_pfn; 24390072059SRussell King unsigned int boot_pages; 24490072059SRussell King pg_data_t *pgdat; 24590072059SRussell King int i; 2461da177e4SLinus Torvalds 24790072059SRussell King start_pfn = -1UL; 24890072059SRussell King end_pfn = 0; 24990072059SRussell King 25090072059SRussell King /* 25190072059SRussell King * Calculate the pfn range, and map the memory banks for this node. 25290072059SRussell King */ 25390072059SRussell King for_each_nodebank(i, mi, node) { 25490072059SRussell King unsigned long start, end; 25590072059SRussell King struct map_desc map; 25690072059SRussell King 25790072059SRussell King start = mi->bank[i].start >> PAGE_SHIFT; 25890072059SRussell King end = (mi->bank[i].start + mi->bank[i].size) >> PAGE_SHIFT; 25990072059SRussell King 26090072059SRussell King if (start_pfn > start) 26190072059SRussell King start_pfn = start; 26290072059SRussell King if (end_pfn < end) 26390072059SRussell King end_pfn = end; 26490072059SRussell King 2659769c246SDeepak Saxena map.pfn = __phys_to_pfn(mi->bank[i].start); 2669769c246SDeepak Saxena map.virtual = __phys_to_virt(mi->bank[i].start); 26790072059SRussell King map.length = mi->bank[i].size; 26890072059SRussell King map.type = MT_MEMORY; 26990072059SRussell King 27090072059SRussell King create_mapping(&map); 2711da177e4SLinus Torvalds } 2721da177e4SLinus Torvalds 2731da177e4SLinus Torvalds /* 27490072059SRussell King * If there is no memory in this node, ignore it. 2751da177e4SLinus Torvalds */ 27690072059SRussell King if (end_pfn == 0) 27790072059SRussell King return end_pfn; 2781da177e4SLinus Torvalds 2791da177e4SLinus Torvalds /* 28090072059SRussell King * Allocate the bootmem bitmap page. 2811da177e4SLinus Torvalds */ 28290072059SRussell King boot_pages = bootmem_bootmap_pages(end_pfn - start_pfn); 28390072059SRussell King boot_pfn = find_bootmap_pfn(node, mi, boot_pages); 2841da177e4SLinus Torvalds 2851da177e4SLinus Torvalds /* 28690072059SRussell King * Initialise the bootmem allocator for this node, handing the 28790072059SRussell King * memory banks over to bootmem. 2881da177e4SLinus Torvalds */ 28990072059SRussell King node_set_online(node); 29090072059SRussell King pgdat = NODE_DATA(node); 29190072059SRussell King init_bootmem_node(pgdat, boot_pfn, start_pfn, end_pfn); 29290072059SRussell King 29390072059SRussell King for_each_nodebank(i, mi, node) 29490072059SRussell King free_bootmem_node(pgdat, mi->bank[i].start, mi->bank[i].size); 2951da177e4SLinus Torvalds 2961da177e4SLinus Torvalds /* 29790072059SRussell King * Reserve the bootmem bitmap for this node. 2981da177e4SLinus Torvalds */ 29990072059SRussell King reserve_bootmem_node(pgdat, boot_pfn << PAGE_SHIFT, 30090072059SRussell King boot_pages << PAGE_SHIFT); 3011da177e4SLinus Torvalds 3021da177e4SLinus Torvalds #ifdef CONFIG_BLK_DEV_INITRD 30390072059SRussell King /* 30490072059SRussell King * If the initrd is in this node, reserve its memory. 30590072059SRussell King */ 30690072059SRussell King if (node == initrd_node) { 30790072059SRussell King reserve_bootmem_node(pgdat, phys_initrd_start, 3081da177e4SLinus Torvalds phys_initrd_size); 3091da177e4SLinus Torvalds initrd_start = __phys_to_virt(phys_initrd_start); 3101da177e4SLinus Torvalds initrd_end = initrd_start + phys_initrd_size; 3111da177e4SLinus Torvalds } 3121da177e4SLinus Torvalds #endif 3131da177e4SLinus Torvalds 31490072059SRussell King /* 31590072059SRussell King * Finally, reserve any node zero regions. 31690072059SRussell King */ 31790072059SRussell King if (node == 0) 31890072059SRussell King reserve_node_zero(pgdat); 31990072059SRussell King 32090072059SRussell King /* 32190072059SRussell King * initialise the zones within this node. 32290072059SRussell King */ 32390072059SRussell King memset(zone_size, 0, sizeof(zone_size)); 32490072059SRussell King memset(zhole_size, 0, sizeof(zhole_size)); 32590072059SRussell King 32690072059SRussell King /* 32790072059SRussell King * The size of this node has already been determined. If we need 32890072059SRussell King * to do anything fancy with the allocation of this memory to the 32990072059SRussell King * zones, now is the time to do it. 33090072059SRussell King */ 33190072059SRussell King zone_size[0] = end_pfn - start_pfn; 33290072059SRussell King 33390072059SRussell King /* 33490072059SRussell King * For each bank in this node, calculate the size of the holes. 33590072059SRussell King * holes = node_size - sum(bank_sizes_in_node) 33690072059SRussell King */ 33790072059SRussell King zhole_size[0] = zone_size[0]; 33890072059SRussell King for_each_nodebank(i, mi, node) 33990072059SRussell King zhole_size[0] -= mi->bank[i].size >> PAGE_SHIFT; 34090072059SRussell King 34190072059SRussell King /* 34290072059SRussell King * Adjust the sizes according to any special requirements for 34390072059SRussell King * this machine type. 34490072059SRussell King */ 34590072059SRussell King arch_adjust_zones(node, zone_size, zhole_size); 34690072059SRussell King 34790072059SRussell King free_area_init_node(node, pgdat, zone_size, start_pfn, zhole_size); 34890072059SRussell King 34990072059SRussell King return end_pfn; 35090072059SRussell King } 35190072059SRussell King 35290072059SRussell King static void __init bootmem_init(struct meminfo *mi) 35390072059SRussell King { 35490072059SRussell King unsigned long addr, memend_pfn = 0; 35590072059SRussell King int node, initrd_node, i; 35690072059SRussell King 35790072059SRussell King /* 35890072059SRussell King * Invalidate the node number for empty or invalid memory banks 35990072059SRussell King */ 36090072059SRussell King for (i = 0; i < mi->nr_banks; i++) 36190072059SRussell King if (mi->bank[i].size == 0 || mi->bank[i].node >= MAX_NUMNODES) 36290072059SRussell King mi->bank[i].node = -1; 36390072059SRussell King 36490072059SRussell King memcpy(&meminfo, mi, sizeof(meminfo)); 36590072059SRussell King 36690072059SRussell King /* 36790072059SRussell King * Clear out all the mappings below the kernel image. 36890072059SRussell King */ 3691a47ebc0SNicolas Pitre for (addr = 0; addr < MODULE_START; addr += PGDIR_SIZE) 3701a47ebc0SNicolas Pitre pmd_clear(pmd_off_k(addr)); 3711a47ebc0SNicolas Pitre #ifdef CONFIG_XIP_KERNEL 3721a47ebc0SNicolas Pitre /* The XIP kernel is mapped in the module area -- skip over it */ 3731a47ebc0SNicolas Pitre addr = ((unsigned long)&_etext + PGDIR_SIZE - 1) & PGDIR_MASK; 3741a47ebc0SNicolas Pitre #endif 3751a47ebc0SNicolas Pitre for ( ; addr < PAGE_OFFSET; addr += PGDIR_SIZE) 37690072059SRussell King pmd_clear(pmd_off_k(addr)); 37790072059SRussell King 37890072059SRussell King /* 37990072059SRussell King * Clear out all the kernel space mappings, except for the first 38090072059SRussell King * memory bank, up to the end of the vmalloc region. 38190072059SRussell King */ 38290072059SRussell King for (addr = __phys_to_virt(mi->bank[0].start + mi->bank[0].size); 38390072059SRussell King addr < VMALLOC_END; addr += PGDIR_SIZE) 38490072059SRussell King pmd_clear(pmd_off_k(addr)); 38590072059SRussell King 38690072059SRussell King /* 38790072059SRussell King * Locate which node contains the ramdisk image, if any. 38890072059SRussell King */ 38990072059SRussell King initrd_node = check_initrd(mi); 39090072059SRussell King 39190072059SRussell King /* 39290072059SRussell King * Run through each node initialising the bootmem allocator. 39390072059SRussell King */ 39490072059SRussell King for_each_node(node) { 39590072059SRussell King unsigned long end_pfn; 39690072059SRussell King 39790072059SRussell King end_pfn = bootmem_init_node(node, initrd_node, mi); 39890072059SRussell King 39990072059SRussell King /* 40090072059SRussell King * Remember the highest memory PFN. 40190072059SRussell King */ 40290072059SRussell King if (end_pfn > memend_pfn) 40390072059SRussell King memend_pfn = end_pfn; 40490072059SRussell King } 40590072059SRussell King 40690072059SRussell King high_memory = __va(memend_pfn << PAGE_SHIFT); 40790072059SRussell King 40890072059SRussell King /* 40990072059SRussell King * This doesn't seem to be used by the Linux memory manager any 41090072059SRussell King * more, but is used by ll_rw_block. If we can get rid of it, we 41190072059SRussell King * also get rid of some of the stuff above as well. 41290072059SRussell King * 41390072059SRussell King * Note: max_low_pfn and max_pfn reflect the number of _pages_ in 41490072059SRussell King * the system, not the maximum PFN. 41590072059SRussell King */ 41690072059SRussell King max_pfn = max_low_pfn = memend_pfn - PHYS_PFN_OFFSET; 41790072059SRussell King } 41890072059SRussell King 41990072059SRussell King /* 42090072059SRussell King * Set up device the mappings. Since we clear out the page tables for all 42190072059SRussell King * mappings above VMALLOC_END, we will remove any debug device mappings. 42290072059SRussell King * This means you have to be careful how you debug this function, or any 42302b30839SRussell King * called function. This means you can't use any function or debugging 42402b30839SRussell King * method which may touch any device, otherwise the kernel _will_ crash. 42590072059SRussell King */ 42690072059SRussell King static void __init devicemaps_init(struct machine_desc *mdesc) 42790072059SRussell King { 42890072059SRussell King struct map_desc map; 42990072059SRussell King unsigned long addr; 43090072059SRussell King void *vectors; 43190072059SRussell King 43202b30839SRussell King /* 43302b30839SRussell King * Allocate the vector page early. 43402b30839SRussell King */ 43502b30839SRussell King vectors = alloc_bootmem_low_pages(PAGE_SIZE); 43602b30839SRussell King BUG_ON(!vectors); 43702b30839SRussell King 43890072059SRussell King for (addr = VMALLOC_END; addr; addr += PGDIR_SIZE) 43990072059SRussell King pmd_clear(pmd_off_k(addr)); 44090072059SRussell King 44190072059SRussell King /* 4421a47ebc0SNicolas Pitre * Map the kernel if it is XIP. 4431a47ebc0SNicolas Pitre * It is always first in the modulearea. 4441a47ebc0SNicolas Pitre */ 4451a47ebc0SNicolas Pitre #ifdef CONFIG_XIP_KERNEL 4461a47ebc0SNicolas Pitre map.pfn = __phys_to_pfn(CONFIG_XIP_PHYS_ADDR & PGDIR_MASK); 4471a47ebc0SNicolas Pitre map.virtual = MODULE_START; 4481a47ebc0SNicolas Pitre map.length = ((unsigned long)&_etext - map.virtual + ~PGDIR_MASK) & PGDIR_MASK; 4491a47ebc0SNicolas Pitre map.type = MT_ROM; 4501a47ebc0SNicolas Pitre create_mapping(&map); 4511a47ebc0SNicolas Pitre #endif 4521a47ebc0SNicolas Pitre 4531a47ebc0SNicolas Pitre /* 45490072059SRussell King * Map the cache flushing regions. 45590072059SRussell King */ 45690072059SRussell King #ifdef FLUSH_BASE 4579769c246SDeepak Saxena map.pfn = __phys_to_pfn(FLUSH_BASE_PHYS); 45890072059SRussell King map.virtual = FLUSH_BASE; 45990072059SRussell King map.length = PGDIR_SIZE; 46090072059SRussell King map.type = MT_CACHECLEAN; 46190072059SRussell King create_mapping(&map); 46290072059SRussell King #endif 46390072059SRussell King #ifdef FLUSH_BASE_MINICACHE 4649769c246SDeepak Saxena map.pfn = __phys_to_pfn(FLUSH_BASE_PHYS + PGDIR_SIZE); 46590072059SRussell King map.virtual = FLUSH_BASE_MINICACHE; 46690072059SRussell King map.length = PGDIR_SIZE; 46790072059SRussell King map.type = MT_MINICLEAN; 46890072059SRussell King create_mapping(&map); 46990072059SRussell King #endif 47090072059SRussell King 47190072059SRussell King /* 47290072059SRussell King * Create a mapping for the machine vectors at the high-vectors 47390072059SRussell King * location (0xffff0000). If we aren't using high-vectors, also 47490072059SRussell King * create a mapping at the low-vectors virtual address. 47590072059SRussell King */ 4769769c246SDeepak Saxena map.pfn = __phys_to_pfn(virt_to_phys(vectors)); 47790072059SRussell King map.virtual = 0xffff0000; 47890072059SRussell King map.length = PAGE_SIZE; 47990072059SRussell King map.type = MT_HIGH_VECTORS; 48090072059SRussell King create_mapping(&map); 48190072059SRussell King 48290072059SRussell King if (!vectors_high()) { 48390072059SRussell King map.virtual = 0; 48490072059SRussell King map.type = MT_LOW_VECTORS; 48590072059SRussell King create_mapping(&map); 48690072059SRussell King } 48790072059SRussell King 48890072059SRussell King /* 48990072059SRussell King * Ask the machine support to map in the statically mapped devices. 49090072059SRussell King */ 49190072059SRussell King if (mdesc->map_io) 49290072059SRussell King mdesc->map_io(); 4936bf7bd69SRussell King 4946bf7bd69SRussell King /* 49502b30839SRussell King * Finally flush the caches and tlb to ensure that we're in a 49602b30839SRussell King * consistent state wrt the writebuffer. This also ensures that 49702b30839SRussell King * any write-allocated cache lines in the vector page are written 49802b30839SRussell King * back. After this point, we can start to touch devices again. 4996bf7bd69SRussell King */ 5006bf7bd69SRussell King local_flush_tlb_all(); 50102b30839SRussell King flush_cache_all(); 5021da177e4SLinus Torvalds } 5031da177e4SLinus Torvalds 5041da177e4SLinus Torvalds /* 5051da177e4SLinus Torvalds * paging_init() sets up the page tables, initialises the zone memory 5061da177e4SLinus Torvalds * maps, and sets up the zero page, bad page and bad page tables. 5071da177e4SLinus Torvalds */ 5081da177e4SLinus Torvalds void __init paging_init(struct meminfo *mi, struct machine_desc *mdesc) 5091da177e4SLinus Torvalds { 5101da177e4SLinus Torvalds void *zero_page; 5111da177e4SLinus Torvalds 51290072059SRussell King build_mem_type_table(); 5131da177e4SLinus Torvalds bootmem_init(mi); 51490072059SRussell King devicemaps_init(mdesc); 5151da177e4SLinus Torvalds 51690072059SRussell King top_pmd = pmd_off_k(0xffff0000); 5171da177e4SLinus Torvalds 5181da177e4SLinus Torvalds /* 5191da177e4SLinus Torvalds * allocate the zero page. Note that we count on this going ok. 5201da177e4SLinus Torvalds */ 5211da177e4SLinus Torvalds zero_page = alloc_bootmem_low_pages(PAGE_SIZE); 5221da177e4SLinus Torvalds memzero(zero_page, PAGE_SIZE); 5231da177e4SLinus Torvalds empty_zero_page = virt_to_page(zero_page); 5241da177e4SLinus Torvalds flush_dcache_page(empty_zero_page); 5251da177e4SLinus Torvalds } 5261da177e4SLinus Torvalds 5271da177e4SLinus Torvalds static inline void free_area(unsigned long addr, unsigned long end, char *s) 5281da177e4SLinus Torvalds { 5291da177e4SLinus Torvalds unsigned int size = (end - addr) >> 10; 5301da177e4SLinus Torvalds 5311da177e4SLinus Torvalds for (; addr < end; addr += PAGE_SIZE) { 5321da177e4SLinus Torvalds struct page *page = virt_to_page(addr); 5331da177e4SLinus Torvalds ClearPageReserved(page); 534*7835e98bSNick Piggin init_page_count(page); 5351da177e4SLinus Torvalds free_page(addr); 5361da177e4SLinus Torvalds totalram_pages++; 5371da177e4SLinus Torvalds } 5381da177e4SLinus Torvalds 5391da177e4SLinus Torvalds if (size && s) 5401da177e4SLinus Torvalds printk(KERN_INFO "Freeing %s memory: %dK\n", s, size); 5411da177e4SLinus Torvalds } 5421da177e4SLinus Torvalds 543a013053dSRussell King static inline void 544a013053dSRussell King free_memmap(int node, unsigned long start_pfn, unsigned long end_pfn) 545a013053dSRussell King { 546a013053dSRussell King struct page *start_pg, *end_pg; 547a013053dSRussell King unsigned long pg, pgend; 548a013053dSRussell King 549a013053dSRussell King /* 550a013053dSRussell King * Convert start_pfn/end_pfn to a struct page pointer. 551a013053dSRussell King */ 552a013053dSRussell King start_pg = pfn_to_page(start_pfn); 553a013053dSRussell King end_pg = pfn_to_page(end_pfn); 554a013053dSRussell King 555a013053dSRussell King /* 556a013053dSRussell King * Convert to physical addresses, and 557a013053dSRussell King * round start upwards and end downwards. 558a013053dSRussell King */ 559a013053dSRussell King pg = PAGE_ALIGN(__pa(start_pg)); 560a013053dSRussell King pgend = __pa(end_pg) & PAGE_MASK; 561a013053dSRussell King 562a013053dSRussell King /* 563a013053dSRussell King * If there are free pages between these, 564a013053dSRussell King * free the section of the memmap array. 565a013053dSRussell King */ 566a013053dSRussell King if (pg < pgend) 567a013053dSRussell King free_bootmem_node(NODE_DATA(node), pg, pgend - pg); 568a013053dSRussell King } 569a013053dSRussell King 570a013053dSRussell King /* 571a013053dSRussell King * The mem_map array can get very big. Free the unused area of the memory map. 572a013053dSRussell King */ 573a013053dSRussell King static void __init free_unused_memmap_node(int node, struct meminfo *mi) 574a013053dSRussell King { 575a013053dSRussell King unsigned long bank_start, prev_bank_end = 0; 576a013053dSRussell King unsigned int i; 577a013053dSRussell King 578a013053dSRussell King /* 579a013053dSRussell King * [FIXME] This relies on each bank being in address order. This 580a013053dSRussell King * may not be the case, especially if the user has provided the 581a013053dSRussell King * information on the command line. 582a013053dSRussell King */ 58390072059SRussell King for_each_nodebank(i, mi, node) { 584a013053dSRussell King bank_start = mi->bank[i].start >> PAGE_SHIFT; 585a013053dSRussell King if (bank_start < prev_bank_end) { 586a013053dSRussell King printk(KERN_ERR "MEM: unordered memory banks. " 587a013053dSRussell King "Not freeing memmap.\n"); 588a013053dSRussell King break; 589a013053dSRussell King } 590a013053dSRussell King 591a013053dSRussell King /* 592a013053dSRussell King * If we had a previous bank, and there is a space 593a013053dSRussell King * between the current bank and the previous, free it. 594a013053dSRussell King */ 595a013053dSRussell King if (prev_bank_end && prev_bank_end != bank_start) 596a013053dSRussell King free_memmap(node, prev_bank_end, bank_start); 597a013053dSRussell King 598a013053dSRussell King prev_bank_end = (mi->bank[i].start + 599a013053dSRussell King mi->bank[i].size) >> PAGE_SHIFT; 600a013053dSRussell King } 601a013053dSRussell King } 602a013053dSRussell King 6031da177e4SLinus Torvalds /* 6041da177e4SLinus Torvalds * mem_init() marks the free areas in the mem_map and tells us how much 6051da177e4SLinus Torvalds * memory is free. This is done after various parts of the system have 6061da177e4SLinus Torvalds * claimed their memory after the kernel image. 6071da177e4SLinus Torvalds */ 6081da177e4SLinus Torvalds void __init mem_init(void) 6091da177e4SLinus Torvalds { 6101da177e4SLinus Torvalds unsigned int codepages, datapages, initpages; 6111da177e4SLinus Torvalds int i, node; 6121da177e4SLinus Torvalds 6131da177e4SLinus Torvalds codepages = &_etext - &_text; 6141da177e4SLinus Torvalds datapages = &_end - &__data_start; 6151da177e4SLinus Torvalds initpages = &__init_end - &__init_begin; 6161da177e4SLinus Torvalds 6171da177e4SLinus Torvalds #ifndef CONFIG_DISCONTIGMEM 6181da177e4SLinus Torvalds max_mapnr = virt_to_page(high_memory) - mem_map; 6191da177e4SLinus Torvalds #endif 6201da177e4SLinus Torvalds 6211da177e4SLinus Torvalds /* this will put all unused low memory onto the freelists */ 6221da177e4SLinus Torvalds for_each_online_node(node) { 6231da177e4SLinus Torvalds pg_data_t *pgdat = NODE_DATA(node); 6241da177e4SLinus Torvalds 625a013053dSRussell King free_unused_memmap_node(node, &meminfo); 626a013053dSRussell King 6271da177e4SLinus Torvalds if (pgdat->node_spanned_pages != 0) 6281da177e4SLinus Torvalds totalram_pages += free_all_bootmem_node(pgdat); 6291da177e4SLinus Torvalds } 6301da177e4SLinus Torvalds 6311da177e4SLinus Torvalds #ifdef CONFIG_SA1111 6321da177e4SLinus Torvalds /* now that our DMA memory is actually so designated, we can free it */ 6331da177e4SLinus Torvalds free_area(PAGE_OFFSET, (unsigned long)swapper_pg_dir, NULL); 6341da177e4SLinus Torvalds #endif 6351da177e4SLinus Torvalds 6361da177e4SLinus Torvalds /* 6371da177e4SLinus Torvalds * Since our memory may not be contiguous, calculate the 6381da177e4SLinus Torvalds * real number of pages we have in this system 6391da177e4SLinus Torvalds */ 6401da177e4SLinus Torvalds printk(KERN_INFO "Memory:"); 6411da177e4SLinus Torvalds 6421da177e4SLinus Torvalds num_physpages = 0; 6431da177e4SLinus Torvalds for (i = 0; i < meminfo.nr_banks; i++) { 6441da177e4SLinus Torvalds num_physpages += meminfo.bank[i].size >> PAGE_SHIFT; 6451da177e4SLinus Torvalds printk(" %ldMB", meminfo.bank[i].size >> 20); 6461da177e4SLinus Torvalds } 6471da177e4SLinus Torvalds 6481da177e4SLinus Torvalds printk(" = %luMB total\n", num_physpages >> (20 - PAGE_SHIFT)); 6491da177e4SLinus Torvalds printk(KERN_NOTICE "Memory: %luKB available (%dK code, " 6501da177e4SLinus Torvalds "%dK data, %dK init)\n", 6511da177e4SLinus Torvalds (unsigned long) nr_free_pages() << (PAGE_SHIFT-10), 6521da177e4SLinus Torvalds codepages >> 10, datapages >> 10, initpages >> 10); 6531da177e4SLinus Torvalds 6541da177e4SLinus Torvalds if (PAGE_SIZE >= 16384 && num_physpages <= 128) { 6551da177e4SLinus Torvalds extern int sysctl_overcommit_memory; 6561da177e4SLinus Torvalds /* 6571da177e4SLinus Torvalds * On a machine this small we won't get 6581da177e4SLinus Torvalds * anywhere without overcommit, so turn 6591da177e4SLinus Torvalds * it on by default. 6601da177e4SLinus Torvalds */ 6611da177e4SLinus Torvalds sysctl_overcommit_memory = OVERCOMMIT_ALWAYS; 6621da177e4SLinus Torvalds } 6631da177e4SLinus Torvalds } 6641da177e4SLinus Torvalds 6651da177e4SLinus Torvalds void free_initmem(void) 6661da177e4SLinus Torvalds { 6671da177e4SLinus Torvalds if (!machine_is_integrator() && !machine_is_cintegrator()) { 6681da177e4SLinus Torvalds free_area((unsigned long)(&__init_begin), 6691da177e4SLinus Torvalds (unsigned long)(&__init_end), 6701da177e4SLinus Torvalds "init"); 6711da177e4SLinus Torvalds } 6721da177e4SLinus Torvalds } 6731da177e4SLinus Torvalds 6741da177e4SLinus Torvalds #ifdef CONFIG_BLK_DEV_INITRD 6751da177e4SLinus Torvalds 6761da177e4SLinus Torvalds static int keep_initrd; 6771da177e4SLinus Torvalds 6781da177e4SLinus Torvalds void free_initrd_mem(unsigned long start, unsigned long end) 6791da177e4SLinus Torvalds { 6801da177e4SLinus Torvalds if (!keep_initrd) 6811da177e4SLinus Torvalds free_area(start, end, "initrd"); 6821da177e4SLinus Torvalds } 6831da177e4SLinus Torvalds 6841da177e4SLinus Torvalds static int __init keepinitrd_setup(char *__unused) 6851da177e4SLinus Torvalds { 6861da177e4SLinus Torvalds keep_initrd = 1; 6871da177e4SLinus Torvalds return 1; 6881da177e4SLinus Torvalds } 6891da177e4SLinus Torvalds 6901da177e4SLinus Torvalds __setup("keepinitrd", keepinitrd_setup); 6911da177e4SLinus Torvalds #endif 692