1 /* 2 * This file is subject to the terms and conditions of the GNU General Public 3 * License. See the file "COPYING" in the main directory of this archive 4 * for more details. 5 * 6 * Copyright (C) 1994 - 2000 Ralf Baechle 7 * Copyright (C) 1999, 2000 Silicon Graphics, Inc. 8 * Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com 9 * Copyright (C) 2000 MIPS Technologies, Inc. All rights reserved. 10 */ 11 #include <linux/bug.h> 12 #include <linux/init.h> 13 #include <linux/export.h> 14 #include <linux/signal.h> 15 #include <linux/sched.h> 16 #include <linux/smp.h> 17 #include <linux/kernel.h> 18 #include <linux/errno.h> 19 #include <linux/string.h> 20 #include <linux/types.h> 21 #include <linux/pagemap.h> 22 #include <linux/ptrace.h> 23 #include <linux/mman.h> 24 #include <linux/mm.h> 25 #include <linux/memblock.h> 26 #include <linux/highmem.h> 27 #include <linux/swap.h> 28 #include <linux/proc_fs.h> 29 #include <linux/pfn.h> 30 #include <linux/hardirq.h> 31 #include <linux/gfp.h> 32 #include <linux/kcore.h> 33 #include <linux/initrd.h> 34 35 #include <asm/bootinfo.h> 36 #include <asm/cachectl.h> 37 #include <asm/cpu.h> 38 #include <asm/dma.h> 39 #include <asm/kmap_types.h> 40 #include <asm/maar.h> 41 #include <asm/mmu_context.h> 42 #include <asm/sections.h> 43 #include <asm/pgtable.h> 44 #include <asm/pgalloc.h> 45 #include <asm/tlb.h> 46 #include <asm/fixmap.h> 47 48 /* 49 * We have up to 8 empty zeroed pages so we can map one of the right colour 50 * when needed. This is necessary only on R4000 / R4400 SC and MC versions 51 * where we have to avoid VCED / VECI exceptions for good performance at 52 * any price. Since page is never written to after the initialization we 53 * don't have to care about aliases on other CPUs. 54 */ 55 unsigned long empty_zero_page, zero_page_mask; 56 EXPORT_SYMBOL_GPL(empty_zero_page); 57 EXPORT_SYMBOL(zero_page_mask); 58 59 /* 60 * Not static inline because used by IP27 special magic initialization code 61 */ 62 void setup_zero_pages(void) 63 { 64 unsigned int order, i; 65 struct page *page; 66 67 if (cpu_has_vce) 68 order = 3; 69 else 70 order = 0; 71 72 empty_zero_page = __get_free_pages(GFP_KERNEL | __GFP_ZERO, order); 73 if (!empty_zero_page) 74 panic("Oh boy, that early out of memory?"); 75 76 page = virt_to_page((void *)empty_zero_page); 77 split_page(page, order); 78 for (i = 0; i < (1 << order); i++, page++) 79 mark_page_reserved(page); 80 81 zero_page_mask = ((PAGE_SIZE << order) - 1) & PAGE_MASK; 82 } 83 84 static void *__kmap_pgprot(struct page *page, unsigned long addr, pgprot_t prot) 85 { 86 enum fixed_addresses idx; 87 unsigned int uninitialized_var(old_mmid); 88 unsigned long vaddr, flags, entrylo; 89 unsigned long old_ctx; 90 pte_t pte; 91 int tlbidx; 92 93 BUG_ON(Page_dcache_dirty(page)); 94 95 preempt_disable(); 96 pagefault_disable(); 97 idx = (addr >> PAGE_SHIFT) & (FIX_N_COLOURS - 1); 98 idx += in_interrupt() ? FIX_N_COLOURS : 0; 99 vaddr = __fix_to_virt(FIX_CMAP_END - idx); 100 pte = mk_pte(page, prot); 101 #if defined(CONFIG_XPA) 102 entrylo = pte_to_entrylo(pte.pte_high); 103 #elif defined(CONFIG_PHYS_ADDR_T_64BIT) && defined(CONFIG_CPU_MIPS32) 104 entrylo = pte.pte_high; 105 #else 106 entrylo = pte_to_entrylo(pte_val(pte)); 107 #endif 108 109 local_irq_save(flags); 110 old_ctx = read_c0_entryhi(); 111 write_c0_entryhi(vaddr & (PAGE_MASK << 1)); 112 write_c0_entrylo0(entrylo); 113 write_c0_entrylo1(entrylo); 114 if (cpu_has_mmid) { 115 old_mmid = read_c0_memorymapid(); 116 write_c0_memorymapid(MMID_KERNEL_WIRED); 117 } 118 #ifdef CONFIG_XPA 119 if (cpu_has_xpa) { 120 entrylo = (pte.pte_low & _PFNX_MASK); 121 writex_c0_entrylo0(entrylo); 122 writex_c0_entrylo1(entrylo); 123 } 124 #endif 125 tlbidx = num_wired_entries(); 126 write_c0_wired(tlbidx + 1); 127 write_c0_index(tlbidx); 128 mtc0_tlbw_hazard(); 129 tlb_write_indexed(); 130 tlbw_use_hazard(); 131 write_c0_entryhi(old_ctx); 132 if (cpu_has_mmid) 133 write_c0_memorymapid(old_mmid); 134 local_irq_restore(flags); 135 136 return (void*) vaddr; 137 } 138 139 void *kmap_coherent(struct page *page, unsigned long addr) 140 { 141 return __kmap_pgprot(page, addr, PAGE_KERNEL); 142 } 143 144 void *kmap_noncoherent(struct page *page, unsigned long addr) 145 { 146 return __kmap_pgprot(page, addr, PAGE_KERNEL_NC); 147 } 148 149 void kunmap_coherent(void) 150 { 151 unsigned int wired; 152 unsigned long flags, old_ctx; 153 154 local_irq_save(flags); 155 old_ctx = read_c0_entryhi(); 156 wired = num_wired_entries() - 1; 157 write_c0_wired(wired); 158 write_c0_index(wired); 159 write_c0_entryhi(UNIQUE_ENTRYHI(wired)); 160 write_c0_entrylo0(0); 161 write_c0_entrylo1(0); 162 mtc0_tlbw_hazard(); 163 tlb_write_indexed(); 164 tlbw_use_hazard(); 165 write_c0_entryhi(old_ctx); 166 local_irq_restore(flags); 167 pagefault_enable(); 168 preempt_enable(); 169 } 170 171 void copy_user_highpage(struct page *to, struct page *from, 172 unsigned long vaddr, struct vm_area_struct *vma) 173 { 174 void *vfrom, *vto; 175 176 vto = kmap_atomic(to); 177 if (cpu_has_dc_aliases && 178 page_mapcount(from) && !Page_dcache_dirty(from)) { 179 vfrom = kmap_coherent(from, vaddr); 180 copy_page(vto, vfrom); 181 kunmap_coherent(); 182 } else { 183 vfrom = kmap_atomic(from); 184 copy_page(vto, vfrom); 185 kunmap_atomic(vfrom); 186 } 187 if ((!cpu_has_ic_fills_f_dc) || 188 pages_do_alias((unsigned long)vto, vaddr & PAGE_MASK)) 189 flush_data_cache_page((unsigned long)vto); 190 kunmap_atomic(vto); 191 /* Make sure this page is cleared on other CPU's too before using it */ 192 smp_wmb(); 193 } 194 195 void copy_to_user_page(struct vm_area_struct *vma, 196 struct page *page, unsigned long vaddr, void *dst, const void *src, 197 unsigned long len) 198 { 199 if (cpu_has_dc_aliases && 200 page_mapcount(page) && !Page_dcache_dirty(page)) { 201 void *vto = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK); 202 memcpy(vto, src, len); 203 kunmap_coherent(); 204 } else { 205 memcpy(dst, src, len); 206 if (cpu_has_dc_aliases) 207 SetPageDcacheDirty(page); 208 } 209 if (vma->vm_flags & VM_EXEC) 210 flush_cache_page(vma, vaddr, page_to_pfn(page)); 211 } 212 213 void copy_from_user_page(struct vm_area_struct *vma, 214 struct page *page, unsigned long vaddr, void *dst, const void *src, 215 unsigned long len) 216 { 217 if (cpu_has_dc_aliases && 218 page_mapcount(page) && !Page_dcache_dirty(page)) { 219 void *vfrom = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK); 220 memcpy(dst, vfrom, len); 221 kunmap_coherent(); 222 } else { 223 memcpy(dst, src, len); 224 if (cpu_has_dc_aliases) 225 SetPageDcacheDirty(page); 226 } 227 } 228 EXPORT_SYMBOL_GPL(copy_from_user_page); 229 230 void __init fixrange_init(unsigned long start, unsigned long end, 231 pgd_t *pgd_base) 232 { 233 #ifdef CONFIG_HIGHMEM 234 pgd_t *pgd; 235 pud_t *pud; 236 pmd_t *pmd; 237 pte_t *pte; 238 int i, j, k; 239 unsigned long vaddr; 240 241 vaddr = start; 242 i = pgd_index(vaddr); 243 j = pud_index(vaddr); 244 k = pmd_index(vaddr); 245 pgd = pgd_base + i; 246 247 for ( ; (i < PTRS_PER_PGD) && (vaddr < end); pgd++, i++) { 248 pud = (pud_t *)pgd; 249 for ( ; (j < PTRS_PER_PUD) && (vaddr < end); pud++, j++) { 250 pmd = (pmd_t *)pud; 251 for (; (k < PTRS_PER_PMD) && (vaddr < end); pmd++, k++) { 252 if (pmd_none(*pmd)) { 253 pte = (pte_t *) memblock_alloc_low(PAGE_SIZE, 254 PAGE_SIZE); 255 if (!pte) 256 panic("%s: Failed to allocate %lu bytes align=%lx\n", 257 __func__, PAGE_SIZE, 258 PAGE_SIZE); 259 260 set_pmd(pmd, __pmd((unsigned long)pte)); 261 BUG_ON(pte != pte_offset_kernel(pmd, 0)); 262 } 263 vaddr += PMD_SIZE; 264 } 265 k = 0; 266 } 267 j = 0; 268 } 269 #endif 270 } 271 272 struct maar_walk_info { 273 struct maar_config cfg[16]; 274 unsigned int num_cfg; 275 }; 276 277 static int maar_res_walk(unsigned long start_pfn, unsigned long nr_pages, 278 void *data) 279 { 280 struct maar_walk_info *wi = data; 281 struct maar_config *cfg = &wi->cfg[wi->num_cfg]; 282 unsigned int maar_align; 283 284 /* MAAR registers hold physical addresses right shifted by 4 bits */ 285 maar_align = BIT(MIPS_MAAR_ADDR_SHIFT + 4); 286 287 /* Fill in the MAAR config entry */ 288 cfg->lower = ALIGN(PFN_PHYS(start_pfn), maar_align); 289 cfg->upper = ALIGN_DOWN(PFN_PHYS(start_pfn + nr_pages), maar_align) - 1; 290 cfg->attrs = MIPS_MAAR_S; 291 292 /* Ensure we don't overflow the cfg array */ 293 if (!WARN_ON(wi->num_cfg >= ARRAY_SIZE(wi->cfg))) 294 wi->num_cfg++; 295 296 return 0; 297 } 298 299 300 unsigned __weak platform_maar_init(unsigned num_pairs) 301 { 302 unsigned int num_configured; 303 struct maar_walk_info wi; 304 305 wi.num_cfg = 0; 306 walk_system_ram_range(0, max_pfn, &wi, maar_res_walk); 307 308 num_configured = maar_config(wi.cfg, wi.num_cfg, num_pairs); 309 if (num_configured < wi.num_cfg) 310 pr_warn("Not enough MAAR pairs (%u) for all memory regions (%u)\n", 311 num_pairs, wi.num_cfg); 312 313 return num_configured; 314 } 315 316 void maar_init(void) 317 { 318 unsigned num_maars, used, i; 319 phys_addr_t lower, upper, attr; 320 static struct { 321 struct maar_config cfgs[3]; 322 unsigned used; 323 } recorded = { { { 0 } }, 0 }; 324 325 if (!cpu_has_maar) 326 return; 327 328 /* Detect the number of MAARs */ 329 write_c0_maari(~0); 330 back_to_back_c0_hazard(); 331 num_maars = read_c0_maari() + 1; 332 333 /* MAARs should be in pairs */ 334 WARN_ON(num_maars % 2); 335 336 /* Set MAARs using values we recorded already */ 337 if (recorded.used) { 338 used = maar_config(recorded.cfgs, recorded.used, num_maars / 2); 339 BUG_ON(used != recorded.used); 340 } else { 341 /* Configure the required MAARs */ 342 used = platform_maar_init(num_maars / 2); 343 } 344 345 /* Disable any further MAARs */ 346 for (i = (used * 2); i < num_maars; i++) { 347 write_c0_maari(i); 348 back_to_back_c0_hazard(); 349 write_c0_maar(0); 350 back_to_back_c0_hazard(); 351 } 352 353 if (recorded.used) 354 return; 355 356 pr_info("MAAR configuration:\n"); 357 for (i = 0; i < num_maars; i += 2) { 358 write_c0_maari(i); 359 back_to_back_c0_hazard(); 360 upper = read_c0_maar(); 361 #ifdef CONFIG_XPA 362 upper |= (phys_addr_t)readx_c0_maar() << MIPS_MAARX_ADDR_SHIFT; 363 #endif 364 365 write_c0_maari(i + 1); 366 back_to_back_c0_hazard(); 367 lower = read_c0_maar(); 368 #ifdef CONFIG_XPA 369 lower |= (phys_addr_t)readx_c0_maar() << MIPS_MAARX_ADDR_SHIFT; 370 #endif 371 372 attr = lower & upper; 373 lower = (lower & MIPS_MAAR_ADDR) << 4; 374 upper = ((upper & MIPS_MAAR_ADDR) << 4) | 0xffff; 375 376 pr_info(" [%d]: ", i / 2); 377 if ((attr & MIPS_MAAR_V) != MIPS_MAAR_V) { 378 pr_cont("disabled\n"); 379 continue; 380 } 381 382 pr_cont("%pa-%pa", &lower, &upper); 383 384 if (attr & MIPS_MAAR_S) 385 pr_cont(" speculate"); 386 387 pr_cont("\n"); 388 389 /* Record the setup for use on secondary CPUs */ 390 if (used <= ARRAY_SIZE(recorded.cfgs)) { 391 recorded.cfgs[recorded.used].lower = lower; 392 recorded.cfgs[recorded.used].upper = upper; 393 recorded.cfgs[recorded.used].attrs = attr; 394 recorded.used++; 395 } 396 } 397 } 398 399 #ifndef CONFIG_NEED_MULTIPLE_NODES 400 void __init paging_init(void) 401 { 402 unsigned long max_zone_pfns[MAX_NR_ZONES]; 403 404 pagetable_init(); 405 406 #ifdef CONFIG_HIGHMEM 407 kmap_init(); 408 #endif 409 #ifdef CONFIG_ZONE_DMA 410 max_zone_pfns[ZONE_DMA] = MAX_DMA_PFN; 411 #endif 412 #ifdef CONFIG_ZONE_DMA32 413 max_zone_pfns[ZONE_DMA32] = MAX_DMA32_PFN; 414 #endif 415 max_zone_pfns[ZONE_NORMAL] = max_low_pfn; 416 #ifdef CONFIG_HIGHMEM 417 max_zone_pfns[ZONE_HIGHMEM] = highend_pfn; 418 419 if (cpu_has_dc_aliases && max_low_pfn != highend_pfn) { 420 printk(KERN_WARNING "This processor doesn't support highmem." 421 " %ldk highmem ignored\n", 422 (highend_pfn - max_low_pfn) << (PAGE_SHIFT - 10)); 423 max_zone_pfns[ZONE_HIGHMEM] = max_low_pfn; 424 } 425 #endif 426 427 free_area_init(max_zone_pfns); 428 } 429 430 #ifdef CONFIG_64BIT 431 static struct kcore_list kcore_kseg0; 432 #endif 433 434 static inline void __init mem_init_free_highmem(void) 435 { 436 #ifdef CONFIG_HIGHMEM 437 unsigned long tmp; 438 439 if (cpu_has_dc_aliases) 440 return; 441 442 for (tmp = highstart_pfn; tmp < highend_pfn; tmp++) { 443 struct page *page = pfn_to_page(tmp); 444 445 if (!memblock_is_memory(PFN_PHYS(tmp))) 446 SetPageReserved(page); 447 else 448 free_highmem_page(page); 449 } 450 #endif 451 } 452 453 void __init mem_init(void) 454 { 455 /* 456 * When _PFN_SHIFT is greater than PAGE_SHIFT we won't have enough PTE 457 * bits to hold a full 32b physical address on MIPS32 systems. 458 */ 459 BUILD_BUG_ON(IS_ENABLED(CONFIG_32BIT) && (_PFN_SHIFT > PAGE_SHIFT)); 460 461 #ifdef CONFIG_HIGHMEM 462 #ifdef CONFIG_DISCONTIGMEM 463 #error "CONFIG_HIGHMEM and CONFIG_DISCONTIGMEM dont work together yet" 464 #endif 465 max_mapnr = highend_pfn ? highend_pfn : max_low_pfn; 466 #else 467 max_mapnr = max_low_pfn; 468 #endif 469 high_memory = (void *) __va(max_low_pfn << PAGE_SHIFT); 470 471 maar_init(); 472 memblock_free_all(); 473 setup_zero_pages(); /* Setup zeroed pages. */ 474 mem_init_free_highmem(); 475 mem_init_print_info(NULL); 476 477 #ifdef CONFIG_64BIT 478 if ((unsigned long) &_text > (unsigned long) CKSEG0) 479 /* The -4 is a hack so that user tools don't have to handle 480 the overflow. */ 481 kclist_add(&kcore_kseg0, (void *) CKSEG0, 482 0x80000000 - 4, KCORE_TEXT); 483 #endif 484 } 485 #endif /* !CONFIG_NEED_MULTIPLE_NODES */ 486 487 void free_init_pages(const char *what, unsigned long begin, unsigned long end) 488 { 489 unsigned long pfn; 490 491 for (pfn = PFN_UP(begin); pfn < PFN_DOWN(end); pfn++) { 492 struct page *page = pfn_to_page(pfn); 493 void *addr = phys_to_virt(PFN_PHYS(pfn)); 494 495 memset(addr, POISON_FREE_INITMEM, PAGE_SIZE); 496 free_reserved_page(page); 497 } 498 printk(KERN_INFO "Freeing %s: %ldk freed\n", what, (end - begin) >> 10); 499 } 500 501 void (*free_init_pages_eva)(void *begin, void *end) = NULL; 502 503 void __ref free_initmem(void) 504 { 505 prom_free_prom_memory(); 506 /* 507 * Let the platform define a specific function to free the 508 * init section since EVA may have used any possible mapping 509 * between virtual and physical addresses. 510 */ 511 if (free_init_pages_eva) 512 free_init_pages_eva((void *)&__init_begin, (void *)&__init_end); 513 else 514 free_initmem_default(POISON_FREE_INITMEM); 515 } 516 517 #ifdef CONFIG_HAVE_SETUP_PER_CPU_AREA 518 unsigned long __per_cpu_offset[NR_CPUS] __read_mostly; 519 EXPORT_SYMBOL(__per_cpu_offset); 520 521 static int __init pcpu_cpu_distance(unsigned int from, unsigned int to) 522 { 523 return node_distance(cpu_to_node(from), cpu_to_node(to)); 524 } 525 526 static void * __init pcpu_fc_alloc(unsigned int cpu, size_t size, 527 size_t align) 528 { 529 return memblock_alloc_try_nid(size, align, __pa(MAX_DMA_ADDRESS), 530 MEMBLOCK_ALLOC_ACCESSIBLE, 531 cpu_to_node(cpu)); 532 } 533 534 static void __init pcpu_fc_free(void *ptr, size_t size) 535 { 536 memblock_free_early(__pa(ptr), size); 537 } 538 539 void __init setup_per_cpu_areas(void) 540 { 541 unsigned long delta; 542 unsigned int cpu; 543 int rc; 544 545 /* 546 * Always reserve area for module percpu variables. That's 547 * what the legacy allocator did. 548 */ 549 rc = pcpu_embed_first_chunk(PERCPU_MODULE_RESERVE, 550 PERCPU_DYNAMIC_RESERVE, PAGE_SIZE, 551 pcpu_cpu_distance, 552 pcpu_fc_alloc, pcpu_fc_free); 553 if (rc < 0) 554 panic("Failed to initialize percpu areas."); 555 556 delta = (unsigned long)pcpu_base_addr - (unsigned long)__per_cpu_start; 557 for_each_possible_cpu(cpu) 558 __per_cpu_offset[cpu] = delta + pcpu_unit_offsets[cpu]; 559 } 560 #endif 561 562 #ifndef CONFIG_MIPS_PGD_C0_CONTEXT 563 unsigned long pgd_current[NR_CPUS]; 564 #endif 565 566 /* 567 * Align swapper_pg_dir in to 64K, allows its address to be loaded 568 * with a single LUI instruction in the TLB handlers. If we used 569 * __aligned(64K), its size would get rounded up to the alignment 570 * size, and waste space. So we place it in its own section and align 571 * it in the linker script. 572 */ 573 pgd_t swapper_pg_dir[PTRS_PER_PGD] __section(.bss..swapper_pg_dir); 574 #ifndef __PAGETABLE_PUD_FOLDED 575 pud_t invalid_pud_table[PTRS_PER_PUD] __page_aligned_bss; 576 #endif 577 #ifndef __PAGETABLE_PMD_FOLDED 578 pmd_t invalid_pmd_table[PTRS_PER_PMD] __page_aligned_bss; 579 EXPORT_SYMBOL_GPL(invalid_pmd_table); 580 #endif 581 pte_t invalid_pte_table[PTRS_PER_PTE] __page_aligned_bss; 582 EXPORT_SYMBOL(invalid_pte_table); 583