xref: /openbmc/linux/arch/mips/mm/init.c (revision f4c3b83b)
1 /*
2  * This file is subject to the terms and conditions of the GNU General Public
3  * License.  See the file "COPYING" in the main directory of this archive
4  * for more details.
5  *
6  * Copyright (C) 1994 - 2000 Ralf Baechle
7  * Copyright (C) 1999, 2000 Silicon Graphics, Inc.
8  * Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com
9  * Copyright (C) 2000 MIPS Technologies, Inc.  All rights reserved.
10  */
11 #include <linux/bug.h>
12 #include <linux/init.h>
13 #include <linux/export.h>
14 #include <linux/signal.h>
15 #include <linux/sched.h>
16 #include <linux/smp.h>
17 #include <linux/kernel.h>
18 #include <linux/errno.h>
19 #include <linux/string.h>
20 #include <linux/types.h>
21 #include <linux/pagemap.h>
22 #include <linux/ptrace.h>
23 #include <linux/mman.h>
24 #include <linux/mm.h>
25 #include <linux/memblock.h>
26 #include <linux/highmem.h>
27 #include <linux/swap.h>
28 #include <linux/proc_fs.h>
29 #include <linux/pfn.h>
30 #include <linux/hardirq.h>
31 #include <linux/gfp.h>
32 #include <linux/kcore.h>
33 #include <linux/initrd.h>
34 
35 #include <asm/bootinfo.h>
36 #include <asm/cachectl.h>
37 #include <asm/cpu.h>
38 #include <asm/dma.h>
39 #include <asm/maar.h>
40 #include <asm/mmu_context.h>
41 #include <asm/sections.h>
42 #include <asm/pgalloc.h>
43 #include <asm/tlb.h>
44 #include <asm/fixmap.h>
45 
46 /*
47  * We have up to 8 empty zeroed pages so we can map one of the right colour
48  * when needed.	 This is necessary only on R4000 / R4400 SC and MC versions
49  * where we have to avoid VCED / VECI exceptions for good performance at
50  * any price.  Since page is never written to after the initialization we
51  * don't have to care about aliases on other CPUs.
52  */
53 unsigned long empty_zero_page, zero_page_mask;
54 EXPORT_SYMBOL_GPL(empty_zero_page);
55 EXPORT_SYMBOL(zero_page_mask);
56 
57 /*
58  * Not static inline because used by IP27 special magic initialization code
59  */
60 void setup_zero_pages(void)
61 {
62 	unsigned int order, i;
63 	struct page *page;
64 
65 	if (cpu_has_vce)
66 		order = 3;
67 	else
68 		order = 0;
69 
70 	empty_zero_page = __get_free_pages(GFP_KERNEL | __GFP_ZERO, order);
71 	if (!empty_zero_page)
72 		panic("Oh boy, that early out of memory?");
73 
74 	page = virt_to_page((void *)empty_zero_page);
75 	split_page(page, order);
76 	for (i = 0; i < (1 << order); i++, page++)
77 		mark_page_reserved(page);
78 
79 	zero_page_mask = ((PAGE_SIZE << order) - 1) & PAGE_MASK;
80 }
81 
82 static void *__kmap_pgprot(struct page *page, unsigned long addr, pgprot_t prot)
83 {
84 	enum fixed_addresses idx;
85 	unsigned int old_mmid;
86 	unsigned long vaddr, flags, entrylo;
87 	unsigned long old_ctx;
88 	pte_t pte;
89 	int tlbidx;
90 
91 	BUG_ON(Page_dcache_dirty(page));
92 
93 	preempt_disable();
94 	pagefault_disable();
95 	idx = (addr >> PAGE_SHIFT) & (FIX_N_COLOURS - 1);
96 	idx += in_interrupt() ? FIX_N_COLOURS : 0;
97 	vaddr = __fix_to_virt(FIX_CMAP_END - idx);
98 	pte = mk_pte(page, prot);
99 #if defined(CONFIG_XPA)
100 	entrylo = pte_to_entrylo(pte.pte_high);
101 #elif defined(CONFIG_PHYS_ADDR_T_64BIT) && defined(CONFIG_CPU_MIPS32)
102 	entrylo = pte.pte_high;
103 #else
104 	entrylo = pte_to_entrylo(pte_val(pte));
105 #endif
106 
107 	local_irq_save(flags);
108 	old_ctx = read_c0_entryhi();
109 	write_c0_entryhi(vaddr & (PAGE_MASK << 1));
110 	write_c0_entrylo0(entrylo);
111 	write_c0_entrylo1(entrylo);
112 	if (cpu_has_mmid) {
113 		old_mmid = read_c0_memorymapid();
114 		write_c0_memorymapid(MMID_KERNEL_WIRED);
115 	}
116 #ifdef CONFIG_XPA
117 	if (cpu_has_xpa) {
118 		entrylo = (pte.pte_low & _PFNX_MASK);
119 		writex_c0_entrylo0(entrylo);
120 		writex_c0_entrylo1(entrylo);
121 	}
122 #endif
123 	tlbidx = num_wired_entries();
124 	write_c0_wired(tlbidx + 1);
125 	write_c0_index(tlbidx);
126 	mtc0_tlbw_hazard();
127 	tlb_write_indexed();
128 	tlbw_use_hazard();
129 	write_c0_entryhi(old_ctx);
130 	if (cpu_has_mmid)
131 		write_c0_memorymapid(old_mmid);
132 	local_irq_restore(flags);
133 
134 	return (void*) vaddr;
135 }
136 
137 void *kmap_coherent(struct page *page, unsigned long addr)
138 {
139 	return __kmap_pgprot(page, addr, PAGE_KERNEL);
140 }
141 
142 void *kmap_noncoherent(struct page *page, unsigned long addr)
143 {
144 	return __kmap_pgprot(page, addr, PAGE_KERNEL_NC);
145 }
146 
147 void kunmap_coherent(void)
148 {
149 	unsigned int wired;
150 	unsigned long flags, old_ctx;
151 
152 	local_irq_save(flags);
153 	old_ctx = read_c0_entryhi();
154 	wired = num_wired_entries() - 1;
155 	write_c0_wired(wired);
156 	write_c0_index(wired);
157 	write_c0_entryhi(UNIQUE_ENTRYHI(wired));
158 	write_c0_entrylo0(0);
159 	write_c0_entrylo1(0);
160 	mtc0_tlbw_hazard();
161 	tlb_write_indexed();
162 	tlbw_use_hazard();
163 	write_c0_entryhi(old_ctx);
164 	local_irq_restore(flags);
165 	pagefault_enable();
166 	preempt_enable();
167 }
168 
169 void copy_user_highpage(struct page *to, struct page *from,
170 	unsigned long vaddr, struct vm_area_struct *vma)
171 {
172 	void *vfrom, *vto;
173 
174 	vto = kmap_atomic(to);
175 	if (cpu_has_dc_aliases &&
176 	    page_mapcount(from) && !Page_dcache_dirty(from)) {
177 		vfrom = kmap_coherent(from, vaddr);
178 		copy_page(vto, vfrom);
179 		kunmap_coherent();
180 	} else {
181 		vfrom = kmap_atomic(from);
182 		copy_page(vto, vfrom);
183 		kunmap_atomic(vfrom);
184 	}
185 	if ((!cpu_has_ic_fills_f_dc) ||
186 	    pages_do_alias((unsigned long)vto, vaddr & PAGE_MASK))
187 		flush_data_cache_page((unsigned long)vto);
188 	kunmap_atomic(vto);
189 	/* Make sure this page is cleared on other CPU's too before using it */
190 	smp_wmb();
191 }
192 
193 void copy_to_user_page(struct vm_area_struct *vma,
194 	struct page *page, unsigned long vaddr, void *dst, const void *src,
195 	unsigned long len)
196 {
197 	if (cpu_has_dc_aliases &&
198 	    page_mapcount(page) && !Page_dcache_dirty(page)) {
199 		void *vto = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK);
200 		memcpy(vto, src, len);
201 		kunmap_coherent();
202 	} else {
203 		memcpy(dst, src, len);
204 		if (cpu_has_dc_aliases)
205 			SetPageDcacheDirty(page);
206 	}
207 	if (vma->vm_flags & VM_EXEC)
208 		flush_cache_page(vma, vaddr, page_to_pfn(page));
209 }
210 
211 void copy_from_user_page(struct vm_area_struct *vma,
212 	struct page *page, unsigned long vaddr, void *dst, const void *src,
213 	unsigned long len)
214 {
215 	if (cpu_has_dc_aliases &&
216 	    page_mapcount(page) && !Page_dcache_dirty(page)) {
217 		void *vfrom = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK);
218 		memcpy(dst, vfrom, len);
219 		kunmap_coherent();
220 	} else {
221 		memcpy(dst, src, len);
222 		if (cpu_has_dc_aliases)
223 			SetPageDcacheDirty(page);
224 	}
225 }
226 EXPORT_SYMBOL_GPL(copy_from_user_page);
227 
228 void __init fixrange_init(unsigned long start, unsigned long end,
229 	pgd_t *pgd_base)
230 {
231 #ifdef CONFIG_HIGHMEM
232 	pgd_t *pgd;
233 	pud_t *pud;
234 	pmd_t *pmd;
235 	pte_t *pte;
236 	int i, j, k;
237 	unsigned long vaddr;
238 
239 	vaddr = start;
240 	i = pgd_index(vaddr);
241 	j = pud_index(vaddr);
242 	k = pmd_index(vaddr);
243 	pgd = pgd_base + i;
244 
245 	for ( ; (i < PTRS_PER_PGD) && (vaddr < end); pgd++, i++) {
246 		pud = (pud_t *)pgd;
247 		for ( ; (j < PTRS_PER_PUD) && (vaddr < end); pud++, j++) {
248 			pmd = (pmd_t *)pud;
249 			for (; (k < PTRS_PER_PMD) && (vaddr < end); pmd++, k++) {
250 				if (pmd_none(*pmd)) {
251 					pte = (pte_t *) memblock_alloc_low(PAGE_SIZE,
252 									   PAGE_SIZE);
253 					if (!pte)
254 						panic("%s: Failed to allocate %lu bytes align=%lx\n",
255 						      __func__, PAGE_SIZE,
256 						      PAGE_SIZE);
257 
258 					set_pmd(pmd, __pmd((unsigned long)pte));
259 					BUG_ON(pte != pte_offset_kernel(pmd, 0));
260 				}
261 				vaddr += PMD_SIZE;
262 			}
263 			k = 0;
264 		}
265 		j = 0;
266 	}
267 #endif
268 }
269 
270 struct maar_walk_info {
271 	struct maar_config cfg[16];
272 	unsigned int num_cfg;
273 };
274 
275 static int maar_res_walk(unsigned long start_pfn, unsigned long nr_pages,
276 			 void *data)
277 {
278 	struct maar_walk_info *wi = data;
279 	struct maar_config *cfg = &wi->cfg[wi->num_cfg];
280 	unsigned int maar_align;
281 
282 	/* MAAR registers hold physical addresses right shifted by 4 bits */
283 	maar_align = BIT(MIPS_MAAR_ADDR_SHIFT + 4);
284 
285 	/* Fill in the MAAR config entry */
286 	cfg->lower = ALIGN(PFN_PHYS(start_pfn), maar_align);
287 	cfg->upper = ALIGN_DOWN(PFN_PHYS(start_pfn + nr_pages), maar_align) - 1;
288 	cfg->attrs = MIPS_MAAR_S;
289 
290 	/* Ensure we don't overflow the cfg array */
291 	if (!WARN_ON(wi->num_cfg >= ARRAY_SIZE(wi->cfg)))
292 		wi->num_cfg++;
293 
294 	return 0;
295 }
296 
297 
298 unsigned __weak platform_maar_init(unsigned num_pairs)
299 {
300 	unsigned int num_configured;
301 	struct maar_walk_info wi;
302 
303 	wi.num_cfg = 0;
304 	walk_system_ram_range(0, max_pfn, &wi, maar_res_walk);
305 
306 	num_configured = maar_config(wi.cfg, wi.num_cfg, num_pairs);
307 	if (num_configured < wi.num_cfg)
308 		pr_warn("Not enough MAAR pairs (%u) for all memory regions (%u)\n",
309 			num_pairs, wi.num_cfg);
310 
311 	return num_configured;
312 }
313 
314 void maar_init(void)
315 {
316 	unsigned num_maars, used, i;
317 	phys_addr_t lower, upper, attr;
318 	static struct {
319 		struct maar_config cfgs[3];
320 		unsigned used;
321 	} recorded = { { { 0 } }, 0 };
322 
323 	if (!cpu_has_maar)
324 		return;
325 
326 	/* Detect the number of MAARs */
327 	write_c0_maari(~0);
328 	back_to_back_c0_hazard();
329 	num_maars = read_c0_maari() + 1;
330 
331 	/* MAARs should be in pairs */
332 	WARN_ON(num_maars % 2);
333 
334 	/* Set MAARs using values we recorded already */
335 	if (recorded.used) {
336 		used = maar_config(recorded.cfgs, recorded.used, num_maars / 2);
337 		BUG_ON(used != recorded.used);
338 	} else {
339 		/* Configure the required MAARs */
340 		used = platform_maar_init(num_maars / 2);
341 	}
342 
343 	/* Disable any further MAARs */
344 	for (i = (used * 2); i < num_maars; i++) {
345 		write_c0_maari(i);
346 		back_to_back_c0_hazard();
347 		write_c0_maar(0);
348 		back_to_back_c0_hazard();
349 	}
350 
351 	if (recorded.used)
352 		return;
353 
354 	pr_info("MAAR configuration:\n");
355 	for (i = 0; i < num_maars; i += 2) {
356 		write_c0_maari(i);
357 		back_to_back_c0_hazard();
358 		upper = read_c0_maar();
359 #ifdef CONFIG_XPA
360 		upper |= (phys_addr_t)readx_c0_maar() << MIPS_MAARX_ADDR_SHIFT;
361 #endif
362 
363 		write_c0_maari(i + 1);
364 		back_to_back_c0_hazard();
365 		lower = read_c0_maar();
366 #ifdef CONFIG_XPA
367 		lower |= (phys_addr_t)readx_c0_maar() << MIPS_MAARX_ADDR_SHIFT;
368 #endif
369 
370 		attr = lower & upper;
371 		lower = (lower & MIPS_MAAR_ADDR) << 4;
372 		upper = ((upper & MIPS_MAAR_ADDR) << 4) | 0xffff;
373 
374 		pr_info("  [%d]: ", i / 2);
375 		if ((attr & MIPS_MAAR_V) != MIPS_MAAR_V) {
376 			pr_cont("disabled\n");
377 			continue;
378 		}
379 
380 		pr_cont("%pa-%pa", &lower, &upper);
381 
382 		if (attr & MIPS_MAAR_S)
383 			pr_cont(" speculate");
384 
385 		pr_cont("\n");
386 
387 		/* Record the setup for use on secondary CPUs */
388 		if (used <= ARRAY_SIZE(recorded.cfgs)) {
389 			recorded.cfgs[recorded.used].lower = lower;
390 			recorded.cfgs[recorded.used].upper = upper;
391 			recorded.cfgs[recorded.used].attrs = attr;
392 			recorded.used++;
393 		}
394 	}
395 }
396 
397 #ifndef CONFIG_NEED_MULTIPLE_NODES
398 void __init paging_init(void)
399 {
400 	unsigned long max_zone_pfns[MAX_NR_ZONES];
401 
402 	pagetable_init();
403 
404 #ifdef CONFIG_ZONE_DMA
405 	max_zone_pfns[ZONE_DMA] = MAX_DMA_PFN;
406 #endif
407 #ifdef CONFIG_ZONE_DMA32
408 	max_zone_pfns[ZONE_DMA32] = MAX_DMA32_PFN;
409 #endif
410 	max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
411 #ifdef CONFIG_HIGHMEM
412 	max_zone_pfns[ZONE_HIGHMEM] = highend_pfn;
413 
414 	if (cpu_has_dc_aliases && max_low_pfn != highend_pfn) {
415 		printk(KERN_WARNING "This processor doesn't support highmem."
416 		       " %ldk highmem ignored\n",
417 		       (highend_pfn - max_low_pfn) << (PAGE_SHIFT - 10));
418 		max_zone_pfns[ZONE_HIGHMEM] = max_low_pfn;
419 	}
420 #endif
421 
422 	free_area_init(max_zone_pfns);
423 }
424 
425 #ifdef CONFIG_64BIT
426 static struct kcore_list kcore_kseg0;
427 #endif
428 
429 static inline void __init mem_init_free_highmem(void)
430 {
431 #ifdef CONFIG_HIGHMEM
432 	unsigned long tmp;
433 
434 	if (cpu_has_dc_aliases)
435 		return;
436 
437 	for (tmp = highstart_pfn; tmp < highend_pfn; tmp++) {
438 		struct page *page = pfn_to_page(tmp);
439 
440 		if (!memblock_is_memory(PFN_PHYS(tmp)))
441 			SetPageReserved(page);
442 		else
443 			free_highmem_page(page);
444 	}
445 #endif
446 }
447 
448 void __init mem_init(void)
449 {
450 	/*
451 	 * When _PFN_SHIFT is greater than PAGE_SHIFT we won't have enough PTE
452 	 * bits to hold a full 32b physical address on MIPS32 systems.
453 	 */
454 	BUILD_BUG_ON(IS_ENABLED(CONFIG_32BIT) && (_PFN_SHIFT > PAGE_SHIFT));
455 
456 #ifdef CONFIG_HIGHMEM
457 #ifdef CONFIG_DISCONTIGMEM
458 #error "CONFIG_HIGHMEM and CONFIG_DISCONTIGMEM dont work together yet"
459 #endif
460 	max_mapnr = highend_pfn ? highend_pfn : max_low_pfn;
461 #else
462 	max_mapnr = max_low_pfn;
463 #endif
464 	high_memory = (void *) __va(max_low_pfn << PAGE_SHIFT);
465 
466 	maar_init();
467 	memblock_free_all();
468 	setup_zero_pages();	/* Setup zeroed pages.  */
469 	mem_init_free_highmem();
470 	mem_init_print_info(NULL);
471 
472 #ifdef CONFIG_64BIT
473 	if ((unsigned long) &_text > (unsigned long) CKSEG0)
474 		/* The -4 is a hack so that user tools don't have to handle
475 		   the overflow.  */
476 		kclist_add(&kcore_kseg0, (void *) CKSEG0,
477 				0x80000000 - 4, KCORE_TEXT);
478 #endif
479 }
480 #endif /* !CONFIG_NEED_MULTIPLE_NODES */
481 
482 void free_init_pages(const char *what, unsigned long begin, unsigned long end)
483 {
484 	unsigned long pfn;
485 
486 	for (pfn = PFN_UP(begin); pfn < PFN_DOWN(end); pfn++) {
487 		struct page *page = pfn_to_page(pfn);
488 		void *addr = phys_to_virt(PFN_PHYS(pfn));
489 
490 		memset(addr, POISON_FREE_INITMEM, PAGE_SIZE);
491 		free_reserved_page(page);
492 	}
493 	printk(KERN_INFO "Freeing %s: %ldk freed\n", what, (end - begin) >> 10);
494 }
495 
496 void (*free_init_pages_eva)(void *begin, void *end) = NULL;
497 
498 void __ref free_initmem(void)
499 {
500 	prom_free_prom_memory();
501 	/*
502 	 * Let the platform define a specific function to free the
503 	 * init section since EVA may have used any possible mapping
504 	 * between virtual and physical addresses.
505 	 */
506 	if (free_init_pages_eva)
507 		free_init_pages_eva((void *)&__init_begin, (void *)&__init_end);
508 	else
509 		free_initmem_default(POISON_FREE_INITMEM);
510 }
511 
512 #ifdef CONFIG_HAVE_SETUP_PER_CPU_AREA
513 unsigned long __per_cpu_offset[NR_CPUS] __read_mostly;
514 EXPORT_SYMBOL(__per_cpu_offset);
515 
516 static int __init pcpu_cpu_distance(unsigned int from, unsigned int to)
517 {
518 	return node_distance(cpu_to_node(from), cpu_to_node(to));
519 }
520 
521 static void * __init pcpu_fc_alloc(unsigned int cpu, size_t size,
522 				       size_t align)
523 {
524 	return memblock_alloc_try_nid(size, align, __pa(MAX_DMA_ADDRESS),
525 				      MEMBLOCK_ALLOC_ACCESSIBLE,
526 				      cpu_to_node(cpu));
527 }
528 
529 static void __init pcpu_fc_free(void *ptr, size_t size)
530 {
531 	memblock_free_early(__pa(ptr), size);
532 }
533 
534 void __init setup_per_cpu_areas(void)
535 {
536 	unsigned long delta;
537 	unsigned int cpu;
538 	int rc;
539 
540 	/*
541 	 * Always reserve area for module percpu variables.  That's
542 	 * what the legacy allocator did.
543 	 */
544 	rc = pcpu_embed_first_chunk(PERCPU_MODULE_RESERVE,
545 				    PERCPU_DYNAMIC_RESERVE, PAGE_SIZE,
546 				    pcpu_cpu_distance,
547 				    pcpu_fc_alloc, pcpu_fc_free);
548 	if (rc < 0)
549 		panic("Failed to initialize percpu areas.");
550 
551 	delta = (unsigned long)pcpu_base_addr - (unsigned long)__per_cpu_start;
552 	for_each_possible_cpu(cpu)
553 		__per_cpu_offset[cpu] = delta + pcpu_unit_offsets[cpu];
554 }
555 #endif
556 
557 #ifndef CONFIG_MIPS_PGD_C0_CONTEXT
558 unsigned long pgd_current[NR_CPUS];
559 #endif
560 
561 /*
562  * Align swapper_pg_dir in to 64K, allows its address to be loaded
563  * with a single LUI instruction in the TLB handlers.  If we used
564  * __aligned(64K), its size would get rounded up to the alignment
565  * size, and waste space.  So we place it in its own section and align
566  * it in the linker script.
567  */
568 pgd_t swapper_pg_dir[PTRS_PER_PGD] __section(".bss..swapper_pg_dir");
569 #ifndef __PAGETABLE_PUD_FOLDED
570 pud_t invalid_pud_table[PTRS_PER_PUD] __page_aligned_bss;
571 #endif
572 #ifndef __PAGETABLE_PMD_FOLDED
573 pmd_t invalid_pmd_table[PTRS_PER_PMD] __page_aligned_bss;
574 EXPORT_SYMBOL_GPL(invalid_pmd_table);
575 #endif
576 pte_t invalid_pte_table[PTRS_PER_PTE] __page_aligned_bss;
577 EXPORT_SYMBOL(invalid_pte_table);
578