xref: /openbmc/linux/arch/powerpc/mm/book3s32/hash_low.S (revision da481c4fe0e485cdab5cf4d2761be8b8fb38d3d1)
12874c5fdSThomas Gleixner/* SPDX-License-Identifier: GPL-2.0-or-later */
217312f25SChristophe Leroy/*
317312f25SChristophe Leroy *  PowerPC version
417312f25SChristophe Leroy *    Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
517312f25SChristophe Leroy *  Rewritten by Cort Dougan (cort@cs.nmt.edu) for PReP
617312f25SChristophe Leroy *    Copyright (C) 1996 Cort Dougan <cort@cs.nmt.edu>
717312f25SChristophe Leroy *  Adapted for Power Macintosh by Paul Mackerras.
817312f25SChristophe Leroy *  Low-level exception handlers and MMU support
917312f25SChristophe Leroy *  rewritten by Paul Mackerras.
1017312f25SChristophe Leroy *    Copyright (C) 1996 Paul Mackerras.
1117312f25SChristophe Leroy *
1217312f25SChristophe Leroy *  This file contains low-level assembler routines for managing
1317312f25SChristophe Leroy *  the PowerPC MMU hash table.  (PPC 8xx processors don't use a
1417312f25SChristophe Leroy *  hash table, so this file is not used on them.)
1517312f25SChristophe Leroy */
1617312f25SChristophe Leroy
1765fddcfcSMike Rapoport#include <linux/pgtable.h>
1869a1593aSChristophe Leroy#include <linux/init.h>
1917312f25SChristophe Leroy#include <asm/reg.h>
2017312f25SChristophe Leroy#include <asm/page.h>
2117312f25SChristophe Leroy#include <asm/cputable.h>
2217312f25SChristophe Leroy#include <asm/ppc_asm.h>
2317312f25SChristophe Leroy#include <asm/thread_info.h>
2417312f25SChristophe Leroy#include <asm/asm-offsets.h>
2517312f25SChristophe Leroy#include <asm/export.h>
2617312f25SChristophe Leroy#include <asm/feature-fixups.h>
2717312f25SChristophe Leroy#include <asm/code-patching-asm.h>
2817312f25SChristophe Leroy
29*da481c4fSChristophe Leroy#ifdef CONFIG_PTE_64BIT
30*da481c4fSChristophe Leroy#define PTE_FLAGS_OFFSET	4	/* offset of PTE flags, in bytes */
31*da481c4fSChristophe Leroy#else
32*da481c4fSChristophe Leroy#define PTE_FLAGS_OFFSET	0
33*da481c4fSChristophe Leroy#endif
34*da481c4fSChristophe Leroy
3517312f25SChristophe Leroy/*
3617312f25SChristophe Leroy * Load a PTE into the hash table, if possible.
3717312f25SChristophe Leroy * The address is in r4, and r3 contains an access flag:
3840bb0e90SChristophe Leroy * _PAGE_RW (0x400) if a write.
3917312f25SChristophe Leroy * r9 contains the SRR1 value, from which we use the MSR_PR bit.
4017312f25SChristophe Leroy * SPRG_THREAD contains the physical address of the current task's thread.
4117312f25SChristophe Leroy *
4217312f25SChristophe Leroy * Returns to the caller if the access is illegal or there is no
4317312f25SChristophe Leroy * mapping for the address.  Otherwise it places an appropriate PTE
4417312f25SChristophe Leroy * in the hash table and returns from the exception.
4517312f25SChristophe Leroy * Uses r0, r3 - r6, r8, r10, ctr, lr.
4617312f25SChristophe Leroy */
4717312f25SChristophe Leroy	.text
4817312f25SChristophe Leroy_GLOBAL(hash_page)
4917312f25SChristophe Leroy#ifdef CONFIG_SMP
50232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@h
51232ca1eeSChristophe Leroy	ori	r8, r8, (mmu_hash_lock - PAGE_OFFSET)@l
5217312f25SChristophe Leroy	lis	r0,0x0fff
5317312f25SChristophe Leroy	b	10f
5417312f25SChristophe Leroy11:	lwz	r6,0(r8)
5517312f25SChristophe Leroy	cmpwi	0,r6,0
5617312f25SChristophe Leroy	bne	11b
5717312f25SChristophe Leroy10:	lwarx	r6,0,r8
5817312f25SChristophe Leroy	cmpwi	0,r6,0
5917312f25SChristophe Leroy	bne-	11b
6017312f25SChristophe Leroy	stwcx.	r0,0,r8
6117312f25SChristophe Leroy	bne-	10b
6217312f25SChristophe Leroy	isync
6317312f25SChristophe Leroy#endif
6417312f25SChristophe Leroy	/* Get PTE (linux-style) and check access */
65f1a1f7a1SChristophe Leroy	lis	r0, TASK_SIZE@h		/* check if kernel address */
6617312f25SChristophe Leroy	cmplw	0,r4,r0
6703d701c2SChristophe Leroy	mfspr	r8,SPRN_SPRG_THREAD	/* current task's THREAD (phys) */
6817312f25SChristophe Leroy	ori	r3,r3,_PAGE_USER|_PAGE_PRESENT /* test low addresses as user */
6903d701c2SChristophe Leroy	lwz	r5,PGDIR(r8)		/* virt page-table root */
7017312f25SChristophe Leroy	blt+	112f			/* assume user more likely */
7103d701c2SChristophe Leroy	lis	r5,swapper_pg_dir@ha	/* if kernel address, use */
7203d701c2SChristophe Leroy	addi	r5,r5,swapper_pg_dir@l	/* kernel page table */
7340bb0e90SChristophe Leroy	rlwimi	r3,r9,32-12,29,29	/* MSR_PR -> _PAGE_USER */
7403d701c2SChristophe Leroy112:	tophys(r5, r5)
7517312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
7617312f25SChristophe Leroy	rlwimi	r5,r4,12,20,29		/* insert top 10 bits of address */
7717312f25SChristophe Leroy	lwz	r8,0(r5)		/* get pmd entry */
7817312f25SChristophe Leroy	rlwinm.	r8,r8,0,0,19		/* extract address of pte page */
7917312f25SChristophe Leroy#else
8017312f25SChristophe Leroy	rlwinm	r8,r4,13,19,29		/* Compute pgdir/pmd offset */
8117312f25SChristophe Leroy	lwzx	r8,r8,r5		/* Get L1 entry */
8217312f25SChristophe Leroy	rlwinm.	r8,r8,0,0,20		/* extract pt base address */
8317312f25SChristophe Leroy#endif
8417312f25SChristophe Leroy#ifdef CONFIG_SMP
85f892c21dSChristophe Leroy	beq-	.Lhash_page_out		/* return if no mapping */
8617312f25SChristophe Leroy#else
8717312f25SChristophe Leroy	/* XXX it seems like the 601 will give a machine fault on the
8817312f25SChristophe Leroy	   rfi if its alignment is wrong (bottom 4 bits of address are
8917312f25SChristophe Leroy	   8 or 0xc) and we have had a not-taken conditional branch
9017312f25SChristophe Leroy	   to the address following the rfi. */
9117312f25SChristophe Leroy	beqlr-
9217312f25SChristophe Leroy#endif
9317312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
9417312f25SChristophe Leroy	rlwimi	r8,r4,22,20,29		/* insert next 10 bits of address */
9517312f25SChristophe Leroy#else
9617312f25SChristophe Leroy	rlwimi	r8,r4,23,20,28		/* compute pte address */
97*da481c4fSChristophe Leroy	/*
98*da481c4fSChristophe Leroy	 * If PTE_64BIT is set, the low word is the flags word; use that
99*da481c4fSChristophe Leroy	 * word for locking since it contains all the interesting bits.
100*da481c4fSChristophe Leroy	 */
101*da481c4fSChristophe Leroy	addi	r8,r8,PTE_FLAGS_OFFSET
10217312f25SChristophe Leroy#endif
10317312f25SChristophe Leroy
10417312f25SChristophe Leroy	/*
10517312f25SChristophe Leroy	 * Update the linux PTE atomically.  We do the lwarx up-front
10617312f25SChristophe Leroy	 * because almost always, there won't be a permission violation
10717312f25SChristophe Leroy	 * and there won't already be an HPTE, and thus we will have
10817312f25SChristophe Leroy	 * to update the PTE to set _PAGE_HASHPTE.  -- paulus.
10917312f25SChristophe Leroy	 */
110f892c21dSChristophe Leroy.Lretry:
11117312f25SChristophe Leroy	lwarx	r6,0,r8			/* get linux-style pte, flag word */
1121b03e71fSChristophe Leroy#ifdef CONFIG_PPC_KUAP
1131b03e71fSChristophe Leroy	mfsrin	r5,r4
1141b03e71fSChristophe Leroy	rlwinm	r0,r9,28,_PAGE_RW	/* MSR[PR] => _PAGE_RW */
1151b03e71fSChristophe Leroy	rlwinm	r5,r5,12,_PAGE_RW	/* Ks => _PAGE_RW */
1161b03e71fSChristophe Leroy	andc	r5,r5,r0		/* Ks & ~MSR[PR] */
1171b03e71fSChristophe Leroy	andc	r5,r6,r5		/* Clear _PAGE_RW when Ks = 1 && MSR[PR] = 0 */
1181b03e71fSChristophe Leroy	andc.	r5,r3,r5		/* check access & ~permission */
1191b03e71fSChristophe Leroy#else
12017312f25SChristophe Leroy	andc.	r5,r3,r6		/* check access & ~permission */
1211b03e71fSChristophe Leroy#endif
1221b03e71fSChristophe Leroy	rlwinm	r0,r3,32-3,24,24	/* _PAGE_RW access -> _PAGE_DIRTY */
1231b03e71fSChristophe Leroy	ori	r0,r0,_PAGE_ACCESSED|_PAGE_HASHPTE
12417312f25SChristophe Leroy#ifdef CONFIG_SMP
125f892c21dSChristophe Leroy	bne-	.Lhash_page_out		/* return if access not permitted */
12617312f25SChristophe Leroy#else
12717312f25SChristophe Leroy	bnelr-
12817312f25SChristophe Leroy#endif
12917312f25SChristophe Leroy	or	r5,r0,r6		/* set accessed/dirty bits */
13017312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
13117312f25SChristophe Leroy#ifdef CONFIG_SMP
13217312f25SChristophe Leroy	subf	r10,r6,r8		/* create false data dependency */
13317312f25SChristophe Leroy	subi	r10,r10,PTE_FLAGS_OFFSET
13417312f25SChristophe Leroy	lwzx	r10,r6,r10		/* Get upper PTE word */
13517312f25SChristophe Leroy#else
13617312f25SChristophe Leroy	lwz	r10,-PTE_FLAGS_OFFSET(r8)
13717312f25SChristophe Leroy#endif /* CONFIG_SMP */
13817312f25SChristophe Leroy#endif /* CONFIG_PTE_64BIT */
13917312f25SChristophe Leroy	stwcx.	r5,0,r8			/* attempt to update PTE */
140f892c21dSChristophe Leroy	bne-	.Lretry			/* retry if someone got there first */
14117312f25SChristophe Leroy
14217312f25SChristophe Leroy	mfsrin	r3,r4			/* get segment reg for segment */
143232ca1eeSChristophe Leroy#ifndef CONFIG_VMAP_STACK
14417312f25SChristophe Leroy	mfctr	r0
14517312f25SChristophe Leroy	stw	r0,_CTR(r11)
146232ca1eeSChristophe Leroy#endif
14717312f25SChristophe Leroy	bl	create_hpte		/* add the hash table entry */
14817312f25SChristophe Leroy
14917312f25SChristophe Leroy#ifdef CONFIG_SMP
15017312f25SChristophe Leroy	eieio
151232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@ha
15217312f25SChristophe Leroy	li	r0,0
153232ca1eeSChristophe Leroy	stw	r0, (mmu_hash_lock - PAGE_OFFSET)@l(r8)
15417312f25SChristophe Leroy#endif
15517312f25SChristophe Leroy
156232ca1eeSChristophe Leroy#ifdef CONFIG_VMAP_STACK
157232ca1eeSChristophe Leroy	b	fast_hash_page_return
158232ca1eeSChristophe Leroy#else
15917312f25SChristophe Leroy	/* Return from the exception */
16017312f25SChristophe Leroy	lwz	r5,_CTR(r11)
16117312f25SChristophe Leroy	mtctr	r5
16217312f25SChristophe Leroy	lwz	r0,GPR0(r11)
16317312f25SChristophe Leroy	lwz	r8,GPR8(r11)
16417312f25SChristophe Leroy	b	fast_exception_return
165232ca1eeSChristophe Leroy#endif
16617312f25SChristophe Leroy
16717312f25SChristophe Leroy#ifdef CONFIG_SMP
168f892c21dSChristophe Leroy.Lhash_page_out:
16917312f25SChristophe Leroy	eieio
170232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@ha
17117312f25SChristophe Leroy	li	r0,0
172232ca1eeSChristophe Leroy	stw	r0, (mmu_hash_lock - PAGE_OFFSET)@l(r8)
17317312f25SChristophe Leroy	blr
17417312f25SChristophe Leroy#endif /* CONFIG_SMP */
175e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(hash_page)
17617312f25SChristophe Leroy
17717312f25SChristophe Leroy/*
17817312f25SChristophe Leroy * Add an entry for a particular page to the hash table.
17917312f25SChristophe Leroy *
18017312f25SChristophe Leroy * add_hash_page(unsigned context, unsigned long va, unsigned long pmdval)
18117312f25SChristophe Leroy *
18217312f25SChristophe Leroy * We assume any necessary modifications to the pte (e.g. setting
18317312f25SChristophe Leroy * the accessed bit) have already been done and that there is actually
18417312f25SChristophe Leroy * a hash table in use (i.e. we're not on a 603).
18517312f25SChristophe Leroy */
18617312f25SChristophe Leroy_GLOBAL(add_hash_page)
18717312f25SChristophe Leroy	mflr	r0
18817312f25SChristophe Leroy	stw	r0,4(r1)
18917312f25SChristophe Leroy
19017312f25SChristophe Leroy#ifdef CONFIG_SMP
19117312f25SChristophe Leroy	lwz	r8,TASK_CPU(r2)		/* to go in mmu_hash_lock */
19217312f25SChristophe Leroy	oris	r8,r8,12
19317312f25SChristophe Leroy#endif /* CONFIG_SMP */
19417312f25SChristophe Leroy
19517312f25SChristophe Leroy	/*
19617312f25SChristophe Leroy	 * We disable interrupts here, even on UP, because we don't
19717312f25SChristophe Leroy	 * want to race with hash_page, and because we want the
19817312f25SChristophe Leroy	 * _PAGE_HASHPTE bit to be a reliable indication of whether
19917312f25SChristophe Leroy	 * the HPTE exists (or at least whether one did once).
20017312f25SChristophe Leroy	 * We also turn off the MMU for data accesses so that we
20117312f25SChristophe Leroy	 * we can't take a hash table miss (assuming the code is
20217312f25SChristophe Leroy	 * covered by a BAT).  -- paulus
20317312f25SChristophe Leroy	 */
20417312f25SChristophe Leroy	mfmsr	r9
20517312f25SChristophe Leroy	rlwinm	r0,r9,0,17,15		/* clear bit 16 (MSR_EE) */
20617312f25SChristophe Leroy	rlwinm	r0,r0,0,28,26		/* clear MSR_DR */
20717312f25SChristophe Leroy	mtmsr	r0
20817312f25SChristophe Leroy	isync
20917312f25SChristophe Leroy
21017312f25SChristophe Leroy#ifdef CONFIG_SMP
21117312f25SChristophe Leroy	lis	r6, (mmu_hash_lock - PAGE_OFFSET)@ha
21217312f25SChristophe Leroy	addi	r6, r6, (mmu_hash_lock - PAGE_OFFSET)@l
21317312f25SChristophe Leroy10:	lwarx	r0,0,r6			/* take the mmu_hash_lock */
21417312f25SChristophe Leroy	cmpi	0,r0,0
21517312f25SChristophe Leroy	bne-	11f
21617312f25SChristophe Leroy	stwcx.	r8,0,r6
21717312f25SChristophe Leroy	beq+	12f
21817312f25SChristophe Leroy11:	lwz	r0,0(r6)
21917312f25SChristophe Leroy	cmpi	0,r0,0
22017312f25SChristophe Leroy	beq	10b
22117312f25SChristophe Leroy	b	11b
22217312f25SChristophe Leroy12:	isync
22317312f25SChristophe Leroy#endif
22417312f25SChristophe Leroy
22517312f25SChristophe Leroy	/*
22617312f25SChristophe Leroy	 * Fetch the linux pte and test and set _PAGE_HASHPTE atomically.
22717312f25SChristophe Leroy	 * If _PAGE_HASHPTE was already set, we don't replace the existing
22817312f25SChristophe Leroy	 * HPTE, so we just unlock and return.
22917312f25SChristophe Leroy	 */
23017312f25SChristophe Leroy	mr	r8,r5
23117312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
23217312f25SChristophe Leroy	rlwimi	r8,r4,22,20,29
23317312f25SChristophe Leroy#else
23417312f25SChristophe Leroy	rlwimi	r8,r4,23,20,28
23517312f25SChristophe Leroy	addi	r8,r8,PTE_FLAGS_OFFSET
23617312f25SChristophe Leroy#endif
23717312f25SChristophe Leroy1:	lwarx	r6,0,r8
23817312f25SChristophe Leroy	andi.	r0,r6,_PAGE_HASHPTE
23917312f25SChristophe Leroy	bne	9f			/* if HASHPTE already set, done */
24017312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
24117312f25SChristophe Leroy#ifdef CONFIG_SMP
24217312f25SChristophe Leroy	subf	r10,r6,r8		/* create false data dependency */
24317312f25SChristophe Leroy	subi	r10,r10,PTE_FLAGS_OFFSET
24417312f25SChristophe Leroy	lwzx	r10,r6,r10		/* Get upper PTE word */
24517312f25SChristophe Leroy#else
24617312f25SChristophe Leroy	lwz	r10,-PTE_FLAGS_OFFSET(r8)
24717312f25SChristophe Leroy#endif /* CONFIG_SMP */
24817312f25SChristophe Leroy#endif /* CONFIG_PTE_64BIT */
24917312f25SChristophe Leroy	ori	r5,r6,_PAGE_HASHPTE
25017312f25SChristophe Leroy	stwcx.	r5,0,r8
25117312f25SChristophe Leroy	bne-	1b
25217312f25SChristophe Leroy
253fec6166bSChristophe Leroy	/* Convert context and va to VSID */
254fec6166bSChristophe Leroy	mulli	r3,r3,897*16		/* multiply context by context skew */
255fec6166bSChristophe Leroy	rlwinm	r0,r4,4,28,31		/* get ESID (top 4 bits of va) */
256fec6166bSChristophe Leroy	mulli	r0,r0,0x111		/* multiply by ESID skew */
257fec6166bSChristophe Leroy	add	r3,r3,r0		/* note create_hpte trims to 24 bits */
258fec6166bSChristophe Leroy
25917312f25SChristophe Leroy	bl	create_hpte
26017312f25SChristophe Leroy
26117312f25SChristophe Leroy9:
26217312f25SChristophe Leroy#ifdef CONFIG_SMP
26317312f25SChristophe Leroy	lis	r6, (mmu_hash_lock - PAGE_OFFSET)@ha
26417312f25SChristophe Leroy	addi	r6, r6, (mmu_hash_lock - PAGE_OFFSET)@l
26517312f25SChristophe Leroy	eieio
26617312f25SChristophe Leroy	li	r0,0
26717312f25SChristophe Leroy	stw	r0,0(r6)		/* clear mmu_hash_lock */
26817312f25SChristophe Leroy#endif
26917312f25SChristophe Leroy
27017312f25SChristophe Leroy	/* reenable interrupts and DR */
27117312f25SChristophe Leroy	mtmsr	r9
27217312f25SChristophe Leroy	isync
27317312f25SChristophe Leroy
27417312f25SChristophe Leroy	lwz	r0,4(r1)
27517312f25SChristophe Leroy	mtlr	r0
27617312f25SChristophe Leroy	blr
277e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(add_hash_page)
27817312f25SChristophe Leroy
27917312f25SChristophe Leroy/*
28017312f25SChristophe Leroy * This routine adds a hardware PTE to the hash table.
28117312f25SChristophe Leroy * It is designed to be called with the MMU either on or off.
28217312f25SChristophe Leroy * r3 contains the VSID, r4 contains the virtual address,
28317312f25SChristophe Leroy * r5 contains the linux PTE, r6 contains the old value of the
28417312f25SChristophe Leroy * linux PTE (before setting _PAGE_HASHPTE). r10 contains the
28517312f25SChristophe Leroy * upper half of the PTE if CONFIG_PTE_64BIT.
28617312f25SChristophe Leroy * On SMP, the caller should have the mmu_hash_lock held.
28717312f25SChristophe Leroy * We assume that the caller has (or will) set the _PAGE_HASHPTE
28817312f25SChristophe Leroy * bit in the linux PTE in memory.  The value passed in r6 should
28917312f25SChristophe Leroy * be the old linux PTE value; if it doesn't have _PAGE_HASHPTE set
29017312f25SChristophe Leroy * this routine will skip the search for an existing HPTE.
29117312f25SChristophe Leroy * This procedure modifies r0, r3 - r6, r8, cr0.
29217312f25SChristophe Leroy *  -- paulus.
29317312f25SChristophe Leroy *
29417312f25SChristophe Leroy * For speed, 4 of the instructions get patched once the size and
29517312f25SChristophe Leroy * physical address of the hash table are known.  These definitions
29669a1593aSChristophe Leroy * of Hash_base and Hash_bits below are for the early hash table.
29717312f25SChristophe Leroy */
29869a1593aSChristophe LeroyHash_base = early_hash
29917312f25SChristophe LeroyHash_bits = 12				/* e.g. 256kB hash table */
30017312f25SChristophe LeroyHash_msk = (((1 << Hash_bits) - 1) * 64)
30117312f25SChristophe Leroy
30217312f25SChristophe Leroy/* defines for the PTE format for 32-bit PPCs */
30317312f25SChristophe Leroy#define HPTE_SIZE	8
30417312f25SChristophe Leroy#define PTEG_SIZE	64
30517312f25SChristophe Leroy#define LG_PTEG_SIZE	6
30617312f25SChristophe Leroy#define LDPTEu		lwzu
30717312f25SChristophe Leroy#define LDPTE		lwz
30817312f25SChristophe Leroy#define STPTE		stw
30917312f25SChristophe Leroy#define CMPPTE		cmpw
31017312f25SChristophe Leroy#define PTE_H		0x40
31117312f25SChristophe Leroy#define PTE_V		0x80000000
31217312f25SChristophe Leroy#define TST_V(r)	rlwinm. r,r,0,0,0
31317312f25SChristophe Leroy#define SET_V(r)	oris r,r,PTE_V@h
31417312f25SChristophe Leroy#define CLR_V(r,t)	rlwinm r,r,0,1,31
31517312f25SChristophe Leroy
31617312f25SChristophe Leroy#define HASH_LEFT	31-(LG_PTEG_SIZE+Hash_bits-1)
31717312f25SChristophe Leroy#define HASH_RIGHT	31-LG_PTEG_SIZE
31817312f25SChristophe Leroy
31969a1593aSChristophe Leroy__REF
32017312f25SChristophe Leroy_GLOBAL(create_hpte)
32117312f25SChristophe Leroy	/* Convert linux-style PTE (r5) to low word of PPC-style PTE (r8) */
32240bb0e90SChristophe Leroy	rlwinm	r8,r5,32-9,30,30	/* _PAGE_RW -> PP msb */
32317312f25SChristophe Leroy	rlwinm	r0,r5,32-6,30,30	/* _PAGE_DIRTY -> PP msb */
32440bb0e90SChristophe Leroy	and	r8,r8,r0		/* writable if _RW & _DIRTY */
32540bb0e90SChristophe Leroy	rlwimi	r5,r5,32-1,30,30	/* _PAGE_USER -> PP msb */
32640bb0e90SChristophe Leroy	rlwimi	r5,r5,32-2,31,31	/* _PAGE_USER -> PP lsb */
32717312f25SChristophe Leroy	ori	r8,r8,0xe04		/* clear out reserved bits */
32817312f25SChristophe Leroy	andc	r8,r5,r8		/* PP = user? (rw&dirty? 1: 3): 0 */
32917312f25SChristophe LeroyBEGIN_FTR_SECTION
33017312f25SChristophe Leroy	rlwinm	r8,r8,0,~_PAGE_COHERENT	/* clear M (coherence not required) */
33117312f25SChristophe LeroyEND_FTR_SECTION_IFCLR(CPU_FTR_NEED_COHERENT)
33217312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
33317312f25SChristophe Leroy	/* Put the XPN bits into the PTE */
33417312f25SChristophe Leroy	rlwimi	r8,r10,8,20,22
33517312f25SChristophe Leroy	rlwimi	r8,r10,2,29,29
33617312f25SChristophe Leroy#endif
33717312f25SChristophe Leroy
33817312f25SChristophe Leroy	/* Construct the high word of the PPC-style PTE (r5) */
33917312f25SChristophe Leroy	rlwinm	r5,r3,7,1,24		/* put VSID in 0x7fffff80 bits */
34017312f25SChristophe Leroy	rlwimi	r5,r4,10,26,31		/* put in API (abbrev page index) */
34117312f25SChristophe Leroy	SET_V(r5)			/* set V (valid) bit */
34217312f25SChristophe Leroy
34317312f25SChristophe Leroy	patch_site	0f, patch__hash_page_A0
34417312f25SChristophe Leroy	patch_site	1f, patch__hash_page_A1
34517312f25SChristophe Leroy	patch_site	2f, patch__hash_page_A2
34617312f25SChristophe Leroy	/* Get the address of the primary PTE group in the hash table (r3) */
347232ca1eeSChristophe Leroy0:	lis	r0, (Hash_base - PAGE_OFFSET)@h	/* base address of hash table */
34817312f25SChristophe Leroy1:	rlwimi	r0,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT    /* VSID -> hash */
34917312f25SChristophe Leroy2:	rlwinm	r3,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */
35017312f25SChristophe Leroy	xor	r3,r3,r0		/* make primary hash */
35117312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
35217312f25SChristophe Leroy
35317312f25SChristophe Leroy	/*
35417312f25SChristophe Leroy	 * Test the _PAGE_HASHPTE bit in the old linux PTE, and skip the search
35517312f25SChristophe Leroy	 * if it is clear, meaning that the HPTE isn't there already...
35617312f25SChristophe Leroy	 */
35717312f25SChristophe Leroy	andi.	r6,r6,_PAGE_HASHPTE
35817312f25SChristophe Leroy	beq+	10f			/* no PTE: go look for an empty slot */
35917312f25SChristophe Leroy	tlbie	r4
36017312f25SChristophe Leroy
36117312f25SChristophe Leroy	/* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */
36217312f25SChristophe Leroy	mtctr	r0
36317312f25SChristophe Leroy	addi	r4,r3,-HPTE_SIZE
36417312f25SChristophe Leroy1:	LDPTEu	r6,HPTE_SIZE(r4)	/* get next PTE */
36517312f25SChristophe Leroy	CMPPTE	0,r6,r5
36617312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
367f892c21dSChristophe Leroy	beq+	.Lfound_slot
36817312f25SChristophe Leroy
36917312f25SChristophe Leroy	patch_site	0f, patch__hash_page_B
37017312f25SChristophe Leroy	/* Search the secondary PTEG for a matching PTE */
37117312f25SChristophe Leroy	ori	r5,r5,PTE_H		/* set H (secondary hash) bit */
37217312f25SChristophe Leroy0:	xoris	r4,r3,Hash_msk>>16	/* compute secondary hash */
37317312f25SChristophe Leroy	xori	r4,r4,(-PTEG_SIZE & 0xffff)
37417312f25SChristophe Leroy	addi	r4,r4,-HPTE_SIZE
37517312f25SChristophe Leroy	mtctr	r0
37617312f25SChristophe Leroy2:	LDPTEu	r6,HPTE_SIZE(r4)
37717312f25SChristophe Leroy	CMPPTE	0,r6,r5
37817312f25SChristophe Leroy	bdnzf	2,2b
379f892c21dSChristophe Leroy	beq+	.Lfound_slot
38017312f25SChristophe Leroy	xori	r5,r5,PTE_H		/* clear H bit again */
38117312f25SChristophe Leroy
38217312f25SChristophe Leroy	/* Search the primary PTEG for an empty slot */
38317312f25SChristophe Leroy10:	mtctr	r0
38417312f25SChristophe Leroy	addi	r4,r3,-HPTE_SIZE	/* search primary PTEG */
38517312f25SChristophe Leroy1:	LDPTEu	r6,HPTE_SIZE(r4)	/* get next PTE */
38617312f25SChristophe Leroy	TST_V(r6)			/* test valid bit */
38717312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
388f892c21dSChristophe Leroy	beq+	.Lfound_empty
38917312f25SChristophe Leroy
39017312f25SChristophe Leroy	patch_site	0f, patch__hash_page_C
39117312f25SChristophe Leroy	/* Search the secondary PTEG for an empty slot */
39217312f25SChristophe Leroy	ori	r5,r5,PTE_H		/* set H (secondary hash) bit */
39317312f25SChristophe Leroy0:	xoris	r4,r3,Hash_msk>>16	/* compute secondary hash */
39417312f25SChristophe Leroy	xori	r4,r4,(-PTEG_SIZE & 0xffff)
39517312f25SChristophe Leroy	addi	r4,r4,-HPTE_SIZE
39617312f25SChristophe Leroy	mtctr	r0
39717312f25SChristophe Leroy2:	LDPTEu	r6,HPTE_SIZE(r4)
39817312f25SChristophe Leroy	TST_V(r6)
39917312f25SChristophe Leroy	bdnzf	2,2b
400f892c21dSChristophe Leroy	beq+	.Lfound_empty
40117312f25SChristophe Leroy	xori	r5,r5,PTE_H		/* clear H bit again */
40217312f25SChristophe Leroy
40317312f25SChristophe Leroy	/*
40417312f25SChristophe Leroy	 * Choose an arbitrary slot in the primary PTEG to overwrite.
40517312f25SChristophe Leroy	 * Since both the primary and secondary PTEGs are full, and we
40617312f25SChristophe Leroy	 * have no information that the PTEs in the primary PTEG are
40717312f25SChristophe Leroy	 * more important or useful than those in the secondary PTEG,
40817312f25SChristophe Leroy	 * and we know there is a definite (although small) speed
40917312f25SChristophe Leroy	 * advantage to putting the PTE in the primary PTEG, we always
41017312f25SChristophe Leroy	 * put the PTE in the primary PTEG.
41117312f25SChristophe Leroy	 */
41217312f25SChristophe Leroy
41379d1befeSChristophe Leroy	lis	r4, (next_slot - PAGE_OFFSET)@ha	/* get next evict slot */
414232ca1eeSChristophe Leroy	lwz	r6, (next_slot - PAGE_OFFSET)@l(r4)
41517312f25SChristophe Leroy	addi	r6,r6,HPTE_SIZE			/* search for candidate */
41617312f25SChristophe Leroy	andi.	r6,r6,7*HPTE_SIZE
41717312f25SChristophe Leroy	stw	r6,next_slot@l(r4)
41817312f25SChristophe Leroy	add	r4,r3,r6
41917312f25SChristophe Leroy
42017312f25SChristophe Leroy#ifndef CONFIG_SMP
42117312f25SChristophe Leroy	/* Store PTE in PTEG */
422f892c21dSChristophe Leroy.Lfound_empty:
42317312f25SChristophe Leroy	STPTE	r5,0(r4)
424f892c21dSChristophe Leroy.Lfound_slot:
42517312f25SChristophe Leroy	STPTE	r8,HPTE_SIZE/2(r4)
42617312f25SChristophe Leroy
42717312f25SChristophe Leroy#else /* CONFIG_SMP */
42817312f25SChristophe Leroy/*
42917312f25SChristophe Leroy * Between the tlbie above and updating the hash table entry below,
43017312f25SChristophe Leroy * another CPU could read the hash table entry and put it in its TLB.
43117312f25SChristophe Leroy * There are 3 cases:
43217312f25SChristophe Leroy * 1. using an empty slot
43317312f25SChristophe Leroy * 2. updating an earlier entry to change permissions (i.e. enable write)
43417312f25SChristophe Leroy * 3. taking over the PTE for an unrelated address
43517312f25SChristophe Leroy *
43617312f25SChristophe Leroy * In each case it doesn't really matter if the other CPUs have the old
43717312f25SChristophe Leroy * PTE in their TLB.  So we don't need to bother with another tlbie here,
43817312f25SChristophe Leroy * which is convenient as we've overwritten the register that had the
43917312f25SChristophe Leroy * address. :-)  The tlbie above is mainly to make sure that this CPU comes
44017312f25SChristophe Leroy * and gets the new PTE from the hash table.
44117312f25SChristophe Leroy *
44217312f25SChristophe Leroy * We do however have to make sure that the PTE is never in an invalid
44317312f25SChristophe Leroy * state with the V bit set.
44417312f25SChristophe Leroy */
445f892c21dSChristophe Leroy.Lfound_empty:
446f892c21dSChristophe Leroy.Lfound_slot:
44717312f25SChristophe Leroy	CLR_V(r5,r0)		/* clear V (valid) bit in PTE */
44817312f25SChristophe Leroy	STPTE	r5,0(r4)
44917312f25SChristophe Leroy	sync
45017312f25SChristophe Leroy	TLBSYNC
45117312f25SChristophe Leroy	STPTE	r8,HPTE_SIZE/2(r4) /* put in correct RPN, WIMG, PP bits */
45217312f25SChristophe Leroy	sync
45317312f25SChristophe Leroy	SET_V(r5)
45417312f25SChristophe Leroy	STPTE	r5,0(r4)	/* finally set V bit in PTE */
45517312f25SChristophe Leroy#endif /* CONFIG_SMP */
45617312f25SChristophe Leroy
45717312f25SChristophe Leroy	sync		/* make sure pte updates get to memory */
45817312f25SChristophe Leroy	blr
45969a1593aSChristophe Leroy	.previous
460e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(create_hpte)
46117312f25SChristophe Leroy
46217312f25SChristophe Leroy	.section .bss
46317312f25SChristophe Leroy	.align	2
46417312f25SChristophe Leroynext_slot:
46517312f25SChristophe Leroy	.space	4
46617312f25SChristophe Leroy	.previous
46717312f25SChristophe Leroy
46817312f25SChristophe Leroy/*
46917312f25SChristophe Leroy * Flush the entry for a particular page from the hash table.
47017312f25SChristophe Leroy *
47117312f25SChristophe Leroy * flush_hash_pages(unsigned context, unsigned long va, unsigned long pmdval,
47217312f25SChristophe Leroy *		    int count)
47317312f25SChristophe Leroy *
47417312f25SChristophe Leroy * We assume that there is a hash table in use (Hash != 0).
47517312f25SChristophe Leroy */
47669a1593aSChristophe Leroy__REF
47717312f25SChristophe Leroy_GLOBAL(flush_hash_pages)
47817312f25SChristophe Leroy	/*
47917312f25SChristophe Leroy	 * We disable interrupts here, even on UP, because we want
48017312f25SChristophe Leroy	 * the _PAGE_HASHPTE bit to be a reliable indication of
48117312f25SChristophe Leroy	 * whether the HPTE exists (or at least whether one did once).
48217312f25SChristophe Leroy	 * We also turn off the MMU for data accesses so that we
48317312f25SChristophe Leroy	 * we can't take a hash table miss (assuming the code is
48417312f25SChristophe Leroy	 * covered by a BAT).  -- paulus
48517312f25SChristophe Leroy	 */
48617312f25SChristophe Leroy	mfmsr	r10
48717312f25SChristophe Leroy	rlwinm	r0,r10,0,17,15		/* clear bit 16 (MSR_EE) */
48817312f25SChristophe Leroy	rlwinm	r0,r0,0,28,26		/* clear MSR_DR */
48917312f25SChristophe Leroy	mtmsr	r0
49017312f25SChristophe Leroy	isync
49117312f25SChristophe Leroy
49217312f25SChristophe Leroy	/* First find a PTE in the range that has _PAGE_HASHPTE set */
49317312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
49417312f25SChristophe Leroy	rlwimi	r5,r4,22,20,29
49517312f25SChristophe Leroy#else
49617312f25SChristophe Leroy	rlwimi	r5,r4,23,20,28
497*da481c4fSChristophe Leroy	addi	r5,r5,PTE_FLAGS_OFFSET
49817312f25SChristophe Leroy#endif
499*da481c4fSChristophe Leroy1:	lwz	r0,0(r5)
50017312f25SChristophe Leroy	cmpwi	cr1,r6,1
50117312f25SChristophe Leroy	andi.	r0,r0,_PAGE_HASHPTE
50217312f25SChristophe Leroy	bne	2f
50317312f25SChristophe Leroy	ble	cr1,19f
50417312f25SChristophe Leroy	addi	r4,r4,0x1000
50517312f25SChristophe Leroy	addi	r5,r5,PTE_SIZE
50617312f25SChristophe Leroy	addi	r6,r6,-1
50717312f25SChristophe Leroy	b	1b
50817312f25SChristophe Leroy
50917312f25SChristophe Leroy	/* Convert context and va to VSID */
51017312f25SChristophe Leroy2:	mulli	r3,r3,897*16		/* multiply context by context skew */
51117312f25SChristophe Leroy	rlwinm	r0,r4,4,28,31		/* get ESID (top 4 bits of va) */
51217312f25SChristophe Leroy	mulli	r0,r0,0x111		/* multiply by ESID skew */
51317312f25SChristophe Leroy	add	r3,r3,r0		/* note code below trims to 24 bits */
51417312f25SChristophe Leroy
51517312f25SChristophe Leroy	/* Construct the high word of the PPC-style PTE (r11) */
51617312f25SChristophe Leroy	rlwinm	r11,r3,7,1,24		/* put VSID in 0x7fffff80 bits */
51717312f25SChristophe Leroy	rlwimi	r11,r4,10,26,31		/* put in API (abbrev page index) */
51817312f25SChristophe Leroy	SET_V(r11)			/* set V (valid) bit */
51917312f25SChristophe Leroy
52017312f25SChristophe Leroy#ifdef CONFIG_SMP
52117312f25SChristophe Leroy	lis	r9, (mmu_hash_lock - PAGE_OFFSET)@ha
52217312f25SChristophe Leroy	addi	r9, r9, (mmu_hash_lock - PAGE_OFFSET)@l
523397d2300SChristophe Leroy	tophys	(r8, r2)
524397d2300SChristophe Leroy	lwz	r8, TASK_CPU(r8)
52517312f25SChristophe Leroy	oris	r8,r8,9
52617312f25SChristophe Leroy10:	lwarx	r0,0,r9
52717312f25SChristophe Leroy	cmpi	0,r0,0
52817312f25SChristophe Leroy	bne-	11f
52917312f25SChristophe Leroy	stwcx.	r8,0,r9
53017312f25SChristophe Leroy	beq+	12f
53117312f25SChristophe Leroy11:	lwz	r0,0(r9)
53217312f25SChristophe Leroy	cmpi	0,r0,0
53317312f25SChristophe Leroy	beq	10b
53417312f25SChristophe Leroy	b	11b
53517312f25SChristophe Leroy12:	isync
53617312f25SChristophe Leroy#endif
53717312f25SChristophe Leroy
53817312f25SChristophe Leroy	/*
53917312f25SChristophe Leroy	 * Check the _PAGE_HASHPTE bit in the linux PTE.  If it is
54017312f25SChristophe Leroy	 * already clear, we're done (for this pte).  If not,
54117312f25SChristophe Leroy	 * clear it (atomically) and proceed.  -- paulus.
54217312f25SChristophe Leroy	 */
54317312f25SChristophe Leroy33:	lwarx	r8,0,r5			/* fetch the pte flags word */
54417312f25SChristophe Leroy	andi.	r0,r8,_PAGE_HASHPTE
54517312f25SChristophe Leroy	beq	8f			/* done if HASHPTE is already clear */
54640bb0e90SChristophe Leroy	rlwinm	r8,r8,0,31,29		/* clear HASHPTE bit */
54717312f25SChristophe Leroy	stwcx.	r8,0,r5			/* update the pte */
54817312f25SChristophe Leroy	bne-	33b
54917312f25SChristophe Leroy
55017312f25SChristophe Leroy	patch_site	0f, patch__flush_hash_A0
55117312f25SChristophe Leroy	patch_site	1f, patch__flush_hash_A1
55217312f25SChristophe Leroy	patch_site	2f, patch__flush_hash_A2
55317312f25SChristophe Leroy	/* Get the address of the primary PTE group in the hash table (r3) */
55417312f25SChristophe Leroy0:	lis	r8, (Hash_base - PAGE_OFFSET)@h	/* base address of hash table */
55517312f25SChristophe Leroy1:	rlwimi	r8,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT    /* VSID -> hash */
55617312f25SChristophe Leroy2:	rlwinm	r0,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */
55717312f25SChristophe Leroy	xor	r8,r0,r8		/* make primary hash */
55817312f25SChristophe Leroy
55917312f25SChristophe Leroy	/* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */
56017312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
56117312f25SChristophe Leroy	mtctr	r0
56217312f25SChristophe Leroy	addi	r12,r8,-HPTE_SIZE
56317312f25SChristophe Leroy1:	LDPTEu	r0,HPTE_SIZE(r12)	/* get next PTE */
56417312f25SChristophe Leroy	CMPPTE	0,r0,r11
56517312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
56617312f25SChristophe Leroy	beq+	3f
56717312f25SChristophe Leroy
56817312f25SChristophe Leroy	patch_site	0f, patch__flush_hash_B
56917312f25SChristophe Leroy	/* Search the secondary PTEG for a matching PTE */
57017312f25SChristophe Leroy	ori	r11,r11,PTE_H		/* set H (secondary hash) bit */
57117312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
57217312f25SChristophe Leroy0:	xoris	r12,r8,Hash_msk>>16	/* compute secondary hash */
57317312f25SChristophe Leroy	xori	r12,r12,(-PTEG_SIZE & 0xffff)
57417312f25SChristophe Leroy	addi	r12,r12,-HPTE_SIZE
57517312f25SChristophe Leroy	mtctr	r0
57617312f25SChristophe Leroy2:	LDPTEu	r0,HPTE_SIZE(r12)
57717312f25SChristophe Leroy	CMPPTE	0,r0,r11
57817312f25SChristophe Leroy	bdnzf	2,2b
57917312f25SChristophe Leroy	xori	r11,r11,PTE_H		/* clear H again */
58017312f25SChristophe Leroy	bne-	4f			/* should rarely fail to find it */
58117312f25SChristophe Leroy
58217312f25SChristophe Leroy3:	li	r0,0
58317312f25SChristophe Leroy	STPTE	r0,0(r12)		/* invalidate entry */
58417312f25SChristophe Leroy4:	sync
58517312f25SChristophe Leroy	tlbie	r4			/* in hw tlb too */
58617312f25SChristophe Leroy	sync
58717312f25SChristophe Leroy
58817312f25SChristophe Leroy8:	ble	cr1,9f			/* if all ptes checked */
58917312f25SChristophe Leroy81:	addi	r6,r6,-1
59017312f25SChristophe Leroy	addi	r5,r5,PTE_SIZE
59117312f25SChristophe Leroy	addi	r4,r4,0x1000
59217312f25SChristophe Leroy	lwz	r0,0(r5)		/* check next pte */
59317312f25SChristophe Leroy	cmpwi	cr1,r6,1
59417312f25SChristophe Leroy	andi.	r0,r0,_PAGE_HASHPTE
59517312f25SChristophe Leroy	bne	33b
59617312f25SChristophe Leroy	bgt	cr1,81b
59717312f25SChristophe Leroy
59817312f25SChristophe Leroy9:
59917312f25SChristophe Leroy#ifdef CONFIG_SMP
60017312f25SChristophe Leroy	TLBSYNC
60117312f25SChristophe Leroy	li	r0,0
60217312f25SChristophe Leroy	stw	r0,0(r9)		/* clear mmu_hash_lock */
60317312f25SChristophe Leroy#endif
60417312f25SChristophe Leroy
60517312f25SChristophe Leroy19:	mtmsr	r10
60617312f25SChristophe Leroy	isync
60717312f25SChristophe Leroy	blr
60869a1593aSChristophe Leroy	.previous
60917312f25SChristophe LeroyEXPORT_SYMBOL(flush_hash_pages)
610e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(flush_hash_pages)
611