xref: /openbmc/linux/arch/powerpc/mm/book3s32/hash_low.S (revision c900529f3d9161bfde5cca0754f83b4d3c3e0220)
12874c5fdSThomas Gleixner/* SPDX-License-Identifier: GPL-2.0-or-later */
217312f25SChristophe Leroy/*
317312f25SChristophe Leroy *  PowerPC version
417312f25SChristophe Leroy *    Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
517312f25SChristophe Leroy *  Rewritten by Cort Dougan (cort@cs.nmt.edu) for PReP
617312f25SChristophe Leroy *    Copyright (C) 1996 Cort Dougan <cort@cs.nmt.edu>
717312f25SChristophe Leroy *  Adapted for Power Macintosh by Paul Mackerras.
817312f25SChristophe Leroy *  Low-level exception handlers and MMU support
917312f25SChristophe Leroy *  rewritten by Paul Mackerras.
1017312f25SChristophe Leroy *    Copyright (C) 1996 Paul Mackerras.
1117312f25SChristophe Leroy *
1217312f25SChristophe Leroy *  This file contains low-level assembler routines for managing
1317312f25SChristophe Leroy *  the PowerPC MMU hash table.  (PPC 8xx processors don't use a
1417312f25SChristophe Leroy *  hash table, so this file is not used on them.)
1517312f25SChristophe Leroy */
1617312f25SChristophe Leroy
17*39326182SMasahiro Yamada#include <linux/export.h>
1865fddcfcSMike Rapoport#include <linux/pgtable.h>
1969a1593aSChristophe Leroy#include <linux/init.h>
2017312f25SChristophe Leroy#include <asm/reg.h>
2117312f25SChristophe Leroy#include <asm/page.h>
2217312f25SChristophe Leroy#include <asm/cputable.h>
2317312f25SChristophe Leroy#include <asm/ppc_asm.h>
2417312f25SChristophe Leroy#include <asm/thread_info.h>
2517312f25SChristophe Leroy#include <asm/asm-offsets.h>
2617312f25SChristophe Leroy#include <asm/feature-fixups.h>
2717312f25SChristophe Leroy#include <asm/code-patching-asm.h>
2817312f25SChristophe Leroy
29da481c4fSChristophe Leroy#ifdef CONFIG_PTE_64BIT
3091e9ee7eSChristophe Leroy#define PTE_T_SIZE		8
31da481c4fSChristophe Leroy#define PTE_FLAGS_OFFSET	4	/* offset of PTE flags, in bytes */
32da481c4fSChristophe Leroy#else
3391e9ee7eSChristophe Leroy#define PTE_T_SIZE		4
34da481c4fSChristophe Leroy#define PTE_FLAGS_OFFSET	0
35da481c4fSChristophe Leroy#endif
36da481c4fSChristophe Leroy
3717312f25SChristophe Leroy/*
3817312f25SChristophe Leroy * Load a PTE into the hash table, if possible.
3917312f25SChristophe Leroy * The address is in r4, and r3 contains an access flag:
4040bb0e90SChristophe Leroy * _PAGE_RW (0x400) if a write.
4117312f25SChristophe Leroy * r9 contains the SRR1 value, from which we use the MSR_PR bit.
4217312f25SChristophe Leroy * SPRG_THREAD contains the physical address of the current task's thread.
4317312f25SChristophe Leroy *
4417312f25SChristophe Leroy * Returns to the caller if the access is illegal or there is no
4517312f25SChristophe Leroy * mapping for the address.  Otherwise it places an appropriate PTE
4617312f25SChristophe Leroy * in the hash table and returns from the exception.
4717312f25SChristophe Leroy * Uses r0, r3 - r6, r8, r10, ctr, lr.
4817312f25SChristophe Leroy */
4917312f25SChristophe Leroy	.text
5017312f25SChristophe Leroy_GLOBAL(hash_page)
5117312f25SChristophe Leroy#ifdef CONFIG_SMP
52232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@h
53232ca1eeSChristophe Leroy	ori	r8, r8, (mmu_hash_lock - PAGE_OFFSET)@l
5417312f25SChristophe Leroy	lis	r0,0x0fff
5517312f25SChristophe Leroy	b	10f
5617312f25SChristophe Leroy11:	lwz	r6,0(r8)
5717312f25SChristophe Leroy	cmpwi	0,r6,0
5817312f25SChristophe Leroy	bne	11b
5917312f25SChristophe Leroy10:	lwarx	r6,0,r8
6017312f25SChristophe Leroy	cmpwi	0,r6,0
6117312f25SChristophe Leroy	bne-	11b
6217312f25SChristophe Leroy	stwcx.	r0,0,r8
6317312f25SChristophe Leroy	bne-	10b
6417312f25SChristophe Leroy	isync
6517312f25SChristophe Leroy#endif
6617312f25SChristophe Leroy	/* Get PTE (linux-style) and check access */
67f1a1f7a1SChristophe Leroy	lis	r0, TASK_SIZE@h		/* check if kernel address */
6817312f25SChristophe Leroy	cmplw	0,r4,r0
6903d701c2SChristophe Leroy	mfspr	r8,SPRN_SPRG_THREAD	/* current task's THREAD (phys) */
7017312f25SChristophe Leroy	ori	r3,r3,_PAGE_USER|_PAGE_PRESENT /* test low addresses as user */
7103d701c2SChristophe Leroy	lwz	r5,PGDIR(r8)		/* virt page-table root */
7217312f25SChristophe Leroy	blt+	112f			/* assume user more likely */
7303d701c2SChristophe Leroy	lis	r5,swapper_pg_dir@ha	/* if kernel address, use */
7403d701c2SChristophe Leroy	addi	r5,r5,swapper_pg_dir@l	/* kernel page table */
7540bb0e90SChristophe Leroy	rlwimi	r3,r9,32-12,29,29	/* MSR_PR -> _PAGE_USER */
7603d701c2SChristophe Leroy112:	tophys(r5, r5)
7717312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
7817312f25SChristophe Leroy	rlwimi	r5,r4,12,20,29		/* insert top 10 bits of address */
7917312f25SChristophe Leroy	lwz	r8,0(r5)		/* get pmd entry */
8017312f25SChristophe Leroy	rlwinm.	r8,r8,0,0,19		/* extract address of pte page */
8117312f25SChristophe Leroy#else
8217312f25SChristophe Leroy	rlwinm	r8,r4,13,19,29		/* Compute pgdir/pmd offset */
8317312f25SChristophe Leroy	lwzx	r8,r8,r5		/* Get L1 entry */
8417312f25SChristophe Leroy	rlwinm.	r8,r8,0,0,20		/* extract pt base address */
8517312f25SChristophe Leroy#endif
8617312f25SChristophe Leroy#ifdef CONFIG_SMP
87f892c21dSChristophe Leroy	beq-	.Lhash_page_out		/* return if no mapping */
8817312f25SChristophe Leroy#else
8917312f25SChristophe Leroy	/* XXX it seems like the 601 will give a machine fault on the
9017312f25SChristophe Leroy	   rfi if its alignment is wrong (bottom 4 bits of address are
9117312f25SChristophe Leroy	   8 or 0xc) and we have had a not-taken conditional branch
9217312f25SChristophe Leroy	   to the address following the rfi. */
9317312f25SChristophe Leroy	beqlr-
9417312f25SChristophe Leroy#endif
9517312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
9617312f25SChristophe Leroy	rlwimi	r8,r4,22,20,29		/* insert next 10 bits of address */
9717312f25SChristophe Leroy#else
9817312f25SChristophe Leroy	rlwimi	r8,r4,23,20,28		/* compute pte address */
99da481c4fSChristophe Leroy	/*
100da481c4fSChristophe Leroy	 * If PTE_64BIT is set, the low word is the flags word; use that
101da481c4fSChristophe Leroy	 * word for locking since it contains all the interesting bits.
102da481c4fSChristophe Leroy	 */
103da481c4fSChristophe Leroy	addi	r8,r8,PTE_FLAGS_OFFSET
10417312f25SChristophe Leroy#endif
10517312f25SChristophe Leroy
10617312f25SChristophe Leroy	/*
10717312f25SChristophe Leroy	 * Update the linux PTE atomically.  We do the lwarx up-front
10817312f25SChristophe Leroy	 * because almost always, there won't be a permission violation
10917312f25SChristophe Leroy	 * and there won't already be an HPTE, and thus we will have
11017312f25SChristophe Leroy	 * to update the PTE to set _PAGE_HASHPTE.  -- paulus.
11117312f25SChristophe Leroy	 */
112f892c21dSChristophe Leroy.Lretry:
11317312f25SChristophe Leroy	lwarx	r6,0,r8			/* get linux-style pte, flag word */
1141b03e71fSChristophe Leroy#ifdef CONFIG_PPC_KUAP
1151b03e71fSChristophe Leroy	mfsrin	r5,r4
1161b03e71fSChristophe Leroy	rlwinm	r0,r9,28,_PAGE_RW	/* MSR[PR] => _PAGE_RW */
1171b03e71fSChristophe Leroy	rlwinm	r5,r5,12,_PAGE_RW	/* Ks => _PAGE_RW */
1181b03e71fSChristophe Leroy	andc	r5,r5,r0		/* Ks & ~MSR[PR] */
1191b03e71fSChristophe Leroy	andc	r5,r6,r5		/* Clear _PAGE_RW when Ks = 1 && MSR[PR] = 0 */
1201b03e71fSChristophe Leroy	andc.	r5,r3,r5		/* check access & ~permission */
1211b03e71fSChristophe Leroy#else
12217312f25SChristophe Leroy	andc.	r5,r3,r6		/* check access & ~permission */
1231b03e71fSChristophe Leroy#endif
1241b03e71fSChristophe Leroy	rlwinm	r0,r3,32-3,24,24	/* _PAGE_RW access -> _PAGE_DIRTY */
1251b03e71fSChristophe Leroy	ori	r0,r0,_PAGE_ACCESSED|_PAGE_HASHPTE
12617312f25SChristophe Leroy#ifdef CONFIG_SMP
127f892c21dSChristophe Leroy	bne-	.Lhash_page_out		/* return if access not permitted */
12817312f25SChristophe Leroy#else
12917312f25SChristophe Leroy	bnelr-
13017312f25SChristophe Leroy#endif
13117312f25SChristophe Leroy	or	r5,r0,r6		/* set accessed/dirty bits */
13217312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
13317312f25SChristophe Leroy#ifdef CONFIG_SMP
13417312f25SChristophe Leroy	subf	r10,r6,r8		/* create false data dependency */
13517312f25SChristophe Leroy	subi	r10,r10,PTE_FLAGS_OFFSET
13617312f25SChristophe Leroy	lwzx	r10,r6,r10		/* Get upper PTE word */
13717312f25SChristophe Leroy#else
13817312f25SChristophe Leroy	lwz	r10,-PTE_FLAGS_OFFSET(r8)
13917312f25SChristophe Leroy#endif /* CONFIG_SMP */
14017312f25SChristophe Leroy#endif /* CONFIG_PTE_64BIT */
14117312f25SChristophe Leroy	stwcx.	r5,0,r8			/* attempt to update PTE */
142f892c21dSChristophe Leroy	bne-	.Lretry			/* retry if someone got there first */
14317312f25SChristophe Leroy
14417312f25SChristophe Leroy	mfsrin	r3,r4			/* get segment reg for segment */
14517312f25SChristophe Leroy	bl	create_hpte		/* add the hash table entry */
14617312f25SChristophe Leroy
14717312f25SChristophe Leroy#ifdef CONFIG_SMP
14817312f25SChristophe Leroy	eieio
149232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@ha
15017312f25SChristophe Leroy	li	r0,0
151232ca1eeSChristophe Leroy	stw	r0, (mmu_hash_lock - PAGE_OFFSET)@l(r8)
15217312f25SChristophe Leroy#endif
153232ca1eeSChristophe Leroy	b	fast_hash_page_return
15417312f25SChristophe Leroy
15517312f25SChristophe Leroy#ifdef CONFIG_SMP
156f892c21dSChristophe Leroy.Lhash_page_out:
15717312f25SChristophe Leroy	eieio
158232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@ha
15917312f25SChristophe Leroy	li	r0,0
160232ca1eeSChristophe Leroy	stw	r0, (mmu_hash_lock - PAGE_OFFSET)@l(r8)
16117312f25SChristophe Leroy	blr
16217312f25SChristophe Leroy#endif /* CONFIG_SMP */
163e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(hash_page)
16417312f25SChristophe Leroy
16517312f25SChristophe Leroy/*
16617312f25SChristophe Leroy * Add an entry for a particular page to the hash table.
16717312f25SChristophe Leroy *
16817312f25SChristophe Leroy * add_hash_page(unsigned context, unsigned long va, unsigned long pmdval)
16917312f25SChristophe Leroy *
17017312f25SChristophe Leroy * We assume any necessary modifications to the pte (e.g. setting
17117312f25SChristophe Leroy * the accessed bit) have already been done and that there is actually
17217312f25SChristophe Leroy * a hash table in use (i.e. we're not on a 603).
17317312f25SChristophe Leroy */
17417312f25SChristophe Leroy_GLOBAL(add_hash_page)
17517312f25SChristophe Leroy	mflr	r0
17617312f25SChristophe Leroy	stw	r0,4(r1)
17717312f25SChristophe Leroy
17817312f25SChristophe Leroy#ifdef CONFIG_SMP
17917312f25SChristophe Leroy	lwz	r8,TASK_CPU(r2)		/* to go in mmu_hash_lock */
18017312f25SChristophe Leroy	oris	r8,r8,12
18117312f25SChristophe Leroy#endif /* CONFIG_SMP */
18217312f25SChristophe Leroy
18317312f25SChristophe Leroy	/*
18417312f25SChristophe Leroy	 * We disable interrupts here, even on UP, because we don't
18517312f25SChristophe Leroy	 * want to race with hash_page, and because we want the
18617312f25SChristophe Leroy	 * _PAGE_HASHPTE bit to be a reliable indication of whether
18717312f25SChristophe Leroy	 * the HPTE exists (or at least whether one did once).
18817312f25SChristophe Leroy	 * We also turn off the MMU for data accesses so that we
18917312f25SChristophe Leroy	 * we can't take a hash table miss (assuming the code is
19017312f25SChristophe Leroy	 * covered by a BAT).  -- paulus
19117312f25SChristophe Leroy	 */
19217312f25SChristophe Leroy	mfmsr	r9
19317312f25SChristophe Leroy	rlwinm	r0,r9,0,17,15		/* clear bit 16 (MSR_EE) */
19417312f25SChristophe Leroy	rlwinm	r0,r0,0,28,26		/* clear MSR_DR */
19517312f25SChristophe Leroy	mtmsr	r0
19617312f25SChristophe Leroy	isync
19717312f25SChristophe Leroy
19817312f25SChristophe Leroy#ifdef CONFIG_SMP
19917312f25SChristophe Leroy	lis	r6, (mmu_hash_lock - PAGE_OFFSET)@ha
20017312f25SChristophe Leroy	addi	r6, r6, (mmu_hash_lock - PAGE_OFFSET)@l
20117312f25SChristophe Leroy10:	lwarx	r0,0,r6			/* take the mmu_hash_lock */
20231b4f69dSNicholas Piggin	cmpwi	0,r0,0
20317312f25SChristophe Leroy	bne-	11f
20417312f25SChristophe Leroy	stwcx.	r8,0,r6
20517312f25SChristophe Leroy	beq+	12f
20617312f25SChristophe Leroy11:	lwz	r0,0(r6)
20731b4f69dSNicholas Piggin	cmpwi	0,r0,0
20817312f25SChristophe Leroy	beq	10b
20917312f25SChristophe Leroy	b	11b
21017312f25SChristophe Leroy12:	isync
21117312f25SChristophe Leroy#endif
21217312f25SChristophe Leroy
21317312f25SChristophe Leroy	/*
21417312f25SChristophe Leroy	 * Fetch the linux pte and test and set _PAGE_HASHPTE atomically.
21517312f25SChristophe Leroy	 * If _PAGE_HASHPTE was already set, we don't replace the existing
21617312f25SChristophe Leroy	 * HPTE, so we just unlock and return.
21717312f25SChristophe Leroy	 */
21817312f25SChristophe Leroy	mr	r8,r5
21917312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
22017312f25SChristophe Leroy	rlwimi	r8,r4,22,20,29
22117312f25SChristophe Leroy#else
22217312f25SChristophe Leroy	rlwimi	r8,r4,23,20,28
22317312f25SChristophe Leroy	addi	r8,r8,PTE_FLAGS_OFFSET
22417312f25SChristophe Leroy#endif
22517312f25SChristophe Leroy1:	lwarx	r6,0,r8
22617312f25SChristophe Leroy	andi.	r0,r6,_PAGE_HASHPTE
22717312f25SChristophe Leroy	bne	9f			/* if HASHPTE already set, done */
22817312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
22917312f25SChristophe Leroy#ifdef CONFIG_SMP
23017312f25SChristophe Leroy	subf	r10,r6,r8		/* create false data dependency */
23117312f25SChristophe Leroy	subi	r10,r10,PTE_FLAGS_OFFSET
23217312f25SChristophe Leroy	lwzx	r10,r6,r10		/* Get upper PTE word */
23317312f25SChristophe Leroy#else
23417312f25SChristophe Leroy	lwz	r10,-PTE_FLAGS_OFFSET(r8)
23517312f25SChristophe Leroy#endif /* CONFIG_SMP */
23617312f25SChristophe Leroy#endif /* CONFIG_PTE_64BIT */
23717312f25SChristophe Leroy	ori	r5,r6,_PAGE_HASHPTE
23817312f25SChristophe Leroy	stwcx.	r5,0,r8
23917312f25SChristophe Leroy	bne-	1b
24017312f25SChristophe Leroy
241fec6166bSChristophe Leroy	/* Convert context and va to VSID */
242fec6166bSChristophe Leroy	mulli	r3,r3,897*16		/* multiply context by context skew */
243fec6166bSChristophe Leroy	rlwinm	r0,r4,4,28,31		/* get ESID (top 4 bits of va) */
244fec6166bSChristophe Leroy	mulli	r0,r0,0x111		/* multiply by ESID skew */
245fec6166bSChristophe Leroy	add	r3,r3,r0		/* note create_hpte trims to 24 bits */
246fec6166bSChristophe Leroy
24717312f25SChristophe Leroy	bl	create_hpte
24817312f25SChristophe Leroy
24917312f25SChristophe Leroy9:
25017312f25SChristophe Leroy#ifdef CONFIG_SMP
25117312f25SChristophe Leroy	lis	r6, (mmu_hash_lock - PAGE_OFFSET)@ha
25217312f25SChristophe Leroy	addi	r6, r6, (mmu_hash_lock - PAGE_OFFSET)@l
25317312f25SChristophe Leroy	eieio
25417312f25SChristophe Leroy	li	r0,0
25517312f25SChristophe Leroy	stw	r0,0(r6)		/* clear mmu_hash_lock */
25617312f25SChristophe Leroy#endif
25717312f25SChristophe Leroy
25817312f25SChristophe Leroy	/* reenable interrupts and DR */
25917312f25SChristophe Leroy	mtmsr	r9
26017312f25SChristophe Leroy	isync
26117312f25SChristophe Leroy
26217312f25SChristophe Leroy	lwz	r0,4(r1)
26317312f25SChristophe Leroy	mtlr	r0
26417312f25SChristophe Leroy	blr
265e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(add_hash_page)
26617312f25SChristophe Leroy
26717312f25SChristophe Leroy/*
26817312f25SChristophe Leroy * This routine adds a hardware PTE to the hash table.
26917312f25SChristophe Leroy * It is designed to be called with the MMU either on or off.
27017312f25SChristophe Leroy * r3 contains the VSID, r4 contains the virtual address,
27117312f25SChristophe Leroy * r5 contains the linux PTE, r6 contains the old value of the
27217312f25SChristophe Leroy * linux PTE (before setting _PAGE_HASHPTE). r10 contains the
27317312f25SChristophe Leroy * upper half of the PTE if CONFIG_PTE_64BIT.
27417312f25SChristophe Leroy * On SMP, the caller should have the mmu_hash_lock held.
27517312f25SChristophe Leroy * We assume that the caller has (or will) set the _PAGE_HASHPTE
27617312f25SChristophe Leroy * bit in the linux PTE in memory.  The value passed in r6 should
27717312f25SChristophe Leroy * be the old linux PTE value; if it doesn't have _PAGE_HASHPTE set
27817312f25SChristophe Leroy * this routine will skip the search for an existing HPTE.
27917312f25SChristophe Leroy * This procedure modifies r0, r3 - r6, r8, cr0.
28017312f25SChristophe Leroy *  -- paulus.
28117312f25SChristophe Leroy *
28217312f25SChristophe Leroy * For speed, 4 of the instructions get patched once the size and
28317312f25SChristophe Leroy * physical address of the hash table are known.  These definitions
28469a1593aSChristophe Leroy * of Hash_base and Hash_bits below are for the early hash table.
28517312f25SChristophe Leroy */
28669a1593aSChristophe LeroyHash_base = early_hash
28717312f25SChristophe LeroyHash_bits = 12				/* e.g. 256kB hash table */
28817312f25SChristophe LeroyHash_msk = (((1 << Hash_bits) - 1) * 64)
28917312f25SChristophe Leroy
29017312f25SChristophe Leroy/* defines for the PTE format for 32-bit PPCs */
29117312f25SChristophe Leroy#define HPTE_SIZE	8
29217312f25SChristophe Leroy#define PTEG_SIZE	64
29317312f25SChristophe Leroy#define LG_PTEG_SIZE	6
29417312f25SChristophe Leroy#define LDPTEu		lwzu
29517312f25SChristophe Leroy#define LDPTE		lwz
29617312f25SChristophe Leroy#define STPTE		stw
29717312f25SChristophe Leroy#define CMPPTE		cmpw
29817312f25SChristophe Leroy#define PTE_H		0x40
29917312f25SChristophe Leroy#define PTE_V		0x80000000
30017312f25SChristophe Leroy#define TST_V(r)	rlwinm. r,r,0,0,0
30117312f25SChristophe Leroy#define SET_V(r)	oris r,r,PTE_V@h
30217312f25SChristophe Leroy#define CLR_V(r,t)	rlwinm r,r,0,1,31
30317312f25SChristophe Leroy
30417312f25SChristophe Leroy#define HASH_LEFT	31-(LG_PTEG_SIZE+Hash_bits-1)
30517312f25SChristophe Leroy#define HASH_RIGHT	31-LG_PTEG_SIZE
30617312f25SChristophe Leroy
30769a1593aSChristophe Leroy__REF
30817312f25SChristophe Leroy_GLOBAL(create_hpte)
30917312f25SChristophe Leroy	/* Convert linux-style PTE (r5) to low word of PPC-style PTE (r8) */
31040bb0e90SChristophe Leroy	rlwinm	r8,r5,32-9,30,30	/* _PAGE_RW -> PP msb */
31117312f25SChristophe Leroy	rlwinm	r0,r5,32-6,30,30	/* _PAGE_DIRTY -> PP msb */
31240bb0e90SChristophe Leroy	and	r8,r8,r0		/* writable if _RW & _DIRTY */
31340bb0e90SChristophe Leroy	rlwimi	r5,r5,32-1,30,30	/* _PAGE_USER -> PP msb */
31440bb0e90SChristophe Leroy	rlwimi	r5,r5,32-2,31,31	/* _PAGE_USER -> PP lsb */
31517312f25SChristophe Leroy	ori	r8,r8,0xe04		/* clear out reserved bits */
31617312f25SChristophe Leroy	andc	r8,r5,r8		/* PP = user? (rw&dirty? 1: 3): 0 */
31717312f25SChristophe LeroyBEGIN_FTR_SECTION
31817312f25SChristophe Leroy	rlwinm	r8,r8,0,~_PAGE_COHERENT	/* clear M (coherence not required) */
31917312f25SChristophe LeroyEND_FTR_SECTION_IFCLR(CPU_FTR_NEED_COHERENT)
32017312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
32117312f25SChristophe Leroy	/* Put the XPN bits into the PTE */
32217312f25SChristophe Leroy	rlwimi	r8,r10,8,20,22
32317312f25SChristophe Leroy	rlwimi	r8,r10,2,29,29
32417312f25SChristophe Leroy#endif
32517312f25SChristophe Leroy
32617312f25SChristophe Leroy	/* Construct the high word of the PPC-style PTE (r5) */
32717312f25SChristophe Leroy	rlwinm	r5,r3,7,1,24		/* put VSID in 0x7fffff80 bits */
32817312f25SChristophe Leroy	rlwimi	r5,r4,10,26,31		/* put in API (abbrev page index) */
32917312f25SChristophe Leroy	SET_V(r5)			/* set V (valid) bit */
33017312f25SChristophe Leroy
33117312f25SChristophe Leroy	patch_site	0f, patch__hash_page_A0
33217312f25SChristophe Leroy	patch_site	1f, patch__hash_page_A1
33317312f25SChristophe Leroy	patch_site	2f, patch__hash_page_A2
33417312f25SChristophe Leroy	/* Get the address of the primary PTE group in the hash table (r3) */
335232ca1eeSChristophe Leroy0:	lis	r0, (Hash_base - PAGE_OFFSET)@h	/* base address of hash table */
33617312f25SChristophe Leroy1:	rlwimi	r0,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT    /* VSID -> hash */
33717312f25SChristophe Leroy2:	rlwinm	r3,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */
33817312f25SChristophe Leroy	xor	r3,r3,r0		/* make primary hash */
33917312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
34017312f25SChristophe Leroy
34117312f25SChristophe Leroy	/*
34217312f25SChristophe Leroy	 * Test the _PAGE_HASHPTE bit in the old linux PTE, and skip the search
34317312f25SChristophe Leroy	 * if it is clear, meaning that the HPTE isn't there already...
34417312f25SChristophe Leroy	 */
34517312f25SChristophe Leroy	andi.	r6,r6,_PAGE_HASHPTE
34617312f25SChristophe Leroy	beq+	10f			/* no PTE: go look for an empty slot */
34717312f25SChristophe Leroy	tlbie	r4
34817312f25SChristophe Leroy
34917312f25SChristophe Leroy	/* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */
35017312f25SChristophe Leroy	mtctr	r0
35117312f25SChristophe Leroy	addi	r4,r3,-HPTE_SIZE
35217312f25SChristophe Leroy1:	LDPTEu	r6,HPTE_SIZE(r4)	/* get next PTE */
35317312f25SChristophe Leroy	CMPPTE	0,r6,r5
35417312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
355f892c21dSChristophe Leroy	beq+	.Lfound_slot
35617312f25SChristophe Leroy
35717312f25SChristophe Leroy	patch_site	0f, patch__hash_page_B
35817312f25SChristophe Leroy	/* Search the secondary PTEG for a matching PTE */
35917312f25SChristophe Leroy	ori	r5,r5,PTE_H		/* set H (secondary hash) bit */
36017312f25SChristophe Leroy0:	xoris	r4,r3,Hash_msk>>16	/* compute secondary hash */
36117312f25SChristophe Leroy	xori	r4,r4,(-PTEG_SIZE & 0xffff)
36217312f25SChristophe Leroy	addi	r4,r4,-HPTE_SIZE
36317312f25SChristophe Leroy	mtctr	r0
36417312f25SChristophe Leroy2:	LDPTEu	r6,HPTE_SIZE(r4)
36517312f25SChristophe Leroy	CMPPTE	0,r6,r5
36617312f25SChristophe Leroy	bdnzf	2,2b
367f892c21dSChristophe Leroy	beq+	.Lfound_slot
36817312f25SChristophe Leroy	xori	r5,r5,PTE_H		/* clear H bit again */
36917312f25SChristophe Leroy
37017312f25SChristophe Leroy	/* Search the primary PTEG for an empty slot */
37117312f25SChristophe Leroy10:	mtctr	r0
37217312f25SChristophe Leroy	addi	r4,r3,-HPTE_SIZE	/* search primary PTEG */
37317312f25SChristophe Leroy1:	LDPTEu	r6,HPTE_SIZE(r4)	/* get next PTE */
37417312f25SChristophe Leroy	TST_V(r6)			/* test valid bit */
37517312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
376f892c21dSChristophe Leroy	beq+	.Lfound_empty
37717312f25SChristophe Leroy
37817312f25SChristophe Leroy	patch_site	0f, patch__hash_page_C
37917312f25SChristophe Leroy	/* Search the secondary PTEG for an empty slot */
38017312f25SChristophe Leroy	ori	r5,r5,PTE_H		/* set H (secondary hash) bit */
38117312f25SChristophe Leroy0:	xoris	r4,r3,Hash_msk>>16	/* compute secondary hash */
38217312f25SChristophe Leroy	xori	r4,r4,(-PTEG_SIZE & 0xffff)
38317312f25SChristophe Leroy	addi	r4,r4,-HPTE_SIZE
38417312f25SChristophe Leroy	mtctr	r0
38517312f25SChristophe Leroy2:	LDPTEu	r6,HPTE_SIZE(r4)
38617312f25SChristophe Leroy	TST_V(r6)
38717312f25SChristophe Leroy	bdnzf	2,2b
388f892c21dSChristophe Leroy	beq+	.Lfound_empty
38917312f25SChristophe Leroy	xori	r5,r5,PTE_H		/* clear H bit again */
39017312f25SChristophe Leroy
39117312f25SChristophe Leroy	/*
39217312f25SChristophe Leroy	 * Choose an arbitrary slot in the primary PTEG to overwrite.
39317312f25SChristophe Leroy	 * Since both the primary and secondary PTEGs are full, and we
39417312f25SChristophe Leroy	 * have no information that the PTEs in the primary PTEG are
39517312f25SChristophe Leroy	 * more important or useful than those in the secondary PTEG,
39617312f25SChristophe Leroy	 * and we know there is a definite (although small) speed
39717312f25SChristophe Leroy	 * advantage to putting the PTE in the primary PTEG, we always
39817312f25SChristophe Leroy	 * put the PTE in the primary PTEG.
39917312f25SChristophe Leroy	 */
40017312f25SChristophe Leroy
40179d1befeSChristophe Leroy	lis	r4, (next_slot - PAGE_OFFSET)@ha	/* get next evict slot */
402232ca1eeSChristophe Leroy	lwz	r6, (next_slot - PAGE_OFFSET)@l(r4)
40317312f25SChristophe Leroy	addi	r6,r6,HPTE_SIZE			/* search for candidate */
40417312f25SChristophe Leroy	andi.	r6,r6,7*HPTE_SIZE
40517312f25SChristophe Leroy	stw	r6,next_slot@l(r4)
40617312f25SChristophe Leroy	add	r4,r3,r6
40717312f25SChristophe Leroy
40817312f25SChristophe Leroy#ifndef CONFIG_SMP
40917312f25SChristophe Leroy	/* Store PTE in PTEG */
410f892c21dSChristophe Leroy.Lfound_empty:
41117312f25SChristophe Leroy	STPTE	r5,0(r4)
412f892c21dSChristophe Leroy.Lfound_slot:
41317312f25SChristophe Leroy	STPTE	r8,HPTE_SIZE/2(r4)
41417312f25SChristophe Leroy
41517312f25SChristophe Leroy#else /* CONFIG_SMP */
41617312f25SChristophe Leroy/*
41717312f25SChristophe Leroy * Between the tlbie above and updating the hash table entry below,
41817312f25SChristophe Leroy * another CPU could read the hash table entry and put it in its TLB.
41917312f25SChristophe Leroy * There are 3 cases:
42017312f25SChristophe Leroy * 1. using an empty slot
42117312f25SChristophe Leroy * 2. updating an earlier entry to change permissions (i.e. enable write)
42217312f25SChristophe Leroy * 3. taking over the PTE for an unrelated address
42317312f25SChristophe Leroy *
42417312f25SChristophe Leroy * In each case it doesn't really matter if the other CPUs have the old
42517312f25SChristophe Leroy * PTE in their TLB.  So we don't need to bother with another tlbie here,
42617312f25SChristophe Leroy * which is convenient as we've overwritten the register that had the
42717312f25SChristophe Leroy * address. :-)  The tlbie above is mainly to make sure that this CPU comes
42817312f25SChristophe Leroy * and gets the new PTE from the hash table.
42917312f25SChristophe Leroy *
43017312f25SChristophe Leroy * We do however have to make sure that the PTE is never in an invalid
43117312f25SChristophe Leroy * state with the V bit set.
43217312f25SChristophe Leroy */
433f892c21dSChristophe Leroy.Lfound_empty:
434f892c21dSChristophe Leroy.Lfound_slot:
43517312f25SChristophe Leroy	CLR_V(r5,r0)		/* clear V (valid) bit in PTE */
43617312f25SChristophe Leroy	STPTE	r5,0(r4)
43717312f25SChristophe Leroy	sync
43817312f25SChristophe Leroy	TLBSYNC
43917312f25SChristophe Leroy	STPTE	r8,HPTE_SIZE/2(r4) /* put in correct RPN, WIMG, PP bits */
44017312f25SChristophe Leroy	sync
44117312f25SChristophe Leroy	SET_V(r5)
44217312f25SChristophe Leroy	STPTE	r5,0(r4)	/* finally set V bit in PTE */
44317312f25SChristophe Leroy#endif /* CONFIG_SMP */
44417312f25SChristophe Leroy
44517312f25SChristophe Leroy	sync		/* make sure pte updates get to memory */
44617312f25SChristophe Leroy	blr
44769a1593aSChristophe Leroy	.previous
448e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(create_hpte)
44917312f25SChristophe Leroy
45017312f25SChristophe Leroy	.section .bss
45117312f25SChristophe Leroy	.align	2
45217312f25SChristophe Leroynext_slot:
45317312f25SChristophe Leroy	.space	4
45417312f25SChristophe Leroy	.previous
45517312f25SChristophe Leroy
45617312f25SChristophe Leroy/*
45717312f25SChristophe Leroy * Flush the entry for a particular page from the hash table.
45817312f25SChristophe Leroy *
45917312f25SChristophe Leroy * flush_hash_pages(unsigned context, unsigned long va, unsigned long pmdval,
46017312f25SChristophe Leroy *		    int count)
46117312f25SChristophe Leroy *
46217312f25SChristophe Leroy * We assume that there is a hash table in use (Hash != 0).
46317312f25SChristophe Leroy */
46469a1593aSChristophe Leroy__REF
46517312f25SChristophe Leroy_GLOBAL(flush_hash_pages)
46617312f25SChristophe Leroy	/*
46717312f25SChristophe Leroy	 * We disable interrupts here, even on UP, because we want
46817312f25SChristophe Leroy	 * the _PAGE_HASHPTE bit to be a reliable indication of
46917312f25SChristophe Leroy	 * whether the HPTE exists (or at least whether one did once).
47017312f25SChristophe Leroy	 * We also turn off the MMU for data accesses so that we
47117312f25SChristophe Leroy	 * we can't take a hash table miss (assuming the code is
47217312f25SChristophe Leroy	 * covered by a BAT).  -- paulus
47317312f25SChristophe Leroy	 */
47417312f25SChristophe Leroy	mfmsr	r10
47517312f25SChristophe Leroy	rlwinm	r0,r10,0,17,15		/* clear bit 16 (MSR_EE) */
47617312f25SChristophe Leroy	rlwinm	r0,r0,0,28,26		/* clear MSR_DR */
47717312f25SChristophe Leroy	mtmsr	r0
47817312f25SChristophe Leroy	isync
47917312f25SChristophe Leroy
48017312f25SChristophe Leroy	/* First find a PTE in the range that has _PAGE_HASHPTE set */
48117312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
48217312f25SChristophe Leroy	rlwimi	r5,r4,22,20,29
48317312f25SChristophe Leroy#else
48417312f25SChristophe Leroy	rlwimi	r5,r4,23,20,28
485da481c4fSChristophe Leroy	addi	r5,r5,PTE_FLAGS_OFFSET
48617312f25SChristophe Leroy#endif
487da481c4fSChristophe Leroy1:	lwz	r0,0(r5)
48817312f25SChristophe Leroy	cmpwi	cr1,r6,1
48917312f25SChristophe Leroy	andi.	r0,r0,_PAGE_HASHPTE
49017312f25SChristophe Leroy	bne	2f
49117312f25SChristophe Leroy	ble	cr1,19f
49217312f25SChristophe Leroy	addi	r4,r4,0x1000
49391e9ee7eSChristophe Leroy	addi	r5,r5,PTE_T_SIZE
49417312f25SChristophe Leroy	addi	r6,r6,-1
49517312f25SChristophe Leroy	b	1b
49617312f25SChristophe Leroy
49717312f25SChristophe Leroy	/* Convert context and va to VSID */
49817312f25SChristophe Leroy2:	mulli	r3,r3,897*16		/* multiply context by context skew */
49917312f25SChristophe Leroy	rlwinm	r0,r4,4,28,31		/* get ESID (top 4 bits of va) */
50017312f25SChristophe Leroy	mulli	r0,r0,0x111		/* multiply by ESID skew */
50117312f25SChristophe Leroy	add	r3,r3,r0		/* note code below trims to 24 bits */
50217312f25SChristophe Leroy
50317312f25SChristophe Leroy	/* Construct the high word of the PPC-style PTE (r11) */
50417312f25SChristophe Leroy	rlwinm	r11,r3,7,1,24		/* put VSID in 0x7fffff80 bits */
50517312f25SChristophe Leroy	rlwimi	r11,r4,10,26,31		/* put in API (abbrev page index) */
50617312f25SChristophe Leroy	SET_V(r11)			/* set V (valid) bit */
50717312f25SChristophe Leroy
50817312f25SChristophe Leroy#ifdef CONFIG_SMP
50917312f25SChristophe Leroy	lis	r9, (mmu_hash_lock - PAGE_OFFSET)@ha
51017312f25SChristophe Leroy	addi	r9, r9, (mmu_hash_lock - PAGE_OFFSET)@l
511397d2300SChristophe Leroy	tophys	(r8, r2)
512397d2300SChristophe Leroy	lwz	r8, TASK_CPU(r8)
51317312f25SChristophe Leroy	oris	r8,r8,9
51417312f25SChristophe Leroy10:	lwarx	r0,0,r9
51531b4f69dSNicholas Piggin	cmpwi	0,r0,0
51617312f25SChristophe Leroy	bne-	11f
51717312f25SChristophe Leroy	stwcx.	r8,0,r9
51817312f25SChristophe Leroy	beq+	12f
51917312f25SChristophe Leroy11:	lwz	r0,0(r9)
52031b4f69dSNicholas Piggin	cmpwi	0,r0,0
52117312f25SChristophe Leroy	beq	10b
52217312f25SChristophe Leroy	b	11b
52317312f25SChristophe Leroy12:	isync
52417312f25SChristophe Leroy#endif
52517312f25SChristophe Leroy
52617312f25SChristophe Leroy	/*
52717312f25SChristophe Leroy	 * Check the _PAGE_HASHPTE bit in the linux PTE.  If it is
52817312f25SChristophe Leroy	 * already clear, we're done (for this pte).  If not,
52917312f25SChristophe Leroy	 * clear it (atomically) and proceed.  -- paulus.
53017312f25SChristophe Leroy	 */
53117312f25SChristophe Leroy33:	lwarx	r8,0,r5			/* fetch the pte flags word */
53217312f25SChristophe Leroy	andi.	r0,r8,_PAGE_HASHPTE
53317312f25SChristophe Leroy	beq	8f			/* done if HASHPTE is already clear */
53440bb0e90SChristophe Leroy	rlwinm	r8,r8,0,31,29		/* clear HASHPTE bit */
53517312f25SChristophe Leroy	stwcx.	r8,0,r5			/* update the pte */
53617312f25SChristophe Leroy	bne-	33b
53717312f25SChristophe Leroy
53817312f25SChristophe Leroy	patch_site	0f, patch__flush_hash_A0
53917312f25SChristophe Leroy	patch_site	1f, patch__flush_hash_A1
54017312f25SChristophe Leroy	patch_site	2f, patch__flush_hash_A2
54117312f25SChristophe Leroy	/* Get the address of the primary PTE group in the hash table (r3) */
54217312f25SChristophe Leroy0:	lis	r8, (Hash_base - PAGE_OFFSET)@h	/* base address of hash table */
54317312f25SChristophe Leroy1:	rlwimi	r8,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT    /* VSID -> hash */
54417312f25SChristophe Leroy2:	rlwinm	r0,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */
54517312f25SChristophe Leroy	xor	r8,r0,r8		/* make primary hash */
54617312f25SChristophe Leroy
54717312f25SChristophe Leroy	/* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */
54817312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
54917312f25SChristophe Leroy	mtctr	r0
55017312f25SChristophe Leroy	addi	r12,r8,-HPTE_SIZE
55117312f25SChristophe Leroy1:	LDPTEu	r0,HPTE_SIZE(r12)	/* get next PTE */
55217312f25SChristophe Leroy	CMPPTE	0,r0,r11
55317312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
55417312f25SChristophe Leroy	beq+	3f
55517312f25SChristophe Leroy
55617312f25SChristophe Leroy	patch_site	0f, patch__flush_hash_B
55717312f25SChristophe Leroy	/* Search the secondary PTEG for a matching PTE */
55817312f25SChristophe Leroy	ori	r11,r11,PTE_H		/* set H (secondary hash) bit */
55917312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
56017312f25SChristophe Leroy0:	xoris	r12,r8,Hash_msk>>16	/* compute secondary hash */
56117312f25SChristophe Leroy	xori	r12,r12,(-PTEG_SIZE & 0xffff)
56217312f25SChristophe Leroy	addi	r12,r12,-HPTE_SIZE
56317312f25SChristophe Leroy	mtctr	r0
56417312f25SChristophe Leroy2:	LDPTEu	r0,HPTE_SIZE(r12)
56517312f25SChristophe Leroy	CMPPTE	0,r0,r11
56617312f25SChristophe Leroy	bdnzf	2,2b
56717312f25SChristophe Leroy	xori	r11,r11,PTE_H		/* clear H again */
56817312f25SChristophe Leroy	bne-	4f			/* should rarely fail to find it */
56917312f25SChristophe Leroy
57017312f25SChristophe Leroy3:	li	r0,0
57117312f25SChristophe Leroy	STPTE	r0,0(r12)		/* invalidate entry */
57217312f25SChristophe Leroy4:	sync
57317312f25SChristophe Leroy	tlbie	r4			/* in hw tlb too */
57417312f25SChristophe Leroy	sync
57517312f25SChristophe Leroy
57617312f25SChristophe Leroy8:	ble	cr1,9f			/* if all ptes checked */
57717312f25SChristophe Leroy81:	addi	r6,r6,-1
57891e9ee7eSChristophe Leroy	addi	r5,r5,PTE_T_SIZE
57917312f25SChristophe Leroy	addi	r4,r4,0x1000
58017312f25SChristophe Leroy	lwz	r0,0(r5)		/* check next pte */
58117312f25SChristophe Leroy	cmpwi	cr1,r6,1
58217312f25SChristophe Leroy	andi.	r0,r0,_PAGE_HASHPTE
58317312f25SChristophe Leroy	bne	33b
58417312f25SChristophe Leroy	bgt	cr1,81b
58517312f25SChristophe Leroy
58617312f25SChristophe Leroy9:
58717312f25SChristophe Leroy#ifdef CONFIG_SMP
58817312f25SChristophe Leroy	TLBSYNC
58917312f25SChristophe Leroy	li	r0,0
59017312f25SChristophe Leroy	stw	r0,0(r9)		/* clear mmu_hash_lock */
59117312f25SChristophe Leroy#endif
59217312f25SChristophe Leroy
59317312f25SChristophe Leroy19:	mtmsr	r10
59417312f25SChristophe Leroy	isync
59517312f25SChristophe Leroy	blr
59669a1593aSChristophe Leroy	.previous
59717312f25SChristophe LeroyEXPORT_SYMBOL(flush_hash_pages)
598e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(flush_hash_pages)
599