xref: /openbmc/linux/arch/powerpc/mm/book3s32/hash_low.S (revision fec6166b44ded68e68144144a02e498580118f1a)
12874c5fdSThomas Gleixner/* SPDX-License-Identifier: GPL-2.0-or-later */
217312f25SChristophe Leroy/*
317312f25SChristophe Leroy *  PowerPC version
417312f25SChristophe Leroy *    Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
517312f25SChristophe Leroy *  Rewritten by Cort Dougan (cort@cs.nmt.edu) for PReP
617312f25SChristophe Leroy *    Copyright (C) 1996 Cort Dougan <cort@cs.nmt.edu>
717312f25SChristophe Leroy *  Adapted for Power Macintosh by Paul Mackerras.
817312f25SChristophe Leroy *  Low-level exception handlers and MMU support
917312f25SChristophe Leroy *  rewritten by Paul Mackerras.
1017312f25SChristophe Leroy *    Copyright (C) 1996 Paul Mackerras.
1117312f25SChristophe Leroy *
1217312f25SChristophe Leroy *  This file contains low-level assembler routines for managing
1317312f25SChristophe Leroy *  the PowerPC MMU hash table.  (PPC 8xx processors don't use a
1417312f25SChristophe Leroy *  hash table, so this file is not used on them.)
1517312f25SChristophe Leroy */
1617312f25SChristophe Leroy
1765fddcfcSMike Rapoport#include <linux/pgtable.h>
1869a1593aSChristophe Leroy#include <linux/init.h>
1917312f25SChristophe Leroy#include <asm/reg.h>
2017312f25SChristophe Leroy#include <asm/page.h>
2117312f25SChristophe Leroy#include <asm/cputable.h>
2217312f25SChristophe Leroy#include <asm/ppc_asm.h>
2317312f25SChristophe Leroy#include <asm/thread_info.h>
2417312f25SChristophe Leroy#include <asm/asm-offsets.h>
2517312f25SChristophe Leroy#include <asm/export.h>
2617312f25SChristophe Leroy#include <asm/feature-fixups.h>
2717312f25SChristophe Leroy#include <asm/code-patching-asm.h>
2817312f25SChristophe Leroy
2917312f25SChristophe Leroy/*
3017312f25SChristophe Leroy * Load a PTE into the hash table, if possible.
3117312f25SChristophe Leroy * The address is in r4, and r3 contains an access flag:
3240bb0e90SChristophe Leroy * _PAGE_RW (0x400) if a write.
3317312f25SChristophe Leroy * r9 contains the SRR1 value, from which we use the MSR_PR bit.
3417312f25SChristophe Leroy * SPRG_THREAD contains the physical address of the current task's thread.
3517312f25SChristophe Leroy *
3617312f25SChristophe Leroy * Returns to the caller if the access is illegal or there is no
3717312f25SChristophe Leroy * mapping for the address.  Otherwise it places an appropriate PTE
3817312f25SChristophe Leroy * in the hash table and returns from the exception.
3917312f25SChristophe Leroy * Uses r0, r3 - r6, r8, r10, ctr, lr.
4017312f25SChristophe Leroy */
4117312f25SChristophe Leroy	.text
4217312f25SChristophe Leroy_GLOBAL(hash_page)
4317312f25SChristophe Leroy#ifdef CONFIG_SMP
44232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@h
45232ca1eeSChristophe Leroy	ori	r8, r8, (mmu_hash_lock - PAGE_OFFSET)@l
4617312f25SChristophe Leroy	lis	r0,0x0fff
4717312f25SChristophe Leroy	b	10f
4817312f25SChristophe Leroy11:	lwz	r6,0(r8)
4917312f25SChristophe Leroy	cmpwi	0,r6,0
5017312f25SChristophe Leroy	bne	11b
5117312f25SChristophe Leroy10:	lwarx	r6,0,r8
5217312f25SChristophe Leroy	cmpwi	0,r6,0
5317312f25SChristophe Leroy	bne-	11b
5417312f25SChristophe Leroy	stwcx.	r0,0,r8
5517312f25SChristophe Leroy	bne-	10b
5617312f25SChristophe Leroy	isync
5717312f25SChristophe Leroy#endif
5817312f25SChristophe Leroy	/* Get PTE (linux-style) and check access */
59f1a1f7a1SChristophe Leroy	lis	r0, TASK_SIZE@h		/* check if kernel address */
6017312f25SChristophe Leroy	cmplw	0,r4,r0
6103d701c2SChristophe Leroy	mfspr	r8,SPRN_SPRG_THREAD	/* current task's THREAD (phys) */
6217312f25SChristophe Leroy	ori	r3,r3,_PAGE_USER|_PAGE_PRESENT /* test low addresses as user */
6303d701c2SChristophe Leroy	lwz	r5,PGDIR(r8)		/* virt page-table root */
6417312f25SChristophe Leroy	blt+	112f			/* assume user more likely */
6503d701c2SChristophe Leroy	lis	r5,swapper_pg_dir@ha	/* if kernel address, use */
6603d701c2SChristophe Leroy	addi	r5,r5,swapper_pg_dir@l	/* kernel page table */
6740bb0e90SChristophe Leroy	rlwimi	r3,r9,32-12,29,29	/* MSR_PR -> _PAGE_USER */
6803d701c2SChristophe Leroy112:	tophys(r5, r5)
6917312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
7017312f25SChristophe Leroy	rlwimi	r5,r4,12,20,29		/* insert top 10 bits of address */
7117312f25SChristophe Leroy	lwz	r8,0(r5)		/* get pmd entry */
7217312f25SChristophe Leroy	rlwinm.	r8,r8,0,0,19		/* extract address of pte page */
7317312f25SChristophe Leroy#else
7417312f25SChristophe Leroy	rlwinm	r8,r4,13,19,29		/* Compute pgdir/pmd offset */
7517312f25SChristophe Leroy	lwzx	r8,r8,r5		/* Get L1 entry */
7617312f25SChristophe Leroy	rlwinm.	r8,r8,0,0,20		/* extract pt base address */
7717312f25SChristophe Leroy#endif
7817312f25SChristophe Leroy#ifdef CONFIG_SMP
79f892c21dSChristophe Leroy	beq-	.Lhash_page_out		/* return if no mapping */
8017312f25SChristophe Leroy#else
8117312f25SChristophe Leroy	/* XXX it seems like the 601 will give a machine fault on the
8217312f25SChristophe Leroy	   rfi if its alignment is wrong (bottom 4 bits of address are
8317312f25SChristophe Leroy	   8 or 0xc) and we have had a not-taken conditional branch
8417312f25SChristophe Leroy	   to the address following the rfi. */
8517312f25SChristophe Leroy	beqlr-
8617312f25SChristophe Leroy#endif
8717312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
8817312f25SChristophe Leroy	rlwimi	r8,r4,22,20,29		/* insert next 10 bits of address */
8917312f25SChristophe Leroy#else
9017312f25SChristophe Leroy	rlwimi	r8,r4,23,20,28		/* compute pte address */
9117312f25SChristophe Leroy#endif
9217312f25SChristophe Leroy
9317312f25SChristophe Leroy	/*
9417312f25SChristophe Leroy	 * Update the linux PTE atomically.  We do the lwarx up-front
9517312f25SChristophe Leroy	 * because almost always, there won't be a permission violation
9617312f25SChristophe Leroy	 * and there won't already be an HPTE, and thus we will have
9717312f25SChristophe Leroy	 * to update the PTE to set _PAGE_HASHPTE.  -- paulus.
9817312f25SChristophe Leroy	 *
9917312f25SChristophe Leroy	 * If PTE_64BIT is set, the low word is the flags word; use that
10017312f25SChristophe Leroy	 * word for locking since it contains all the interesting bits.
10117312f25SChristophe Leroy	 */
10217312f25SChristophe Leroy#if (PTE_FLAGS_OFFSET != 0)
10317312f25SChristophe Leroy	addi	r8,r8,PTE_FLAGS_OFFSET
10417312f25SChristophe Leroy#endif
105f892c21dSChristophe Leroy.Lretry:
10617312f25SChristophe Leroy	lwarx	r6,0,r8			/* get linux-style pte, flag word */
1071b03e71fSChristophe Leroy#ifdef CONFIG_PPC_KUAP
1081b03e71fSChristophe Leroy	mfsrin	r5,r4
1091b03e71fSChristophe Leroy	rlwinm	r0,r9,28,_PAGE_RW	/* MSR[PR] => _PAGE_RW */
1101b03e71fSChristophe Leroy	rlwinm	r5,r5,12,_PAGE_RW	/* Ks => _PAGE_RW */
1111b03e71fSChristophe Leroy	andc	r5,r5,r0		/* Ks & ~MSR[PR] */
1121b03e71fSChristophe Leroy	andc	r5,r6,r5		/* Clear _PAGE_RW when Ks = 1 && MSR[PR] = 0 */
1131b03e71fSChristophe Leroy	andc.	r5,r3,r5		/* check access & ~permission */
1141b03e71fSChristophe Leroy#else
11517312f25SChristophe Leroy	andc.	r5,r3,r6		/* check access & ~permission */
1161b03e71fSChristophe Leroy#endif
1171b03e71fSChristophe Leroy	rlwinm	r0,r3,32-3,24,24	/* _PAGE_RW access -> _PAGE_DIRTY */
1181b03e71fSChristophe Leroy	ori	r0,r0,_PAGE_ACCESSED|_PAGE_HASHPTE
11917312f25SChristophe Leroy#ifdef CONFIG_SMP
120f892c21dSChristophe Leroy	bne-	.Lhash_page_out		/* return if access not permitted */
12117312f25SChristophe Leroy#else
12217312f25SChristophe Leroy	bnelr-
12317312f25SChristophe Leroy#endif
12417312f25SChristophe Leroy	or	r5,r0,r6		/* set accessed/dirty bits */
12517312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
12617312f25SChristophe Leroy#ifdef CONFIG_SMP
12717312f25SChristophe Leroy	subf	r10,r6,r8		/* create false data dependency */
12817312f25SChristophe Leroy	subi	r10,r10,PTE_FLAGS_OFFSET
12917312f25SChristophe Leroy	lwzx	r10,r6,r10		/* Get upper PTE word */
13017312f25SChristophe Leroy#else
13117312f25SChristophe Leroy	lwz	r10,-PTE_FLAGS_OFFSET(r8)
13217312f25SChristophe Leroy#endif /* CONFIG_SMP */
13317312f25SChristophe Leroy#endif /* CONFIG_PTE_64BIT */
13417312f25SChristophe Leroy	stwcx.	r5,0,r8			/* attempt to update PTE */
135f892c21dSChristophe Leroy	bne-	.Lretry			/* retry if someone got there first */
13617312f25SChristophe Leroy
13717312f25SChristophe Leroy	mfsrin	r3,r4			/* get segment reg for segment */
138232ca1eeSChristophe Leroy#ifndef CONFIG_VMAP_STACK
13917312f25SChristophe Leroy	mfctr	r0
14017312f25SChristophe Leroy	stw	r0,_CTR(r11)
141232ca1eeSChristophe Leroy#endif
14217312f25SChristophe Leroy	bl	create_hpte		/* add the hash table entry */
14317312f25SChristophe Leroy
14417312f25SChristophe Leroy#ifdef CONFIG_SMP
14517312f25SChristophe Leroy	eieio
146232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@ha
14717312f25SChristophe Leroy	li	r0,0
148232ca1eeSChristophe Leroy	stw	r0, (mmu_hash_lock - PAGE_OFFSET)@l(r8)
14917312f25SChristophe Leroy#endif
15017312f25SChristophe Leroy
151232ca1eeSChristophe Leroy#ifdef CONFIG_VMAP_STACK
152232ca1eeSChristophe Leroy	b	fast_hash_page_return
153232ca1eeSChristophe Leroy#else
15417312f25SChristophe Leroy	/* Return from the exception */
15517312f25SChristophe Leroy	lwz	r5,_CTR(r11)
15617312f25SChristophe Leroy	mtctr	r5
15717312f25SChristophe Leroy	lwz	r0,GPR0(r11)
15817312f25SChristophe Leroy	lwz	r8,GPR8(r11)
15917312f25SChristophe Leroy	b	fast_exception_return
160232ca1eeSChristophe Leroy#endif
16117312f25SChristophe Leroy
16217312f25SChristophe Leroy#ifdef CONFIG_SMP
163f892c21dSChristophe Leroy.Lhash_page_out:
16417312f25SChristophe Leroy	eieio
165232ca1eeSChristophe Leroy	lis	r8, (mmu_hash_lock - PAGE_OFFSET)@ha
16617312f25SChristophe Leroy	li	r0,0
167232ca1eeSChristophe Leroy	stw	r0, (mmu_hash_lock - PAGE_OFFSET)@l(r8)
16817312f25SChristophe Leroy	blr
16917312f25SChristophe Leroy#endif /* CONFIG_SMP */
170e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(hash_page)
17117312f25SChristophe Leroy
17217312f25SChristophe Leroy/*
17317312f25SChristophe Leroy * Add an entry for a particular page to the hash table.
17417312f25SChristophe Leroy *
17517312f25SChristophe Leroy * add_hash_page(unsigned context, unsigned long va, unsigned long pmdval)
17617312f25SChristophe Leroy *
17717312f25SChristophe Leroy * We assume any necessary modifications to the pte (e.g. setting
17817312f25SChristophe Leroy * the accessed bit) have already been done and that there is actually
17917312f25SChristophe Leroy * a hash table in use (i.e. we're not on a 603).
18017312f25SChristophe Leroy */
18117312f25SChristophe Leroy_GLOBAL(add_hash_page)
18217312f25SChristophe Leroy	mflr	r0
18317312f25SChristophe Leroy	stw	r0,4(r1)
18417312f25SChristophe Leroy
18517312f25SChristophe Leroy#ifdef CONFIG_SMP
18617312f25SChristophe Leroy	lwz	r8,TASK_CPU(r2)		/* to go in mmu_hash_lock */
18717312f25SChristophe Leroy	oris	r8,r8,12
18817312f25SChristophe Leroy#endif /* CONFIG_SMP */
18917312f25SChristophe Leroy
19017312f25SChristophe Leroy	/*
19117312f25SChristophe Leroy	 * We disable interrupts here, even on UP, because we don't
19217312f25SChristophe Leroy	 * want to race with hash_page, and because we want the
19317312f25SChristophe Leroy	 * _PAGE_HASHPTE bit to be a reliable indication of whether
19417312f25SChristophe Leroy	 * the HPTE exists (or at least whether one did once).
19517312f25SChristophe Leroy	 * We also turn off the MMU for data accesses so that we
19617312f25SChristophe Leroy	 * we can't take a hash table miss (assuming the code is
19717312f25SChristophe Leroy	 * covered by a BAT).  -- paulus
19817312f25SChristophe Leroy	 */
19917312f25SChristophe Leroy	mfmsr	r9
20017312f25SChristophe Leroy	rlwinm	r0,r9,0,17,15		/* clear bit 16 (MSR_EE) */
20117312f25SChristophe Leroy	rlwinm	r0,r0,0,28,26		/* clear MSR_DR */
20217312f25SChristophe Leroy	mtmsr	r0
20317312f25SChristophe Leroy	isync
20417312f25SChristophe Leroy
20517312f25SChristophe Leroy#ifdef CONFIG_SMP
20617312f25SChristophe Leroy	lis	r6, (mmu_hash_lock - PAGE_OFFSET)@ha
20717312f25SChristophe Leroy	addi	r6, r6, (mmu_hash_lock - PAGE_OFFSET)@l
20817312f25SChristophe Leroy10:	lwarx	r0,0,r6			/* take the mmu_hash_lock */
20917312f25SChristophe Leroy	cmpi	0,r0,0
21017312f25SChristophe Leroy	bne-	11f
21117312f25SChristophe Leroy	stwcx.	r8,0,r6
21217312f25SChristophe Leroy	beq+	12f
21317312f25SChristophe Leroy11:	lwz	r0,0(r6)
21417312f25SChristophe Leroy	cmpi	0,r0,0
21517312f25SChristophe Leroy	beq	10b
21617312f25SChristophe Leroy	b	11b
21717312f25SChristophe Leroy12:	isync
21817312f25SChristophe Leroy#endif
21917312f25SChristophe Leroy
22017312f25SChristophe Leroy	/*
22117312f25SChristophe Leroy	 * Fetch the linux pte and test and set _PAGE_HASHPTE atomically.
22217312f25SChristophe Leroy	 * If _PAGE_HASHPTE was already set, we don't replace the existing
22317312f25SChristophe Leroy	 * HPTE, so we just unlock and return.
22417312f25SChristophe Leroy	 */
22517312f25SChristophe Leroy	mr	r8,r5
22617312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
22717312f25SChristophe Leroy	rlwimi	r8,r4,22,20,29
22817312f25SChristophe Leroy#else
22917312f25SChristophe Leroy	rlwimi	r8,r4,23,20,28
23017312f25SChristophe Leroy	addi	r8,r8,PTE_FLAGS_OFFSET
23117312f25SChristophe Leroy#endif
23217312f25SChristophe Leroy1:	lwarx	r6,0,r8
23317312f25SChristophe Leroy	andi.	r0,r6,_PAGE_HASHPTE
23417312f25SChristophe Leroy	bne	9f			/* if HASHPTE already set, done */
23517312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
23617312f25SChristophe Leroy#ifdef CONFIG_SMP
23717312f25SChristophe Leroy	subf	r10,r6,r8		/* create false data dependency */
23817312f25SChristophe Leroy	subi	r10,r10,PTE_FLAGS_OFFSET
23917312f25SChristophe Leroy	lwzx	r10,r6,r10		/* Get upper PTE word */
24017312f25SChristophe Leroy#else
24117312f25SChristophe Leroy	lwz	r10,-PTE_FLAGS_OFFSET(r8)
24217312f25SChristophe Leroy#endif /* CONFIG_SMP */
24317312f25SChristophe Leroy#endif /* CONFIG_PTE_64BIT */
24417312f25SChristophe Leroy	ori	r5,r6,_PAGE_HASHPTE
24517312f25SChristophe Leroy	stwcx.	r5,0,r8
24617312f25SChristophe Leroy	bne-	1b
24717312f25SChristophe Leroy
248*fec6166bSChristophe Leroy	/* Convert context and va to VSID */
249*fec6166bSChristophe Leroy	mulli	r3,r3,897*16		/* multiply context by context skew */
250*fec6166bSChristophe Leroy	rlwinm	r0,r4,4,28,31		/* get ESID (top 4 bits of va) */
251*fec6166bSChristophe Leroy	mulli	r0,r0,0x111		/* multiply by ESID skew */
252*fec6166bSChristophe Leroy	add	r3,r3,r0		/* note create_hpte trims to 24 bits */
253*fec6166bSChristophe Leroy
25417312f25SChristophe Leroy	bl	create_hpte
25517312f25SChristophe Leroy
25617312f25SChristophe Leroy9:
25717312f25SChristophe Leroy#ifdef CONFIG_SMP
25817312f25SChristophe Leroy	lis	r6, (mmu_hash_lock - PAGE_OFFSET)@ha
25917312f25SChristophe Leroy	addi	r6, r6, (mmu_hash_lock - PAGE_OFFSET)@l
26017312f25SChristophe Leroy	eieio
26117312f25SChristophe Leroy	li	r0,0
26217312f25SChristophe Leroy	stw	r0,0(r6)		/* clear mmu_hash_lock */
26317312f25SChristophe Leroy#endif
26417312f25SChristophe Leroy
26517312f25SChristophe Leroy	/* reenable interrupts and DR */
26617312f25SChristophe Leroy	mtmsr	r9
26717312f25SChristophe Leroy	isync
26817312f25SChristophe Leroy
26917312f25SChristophe Leroy	lwz	r0,4(r1)
27017312f25SChristophe Leroy	mtlr	r0
27117312f25SChristophe Leroy	blr
272e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(add_hash_page)
27317312f25SChristophe Leroy
27417312f25SChristophe Leroy/*
27517312f25SChristophe Leroy * This routine adds a hardware PTE to the hash table.
27617312f25SChristophe Leroy * It is designed to be called with the MMU either on or off.
27717312f25SChristophe Leroy * r3 contains the VSID, r4 contains the virtual address,
27817312f25SChristophe Leroy * r5 contains the linux PTE, r6 contains the old value of the
27917312f25SChristophe Leroy * linux PTE (before setting _PAGE_HASHPTE). r10 contains the
28017312f25SChristophe Leroy * upper half of the PTE if CONFIG_PTE_64BIT.
28117312f25SChristophe Leroy * On SMP, the caller should have the mmu_hash_lock held.
28217312f25SChristophe Leroy * We assume that the caller has (or will) set the _PAGE_HASHPTE
28317312f25SChristophe Leroy * bit in the linux PTE in memory.  The value passed in r6 should
28417312f25SChristophe Leroy * be the old linux PTE value; if it doesn't have _PAGE_HASHPTE set
28517312f25SChristophe Leroy * this routine will skip the search for an existing HPTE.
28617312f25SChristophe Leroy * This procedure modifies r0, r3 - r6, r8, cr0.
28717312f25SChristophe Leroy *  -- paulus.
28817312f25SChristophe Leroy *
28917312f25SChristophe Leroy * For speed, 4 of the instructions get patched once the size and
29017312f25SChristophe Leroy * physical address of the hash table are known.  These definitions
29169a1593aSChristophe Leroy * of Hash_base and Hash_bits below are for the early hash table.
29217312f25SChristophe Leroy */
29369a1593aSChristophe LeroyHash_base = early_hash
29417312f25SChristophe LeroyHash_bits = 12				/* e.g. 256kB hash table */
29517312f25SChristophe LeroyHash_msk = (((1 << Hash_bits) - 1) * 64)
29617312f25SChristophe Leroy
29717312f25SChristophe Leroy/* defines for the PTE format for 32-bit PPCs */
29817312f25SChristophe Leroy#define HPTE_SIZE	8
29917312f25SChristophe Leroy#define PTEG_SIZE	64
30017312f25SChristophe Leroy#define LG_PTEG_SIZE	6
30117312f25SChristophe Leroy#define LDPTEu		lwzu
30217312f25SChristophe Leroy#define LDPTE		lwz
30317312f25SChristophe Leroy#define STPTE		stw
30417312f25SChristophe Leroy#define CMPPTE		cmpw
30517312f25SChristophe Leroy#define PTE_H		0x40
30617312f25SChristophe Leroy#define PTE_V		0x80000000
30717312f25SChristophe Leroy#define TST_V(r)	rlwinm. r,r,0,0,0
30817312f25SChristophe Leroy#define SET_V(r)	oris r,r,PTE_V@h
30917312f25SChristophe Leroy#define CLR_V(r,t)	rlwinm r,r,0,1,31
31017312f25SChristophe Leroy
31117312f25SChristophe Leroy#define HASH_LEFT	31-(LG_PTEG_SIZE+Hash_bits-1)
31217312f25SChristophe Leroy#define HASH_RIGHT	31-LG_PTEG_SIZE
31317312f25SChristophe Leroy
31469a1593aSChristophe Leroy__REF
31517312f25SChristophe Leroy_GLOBAL(create_hpte)
31617312f25SChristophe Leroy	/* Convert linux-style PTE (r5) to low word of PPC-style PTE (r8) */
31740bb0e90SChristophe Leroy	rlwinm	r8,r5,32-9,30,30	/* _PAGE_RW -> PP msb */
31817312f25SChristophe Leroy	rlwinm	r0,r5,32-6,30,30	/* _PAGE_DIRTY -> PP msb */
31940bb0e90SChristophe Leroy	and	r8,r8,r0		/* writable if _RW & _DIRTY */
32040bb0e90SChristophe Leroy	rlwimi	r5,r5,32-1,30,30	/* _PAGE_USER -> PP msb */
32140bb0e90SChristophe Leroy	rlwimi	r5,r5,32-2,31,31	/* _PAGE_USER -> PP lsb */
32217312f25SChristophe Leroy	ori	r8,r8,0xe04		/* clear out reserved bits */
32317312f25SChristophe Leroy	andc	r8,r5,r8		/* PP = user? (rw&dirty? 1: 3): 0 */
32417312f25SChristophe LeroyBEGIN_FTR_SECTION
32517312f25SChristophe Leroy	rlwinm	r8,r8,0,~_PAGE_COHERENT	/* clear M (coherence not required) */
32617312f25SChristophe LeroyEND_FTR_SECTION_IFCLR(CPU_FTR_NEED_COHERENT)
32717312f25SChristophe Leroy#ifdef CONFIG_PTE_64BIT
32817312f25SChristophe Leroy	/* Put the XPN bits into the PTE */
32917312f25SChristophe Leroy	rlwimi	r8,r10,8,20,22
33017312f25SChristophe Leroy	rlwimi	r8,r10,2,29,29
33117312f25SChristophe Leroy#endif
33217312f25SChristophe Leroy
33317312f25SChristophe Leroy	/* Construct the high word of the PPC-style PTE (r5) */
33417312f25SChristophe Leroy	rlwinm	r5,r3,7,1,24		/* put VSID in 0x7fffff80 bits */
33517312f25SChristophe Leroy	rlwimi	r5,r4,10,26,31		/* put in API (abbrev page index) */
33617312f25SChristophe Leroy	SET_V(r5)			/* set V (valid) bit */
33717312f25SChristophe Leroy
33817312f25SChristophe Leroy	patch_site	0f, patch__hash_page_A0
33917312f25SChristophe Leroy	patch_site	1f, patch__hash_page_A1
34017312f25SChristophe Leroy	patch_site	2f, patch__hash_page_A2
34117312f25SChristophe Leroy	/* Get the address of the primary PTE group in the hash table (r3) */
342232ca1eeSChristophe Leroy0:	lis	r0, (Hash_base - PAGE_OFFSET)@h	/* base address of hash table */
34317312f25SChristophe Leroy1:	rlwimi	r0,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT    /* VSID -> hash */
34417312f25SChristophe Leroy2:	rlwinm	r3,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */
34517312f25SChristophe Leroy	xor	r3,r3,r0		/* make primary hash */
34617312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
34717312f25SChristophe Leroy
34817312f25SChristophe Leroy	/*
34917312f25SChristophe Leroy	 * Test the _PAGE_HASHPTE bit in the old linux PTE, and skip the search
35017312f25SChristophe Leroy	 * if it is clear, meaning that the HPTE isn't there already...
35117312f25SChristophe Leroy	 */
35217312f25SChristophe Leroy	andi.	r6,r6,_PAGE_HASHPTE
35317312f25SChristophe Leroy	beq+	10f			/* no PTE: go look for an empty slot */
35417312f25SChristophe Leroy	tlbie	r4
35517312f25SChristophe Leroy
35617312f25SChristophe Leroy	/* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */
35717312f25SChristophe Leroy	mtctr	r0
35817312f25SChristophe Leroy	addi	r4,r3,-HPTE_SIZE
35917312f25SChristophe Leroy1:	LDPTEu	r6,HPTE_SIZE(r4)	/* get next PTE */
36017312f25SChristophe Leroy	CMPPTE	0,r6,r5
36117312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
362f892c21dSChristophe Leroy	beq+	.Lfound_slot
36317312f25SChristophe Leroy
36417312f25SChristophe Leroy	patch_site	0f, patch__hash_page_B
36517312f25SChristophe Leroy	/* Search the secondary PTEG for a matching PTE */
36617312f25SChristophe Leroy	ori	r5,r5,PTE_H		/* set H (secondary hash) bit */
36717312f25SChristophe Leroy0:	xoris	r4,r3,Hash_msk>>16	/* compute secondary hash */
36817312f25SChristophe Leroy	xori	r4,r4,(-PTEG_SIZE & 0xffff)
36917312f25SChristophe Leroy	addi	r4,r4,-HPTE_SIZE
37017312f25SChristophe Leroy	mtctr	r0
37117312f25SChristophe Leroy2:	LDPTEu	r6,HPTE_SIZE(r4)
37217312f25SChristophe Leroy	CMPPTE	0,r6,r5
37317312f25SChristophe Leroy	bdnzf	2,2b
374f892c21dSChristophe Leroy	beq+	.Lfound_slot
37517312f25SChristophe Leroy	xori	r5,r5,PTE_H		/* clear H bit again */
37617312f25SChristophe Leroy
37717312f25SChristophe Leroy	/* Search the primary PTEG for an empty slot */
37817312f25SChristophe Leroy10:	mtctr	r0
37917312f25SChristophe Leroy	addi	r4,r3,-HPTE_SIZE	/* search primary PTEG */
38017312f25SChristophe Leroy1:	LDPTEu	r6,HPTE_SIZE(r4)	/* get next PTE */
38117312f25SChristophe Leroy	TST_V(r6)			/* test valid bit */
38217312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
383f892c21dSChristophe Leroy	beq+	.Lfound_empty
38417312f25SChristophe Leroy
38517312f25SChristophe Leroy	patch_site	0f, patch__hash_page_C
38617312f25SChristophe Leroy	/* Search the secondary PTEG for an empty slot */
38717312f25SChristophe Leroy	ori	r5,r5,PTE_H		/* set H (secondary hash) bit */
38817312f25SChristophe Leroy0:	xoris	r4,r3,Hash_msk>>16	/* compute secondary hash */
38917312f25SChristophe Leroy	xori	r4,r4,(-PTEG_SIZE & 0xffff)
39017312f25SChristophe Leroy	addi	r4,r4,-HPTE_SIZE
39117312f25SChristophe Leroy	mtctr	r0
39217312f25SChristophe Leroy2:	LDPTEu	r6,HPTE_SIZE(r4)
39317312f25SChristophe Leroy	TST_V(r6)
39417312f25SChristophe Leroy	bdnzf	2,2b
395f892c21dSChristophe Leroy	beq+	.Lfound_empty
39617312f25SChristophe Leroy	xori	r5,r5,PTE_H		/* clear H bit again */
39717312f25SChristophe Leroy
39817312f25SChristophe Leroy	/*
39917312f25SChristophe Leroy	 * Choose an arbitrary slot in the primary PTEG to overwrite.
40017312f25SChristophe Leroy	 * Since both the primary and secondary PTEGs are full, and we
40117312f25SChristophe Leroy	 * have no information that the PTEs in the primary PTEG are
40217312f25SChristophe Leroy	 * more important or useful than those in the secondary PTEG,
40317312f25SChristophe Leroy	 * and we know there is a definite (although small) speed
40417312f25SChristophe Leroy	 * advantage to putting the PTE in the primary PTEG, we always
40517312f25SChristophe Leroy	 * put the PTE in the primary PTEG.
40617312f25SChristophe Leroy	 */
40717312f25SChristophe Leroy
40879d1befeSChristophe Leroy	lis	r4, (next_slot - PAGE_OFFSET)@ha	/* get next evict slot */
409232ca1eeSChristophe Leroy	lwz	r6, (next_slot - PAGE_OFFSET)@l(r4)
41017312f25SChristophe Leroy	addi	r6,r6,HPTE_SIZE			/* search for candidate */
41117312f25SChristophe Leroy	andi.	r6,r6,7*HPTE_SIZE
41217312f25SChristophe Leroy	stw	r6,next_slot@l(r4)
41317312f25SChristophe Leroy	add	r4,r3,r6
41417312f25SChristophe Leroy
41517312f25SChristophe Leroy#ifndef CONFIG_SMP
41617312f25SChristophe Leroy	/* Store PTE in PTEG */
417f892c21dSChristophe Leroy.Lfound_empty:
41817312f25SChristophe Leroy	STPTE	r5,0(r4)
419f892c21dSChristophe Leroy.Lfound_slot:
42017312f25SChristophe Leroy	STPTE	r8,HPTE_SIZE/2(r4)
42117312f25SChristophe Leroy
42217312f25SChristophe Leroy#else /* CONFIG_SMP */
42317312f25SChristophe Leroy/*
42417312f25SChristophe Leroy * Between the tlbie above and updating the hash table entry below,
42517312f25SChristophe Leroy * another CPU could read the hash table entry and put it in its TLB.
42617312f25SChristophe Leroy * There are 3 cases:
42717312f25SChristophe Leroy * 1. using an empty slot
42817312f25SChristophe Leroy * 2. updating an earlier entry to change permissions (i.e. enable write)
42917312f25SChristophe Leroy * 3. taking over the PTE for an unrelated address
43017312f25SChristophe Leroy *
43117312f25SChristophe Leroy * In each case it doesn't really matter if the other CPUs have the old
43217312f25SChristophe Leroy * PTE in their TLB.  So we don't need to bother with another tlbie here,
43317312f25SChristophe Leroy * which is convenient as we've overwritten the register that had the
43417312f25SChristophe Leroy * address. :-)  The tlbie above is mainly to make sure that this CPU comes
43517312f25SChristophe Leroy * and gets the new PTE from the hash table.
43617312f25SChristophe Leroy *
43717312f25SChristophe Leroy * We do however have to make sure that the PTE is never in an invalid
43817312f25SChristophe Leroy * state with the V bit set.
43917312f25SChristophe Leroy */
440f892c21dSChristophe Leroy.Lfound_empty:
441f892c21dSChristophe Leroy.Lfound_slot:
44217312f25SChristophe Leroy	CLR_V(r5,r0)		/* clear V (valid) bit in PTE */
44317312f25SChristophe Leroy	STPTE	r5,0(r4)
44417312f25SChristophe Leroy	sync
44517312f25SChristophe Leroy	TLBSYNC
44617312f25SChristophe Leroy	STPTE	r8,HPTE_SIZE/2(r4) /* put in correct RPN, WIMG, PP bits */
44717312f25SChristophe Leroy	sync
44817312f25SChristophe Leroy	SET_V(r5)
44917312f25SChristophe Leroy	STPTE	r5,0(r4)	/* finally set V bit in PTE */
45017312f25SChristophe Leroy#endif /* CONFIG_SMP */
45117312f25SChristophe Leroy
45217312f25SChristophe Leroy	sync		/* make sure pte updates get to memory */
45317312f25SChristophe Leroy	blr
45469a1593aSChristophe Leroy	.previous
455e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(create_hpte)
45617312f25SChristophe Leroy
45717312f25SChristophe Leroy	.section .bss
45817312f25SChristophe Leroy	.align	2
45917312f25SChristophe Leroynext_slot:
46017312f25SChristophe Leroy	.space	4
46117312f25SChristophe Leroy	.previous
46217312f25SChristophe Leroy
46317312f25SChristophe Leroy/*
46417312f25SChristophe Leroy * Flush the entry for a particular page from the hash table.
46517312f25SChristophe Leroy *
46617312f25SChristophe Leroy * flush_hash_pages(unsigned context, unsigned long va, unsigned long pmdval,
46717312f25SChristophe Leroy *		    int count)
46817312f25SChristophe Leroy *
46917312f25SChristophe Leroy * We assume that there is a hash table in use (Hash != 0).
47017312f25SChristophe Leroy */
47169a1593aSChristophe Leroy__REF
47217312f25SChristophe Leroy_GLOBAL(flush_hash_pages)
47317312f25SChristophe Leroy	/*
47417312f25SChristophe Leroy	 * We disable interrupts here, even on UP, because we want
47517312f25SChristophe Leroy	 * the _PAGE_HASHPTE bit to be a reliable indication of
47617312f25SChristophe Leroy	 * whether the HPTE exists (or at least whether one did once).
47717312f25SChristophe Leroy	 * We also turn off the MMU for data accesses so that we
47817312f25SChristophe Leroy	 * we can't take a hash table miss (assuming the code is
47917312f25SChristophe Leroy	 * covered by a BAT).  -- paulus
48017312f25SChristophe Leroy	 */
48117312f25SChristophe Leroy	mfmsr	r10
48217312f25SChristophe Leroy	rlwinm	r0,r10,0,17,15		/* clear bit 16 (MSR_EE) */
48317312f25SChristophe Leroy	rlwinm	r0,r0,0,28,26		/* clear MSR_DR */
48417312f25SChristophe Leroy	mtmsr	r0
48517312f25SChristophe Leroy	isync
48617312f25SChristophe Leroy
48717312f25SChristophe Leroy	/* First find a PTE in the range that has _PAGE_HASHPTE set */
48817312f25SChristophe Leroy#ifndef CONFIG_PTE_64BIT
48917312f25SChristophe Leroy	rlwimi	r5,r4,22,20,29
49017312f25SChristophe Leroy#else
49117312f25SChristophe Leroy	rlwimi	r5,r4,23,20,28
49217312f25SChristophe Leroy#endif
49317312f25SChristophe Leroy1:	lwz	r0,PTE_FLAGS_OFFSET(r5)
49417312f25SChristophe Leroy	cmpwi	cr1,r6,1
49517312f25SChristophe Leroy	andi.	r0,r0,_PAGE_HASHPTE
49617312f25SChristophe Leroy	bne	2f
49717312f25SChristophe Leroy	ble	cr1,19f
49817312f25SChristophe Leroy	addi	r4,r4,0x1000
49917312f25SChristophe Leroy	addi	r5,r5,PTE_SIZE
50017312f25SChristophe Leroy	addi	r6,r6,-1
50117312f25SChristophe Leroy	b	1b
50217312f25SChristophe Leroy
50317312f25SChristophe Leroy	/* Convert context and va to VSID */
50417312f25SChristophe Leroy2:	mulli	r3,r3,897*16		/* multiply context by context skew */
50517312f25SChristophe Leroy	rlwinm	r0,r4,4,28,31		/* get ESID (top 4 bits of va) */
50617312f25SChristophe Leroy	mulli	r0,r0,0x111		/* multiply by ESID skew */
50717312f25SChristophe Leroy	add	r3,r3,r0		/* note code below trims to 24 bits */
50817312f25SChristophe Leroy
50917312f25SChristophe Leroy	/* Construct the high word of the PPC-style PTE (r11) */
51017312f25SChristophe Leroy	rlwinm	r11,r3,7,1,24		/* put VSID in 0x7fffff80 bits */
51117312f25SChristophe Leroy	rlwimi	r11,r4,10,26,31		/* put in API (abbrev page index) */
51217312f25SChristophe Leroy	SET_V(r11)			/* set V (valid) bit */
51317312f25SChristophe Leroy
51417312f25SChristophe Leroy#ifdef CONFIG_SMP
51517312f25SChristophe Leroy	lis	r9, (mmu_hash_lock - PAGE_OFFSET)@ha
51617312f25SChristophe Leroy	addi	r9, r9, (mmu_hash_lock - PAGE_OFFSET)@l
517397d2300SChristophe Leroy	tophys	(r8, r2)
518397d2300SChristophe Leroy	lwz	r8, TASK_CPU(r8)
51917312f25SChristophe Leroy	oris	r8,r8,9
52017312f25SChristophe Leroy10:	lwarx	r0,0,r9
52117312f25SChristophe Leroy	cmpi	0,r0,0
52217312f25SChristophe Leroy	bne-	11f
52317312f25SChristophe Leroy	stwcx.	r8,0,r9
52417312f25SChristophe Leroy	beq+	12f
52517312f25SChristophe Leroy11:	lwz	r0,0(r9)
52617312f25SChristophe Leroy	cmpi	0,r0,0
52717312f25SChristophe Leroy	beq	10b
52817312f25SChristophe Leroy	b	11b
52917312f25SChristophe Leroy12:	isync
53017312f25SChristophe Leroy#endif
53117312f25SChristophe Leroy
53217312f25SChristophe Leroy	/*
53317312f25SChristophe Leroy	 * Check the _PAGE_HASHPTE bit in the linux PTE.  If it is
53417312f25SChristophe Leroy	 * already clear, we're done (for this pte).  If not,
53517312f25SChristophe Leroy	 * clear it (atomically) and proceed.  -- paulus.
53617312f25SChristophe Leroy	 */
53717312f25SChristophe Leroy#if (PTE_FLAGS_OFFSET != 0)
53817312f25SChristophe Leroy	addi	r5,r5,PTE_FLAGS_OFFSET
53917312f25SChristophe Leroy#endif
54017312f25SChristophe Leroy33:	lwarx	r8,0,r5			/* fetch the pte flags word */
54117312f25SChristophe Leroy	andi.	r0,r8,_PAGE_HASHPTE
54217312f25SChristophe Leroy	beq	8f			/* done if HASHPTE is already clear */
54340bb0e90SChristophe Leroy	rlwinm	r8,r8,0,31,29		/* clear HASHPTE bit */
54417312f25SChristophe Leroy	stwcx.	r8,0,r5			/* update the pte */
54517312f25SChristophe Leroy	bne-	33b
54617312f25SChristophe Leroy
54717312f25SChristophe Leroy	patch_site	0f, patch__flush_hash_A0
54817312f25SChristophe Leroy	patch_site	1f, patch__flush_hash_A1
54917312f25SChristophe Leroy	patch_site	2f, patch__flush_hash_A2
55017312f25SChristophe Leroy	/* Get the address of the primary PTE group in the hash table (r3) */
55117312f25SChristophe Leroy0:	lis	r8, (Hash_base - PAGE_OFFSET)@h	/* base address of hash table */
55217312f25SChristophe Leroy1:	rlwimi	r8,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT    /* VSID -> hash */
55317312f25SChristophe Leroy2:	rlwinm	r0,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */
55417312f25SChristophe Leroy	xor	r8,r0,r8		/* make primary hash */
55517312f25SChristophe Leroy
55617312f25SChristophe Leroy	/* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */
55717312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
55817312f25SChristophe Leroy	mtctr	r0
55917312f25SChristophe Leroy	addi	r12,r8,-HPTE_SIZE
56017312f25SChristophe Leroy1:	LDPTEu	r0,HPTE_SIZE(r12)	/* get next PTE */
56117312f25SChristophe Leroy	CMPPTE	0,r0,r11
56217312f25SChristophe Leroy	bdnzf	2,1b			/* loop while ctr != 0 && !cr0.eq */
56317312f25SChristophe Leroy	beq+	3f
56417312f25SChristophe Leroy
56517312f25SChristophe Leroy	patch_site	0f, patch__flush_hash_B
56617312f25SChristophe Leroy	/* Search the secondary PTEG for a matching PTE */
56717312f25SChristophe Leroy	ori	r11,r11,PTE_H		/* set H (secondary hash) bit */
56817312f25SChristophe Leroy	li	r0,8			/* PTEs/group */
56917312f25SChristophe Leroy0:	xoris	r12,r8,Hash_msk>>16	/* compute secondary hash */
57017312f25SChristophe Leroy	xori	r12,r12,(-PTEG_SIZE & 0xffff)
57117312f25SChristophe Leroy	addi	r12,r12,-HPTE_SIZE
57217312f25SChristophe Leroy	mtctr	r0
57317312f25SChristophe Leroy2:	LDPTEu	r0,HPTE_SIZE(r12)
57417312f25SChristophe Leroy	CMPPTE	0,r0,r11
57517312f25SChristophe Leroy	bdnzf	2,2b
57617312f25SChristophe Leroy	xori	r11,r11,PTE_H		/* clear H again */
57717312f25SChristophe Leroy	bne-	4f			/* should rarely fail to find it */
57817312f25SChristophe Leroy
57917312f25SChristophe Leroy3:	li	r0,0
58017312f25SChristophe Leroy	STPTE	r0,0(r12)		/* invalidate entry */
58117312f25SChristophe Leroy4:	sync
58217312f25SChristophe Leroy	tlbie	r4			/* in hw tlb too */
58317312f25SChristophe Leroy	sync
58417312f25SChristophe Leroy
58517312f25SChristophe Leroy8:	ble	cr1,9f			/* if all ptes checked */
58617312f25SChristophe Leroy81:	addi	r6,r6,-1
58717312f25SChristophe Leroy	addi	r5,r5,PTE_SIZE
58817312f25SChristophe Leroy	addi	r4,r4,0x1000
58917312f25SChristophe Leroy	lwz	r0,0(r5)		/* check next pte */
59017312f25SChristophe Leroy	cmpwi	cr1,r6,1
59117312f25SChristophe Leroy	andi.	r0,r0,_PAGE_HASHPTE
59217312f25SChristophe Leroy	bne	33b
59317312f25SChristophe Leroy	bgt	cr1,81b
59417312f25SChristophe Leroy
59517312f25SChristophe Leroy9:
59617312f25SChristophe Leroy#ifdef CONFIG_SMP
59717312f25SChristophe Leroy	TLBSYNC
59817312f25SChristophe Leroy	li	r0,0
59917312f25SChristophe Leroy	stw	r0,0(r9)		/* clear mmu_hash_lock */
60017312f25SChristophe Leroy#endif
60117312f25SChristophe Leroy
60217312f25SChristophe Leroy19:	mtmsr	r10
60317312f25SChristophe Leroy	isync
60417312f25SChristophe Leroy	blr
60569a1593aSChristophe Leroy	.previous
60617312f25SChristophe LeroyEXPORT_SYMBOL(flush_hash_pages)
607e6209318SChristophe Leroy_ASM_NOKPROBE_SYMBOL(flush_hash_pages)
608