147d99948SChristophe Leroy /*
247d99948SChristophe Leroy * Copyright IBM Corporation, 2013
347d99948SChristophe Leroy * Author Aneesh Kumar K.V <aneesh.kumar@linux.ibm.com>
447d99948SChristophe Leroy *
547d99948SChristophe Leroy * This program is free software; you can redistribute it and/or modify it
647d99948SChristophe Leroy * under the terms of version 2.1 of the GNU Lesser General Public License
747d99948SChristophe Leroy * as published by the Free Software Foundation.
847d99948SChristophe Leroy *
947d99948SChristophe Leroy * This program is distributed in the hope that it would be useful, but
1047d99948SChristophe Leroy * WITHOUT ANY WARRANTY; without even the implied warranty of
1147d99948SChristophe Leroy * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
1247d99948SChristophe Leroy *
1347d99948SChristophe Leroy */
1447d99948SChristophe Leroy
1547d99948SChristophe Leroy /*
1647d99948SChristophe Leroy * PPC64 THP Support for hash based MMUs
1747d99948SChristophe Leroy */
1847d99948SChristophe Leroy #include <linux/mm.h>
1947d99948SChristophe Leroy #include <asm/machdep.h>
2047d99948SChristophe Leroy
__hash_page_thp(unsigned long ea,unsigned long access,unsigned long vsid,pmd_t * pmdp,unsigned long trap,unsigned long flags,int ssize,unsigned int psize)2147d99948SChristophe Leroy int __hash_page_thp(unsigned long ea, unsigned long access, unsigned long vsid,
2247d99948SChristophe Leroy pmd_t *pmdp, unsigned long trap, unsigned long flags,
2347d99948SChristophe Leroy int ssize, unsigned int psize)
2447d99948SChristophe Leroy {
2547d99948SChristophe Leroy unsigned int index, valid;
2647d99948SChristophe Leroy unsigned char *hpte_slot_array;
2747d99948SChristophe Leroy unsigned long rflags, pa, hidx;
2847d99948SChristophe Leroy unsigned long old_pmd, new_pmd;
2947d99948SChristophe Leroy int ret, lpsize = MMU_PAGE_16M;
3047d99948SChristophe Leroy unsigned long vpn, hash, shift, slot;
3147d99948SChristophe Leroy
3247d99948SChristophe Leroy /*
3347d99948SChristophe Leroy * atomically mark the linux large page PMD busy and dirty
3447d99948SChristophe Leroy */
3547d99948SChristophe Leroy do {
3647d99948SChristophe Leroy pmd_t pmd = READ_ONCE(*pmdp);
3747d99948SChristophe Leroy
3847d99948SChristophe Leroy old_pmd = pmd_val(pmd);
3947d99948SChristophe Leroy /* If PMD busy, retry the access */
4047d99948SChristophe Leroy if (unlikely(old_pmd & H_PAGE_BUSY))
4147d99948SChristophe Leroy return 0;
4247d99948SChristophe Leroy /* If PMD permissions don't match, take page fault */
4347d99948SChristophe Leroy if (unlikely(!check_pte_access(access, old_pmd)))
4447d99948SChristophe Leroy return 1;
4547d99948SChristophe Leroy /*
4647d99948SChristophe Leroy * Try to lock the PTE, add ACCESSED and DIRTY if it was
4747d99948SChristophe Leroy * a write access
4847d99948SChristophe Leroy */
4947d99948SChristophe Leroy new_pmd = old_pmd | H_PAGE_BUSY | _PAGE_ACCESSED;
5047d99948SChristophe Leroy if (access & _PAGE_WRITE)
5147d99948SChristophe Leroy new_pmd |= _PAGE_DIRTY;
5247d99948SChristophe Leroy } while (!pmd_xchg(pmdp, __pmd(old_pmd), __pmd(new_pmd)));
5347d99948SChristophe Leroy
5447d99948SChristophe Leroy /*
5547d99948SChristophe Leroy * Make sure this is thp or devmap entry
5647d99948SChristophe Leroy */
5747d99948SChristophe Leroy if (!(old_pmd & (H_PAGE_THP_HUGE | _PAGE_DEVMAP)))
5847d99948SChristophe Leroy return 0;
5947d99948SChristophe Leroy
60*d94b827eSAneesh Kumar K.V rflags = htab_convert_pte_flags(new_pmd, flags);
6147d99948SChristophe Leroy
6247d99948SChristophe Leroy #if 0
6347d99948SChristophe Leroy if (!cpu_has_feature(CPU_FTR_COHERENT_ICACHE)) {
6447d99948SChristophe Leroy
6547d99948SChristophe Leroy /*
6647d99948SChristophe Leroy * No CPU has hugepages but lacks no execute, so we
6747d99948SChristophe Leroy * don't need to worry about that case
6847d99948SChristophe Leroy */
6947d99948SChristophe Leroy rflags = hash_page_do_lazy_icache(rflags, __pte(old_pte), trap);
7047d99948SChristophe Leroy }
7147d99948SChristophe Leroy #endif
7247d99948SChristophe Leroy /*
7347d99948SChristophe Leroy * Find the slot index details for this ea, using base page size.
7447d99948SChristophe Leroy */
7547d99948SChristophe Leroy shift = mmu_psize_defs[psize].shift;
7647d99948SChristophe Leroy index = (ea & ~HPAGE_PMD_MASK) >> shift;
7747d99948SChristophe Leroy BUG_ON(index >= PTE_FRAG_SIZE);
7847d99948SChristophe Leroy
7947d99948SChristophe Leroy vpn = hpt_vpn(ea, vsid, ssize);
8047d99948SChristophe Leroy hpte_slot_array = get_hpte_slot_array(pmdp);
8147d99948SChristophe Leroy if (psize == MMU_PAGE_4K) {
8247d99948SChristophe Leroy /*
8347d99948SChristophe Leroy * invalidate the old hpte entry if we have that mapped via 64K
8447d99948SChristophe Leroy * base page size. This is because demote_segment won't flush
8547d99948SChristophe Leroy * hash page table entries.
8647d99948SChristophe Leroy */
8747d99948SChristophe Leroy if ((old_pmd & H_PAGE_HASHPTE) && !(old_pmd & H_PAGE_COMBO)) {
8847d99948SChristophe Leroy flush_hash_hugepage(vsid, ea, pmdp, MMU_PAGE_64K,
8947d99948SChristophe Leroy ssize, flags);
9047d99948SChristophe Leroy /*
9147d99948SChristophe Leroy * With THP, we also clear the slot information with
9247d99948SChristophe Leroy * respect to all the 64K hash pte mapping the 16MB
9347d99948SChristophe Leroy * page. They are all invalid now. This make sure we
9447d99948SChristophe Leroy * don't find the slot valid when we fault with 4k
9547d99948SChristophe Leroy * base page size.
9647d99948SChristophe Leroy *
9747d99948SChristophe Leroy */
9847d99948SChristophe Leroy memset(hpte_slot_array, 0, PTE_FRAG_SIZE);
9947d99948SChristophe Leroy }
10047d99948SChristophe Leroy }
10147d99948SChristophe Leroy
10247d99948SChristophe Leroy valid = hpte_valid(hpte_slot_array, index);
10347d99948SChristophe Leroy if (valid) {
10447d99948SChristophe Leroy /* update the hpte bits */
10547d99948SChristophe Leroy hash = hpt_hash(vpn, shift, ssize);
10647d99948SChristophe Leroy hidx = hpte_hash_index(hpte_slot_array, index);
10747d99948SChristophe Leroy if (hidx & _PTEIDX_SECONDARY)
10847d99948SChristophe Leroy hash = ~hash;
10947d99948SChristophe Leroy slot = (hash & htab_hash_mask) * HPTES_PER_GROUP;
11047d99948SChristophe Leroy slot += hidx & _PTEIDX_GROUP_IX;
11147d99948SChristophe Leroy
11247d99948SChristophe Leroy ret = mmu_hash_ops.hpte_updatepp(slot, rflags, vpn,
11347d99948SChristophe Leroy psize, lpsize, ssize, flags);
11447d99948SChristophe Leroy /*
11547d99948SChristophe Leroy * We failed to update, try to insert a new entry.
11647d99948SChristophe Leroy */
11747d99948SChristophe Leroy if (ret == -1) {
11847d99948SChristophe Leroy /*
11947d99948SChristophe Leroy * large pte is marked busy, so we can be sure
12047d99948SChristophe Leroy * nobody is looking at hpte_slot_array. hence we can
12147d99948SChristophe Leroy * safely update this here.
12247d99948SChristophe Leroy */
12347d99948SChristophe Leroy valid = 0;
12447d99948SChristophe Leroy hpte_slot_array[index] = 0;
12547d99948SChristophe Leroy }
12647d99948SChristophe Leroy }
12747d99948SChristophe Leroy
12847d99948SChristophe Leroy if (!valid) {
12947d99948SChristophe Leroy unsigned long hpte_group;
13047d99948SChristophe Leroy
13147d99948SChristophe Leroy hash = hpt_hash(vpn, shift, ssize);
13247d99948SChristophe Leroy /* insert new entry */
13347d99948SChristophe Leroy pa = pmd_pfn(__pmd(old_pmd)) << PAGE_SHIFT;
13447d99948SChristophe Leroy new_pmd |= H_PAGE_HASHPTE;
13547d99948SChristophe Leroy
13647d99948SChristophe Leroy repeat:
13747d99948SChristophe Leroy hpte_group = (hash & htab_hash_mask) * HPTES_PER_GROUP;
13847d99948SChristophe Leroy
13947d99948SChristophe Leroy /* Insert into the hash table, primary slot */
14047d99948SChristophe Leroy slot = mmu_hash_ops.hpte_insert(hpte_group, vpn, pa, rflags, 0,
14147d99948SChristophe Leroy psize, lpsize, ssize);
14247d99948SChristophe Leroy /*
14347d99948SChristophe Leroy * Primary is full, try the secondary
14447d99948SChristophe Leroy */
14547d99948SChristophe Leroy if (unlikely(slot == -1)) {
14647d99948SChristophe Leroy hpte_group = (~hash & htab_hash_mask) * HPTES_PER_GROUP;
14747d99948SChristophe Leroy slot = mmu_hash_ops.hpte_insert(hpte_group, vpn, pa,
14847d99948SChristophe Leroy rflags,
14947d99948SChristophe Leroy HPTE_V_SECONDARY,
15047d99948SChristophe Leroy psize, lpsize, ssize);
15147d99948SChristophe Leroy if (slot == -1) {
15247d99948SChristophe Leroy if (mftb() & 0x1)
15347d99948SChristophe Leroy hpte_group = (hash & htab_hash_mask) *
15447d99948SChristophe Leroy HPTES_PER_GROUP;
15547d99948SChristophe Leroy
15647d99948SChristophe Leroy mmu_hash_ops.hpte_remove(hpte_group);
15747d99948SChristophe Leroy goto repeat;
15847d99948SChristophe Leroy }
15947d99948SChristophe Leroy }
16047d99948SChristophe Leroy /*
16147d99948SChristophe Leroy * Hypervisor failure. Restore old pmd and return -1
16247d99948SChristophe Leroy * similar to __hash_page_*
16347d99948SChristophe Leroy */
16447d99948SChristophe Leroy if (unlikely(slot == -2)) {
16547d99948SChristophe Leroy *pmdp = __pmd(old_pmd);
16647d99948SChristophe Leroy hash_failure_debug(ea, access, vsid, trap, ssize,
16747d99948SChristophe Leroy psize, lpsize, old_pmd);
16847d99948SChristophe Leroy return -1;
16947d99948SChristophe Leroy }
17047d99948SChristophe Leroy /*
17147d99948SChristophe Leroy * large pte is marked busy, so we can be sure
17247d99948SChristophe Leroy * nobody is looking at hpte_slot_array. hence we can
17347d99948SChristophe Leroy * safely update this here.
17447d99948SChristophe Leroy */
17547d99948SChristophe Leroy mark_hpte_slot_valid(hpte_slot_array, index, slot);
17647d99948SChristophe Leroy }
17747d99948SChristophe Leroy /*
17847d99948SChristophe Leroy * Mark the pte with H_PAGE_COMBO, if we are trying to hash it with
17947d99948SChristophe Leroy * base page size 4k.
18047d99948SChristophe Leroy */
18147d99948SChristophe Leroy if (psize == MMU_PAGE_4K)
18247d99948SChristophe Leroy new_pmd |= H_PAGE_COMBO;
18347d99948SChristophe Leroy /*
18447d99948SChristophe Leroy * The hpte valid is stored in the pgtable whose address is in the
18547d99948SChristophe Leroy * second half of the PMD. Order this against clearing of the busy bit in
18647d99948SChristophe Leroy * huge pmd.
18747d99948SChristophe Leroy */
18847d99948SChristophe Leroy smp_wmb();
18947d99948SChristophe Leroy *pmdp = __pmd(new_pmd & ~H_PAGE_BUSY);
19047d99948SChristophe Leroy return 0;
19147d99948SChristophe Leroy }
192