1ac41aaeeSGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0
23610cce8SMartin Schwidefsky /*
3388186bcSChristian Borntraeger * Copyright IBM Corp. 2007, 2011
43610cce8SMartin Schwidefsky * Author(s): Martin Schwidefsky <schwidefsky@de.ibm.com>
53610cce8SMartin Schwidefsky */
63610cce8SMartin Schwidefsky
73610cce8SMartin Schwidefsky #include <linux/sched.h>
83610cce8SMartin Schwidefsky #include <linux/kernel.h>
93610cce8SMartin Schwidefsky #include <linux/errno.h>
105a0e3ad6STejun Heo #include <linux/gfp.h>
113610cce8SMartin Schwidefsky #include <linux/mm.h>
123610cce8SMartin Schwidefsky #include <linux/swap.h>
133610cce8SMartin Schwidefsky #include <linux/smp.h>
143610cce8SMartin Schwidefsky #include <linux/spinlock.h>
1580217147SMartin Schwidefsky #include <linux/rcupdate.h>
16e5992f2eSMartin Schwidefsky #include <linux/slab.h>
17b31288faSKonstantin Weitz #include <linux/swapops.h>
180b46e0a3SMartin Schwidefsky #include <linux/sysctl.h>
193ac8e380SDominik Dingel #include <linux/ksm.h>
203ac8e380SDominik Dingel #include <linux/mman.h>
213610cce8SMartin Schwidefsky
223610cce8SMartin Schwidefsky #include <asm/tlb.h>
233610cce8SMartin Schwidefsky #include <asm/tlbflush.h>
246252d702SMartin Schwidefsky #include <asm/mmu_context.h>
252d42f947SClaudio Imbrenda #include <asm/page-states.h>
263610cce8SMartin Schwidefsky
pgprot_writecombine(pgprot_t prot)27b02002ccSNiklas Schnelle pgprot_t pgprot_writecombine(pgprot_t prot)
28b02002ccSNiklas Schnelle {
29b02002ccSNiklas Schnelle /*
30b02002ccSNiklas Schnelle * mio_wb_bit_mask may be set on a different CPU, but it is only set
31b02002ccSNiklas Schnelle * once at init and only read afterwards.
32b02002ccSNiklas Schnelle */
33b02002ccSNiklas Schnelle return __pgprot(pgprot_val(prot) | mio_wb_bit_mask);
34b02002ccSNiklas Schnelle }
35b02002ccSNiklas Schnelle EXPORT_SYMBOL_GPL(pgprot_writecombine);
36b02002ccSNiklas Schnelle
pgprot_writethrough(pgprot_t prot)37b02002ccSNiklas Schnelle pgprot_t pgprot_writethrough(pgprot_t prot)
38b02002ccSNiklas Schnelle {
39b02002ccSNiklas Schnelle /*
40b02002ccSNiklas Schnelle * mio_wb_bit_mask may be set on a different CPU, but it is only set
41b02002ccSNiklas Schnelle * once at init and only read afterwards.
42b02002ccSNiklas Schnelle */
43b02002ccSNiklas Schnelle return __pgprot(pgprot_val(prot) & ~mio_wb_bit_mask);
44b02002ccSNiklas Schnelle }
45b02002ccSNiklas Schnelle EXPORT_SYMBOL_GPL(pgprot_writethrough);
46b02002ccSNiklas Schnelle
ptep_ipte_local(struct mm_struct * mm,unsigned long addr,pte_t * ptep,int nodat)47118bd31bSMartin Schwidefsky static inline void ptep_ipte_local(struct mm_struct *mm, unsigned long addr,
48cd774b90SMartin Schwidefsky pte_t *ptep, int nodat)
49118bd31bSMartin Schwidefsky {
50118bd31bSMartin Schwidefsky unsigned long opt, asce;
51118bd31bSMartin Schwidefsky
52118bd31bSMartin Schwidefsky if (MACHINE_HAS_TLB_GUEST) {
53118bd31bSMartin Schwidefsky opt = 0;
54118bd31bSMartin Schwidefsky asce = READ_ONCE(mm->context.gmap_asce);
55cd774b90SMartin Schwidefsky if (asce == 0UL || nodat)
56118bd31bSMartin Schwidefsky opt |= IPTE_NODAT;
5728c807e5SMartin Schwidefsky if (asce != -1UL) {
5828c807e5SMartin Schwidefsky asce = asce ? : mm->context.asce;
5928c807e5SMartin Schwidefsky opt |= IPTE_GUEST_ASCE;
6028c807e5SMartin Schwidefsky }
6128c807e5SMartin Schwidefsky __ptep_ipte(addr, ptep, opt, asce, IPTE_LOCAL);
62118bd31bSMartin Schwidefsky } else {
6328c807e5SMartin Schwidefsky __ptep_ipte(addr, ptep, 0, 0, IPTE_LOCAL);
64118bd31bSMartin Schwidefsky }
65118bd31bSMartin Schwidefsky }
66118bd31bSMartin Schwidefsky
ptep_ipte_global(struct mm_struct * mm,unsigned long addr,pte_t * ptep,int nodat)67118bd31bSMartin Schwidefsky static inline void ptep_ipte_global(struct mm_struct *mm, unsigned long addr,
68cd774b90SMartin Schwidefsky pte_t *ptep, int nodat)
69118bd31bSMartin Schwidefsky {
70118bd31bSMartin Schwidefsky unsigned long opt, asce;
71118bd31bSMartin Schwidefsky
72118bd31bSMartin Schwidefsky if (MACHINE_HAS_TLB_GUEST) {
73118bd31bSMartin Schwidefsky opt = 0;
74118bd31bSMartin Schwidefsky asce = READ_ONCE(mm->context.gmap_asce);
75cd774b90SMartin Schwidefsky if (asce == 0UL || nodat)
76118bd31bSMartin Schwidefsky opt |= IPTE_NODAT;
7728c807e5SMartin Schwidefsky if (asce != -1UL) {
7828c807e5SMartin Schwidefsky asce = asce ? : mm->context.asce;
7928c807e5SMartin Schwidefsky opt |= IPTE_GUEST_ASCE;
8028c807e5SMartin Schwidefsky }
8128c807e5SMartin Schwidefsky __ptep_ipte(addr, ptep, opt, asce, IPTE_GLOBAL);
82118bd31bSMartin Schwidefsky } else {
8328c807e5SMartin Schwidefsky __ptep_ipte(addr, ptep, 0, 0, IPTE_GLOBAL);
84118bd31bSMartin Schwidefsky }
85118bd31bSMartin Schwidefsky }
86118bd31bSMartin Schwidefsky
ptep_flush_direct(struct mm_struct * mm,unsigned long addr,pte_t * ptep,int nodat)87ebde765cSMartin Schwidefsky static inline pte_t ptep_flush_direct(struct mm_struct *mm,
88cd774b90SMartin Schwidefsky unsigned long addr, pte_t *ptep,
89cd774b90SMartin Schwidefsky int nodat)
90ebde765cSMartin Schwidefsky {
91ebde765cSMartin Schwidefsky pte_t old;
92ebde765cSMartin Schwidefsky
93ebde765cSMartin Schwidefsky old = *ptep;
94ebde765cSMartin Schwidefsky if (unlikely(pte_val(old) & _PAGE_INVALID))
95ebde765cSMartin Schwidefsky return old;
9664f31d58SMartin Schwidefsky atomic_inc(&mm->context.flush_count);
9764f31d58SMartin Schwidefsky if (MACHINE_HAS_TLB_LC &&
98ebde765cSMartin Schwidefsky cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
99cd774b90SMartin Schwidefsky ptep_ipte_local(mm, addr, ptep, nodat);
100ebde765cSMartin Schwidefsky else
101cd774b90SMartin Schwidefsky ptep_ipte_global(mm, addr, ptep, nodat);
10264f31d58SMartin Schwidefsky atomic_dec(&mm->context.flush_count);
103ebde765cSMartin Schwidefsky return old;
104ebde765cSMartin Schwidefsky }
105ebde765cSMartin Schwidefsky
ptep_flush_lazy(struct mm_struct * mm,unsigned long addr,pte_t * ptep,int nodat)106ebde765cSMartin Schwidefsky static inline pte_t ptep_flush_lazy(struct mm_struct *mm,
107cd774b90SMartin Schwidefsky unsigned long addr, pte_t *ptep,
108cd774b90SMartin Schwidefsky int nodat)
109ebde765cSMartin Schwidefsky {
110ebde765cSMartin Schwidefsky pte_t old;
111ebde765cSMartin Schwidefsky
112ebde765cSMartin Schwidefsky old = *ptep;
113ebde765cSMartin Schwidefsky if (unlikely(pte_val(old) & _PAGE_INVALID))
114ebde765cSMartin Schwidefsky return old;
11564f31d58SMartin Schwidefsky atomic_inc(&mm->context.flush_count);
11664f31d58SMartin Schwidefsky if (cpumask_equal(&mm->context.cpu_attach_mask,
11764f31d58SMartin Schwidefsky cpumask_of(smp_processor_id()))) {
118b8e3b379SHeiko Carstens set_pte(ptep, set_pte_bit(*ptep, __pgprot(_PAGE_INVALID)));
119ebde765cSMartin Schwidefsky mm->context.flush_mm = 1;
120ebde765cSMartin Schwidefsky } else
121cd774b90SMartin Schwidefsky ptep_ipte_global(mm, addr, ptep, nodat);
12264f31d58SMartin Schwidefsky atomic_dec(&mm->context.flush_count);
123ebde765cSMartin Schwidefsky return old;
124ebde765cSMartin Schwidefsky }
125ebde765cSMartin Schwidefsky
pgste_get_lock(pte_t * ptep)1261e133ab2SMartin Schwidefsky static inline pgste_t pgste_get_lock(pte_t *ptep)
1271e133ab2SMartin Schwidefsky {
1281e133ab2SMartin Schwidefsky unsigned long new = 0;
1291e133ab2SMartin Schwidefsky #ifdef CONFIG_PGSTE
1301e133ab2SMartin Schwidefsky unsigned long old;
1311e133ab2SMartin Schwidefsky
1321e133ab2SMartin Schwidefsky asm(
1331e133ab2SMartin Schwidefsky " lg %0,%2\n"
1341e133ab2SMartin Schwidefsky "0: lgr %1,%0\n"
1351e133ab2SMartin Schwidefsky " nihh %0,0xff7f\n" /* clear PCL bit in old */
1361e133ab2SMartin Schwidefsky " oihh %1,0x0080\n" /* set PCL bit in new */
1371e133ab2SMartin Schwidefsky " csg %0,%1,%2\n"
1381e133ab2SMartin Schwidefsky " jl 0b\n"
1391e133ab2SMartin Schwidefsky : "=&d" (old), "=&d" (new), "=Q" (ptep[PTRS_PER_PTE])
1401e133ab2SMartin Schwidefsky : "Q" (ptep[PTRS_PER_PTE]) : "cc", "memory");
1411e133ab2SMartin Schwidefsky #endif
1421e133ab2SMartin Schwidefsky return __pgste(new);
1431e133ab2SMartin Schwidefsky }
1441e133ab2SMartin Schwidefsky
pgste_set_unlock(pte_t * ptep,pgste_t pgste)1451e133ab2SMartin Schwidefsky static inline void pgste_set_unlock(pte_t *ptep, pgste_t pgste)
1461e133ab2SMartin Schwidefsky {
1471e133ab2SMartin Schwidefsky #ifdef CONFIG_PGSTE
1481e133ab2SMartin Schwidefsky asm(
1491e133ab2SMartin Schwidefsky " nihh %1,0xff7f\n" /* clear PCL bit */
1501e133ab2SMartin Schwidefsky " stg %1,%0\n"
1511e133ab2SMartin Schwidefsky : "=Q" (ptep[PTRS_PER_PTE])
1521e133ab2SMartin Schwidefsky : "d" (pgste_val(pgste)), "Q" (ptep[PTRS_PER_PTE])
1531e133ab2SMartin Schwidefsky : "cc", "memory");
1541e133ab2SMartin Schwidefsky #endif
1551e133ab2SMartin Schwidefsky }
1561e133ab2SMartin Schwidefsky
pgste_get(pte_t * ptep)1571e133ab2SMartin Schwidefsky static inline pgste_t pgste_get(pte_t *ptep)
1581e133ab2SMartin Schwidefsky {
1591e133ab2SMartin Schwidefsky unsigned long pgste = 0;
1601e133ab2SMartin Schwidefsky #ifdef CONFIG_PGSTE
1611e133ab2SMartin Schwidefsky pgste = *(unsigned long *)(ptep + PTRS_PER_PTE);
1621e133ab2SMartin Schwidefsky #endif
1631e133ab2SMartin Schwidefsky return __pgste(pgste);
1641e133ab2SMartin Schwidefsky }
1651e133ab2SMartin Schwidefsky
pgste_set(pte_t * ptep,pgste_t pgste)1661e133ab2SMartin Schwidefsky static inline void pgste_set(pte_t *ptep, pgste_t pgste)
1671e133ab2SMartin Schwidefsky {
1681e133ab2SMartin Schwidefsky #ifdef CONFIG_PGSTE
1691e133ab2SMartin Schwidefsky *(pgste_t *)(ptep + PTRS_PER_PTE) = pgste;
1701e133ab2SMartin Schwidefsky #endif
1711e133ab2SMartin Schwidefsky }
1721e133ab2SMartin Schwidefsky
pgste_update_all(pte_t pte,pgste_t pgste,struct mm_struct * mm)173ebde765cSMartin Schwidefsky static inline pgste_t pgste_update_all(pte_t pte, pgste_t pgste,
174ebde765cSMartin Schwidefsky struct mm_struct *mm)
175ebde765cSMartin Schwidefsky {
176ebde765cSMartin Schwidefsky #ifdef CONFIG_PGSTE
177ebde765cSMartin Schwidefsky unsigned long address, bits, skey;
178ebde765cSMartin Schwidefsky
17955531b74SJanosch Frank if (!mm_uses_skeys(mm) || pte_val(pte) & _PAGE_INVALID)
180ebde765cSMartin Schwidefsky return pgste;
181ebde765cSMartin Schwidefsky address = pte_val(pte) & PAGE_MASK;
182ebde765cSMartin Schwidefsky skey = (unsigned long) page_get_storage_key(address);
183ebde765cSMartin Schwidefsky bits = skey & (_PAGE_CHANGED | _PAGE_REFERENCED);
184ebde765cSMartin Schwidefsky /* Transfer page changed & referenced bit to guest bits in pgste */
185ebde765cSMartin Schwidefsky pgste_val(pgste) |= bits << 48; /* GR bit & GC bit */
186ebde765cSMartin Schwidefsky /* Copy page access key and fetch protection bit to pgste */
187ebde765cSMartin Schwidefsky pgste_val(pgste) &= ~(PGSTE_ACC_BITS | PGSTE_FP_BIT);
188ebde765cSMartin Schwidefsky pgste_val(pgste) |= (skey & (_PAGE_ACC_BITS | _PAGE_FP_BIT)) << 56;
189ebde765cSMartin Schwidefsky #endif
190ebde765cSMartin Schwidefsky return pgste;
191ebde765cSMartin Schwidefsky
192ebde765cSMartin Schwidefsky }
193ebde765cSMartin Schwidefsky
pgste_set_key(pte_t * ptep,pgste_t pgste,pte_t entry,struct mm_struct * mm)194ebde765cSMartin Schwidefsky static inline void pgste_set_key(pte_t *ptep, pgste_t pgste, pte_t entry,
195ebde765cSMartin Schwidefsky struct mm_struct *mm)
196ebde765cSMartin Schwidefsky {
197ebde765cSMartin Schwidefsky #ifdef CONFIG_PGSTE
198ebde765cSMartin Schwidefsky unsigned long address;
199ebde765cSMartin Schwidefsky unsigned long nkey;
200ebde765cSMartin Schwidefsky
20155531b74SJanosch Frank if (!mm_uses_skeys(mm) || pte_val(entry) & _PAGE_INVALID)
202ebde765cSMartin Schwidefsky return;
203ebde765cSMartin Schwidefsky VM_BUG_ON(!(pte_val(*ptep) & _PAGE_INVALID));
204ebde765cSMartin Schwidefsky address = pte_val(entry) & PAGE_MASK;
205ebde765cSMartin Schwidefsky /*
206ebde765cSMartin Schwidefsky * Set page access key and fetch protection bit from pgste.
207ebde765cSMartin Schwidefsky * The guest C/R information is still in the PGSTE, set real
208ebde765cSMartin Schwidefsky * key C/R to 0.
209ebde765cSMartin Schwidefsky */
210ebde765cSMartin Schwidefsky nkey = (pgste_val(pgste) & (PGSTE_ACC_BITS | PGSTE_FP_BIT)) >> 56;
211ebde765cSMartin Schwidefsky nkey |= (pgste_val(pgste) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 48;
212ebde765cSMartin Schwidefsky page_set_storage_key(address, nkey, 0);
213ebde765cSMartin Schwidefsky #endif
214ebde765cSMartin Schwidefsky }
215ebde765cSMartin Schwidefsky
pgste_set_pte(pte_t * ptep,pgste_t pgste,pte_t entry)216ebde765cSMartin Schwidefsky static inline pgste_t pgste_set_pte(pte_t *ptep, pgste_t pgste, pte_t entry)
217ebde765cSMartin Schwidefsky {
218ebde765cSMartin Schwidefsky #ifdef CONFIG_PGSTE
219ebde765cSMartin Schwidefsky if ((pte_val(entry) & _PAGE_PRESENT) &&
220ebde765cSMartin Schwidefsky (pte_val(entry) & _PAGE_WRITE) &&
221ebde765cSMartin Schwidefsky !(pte_val(entry) & _PAGE_INVALID)) {
222ebde765cSMartin Schwidefsky if (!MACHINE_HAS_ESOP) {
223ebde765cSMartin Schwidefsky /*
224ebde765cSMartin Schwidefsky * Without enhanced suppression-on-protection force
225ebde765cSMartin Schwidefsky * the dirty bit on for all writable ptes.
226ebde765cSMartin Schwidefsky */
2274a366f51SHeiko Carstens entry = set_pte_bit(entry, __pgprot(_PAGE_DIRTY));
2284a366f51SHeiko Carstens entry = clear_pte_bit(entry, __pgprot(_PAGE_PROTECT));
229ebde765cSMartin Schwidefsky }
230ebde765cSMartin Schwidefsky if (!(pte_val(entry) & _PAGE_PROTECT))
231ebde765cSMartin Schwidefsky /* This pte allows write access, set user-dirty */
232ebde765cSMartin Schwidefsky pgste_val(pgste) |= PGSTE_UC_BIT;
233ebde765cSMartin Schwidefsky }
234ebde765cSMartin Schwidefsky #endif
235b8e3b379SHeiko Carstens set_pte(ptep, entry);
236ebde765cSMartin Schwidefsky return pgste;
237ebde765cSMartin Schwidefsky }
238ebde765cSMartin Schwidefsky
pgste_pte_notify(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pgste_t pgste)239b2d73b2aSMartin Schwidefsky static inline pgste_t pgste_pte_notify(struct mm_struct *mm,
240ebde765cSMartin Schwidefsky unsigned long addr,
241ebde765cSMartin Schwidefsky pte_t *ptep, pgste_t pgste)
242ebde765cSMartin Schwidefsky {
243ebde765cSMartin Schwidefsky #ifdef CONFIG_PGSTE
2444be130a0SMartin Schwidefsky unsigned long bits;
2454be130a0SMartin Schwidefsky
2464be130a0SMartin Schwidefsky bits = pgste_val(pgste) & (PGSTE_IN_BIT | PGSTE_VSIE_BIT);
2474be130a0SMartin Schwidefsky if (bits) {
2484be130a0SMartin Schwidefsky pgste_val(pgste) ^= bits;
2494be130a0SMartin Schwidefsky ptep_notify(mm, addr, ptep, bits);
250ebde765cSMartin Schwidefsky }
251ebde765cSMartin Schwidefsky #endif
252ebde765cSMartin Schwidefsky return pgste;
253ebde765cSMartin Schwidefsky }
254ebde765cSMartin Schwidefsky
ptep_xchg_start(struct mm_struct * mm,unsigned long addr,pte_t * ptep)255ebde765cSMartin Schwidefsky static inline pgste_t ptep_xchg_start(struct mm_struct *mm,
256ebde765cSMartin Schwidefsky unsigned long addr, pte_t *ptep)
257ebde765cSMartin Schwidefsky {
258ebde765cSMartin Schwidefsky pgste_t pgste = __pgste(0);
259ebde765cSMartin Schwidefsky
260ebde765cSMartin Schwidefsky if (mm_has_pgste(mm)) {
261ebde765cSMartin Schwidefsky pgste = pgste_get_lock(ptep);
262b2d73b2aSMartin Schwidefsky pgste = pgste_pte_notify(mm, addr, ptep, pgste);
263ebde765cSMartin Schwidefsky }
264ebde765cSMartin Schwidefsky return pgste;
265ebde765cSMartin Schwidefsky }
266ebde765cSMartin Schwidefsky
ptep_xchg_commit(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pgste_t pgste,pte_t old,pte_t new)2670d6da872SChristian Borntraeger static inline pte_t ptep_xchg_commit(struct mm_struct *mm,
268ebde765cSMartin Schwidefsky unsigned long addr, pte_t *ptep,
269ebde765cSMartin Schwidefsky pgste_t pgste, pte_t old, pte_t new)
270ebde765cSMartin Schwidefsky {
271ebde765cSMartin Schwidefsky if (mm_has_pgste(mm)) {
272ebde765cSMartin Schwidefsky if (pte_val(old) & _PAGE_INVALID)
273ebde765cSMartin Schwidefsky pgste_set_key(ptep, pgste, new, mm);
274ebde765cSMartin Schwidefsky if (pte_val(new) & _PAGE_INVALID) {
275ebde765cSMartin Schwidefsky pgste = pgste_update_all(old, pgste, mm);
276ebde765cSMartin Schwidefsky if ((pgste_val(pgste) & _PGSTE_GPS_USAGE_MASK) ==
277ebde765cSMartin Schwidefsky _PGSTE_GPS_USAGE_UNUSED)
2784a366f51SHeiko Carstens old = set_pte_bit(old, __pgprot(_PAGE_UNUSED));
279ebde765cSMartin Schwidefsky }
280ebde765cSMartin Schwidefsky pgste = pgste_set_pte(ptep, pgste, new);
281ebde765cSMartin Schwidefsky pgste_set_unlock(ptep, pgste);
282ebde765cSMartin Schwidefsky } else {
283b8e3b379SHeiko Carstens set_pte(ptep, new);
284ebde765cSMartin Schwidefsky }
2850d6da872SChristian Borntraeger return old;
286ebde765cSMartin Schwidefsky }
287ebde765cSMartin Schwidefsky
ptep_xchg_direct(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pte_t new)288ebde765cSMartin Schwidefsky pte_t ptep_xchg_direct(struct mm_struct *mm, unsigned long addr,
289ebde765cSMartin Schwidefsky pte_t *ptep, pte_t new)
290ebde765cSMartin Schwidefsky {
291ebde765cSMartin Schwidefsky pgste_t pgste;
292ebde765cSMartin Schwidefsky pte_t old;
293cd774b90SMartin Schwidefsky int nodat;
294ebde765cSMartin Schwidefsky
295a9809407SMartin Schwidefsky preempt_disable();
296ebde765cSMartin Schwidefsky pgste = ptep_xchg_start(mm, addr, ptep);
297cd774b90SMartin Schwidefsky nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
298cd774b90SMartin Schwidefsky old = ptep_flush_direct(mm, addr, ptep, nodat);
2990d6da872SChristian Borntraeger old = ptep_xchg_commit(mm, addr, ptep, pgste, old, new);
300a9809407SMartin Schwidefsky preempt_enable();
301ebde765cSMartin Schwidefsky return old;
302ebde765cSMartin Schwidefsky }
303ebde765cSMartin Schwidefsky EXPORT_SYMBOL(ptep_xchg_direct);
304ebde765cSMartin Schwidefsky
3050807b856SGerald Schaefer /*
3060807b856SGerald Schaefer * Caller must check that new PTE only differs in _PAGE_PROTECT HW bit, so that
3070807b856SGerald Schaefer * RDP can be used instead of IPTE. See also comments at pte_allow_rdp().
3080807b856SGerald Schaefer */
ptep_reset_dat_prot(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pte_t new)3090807b856SGerald Schaefer void ptep_reset_dat_prot(struct mm_struct *mm, unsigned long addr, pte_t *ptep,
3100807b856SGerald Schaefer pte_t new)
3110807b856SGerald Schaefer {
3120807b856SGerald Schaefer preempt_disable();
3130807b856SGerald Schaefer atomic_inc(&mm->context.flush_count);
3140807b856SGerald Schaefer if (cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
3150807b856SGerald Schaefer __ptep_rdp(addr, ptep, 0, 0, 1);
3160807b856SGerald Schaefer else
3170807b856SGerald Schaefer __ptep_rdp(addr, ptep, 0, 0, 0);
3180807b856SGerald Schaefer /*
3190807b856SGerald Schaefer * PTE is not invalidated by RDP, only _PAGE_PROTECT is cleared. That
3200807b856SGerald Schaefer * means it is still valid and active, and must not be changed according
3210807b856SGerald Schaefer * to the architecture. But writing a new value that only differs in SW
3220807b856SGerald Schaefer * bits is allowed.
3230807b856SGerald Schaefer */
3240807b856SGerald Schaefer set_pte(ptep, new);
3250807b856SGerald Schaefer atomic_dec(&mm->context.flush_count);
3260807b856SGerald Schaefer preempt_enable();
3270807b856SGerald Schaefer }
3280807b856SGerald Schaefer EXPORT_SYMBOL(ptep_reset_dat_prot);
3290807b856SGerald Schaefer
ptep_xchg_lazy(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pte_t new)330ebde765cSMartin Schwidefsky pte_t ptep_xchg_lazy(struct mm_struct *mm, unsigned long addr,
331ebde765cSMartin Schwidefsky pte_t *ptep, pte_t new)
332ebde765cSMartin Schwidefsky {
333ebde765cSMartin Schwidefsky pgste_t pgste;
334ebde765cSMartin Schwidefsky pte_t old;
335cd774b90SMartin Schwidefsky int nodat;
336ebde765cSMartin Schwidefsky
337a9809407SMartin Schwidefsky preempt_disable();
338ebde765cSMartin Schwidefsky pgste = ptep_xchg_start(mm, addr, ptep);
339cd774b90SMartin Schwidefsky nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
340cd774b90SMartin Schwidefsky old = ptep_flush_lazy(mm, addr, ptep, nodat);
3410d6da872SChristian Borntraeger old = ptep_xchg_commit(mm, addr, ptep, pgste, old, new);
342a9809407SMartin Schwidefsky preempt_enable();
343ebde765cSMartin Schwidefsky return old;
344ebde765cSMartin Schwidefsky }
345ebde765cSMartin Schwidefsky EXPORT_SYMBOL(ptep_xchg_lazy);
346ebde765cSMartin Schwidefsky
ptep_modify_prot_start(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep)3470cbe3e26SAneesh Kumar K.V pte_t ptep_modify_prot_start(struct vm_area_struct *vma, unsigned long addr,
348ebde765cSMartin Schwidefsky pte_t *ptep)
349ebde765cSMartin Schwidefsky {
350ebde765cSMartin Schwidefsky pgste_t pgste;
351ebde765cSMartin Schwidefsky pte_t old;
352cd774b90SMartin Schwidefsky int nodat;
3530cbe3e26SAneesh Kumar K.V struct mm_struct *mm = vma->vm_mm;
354ebde765cSMartin Schwidefsky
355a9809407SMartin Schwidefsky preempt_disable();
356ebde765cSMartin Schwidefsky pgste = ptep_xchg_start(mm, addr, ptep);
357cd774b90SMartin Schwidefsky nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
358cd774b90SMartin Schwidefsky old = ptep_flush_lazy(mm, addr, ptep, nodat);
359ebde765cSMartin Schwidefsky if (mm_has_pgste(mm)) {
360ebde765cSMartin Schwidefsky pgste = pgste_update_all(old, pgste, mm);
361ebde765cSMartin Schwidefsky pgste_set(ptep, pgste);
362ebde765cSMartin Schwidefsky }
363ebde765cSMartin Schwidefsky return old;
364ebde765cSMartin Schwidefsky }
365ebde765cSMartin Schwidefsky
ptep_modify_prot_commit(struct vm_area_struct * vma,unsigned long addr,pte_t * ptep,pte_t old_pte,pte_t pte)3660cbe3e26SAneesh Kumar K.V void ptep_modify_prot_commit(struct vm_area_struct *vma, unsigned long addr,
36704a86453SAneesh Kumar K.V pte_t *ptep, pte_t old_pte, pte_t pte)
368ebde765cSMartin Schwidefsky {
369ebde765cSMartin Schwidefsky pgste_t pgste;
3700cbe3e26SAneesh Kumar K.V struct mm_struct *mm = vma->vm_mm;
371ebde765cSMartin Schwidefsky
37257d7f939SMartin Schwidefsky if (!MACHINE_HAS_NX)
3734a366f51SHeiko Carstens pte = clear_pte_bit(pte, __pgprot(_PAGE_NOEXEC));
374ebde765cSMartin Schwidefsky if (mm_has_pgste(mm)) {
375ebde765cSMartin Schwidefsky pgste = pgste_get(ptep);
376ebde765cSMartin Schwidefsky pgste_set_key(ptep, pgste, pte, mm);
377ebde765cSMartin Schwidefsky pgste = pgste_set_pte(ptep, pgste, pte);
378ebde765cSMartin Schwidefsky pgste_set_unlock(ptep, pgste);
379ebde765cSMartin Schwidefsky } else {
380b8e3b379SHeiko Carstens set_pte(ptep, pte);
381ebde765cSMartin Schwidefsky }
382a9809407SMartin Schwidefsky preempt_enable();
383ebde765cSMartin Schwidefsky }
384ebde765cSMartin Schwidefsky
pmdp_idte_local(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp)385118bd31bSMartin Schwidefsky static inline void pmdp_idte_local(struct mm_struct *mm,
386118bd31bSMartin Schwidefsky unsigned long addr, pmd_t *pmdp)
387118bd31bSMartin Schwidefsky {
388118bd31bSMartin Schwidefsky if (MACHINE_HAS_TLB_GUEST)
38928c807e5SMartin Schwidefsky __pmdp_idte(addr, pmdp, IDTE_NODAT | IDTE_GUEST_ASCE,
39028c807e5SMartin Schwidefsky mm->context.asce, IDTE_LOCAL);
391118bd31bSMartin Schwidefsky else
39228c807e5SMartin Schwidefsky __pmdp_idte(addr, pmdp, 0, 0, IDTE_LOCAL);
393a9e00d83SJanosch Frank if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
3946a376277SJanosch Frank gmap_pmdp_idte_local(mm, addr);
395118bd31bSMartin Schwidefsky }
396118bd31bSMartin Schwidefsky
pmdp_idte_global(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp)397118bd31bSMartin Schwidefsky static inline void pmdp_idte_global(struct mm_struct *mm,
398118bd31bSMartin Schwidefsky unsigned long addr, pmd_t *pmdp)
399118bd31bSMartin Schwidefsky {
4006a376277SJanosch Frank if (MACHINE_HAS_TLB_GUEST) {
40128c807e5SMartin Schwidefsky __pmdp_idte(addr, pmdp, IDTE_NODAT | IDTE_GUEST_ASCE,
40228c807e5SMartin Schwidefsky mm->context.asce, IDTE_GLOBAL);
403a9e00d83SJanosch Frank if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
4046a376277SJanosch Frank gmap_pmdp_idte_global(mm, addr);
4056a376277SJanosch Frank } else if (MACHINE_HAS_IDTE) {
40628c807e5SMartin Schwidefsky __pmdp_idte(addr, pmdp, 0, 0, IDTE_GLOBAL);
407a9e00d83SJanosch Frank if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
4086a376277SJanosch Frank gmap_pmdp_idte_global(mm, addr);
4096a376277SJanosch Frank } else {
410118bd31bSMartin Schwidefsky __pmdp_csp(pmdp);
411a9e00d83SJanosch Frank if (mm_has_pgste(mm) && mm->context.allow_gmap_hpage_1m)
4126a376277SJanosch Frank gmap_pmdp_csp(mm, addr);
4136a376277SJanosch Frank }
414118bd31bSMartin Schwidefsky }
415118bd31bSMartin Schwidefsky
pmdp_flush_direct(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp)416227be799SMartin Schwidefsky static inline pmd_t pmdp_flush_direct(struct mm_struct *mm,
417227be799SMartin Schwidefsky unsigned long addr, pmd_t *pmdp)
418227be799SMartin Schwidefsky {
419227be799SMartin Schwidefsky pmd_t old;
420227be799SMartin Schwidefsky
421227be799SMartin Schwidefsky old = *pmdp;
422227be799SMartin Schwidefsky if (pmd_val(old) & _SEGMENT_ENTRY_INVALID)
423227be799SMartin Schwidefsky return old;
42464f31d58SMartin Schwidefsky atomic_inc(&mm->context.flush_count);
42564f31d58SMartin Schwidefsky if (MACHINE_HAS_TLB_LC &&
426227be799SMartin Schwidefsky cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
427118bd31bSMartin Schwidefsky pmdp_idte_local(mm, addr, pmdp);
428227be799SMartin Schwidefsky else
429118bd31bSMartin Schwidefsky pmdp_idte_global(mm, addr, pmdp);
43064f31d58SMartin Schwidefsky atomic_dec(&mm->context.flush_count);
431227be799SMartin Schwidefsky return old;
432227be799SMartin Schwidefsky }
433227be799SMartin Schwidefsky
pmdp_flush_lazy(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp)434227be799SMartin Schwidefsky static inline pmd_t pmdp_flush_lazy(struct mm_struct *mm,
435227be799SMartin Schwidefsky unsigned long addr, pmd_t *pmdp)
436227be799SMartin Schwidefsky {
437227be799SMartin Schwidefsky pmd_t old;
438227be799SMartin Schwidefsky
439227be799SMartin Schwidefsky old = *pmdp;
440227be799SMartin Schwidefsky if (pmd_val(old) & _SEGMENT_ENTRY_INVALID)
441227be799SMartin Schwidefsky return old;
44264f31d58SMartin Schwidefsky atomic_inc(&mm->context.flush_count);
44364f31d58SMartin Schwidefsky if (cpumask_equal(&mm->context.cpu_attach_mask,
44464f31d58SMartin Schwidefsky cpumask_of(smp_processor_id()))) {
445b8e3b379SHeiko Carstens set_pmd(pmdp, set_pmd_bit(*pmdp, __pgprot(_SEGMENT_ENTRY_INVALID)));
446227be799SMartin Schwidefsky mm->context.flush_mm = 1;
4476a376277SJanosch Frank if (mm_has_pgste(mm))
4486a376277SJanosch Frank gmap_pmdp_invalidate(mm, addr);
449118bd31bSMartin Schwidefsky } else {
450118bd31bSMartin Schwidefsky pmdp_idte_global(mm, addr, pmdp);
451118bd31bSMartin Schwidefsky }
45264f31d58SMartin Schwidefsky atomic_dec(&mm->context.flush_count);
453227be799SMartin Schwidefsky return old;
454227be799SMartin Schwidefsky }
455227be799SMartin Schwidefsky
45681a8f2beSThomas Huth #ifdef CONFIG_PGSTE
pmd_lookup(struct mm_struct * mm,unsigned long addr,pmd_t ** pmdp)457949f5c12SDavid Hildenbrand static int pmd_lookup(struct mm_struct *mm, unsigned long addr, pmd_t **pmdp)
458637ff9efSJanosch Frank {
459949f5c12SDavid Hildenbrand struct vm_area_struct *vma;
460637ff9efSJanosch Frank pgd_t *pgd;
461637ff9efSJanosch Frank p4d_t *p4d;
462637ff9efSJanosch Frank pud_t *pud;
463949f5c12SDavid Hildenbrand
464949f5c12SDavid Hildenbrand /* We need a valid VMA, otherwise this is clearly a fault. */
465949f5c12SDavid Hildenbrand vma = vma_lookup(mm, addr);
466949f5c12SDavid Hildenbrand if (!vma)
467949f5c12SDavid Hildenbrand return -EFAULT;
468637ff9efSJanosch Frank
469637ff9efSJanosch Frank pgd = pgd_offset(mm, addr);
470949f5c12SDavid Hildenbrand if (!pgd_present(*pgd))
471949f5c12SDavid Hildenbrand return -ENOENT;
472949f5c12SDavid Hildenbrand
473949f5c12SDavid Hildenbrand p4d = p4d_offset(pgd, addr);
474949f5c12SDavid Hildenbrand if (!p4d_present(*p4d))
475949f5c12SDavid Hildenbrand return -ENOENT;
476949f5c12SDavid Hildenbrand
477949f5c12SDavid Hildenbrand pud = pud_offset(p4d, addr);
478949f5c12SDavid Hildenbrand if (!pud_present(*pud))
479949f5c12SDavid Hildenbrand return -ENOENT;
480949f5c12SDavid Hildenbrand
481949f5c12SDavid Hildenbrand /* Large PUDs are not supported yet. */
482*907835e6SPeter Xu if (pud_leaf(*pud))
483949f5c12SDavid Hildenbrand return -EFAULT;
484949f5c12SDavid Hildenbrand
485949f5c12SDavid Hildenbrand *pmdp = pmd_offset(pud, addr);
486949f5c12SDavid Hildenbrand return 0;
487637ff9efSJanosch Frank }
48881a8f2beSThomas Huth #endif
489637ff9efSJanosch Frank
pmdp_xchg_direct(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp,pmd_t new)490227be799SMartin Schwidefsky pmd_t pmdp_xchg_direct(struct mm_struct *mm, unsigned long addr,
491227be799SMartin Schwidefsky pmd_t *pmdp, pmd_t new)
492227be799SMartin Schwidefsky {
493227be799SMartin Schwidefsky pmd_t old;
494227be799SMartin Schwidefsky
495a9809407SMartin Schwidefsky preempt_disable();
496227be799SMartin Schwidefsky old = pmdp_flush_direct(mm, addr, pmdp);
497b8e3b379SHeiko Carstens set_pmd(pmdp, new);
498a9809407SMartin Schwidefsky preempt_enable();
499227be799SMartin Schwidefsky return old;
500227be799SMartin Schwidefsky }
501227be799SMartin Schwidefsky EXPORT_SYMBOL(pmdp_xchg_direct);
502227be799SMartin Schwidefsky
pmdp_xchg_lazy(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp,pmd_t new)503227be799SMartin Schwidefsky pmd_t pmdp_xchg_lazy(struct mm_struct *mm, unsigned long addr,
504227be799SMartin Schwidefsky pmd_t *pmdp, pmd_t new)
505227be799SMartin Schwidefsky {
506227be799SMartin Schwidefsky pmd_t old;
507227be799SMartin Schwidefsky
508a9809407SMartin Schwidefsky preempt_disable();
509227be799SMartin Schwidefsky old = pmdp_flush_lazy(mm, addr, pmdp);
510b8e3b379SHeiko Carstens set_pmd(pmdp, new);
511a9809407SMartin Schwidefsky preempt_enable();
512227be799SMartin Schwidefsky return old;
513227be799SMartin Schwidefsky }
514227be799SMartin Schwidefsky EXPORT_SYMBOL(pmdp_xchg_lazy);
515227be799SMartin Schwidefsky
pudp_idte_local(struct mm_struct * mm,unsigned long addr,pud_t * pudp)516118bd31bSMartin Schwidefsky static inline void pudp_idte_local(struct mm_struct *mm,
517118bd31bSMartin Schwidefsky unsigned long addr, pud_t *pudp)
518118bd31bSMartin Schwidefsky {
519118bd31bSMartin Schwidefsky if (MACHINE_HAS_TLB_GUEST)
52028c807e5SMartin Schwidefsky __pudp_idte(addr, pudp, IDTE_NODAT | IDTE_GUEST_ASCE,
52128c807e5SMartin Schwidefsky mm->context.asce, IDTE_LOCAL);
522118bd31bSMartin Schwidefsky else
52328c807e5SMartin Schwidefsky __pudp_idte(addr, pudp, 0, 0, IDTE_LOCAL);
524118bd31bSMartin Schwidefsky }
525118bd31bSMartin Schwidefsky
pudp_idte_global(struct mm_struct * mm,unsigned long addr,pud_t * pudp)526118bd31bSMartin Schwidefsky static inline void pudp_idte_global(struct mm_struct *mm,
527118bd31bSMartin Schwidefsky unsigned long addr, pud_t *pudp)
528118bd31bSMartin Schwidefsky {
529118bd31bSMartin Schwidefsky if (MACHINE_HAS_TLB_GUEST)
53028c807e5SMartin Schwidefsky __pudp_idte(addr, pudp, IDTE_NODAT | IDTE_GUEST_ASCE,
53128c807e5SMartin Schwidefsky mm->context.asce, IDTE_GLOBAL);
532118bd31bSMartin Schwidefsky else if (MACHINE_HAS_IDTE)
53328c807e5SMartin Schwidefsky __pudp_idte(addr, pudp, 0, 0, IDTE_GLOBAL);
534118bd31bSMartin Schwidefsky else
535118bd31bSMartin Schwidefsky /*
536118bd31bSMartin Schwidefsky * Invalid bit position is the same for pmd and pud, so we can
537118bd31bSMartin Schwidefsky * re-use _pmd_csp() here
538118bd31bSMartin Schwidefsky */
539118bd31bSMartin Schwidefsky __pmdp_csp((pmd_t *) pudp);
540118bd31bSMartin Schwidefsky }
541118bd31bSMartin Schwidefsky
pudp_flush_direct(struct mm_struct * mm,unsigned long addr,pud_t * pudp)542d08de8e2SGerald Schaefer static inline pud_t pudp_flush_direct(struct mm_struct *mm,
543d08de8e2SGerald Schaefer unsigned long addr, pud_t *pudp)
544d08de8e2SGerald Schaefer {
545d08de8e2SGerald Schaefer pud_t old;
546d08de8e2SGerald Schaefer
547d08de8e2SGerald Schaefer old = *pudp;
548d08de8e2SGerald Schaefer if (pud_val(old) & _REGION_ENTRY_INVALID)
549d08de8e2SGerald Schaefer return old;
550d08de8e2SGerald Schaefer atomic_inc(&mm->context.flush_count);
551d08de8e2SGerald Schaefer if (MACHINE_HAS_TLB_LC &&
552d08de8e2SGerald Schaefer cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
553118bd31bSMartin Schwidefsky pudp_idte_local(mm, addr, pudp);
554d08de8e2SGerald Schaefer else
555118bd31bSMartin Schwidefsky pudp_idte_global(mm, addr, pudp);
556d08de8e2SGerald Schaefer atomic_dec(&mm->context.flush_count);
557d08de8e2SGerald Schaefer return old;
558d08de8e2SGerald Schaefer }
559d08de8e2SGerald Schaefer
pudp_xchg_direct(struct mm_struct * mm,unsigned long addr,pud_t * pudp,pud_t new)560d08de8e2SGerald Schaefer pud_t pudp_xchg_direct(struct mm_struct *mm, unsigned long addr,
561d08de8e2SGerald Schaefer pud_t *pudp, pud_t new)
562d08de8e2SGerald Schaefer {
563d08de8e2SGerald Schaefer pud_t old;
564d08de8e2SGerald Schaefer
565d08de8e2SGerald Schaefer preempt_disable();
566d08de8e2SGerald Schaefer old = pudp_flush_direct(mm, addr, pudp);
567b8e3b379SHeiko Carstens set_pud(pudp, new);
568d08de8e2SGerald Schaefer preempt_enable();
569d08de8e2SGerald Schaefer return old;
570d08de8e2SGerald Schaefer }
571d08de8e2SGerald Schaefer EXPORT_SYMBOL(pudp_xchg_direct);
572d08de8e2SGerald Schaefer
57375077afbSGerald Schaefer #ifdef CONFIG_TRANSPARENT_HUGEPAGE
pgtable_trans_huge_deposit(struct mm_struct * mm,pmd_t * pmdp,pgtable_t pgtable)5746b0b50b0SAneesh Kumar K.V void pgtable_trans_huge_deposit(struct mm_struct *mm, pmd_t *pmdp,
5756b0b50b0SAneesh Kumar K.V pgtable_t pgtable)
5769501d09fSGerald Schaefer {
5779501d09fSGerald Schaefer struct list_head *lh = (struct list_head *) pgtable;
5789501d09fSGerald Schaefer
579ec66ad66SMartin Schwidefsky assert_spin_locked(pmd_lockptr(mm, pmdp));
5809501d09fSGerald Schaefer
5819501d09fSGerald Schaefer /* FIFO */
582c389a250SKirill A. Shutemov if (!pmd_huge_pte(mm, pmdp))
5839501d09fSGerald Schaefer INIT_LIST_HEAD(lh);
5849501d09fSGerald Schaefer else
585c389a250SKirill A. Shutemov list_add(lh, (struct list_head *) pmd_huge_pte(mm, pmdp));
586c389a250SKirill A. Shutemov pmd_huge_pte(mm, pmdp) = pgtable;
5879501d09fSGerald Schaefer }
5889501d09fSGerald Schaefer
pgtable_trans_huge_withdraw(struct mm_struct * mm,pmd_t * pmdp)5896b0b50b0SAneesh Kumar K.V pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp)
5909501d09fSGerald Schaefer {
5919501d09fSGerald Schaefer struct list_head *lh;
5929501d09fSGerald Schaefer pgtable_t pgtable;
5939501d09fSGerald Schaefer pte_t *ptep;
5949501d09fSGerald Schaefer
595ec66ad66SMartin Schwidefsky assert_spin_locked(pmd_lockptr(mm, pmdp));
5969501d09fSGerald Schaefer
5979501d09fSGerald Schaefer /* FIFO */
598c389a250SKirill A. Shutemov pgtable = pmd_huge_pte(mm, pmdp);
5999501d09fSGerald Schaefer lh = (struct list_head *) pgtable;
6009501d09fSGerald Schaefer if (list_empty(lh))
601c389a250SKirill A. Shutemov pmd_huge_pte(mm, pmdp) = NULL;
6029501d09fSGerald Schaefer else {
603c389a250SKirill A. Shutemov pmd_huge_pte(mm, pmdp) = (pgtable_t) lh->next;
6049501d09fSGerald Schaefer list_del(lh);
6059501d09fSGerald Schaefer }
6069501d09fSGerald Schaefer ptep = (pte_t *) pgtable;
607b8e3b379SHeiko Carstens set_pte(ptep, __pte(_PAGE_INVALID));
6089501d09fSGerald Schaefer ptep++;
609b8e3b379SHeiko Carstens set_pte(ptep, __pte(_PAGE_INVALID));
6109501d09fSGerald Schaefer return pgtable;
6119501d09fSGerald Schaefer }
61275077afbSGerald Schaefer #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
6131e133ab2SMartin Schwidefsky
6141e133ab2SMartin Schwidefsky #ifdef CONFIG_PGSTE
ptep_set_pte_at(struct mm_struct * mm,unsigned long addr,pte_t * ptep,pte_t entry)6151e133ab2SMartin Schwidefsky void ptep_set_pte_at(struct mm_struct *mm, unsigned long addr,
6161e133ab2SMartin Schwidefsky pte_t *ptep, pte_t entry)
6171e133ab2SMartin Schwidefsky {
6181e133ab2SMartin Schwidefsky pgste_t pgste;
6191e133ab2SMartin Schwidefsky
6201e133ab2SMartin Schwidefsky /* the mm_has_pgste() check is done in set_pte_at() */
621a9809407SMartin Schwidefsky preempt_disable();
6221e133ab2SMartin Schwidefsky pgste = pgste_get_lock(ptep);
6231e133ab2SMartin Schwidefsky pgste_val(pgste) &= ~_PGSTE_GPS_ZERO;
6241e133ab2SMartin Schwidefsky pgste_set_key(ptep, pgste, entry, mm);
6251e133ab2SMartin Schwidefsky pgste = pgste_set_pte(ptep, pgste, entry);
6261e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
627a9809407SMartin Schwidefsky preempt_enable();
6281e133ab2SMartin Schwidefsky }
6291e133ab2SMartin Schwidefsky
ptep_set_notify(struct mm_struct * mm,unsigned long addr,pte_t * ptep)6301e133ab2SMartin Schwidefsky void ptep_set_notify(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
6311e133ab2SMartin Schwidefsky {
6321e133ab2SMartin Schwidefsky pgste_t pgste;
6331e133ab2SMartin Schwidefsky
634a9809407SMartin Schwidefsky preempt_disable();
6351e133ab2SMartin Schwidefsky pgste = pgste_get_lock(ptep);
6361e133ab2SMartin Schwidefsky pgste_val(pgste) |= PGSTE_IN_BIT;
6371e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
638a9809407SMartin Schwidefsky preempt_enable();
6391e133ab2SMartin Schwidefsky }
6401e133ab2SMartin Schwidefsky
641b2d73b2aSMartin Schwidefsky /**
642b2d73b2aSMartin Schwidefsky * ptep_force_prot - change access rights of a locked pte
643b2d73b2aSMartin Schwidefsky * @mm: pointer to the process mm_struct
644b2d73b2aSMartin Schwidefsky * @addr: virtual address in the guest address space
645b2d73b2aSMartin Schwidefsky * @ptep: pointer to the page table entry
646b2d73b2aSMartin Schwidefsky * @prot: indicates guest access rights: PROT_NONE, PROT_READ or PROT_WRITE
6474be130a0SMartin Schwidefsky * @bit: pgste bit to set (e.g. for notification)
648b2d73b2aSMartin Schwidefsky *
649b2d73b2aSMartin Schwidefsky * Returns 0 if the access rights were changed and -EAGAIN if the current
650b2d73b2aSMartin Schwidefsky * and requested access rights are incompatible.
651b2d73b2aSMartin Schwidefsky */
ptep_force_prot(struct mm_struct * mm,unsigned long addr,pte_t * ptep,int prot,unsigned long bit)652b2d73b2aSMartin Schwidefsky int ptep_force_prot(struct mm_struct *mm, unsigned long addr,
6534be130a0SMartin Schwidefsky pte_t *ptep, int prot, unsigned long bit)
654b2d73b2aSMartin Schwidefsky {
655b2d73b2aSMartin Schwidefsky pte_t entry;
656b2d73b2aSMartin Schwidefsky pgste_t pgste;
657cd774b90SMartin Schwidefsky int pte_i, pte_p, nodat;
658b2d73b2aSMartin Schwidefsky
659b2d73b2aSMartin Schwidefsky pgste = pgste_get_lock(ptep);
660b2d73b2aSMartin Schwidefsky entry = *ptep;
661b2d73b2aSMartin Schwidefsky /* Check pte entry after all locks have been acquired */
662b2d73b2aSMartin Schwidefsky pte_i = pte_val(entry) & _PAGE_INVALID;
663b2d73b2aSMartin Schwidefsky pte_p = pte_val(entry) & _PAGE_PROTECT;
664b2d73b2aSMartin Schwidefsky if ((pte_i && (prot != PROT_NONE)) ||
665b2d73b2aSMartin Schwidefsky (pte_p && (prot & PROT_WRITE))) {
666b2d73b2aSMartin Schwidefsky pgste_set_unlock(ptep, pgste);
667b2d73b2aSMartin Schwidefsky return -EAGAIN;
668b2d73b2aSMartin Schwidefsky }
6694be130a0SMartin Schwidefsky /* Change access rights and set pgste bit */
670cd774b90SMartin Schwidefsky nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
671b2d73b2aSMartin Schwidefsky if (prot == PROT_NONE && !pte_i) {
672cd774b90SMartin Schwidefsky ptep_flush_direct(mm, addr, ptep, nodat);
673b2d73b2aSMartin Schwidefsky pgste = pgste_update_all(entry, pgste, mm);
6744a366f51SHeiko Carstens entry = set_pte_bit(entry, __pgprot(_PAGE_INVALID));
675b2d73b2aSMartin Schwidefsky }
676b2d73b2aSMartin Schwidefsky if (prot == PROT_READ && !pte_p) {
677cd774b90SMartin Schwidefsky ptep_flush_direct(mm, addr, ptep, nodat);
6784a366f51SHeiko Carstens entry = clear_pte_bit(entry, __pgprot(_PAGE_INVALID));
6794a366f51SHeiko Carstens entry = set_pte_bit(entry, __pgprot(_PAGE_PROTECT));
680b2d73b2aSMartin Schwidefsky }
6814be130a0SMartin Schwidefsky pgste_val(pgste) |= bit;
682b2d73b2aSMartin Schwidefsky pgste = pgste_set_pte(ptep, pgste, entry);
683b2d73b2aSMartin Schwidefsky pgste_set_unlock(ptep, pgste);
684b2d73b2aSMartin Schwidefsky return 0;
685b2d73b2aSMartin Schwidefsky }
686b2d73b2aSMartin Schwidefsky
ptep_shadow_pte(struct mm_struct * mm,unsigned long saddr,pte_t * sptep,pte_t * tptep,pte_t pte)6874be130a0SMartin Schwidefsky int ptep_shadow_pte(struct mm_struct *mm, unsigned long saddr,
688a9d23e71SDavid Hildenbrand pte_t *sptep, pte_t *tptep, pte_t pte)
6894be130a0SMartin Schwidefsky {
6904be130a0SMartin Schwidefsky pgste_t spgste, tpgste;
6914be130a0SMartin Schwidefsky pte_t spte, tpte;
6924be130a0SMartin Schwidefsky int rc = -EAGAIN;
6934be130a0SMartin Schwidefsky
694a9d23e71SDavid Hildenbrand if (!(pte_val(*tptep) & _PAGE_INVALID))
695a9d23e71SDavid Hildenbrand return 0; /* already shadowed */
6964be130a0SMartin Schwidefsky spgste = pgste_get_lock(sptep);
6974be130a0SMartin Schwidefsky spte = *sptep;
6984be130a0SMartin Schwidefsky if (!(pte_val(spte) & _PAGE_INVALID) &&
699a9d23e71SDavid Hildenbrand !((pte_val(spte) & _PAGE_PROTECT) &&
700a9d23e71SDavid Hildenbrand !(pte_val(pte) & _PAGE_PROTECT))) {
7014be130a0SMartin Schwidefsky pgste_val(spgste) |= PGSTE_VSIE_BIT;
7024be130a0SMartin Schwidefsky tpgste = pgste_get_lock(tptep);
7034a366f51SHeiko Carstens tpte = __pte((pte_val(spte) & PAGE_MASK) |
7044a366f51SHeiko Carstens (pte_val(pte) & _PAGE_PROTECT));
7054be130a0SMartin Schwidefsky /* don't touch the storage key - it belongs to parent pgste */
7064be130a0SMartin Schwidefsky tpgste = pgste_set_pte(tptep, tpgste, tpte);
7074be130a0SMartin Schwidefsky pgste_set_unlock(tptep, tpgste);
708a9d23e71SDavid Hildenbrand rc = 1;
7094be130a0SMartin Schwidefsky }
7104be130a0SMartin Schwidefsky pgste_set_unlock(sptep, spgste);
7114be130a0SMartin Schwidefsky return rc;
7124be130a0SMartin Schwidefsky }
7134be130a0SMartin Schwidefsky
ptep_unshadow_pte(struct mm_struct * mm,unsigned long saddr,pte_t * ptep)7144be130a0SMartin Schwidefsky void ptep_unshadow_pte(struct mm_struct *mm, unsigned long saddr, pte_t *ptep)
7154be130a0SMartin Schwidefsky {
7164be130a0SMartin Schwidefsky pgste_t pgste;
717cd774b90SMartin Schwidefsky int nodat;
7184be130a0SMartin Schwidefsky
7194be130a0SMartin Schwidefsky pgste = pgste_get_lock(ptep);
7204be130a0SMartin Schwidefsky /* notifier is called by the caller */
721cd774b90SMartin Schwidefsky nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
722cd774b90SMartin Schwidefsky ptep_flush_direct(mm, saddr, ptep, nodat);
7234be130a0SMartin Schwidefsky /* don't touch the storage key - it belongs to parent pgste */
7244be130a0SMartin Schwidefsky pgste = pgste_set_pte(ptep, pgste, __pte(_PAGE_INVALID));
7254be130a0SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
7264be130a0SMartin Schwidefsky }
7274be130a0SMartin Schwidefsky
ptep_zap_swap_entry(struct mm_struct * mm,swp_entry_t entry)7281e133ab2SMartin Schwidefsky static void ptep_zap_swap_entry(struct mm_struct *mm, swp_entry_t entry)
7291e133ab2SMartin Schwidefsky {
7301e133ab2SMartin Schwidefsky if (!non_swap_entry(entry))
7311e133ab2SMartin Schwidefsky dec_mm_counter(mm, MM_SWAPENTS);
7321e133ab2SMartin Schwidefsky else if (is_migration_entry(entry)) {
733af5cdaf8SAlistair Popple struct page *page = pfn_swap_entry_to_page(entry);
7341e133ab2SMartin Schwidefsky
7351e133ab2SMartin Schwidefsky dec_mm_counter(mm, mm_counter(page));
7361e133ab2SMartin Schwidefsky }
7371e133ab2SMartin Schwidefsky free_swap_and_cache(entry);
7381e133ab2SMartin Schwidefsky }
7391e133ab2SMartin Schwidefsky
ptep_zap_unused(struct mm_struct * mm,unsigned long addr,pte_t * ptep,int reset)7401e133ab2SMartin Schwidefsky void ptep_zap_unused(struct mm_struct *mm, unsigned long addr,
7411e133ab2SMartin Schwidefsky pte_t *ptep, int reset)
7421e133ab2SMartin Schwidefsky {
7431e133ab2SMartin Schwidefsky unsigned long pgstev;
7441e133ab2SMartin Schwidefsky pgste_t pgste;
7451e133ab2SMartin Schwidefsky pte_t pte;
7461e133ab2SMartin Schwidefsky
7471e133ab2SMartin Schwidefsky /* Zap unused and logically-zero pages */
748a9809407SMartin Schwidefsky preempt_disable();
7491e133ab2SMartin Schwidefsky pgste = pgste_get_lock(ptep);
7501e133ab2SMartin Schwidefsky pgstev = pgste_val(pgste);
7511e133ab2SMartin Schwidefsky pte = *ptep;
7521c343f7bSChristian Borntraeger if (!reset && pte_swap(pte) &&
7531e133ab2SMartin Schwidefsky ((pgstev & _PGSTE_GPS_USAGE_MASK) == _PGSTE_GPS_USAGE_UNUSED ||
7541e133ab2SMartin Schwidefsky (pgstev & _PGSTE_GPS_ZERO))) {
7551e133ab2SMartin Schwidefsky ptep_zap_swap_entry(mm, pte_to_swp_entry(pte));
7561e133ab2SMartin Schwidefsky pte_clear(mm, addr, ptep);
7571e133ab2SMartin Schwidefsky }
7581e133ab2SMartin Schwidefsky if (reset)
759bb356cc6SClaudio Imbrenda pgste_val(pgste) &= ~(_PGSTE_GPS_USAGE_MASK | _PGSTE_GPS_NODAT);
7601e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
761a9809407SMartin Schwidefsky preempt_enable();
7621e133ab2SMartin Schwidefsky }
7631e133ab2SMartin Schwidefsky
ptep_zap_key(struct mm_struct * mm,unsigned long addr,pte_t * ptep)7641e133ab2SMartin Schwidefsky void ptep_zap_key(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
7651e133ab2SMartin Schwidefsky {
7661e133ab2SMartin Schwidefsky unsigned long ptev;
7671e133ab2SMartin Schwidefsky pgste_t pgste;
7681e133ab2SMartin Schwidefsky
76997ca7bfcSChristian Borntraeger /* Clear storage key ACC and F, but set R/C */
770a9809407SMartin Schwidefsky preempt_disable();
7711e133ab2SMartin Schwidefsky pgste = pgste_get_lock(ptep);
77297ca7bfcSChristian Borntraeger pgste_val(pgste) &= ~(PGSTE_ACC_BITS | PGSTE_FP_BIT);
77397ca7bfcSChristian Borntraeger pgste_val(pgste) |= PGSTE_GR_BIT | PGSTE_GC_BIT;
7741e133ab2SMartin Schwidefsky ptev = pte_val(*ptep);
7751e133ab2SMartin Schwidefsky if (!(ptev & _PAGE_INVALID) && (ptev & _PAGE_WRITE))
7763ae11dbcSChristian Borntraeger page_set_storage_key(ptev & PAGE_MASK, PAGE_DEFAULT_KEY, 0);
7771e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
778a9809407SMartin Schwidefsky preempt_enable();
7791e133ab2SMartin Schwidefsky }
7801e133ab2SMartin Schwidefsky
7811e133ab2SMartin Schwidefsky /*
7821e133ab2SMartin Schwidefsky * Test and reset if a guest page is dirty
7831e133ab2SMartin Schwidefsky */
ptep_test_and_clear_uc(struct mm_struct * mm,unsigned long addr,pte_t * ptep)7840959e168SJanosch Frank bool ptep_test_and_clear_uc(struct mm_struct *mm, unsigned long addr,
7850959e168SJanosch Frank pte_t *ptep)
7861e133ab2SMartin Schwidefsky {
7871e133ab2SMartin Schwidefsky pgste_t pgste;
7881e133ab2SMartin Schwidefsky pte_t pte;
7891e133ab2SMartin Schwidefsky bool dirty;
790cd774b90SMartin Schwidefsky int nodat;
7911e133ab2SMartin Schwidefsky
7921e133ab2SMartin Schwidefsky pgste = pgste_get_lock(ptep);
7931e133ab2SMartin Schwidefsky dirty = !!(pgste_val(pgste) & PGSTE_UC_BIT);
7941e133ab2SMartin Schwidefsky pgste_val(pgste) &= ~PGSTE_UC_BIT;
7951e133ab2SMartin Schwidefsky pte = *ptep;
7961e133ab2SMartin Schwidefsky if (dirty && (pte_val(pte) & _PAGE_PRESENT)) {
797b2d73b2aSMartin Schwidefsky pgste = pgste_pte_notify(mm, addr, ptep, pgste);
798cd774b90SMartin Schwidefsky nodat = !!(pgste_val(pgste) & _PGSTE_GPS_NODAT);
799cd774b90SMartin Schwidefsky ptep_ipte_global(mm, addr, ptep, nodat);
8001e133ab2SMartin Schwidefsky if (MACHINE_HAS_ESOP || !(pte_val(pte) & _PAGE_WRITE))
8014a366f51SHeiko Carstens pte = set_pte_bit(pte, __pgprot(_PAGE_PROTECT));
8021e133ab2SMartin Schwidefsky else
8034a366f51SHeiko Carstens pte = set_pte_bit(pte, __pgprot(_PAGE_INVALID));
804b8e3b379SHeiko Carstens set_pte(ptep, pte);
8051e133ab2SMartin Schwidefsky }
8061e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
8071e133ab2SMartin Schwidefsky return dirty;
8081e133ab2SMartin Schwidefsky }
8090959e168SJanosch Frank EXPORT_SYMBOL_GPL(ptep_test_and_clear_uc);
8101e133ab2SMartin Schwidefsky
set_guest_storage_key(struct mm_struct * mm,unsigned long addr,unsigned char key,bool nq)8111e133ab2SMartin Schwidefsky int set_guest_storage_key(struct mm_struct *mm, unsigned long addr,
8121e133ab2SMartin Schwidefsky unsigned char key, bool nq)
8131e133ab2SMartin Schwidefsky {
814637ff9efSJanosch Frank unsigned long keyul, paddr;
8151e133ab2SMartin Schwidefsky spinlock_t *ptl;
8161e133ab2SMartin Schwidefsky pgste_t old, new;
817637ff9efSJanosch Frank pmd_t *pmdp;
8181e133ab2SMartin Schwidefsky pte_t *ptep;
8191e133ab2SMartin Schwidefsky
8207cb70266SDavid Hildenbrand /*
8217cb70266SDavid Hildenbrand * If we don't have a PTE table and if there is no huge page mapped,
8227cb70266SDavid Hildenbrand * we can ignore attempts to set the key to 0, because it already is 0.
8237cb70266SDavid Hildenbrand */
8247cb70266SDavid Hildenbrand switch (pmd_lookup(mm, addr, &pmdp)) {
8257cb70266SDavid Hildenbrand case -ENOENT:
8267cb70266SDavid Hildenbrand return key ? -EFAULT : 0;
8277cb70266SDavid Hildenbrand case 0:
8287cb70266SDavid Hildenbrand break;
8297cb70266SDavid Hildenbrand default:
830637ff9efSJanosch Frank return -EFAULT;
8317cb70266SDavid Hildenbrand }
8325c7f3bf0SHugh Dickins again:
833637ff9efSJanosch Frank ptl = pmd_lock(mm, pmdp);
834637ff9efSJanosch Frank if (!pmd_present(*pmdp)) {
835637ff9efSJanosch Frank spin_unlock(ptl);
8367cb70266SDavid Hildenbrand return key ? -EFAULT : 0;
837637ff9efSJanosch Frank }
838637ff9efSJanosch Frank
839637ff9efSJanosch Frank if (pmd_large(*pmdp)) {
840637ff9efSJanosch Frank paddr = pmd_val(*pmdp) & HPAGE_MASK;
841637ff9efSJanosch Frank paddr |= addr & ~HPAGE_MASK;
842637ff9efSJanosch Frank /*
843637ff9efSJanosch Frank * Huge pmds need quiescing operations, they are
844637ff9efSJanosch Frank * always mapped.
845637ff9efSJanosch Frank */
846637ff9efSJanosch Frank page_set_storage_key(paddr, key, 1);
847637ff9efSJanosch Frank spin_unlock(ptl);
848637ff9efSJanosch Frank return 0;
849637ff9efSJanosch Frank }
850637ff9efSJanosch Frank spin_unlock(ptl);
851637ff9efSJanosch Frank
8528318c404SDavid Hildenbrand ptep = pte_offset_map_lock(mm, pmdp, addr, &ptl);
8535c7f3bf0SHugh Dickins if (!ptep)
8545c7f3bf0SHugh Dickins goto again;
8551e133ab2SMartin Schwidefsky new = old = pgste_get_lock(ptep);
8561e133ab2SMartin Schwidefsky pgste_val(new) &= ~(PGSTE_GR_BIT | PGSTE_GC_BIT |
8571e133ab2SMartin Schwidefsky PGSTE_ACC_BITS | PGSTE_FP_BIT);
8581e133ab2SMartin Schwidefsky keyul = (unsigned long) key;
8591e133ab2SMartin Schwidefsky pgste_val(new) |= (keyul & (_PAGE_CHANGED | _PAGE_REFERENCED)) << 48;
8601e133ab2SMartin Schwidefsky pgste_val(new) |= (keyul & (_PAGE_ACC_BITS | _PAGE_FP_BIT)) << 56;
8611e133ab2SMartin Schwidefsky if (!(pte_val(*ptep) & _PAGE_INVALID)) {
862637ff9efSJanosch Frank unsigned long bits, skey;
8631e133ab2SMartin Schwidefsky
864637ff9efSJanosch Frank paddr = pte_val(*ptep) & PAGE_MASK;
865637ff9efSJanosch Frank skey = (unsigned long) page_get_storage_key(paddr);
8661e133ab2SMartin Schwidefsky bits = skey & (_PAGE_CHANGED | _PAGE_REFERENCED);
8671e133ab2SMartin Schwidefsky skey = key & (_PAGE_ACC_BITS | _PAGE_FP_BIT);
8681e133ab2SMartin Schwidefsky /* Set storage key ACC and FP */
869637ff9efSJanosch Frank page_set_storage_key(paddr, skey, !nq);
8701e133ab2SMartin Schwidefsky /* Merge host changed & referenced into pgste */
8711e133ab2SMartin Schwidefsky pgste_val(new) |= bits << 52;
8721e133ab2SMartin Schwidefsky }
8731e133ab2SMartin Schwidefsky /* changing the guest storage key is considered a change of the page */
8741e133ab2SMartin Schwidefsky if ((pgste_val(new) ^ pgste_val(old)) &
8751e133ab2SMartin Schwidefsky (PGSTE_ACC_BITS | PGSTE_FP_BIT | PGSTE_GR_BIT | PGSTE_GC_BIT))
8761e133ab2SMartin Schwidefsky pgste_val(new) |= PGSTE_UC_BIT;
8771e133ab2SMartin Schwidefsky
8781e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, new);
8791e133ab2SMartin Schwidefsky pte_unmap_unlock(ptep, ptl);
8801e133ab2SMartin Schwidefsky return 0;
8811e133ab2SMartin Schwidefsky }
8821e133ab2SMartin Schwidefsky EXPORT_SYMBOL(set_guest_storage_key);
8831e133ab2SMartin Schwidefsky
8842e827528SHeiko Carstens /*
8851824c723SDavid Hildenbrand * Conditionally set a guest storage key (handling csske).
8861824c723SDavid Hildenbrand * oldkey will be updated when either mr or mc is set and a pointer is given.
8871824c723SDavid Hildenbrand *
8881824c723SDavid Hildenbrand * Returns 0 if a guests storage key update wasn't necessary, 1 if the guest
8891824c723SDavid Hildenbrand * storage key was updated and -EFAULT on access errors.
8901824c723SDavid Hildenbrand */
cond_set_guest_storage_key(struct mm_struct * mm,unsigned long addr,unsigned char key,unsigned char * oldkey,bool nq,bool mr,bool mc)8911824c723SDavid Hildenbrand int cond_set_guest_storage_key(struct mm_struct *mm, unsigned long addr,
8921824c723SDavid Hildenbrand unsigned char key, unsigned char *oldkey,
8931824c723SDavid Hildenbrand bool nq, bool mr, bool mc)
8941e133ab2SMartin Schwidefsky {
8951824c723SDavid Hildenbrand unsigned char tmp, mask = _PAGE_ACC_BITS | _PAGE_FP_BIT;
8961824c723SDavid Hildenbrand int rc;
8971824c723SDavid Hildenbrand
8981824c723SDavid Hildenbrand /* we can drop the pgste lock between getting and setting the key */
8991824c723SDavid Hildenbrand if (mr | mc) {
9001824c723SDavid Hildenbrand rc = get_guest_storage_key(current->mm, addr, &tmp);
9011824c723SDavid Hildenbrand if (rc)
9021824c723SDavid Hildenbrand return rc;
9031824c723SDavid Hildenbrand if (oldkey)
9041824c723SDavid Hildenbrand *oldkey = tmp;
9051824c723SDavid Hildenbrand if (!mr)
9061824c723SDavid Hildenbrand mask |= _PAGE_REFERENCED;
9071824c723SDavid Hildenbrand if (!mc)
9081824c723SDavid Hildenbrand mask |= _PAGE_CHANGED;
9091824c723SDavid Hildenbrand if (!((tmp ^ key) & mask))
9101824c723SDavid Hildenbrand return 0;
9111824c723SDavid Hildenbrand }
9121824c723SDavid Hildenbrand rc = set_guest_storage_key(current->mm, addr, key, nq);
9131824c723SDavid Hildenbrand return rc < 0 ? rc : 1;
9141824c723SDavid Hildenbrand }
9151824c723SDavid Hildenbrand EXPORT_SYMBOL(cond_set_guest_storage_key);
9161824c723SDavid Hildenbrand
9172e827528SHeiko Carstens /*
918a7e19ab5SDavid Hildenbrand * Reset a guest reference bit (rrbe), returning the reference and changed bit.
919a7e19ab5SDavid Hildenbrand *
920a7e19ab5SDavid Hildenbrand * Returns < 0 in case of error, otherwise the cc to be reported to the guest.
921a7e19ab5SDavid Hildenbrand */
reset_guest_reference_bit(struct mm_struct * mm,unsigned long addr)922a7e19ab5SDavid Hildenbrand int reset_guest_reference_bit(struct mm_struct *mm, unsigned long addr)
923a7e19ab5SDavid Hildenbrand {
924a7e19ab5SDavid Hildenbrand spinlock_t *ptl;
925637ff9efSJanosch Frank unsigned long paddr;
926a7e19ab5SDavid Hildenbrand pgste_t old, new;
927637ff9efSJanosch Frank pmd_t *pmdp;
928a7e19ab5SDavid Hildenbrand pte_t *ptep;
929a7e19ab5SDavid Hildenbrand int cc = 0;
930a7e19ab5SDavid Hildenbrand
93114ea40e2SDavid Hildenbrand /*
93214ea40e2SDavid Hildenbrand * If we don't have a PTE table and if there is no huge page mapped,
93314ea40e2SDavid Hildenbrand * the storage key is 0 and there is nothing for us to do.
93414ea40e2SDavid Hildenbrand */
93514ea40e2SDavid Hildenbrand switch (pmd_lookup(mm, addr, &pmdp)) {
93614ea40e2SDavid Hildenbrand case -ENOENT:
93714ea40e2SDavid Hildenbrand return 0;
93814ea40e2SDavid Hildenbrand case 0:
93914ea40e2SDavid Hildenbrand break;
94014ea40e2SDavid Hildenbrand default:
941637ff9efSJanosch Frank return -EFAULT;
94214ea40e2SDavid Hildenbrand }
9435c7f3bf0SHugh Dickins again:
944637ff9efSJanosch Frank ptl = pmd_lock(mm, pmdp);
945637ff9efSJanosch Frank if (!pmd_present(*pmdp)) {
946637ff9efSJanosch Frank spin_unlock(ptl);
94714ea40e2SDavid Hildenbrand return 0;
948637ff9efSJanosch Frank }
949637ff9efSJanosch Frank
950637ff9efSJanosch Frank if (pmd_large(*pmdp)) {
951637ff9efSJanosch Frank paddr = pmd_val(*pmdp) & HPAGE_MASK;
952637ff9efSJanosch Frank paddr |= addr & ~HPAGE_MASK;
953637ff9efSJanosch Frank cc = page_reset_referenced(paddr);
954637ff9efSJanosch Frank spin_unlock(ptl);
955637ff9efSJanosch Frank return cc;
956637ff9efSJanosch Frank }
957637ff9efSJanosch Frank spin_unlock(ptl);
958637ff9efSJanosch Frank
9598318c404SDavid Hildenbrand ptep = pte_offset_map_lock(mm, pmdp, addr, &ptl);
9605c7f3bf0SHugh Dickins if (!ptep)
9615c7f3bf0SHugh Dickins goto again;
962a7e19ab5SDavid Hildenbrand new = old = pgste_get_lock(ptep);
963a7e19ab5SDavid Hildenbrand /* Reset guest reference bit only */
964a7e19ab5SDavid Hildenbrand pgste_val(new) &= ~PGSTE_GR_BIT;
965a7e19ab5SDavid Hildenbrand
966a7e19ab5SDavid Hildenbrand if (!(pte_val(*ptep) & _PAGE_INVALID)) {
967637ff9efSJanosch Frank paddr = pte_val(*ptep) & PAGE_MASK;
968637ff9efSJanosch Frank cc = page_reset_referenced(paddr);
969a7e19ab5SDavid Hildenbrand /* Merge real referenced bit into host-set */
970a7e19ab5SDavid Hildenbrand pgste_val(new) |= ((unsigned long) cc << 53) & PGSTE_HR_BIT;
971a7e19ab5SDavid Hildenbrand }
972a7e19ab5SDavid Hildenbrand /* Reflect guest's logical view, not physical */
973a7e19ab5SDavid Hildenbrand cc |= (pgste_val(old) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 49;
974a7e19ab5SDavid Hildenbrand /* Changing the guest storage key is considered a change of the page */
975a7e19ab5SDavid Hildenbrand if ((pgste_val(new) ^ pgste_val(old)) & PGSTE_GR_BIT)
976a7e19ab5SDavid Hildenbrand pgste_val(new) |= PGSTE_UC_BIT;
977a7e19ab5SDavid Hildenbrand
978a7e19ab5SDavid Hildenbrand pgste_set_unlock(ptep, new);
979a7e19ab5SDavid Hildenbrand pte_unmap_unlock(ptep, ptl);
9804bead2a4SJanosch Frank return cc;
981a7e19ab5SDavid Hildenbrand }
982a7e19ab5SDavid Hildenbrand EXPORT_SYMBOL(reset_guest_reference_bit);
983a7e19ab5SDavid Hildenbrand
get_guest_storage_key(struct mm_struct * mm,unsigned long addr,unsigned char * key)984154c8c19SDavid Hildenbrand int get_guest_storage_key(struct mm_struct *mm, unsigned long addr,
985154c8c19SDavid Hildenbrand unsigned char *key)
9861e133ab2SMartin Schwidefsky {
987637ff9efSJanosch Frank unsigned long paddr;
9881e133ab2SMartin Schwidefsky spinlock_t *ptl;
9891e133ab2SMartin Schwidefsky pgste_t pgste;
990637ff9efSJanosch Frank pmd_t *pmdp;
9911e133ab2SMartin Schwidefsky pte_t *ptep;
9921e133ab2SMartin Schwidefsky
993949f5c12SDavid Hildenbrand /*
994949f5c12SDavid Hildenbrand * If we don't have a PTE table and if there is no huge page mapped,
995949f5c12SDavid Hildenbrand * the storage key is 0.
996949f5c12SDavid Hildenbrand */
997949f5c12SDavid Hildenbrand *key = 0;
998949f5c12SDavid Hildenbrand
999949f5c12SDavid Hildenbrand switch (pmd_lookup(mm, addr, &pmdp)) {
1000949f5c12SDavid Hildenbrand case -ENOENT:
1001949f5c12SDavid Hildenbrand return 0;
1002949f5c12SDavid Hildenbrand case 0:
1003949f5c12SDavid Hildenbrand break;
1004949f5c12SDavid Hildenbrand default:
1005637ff9efSJanosch Frank return -EFAULT;
1006949f5c12SDavid Hildenbrand }
10075c7f3bf0SHugh Dickins again:
1008637ff9efSJanosch Frank ptl = pmd_lock(mm, pmdp);
1009637ff9efSJanosch Frank if (!pmd_present(*pmdp)) {
1010637ff9efSJanosch Frank spin_unlock(ptl);
1011637ff9efSJanosch Frank return 0;
1012637ff9efSJanosch Frank }
1013637ff9efSJanosch Frank
1014637ff9efSJanosch Frank if (pmd_large(*pmdp)) {
1015637ff9efSJanosch Frank paddr = pmd_val(*pmdp) & HPAGE_MASK;
1016637ff9efSJanosch Frank paddr |= addr & ~HPAGE_MASK;
1017637ff9efSJanosch Frank *key = page_get_storage_key(paddr);
1018637ff9efSJanosch Frank spin_unlock(ptl);
1019637ff9efSJanosch Frank return 0;
1020637ff9efSJanosch Frank }
1021637ff9efSJanosch Frank spin_unlock(ptl);
1022637ff9efSJanosch Frank
10238318c404SDavid Hildenbrand ptep = pte_offset_map_lock(mm, pmdp, addr, &ptl);
10245c7f3bf0SHugh Dickins if (!ptep)
10255c7f3bf0SHugh Dickins goto again;
10261e133ab2SMartin Schwidefsky pgste = pgste_get_lock(ptep);
1027154c8c19SDavid Hildenbrand *key = (pgste_val(pgste) & (PGSTE_ACC_BITS | PGSTE_FP_BIT)) >> 56;
1028637ff9efSJanosch Frank paddr = pte_val(*ptep) & PAGE_MASK;
10298d6037a7SDavid Hildenbrand if (!(pte_val(*ptep) & _PAGE_INVALID))
1030637ff9efSJanosch Frank *key = page_get_storage_key(paddr);
10311e133ab2SMartin Schwidefsky /* Reflect guest's logical view, not physical */
1032154c8c19SDavid Hildenbrand *key |= (pgste_val(pgste) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 48;
10331e133ab2SMartin Schwidefsky pgste_set_unlock(ptep, pgste);
10341e133ab2SMartin Schwidefsky pte_unmap_unlock(ptep, ptl);
1035154c8c19SDavid Hildenbrand return 0;
10361e133ab2SMartin Schwidefsky }
10371e133ab2SMartin Schwidefsky EXPORT_SYMBOL(get_guest_storage_key);
10382d42f947SClaudio Imbrenda
10392d42f947SClaudio Imbrenda /**
10402d42f947SClaudio Imbrenda * pgste_perform_essa - perform ESSA actions on the PGSTE.
10412d42f947SClaudio Imbrenda * @mm: the memory context. It must have PGSTEs, no check is performed here!
10422d42f947SClaudio Imbrenda * @hva: the host virtual address of the page whose PGSTE is to be processed
10432d42f947SClaudio Imbrenda * @orc: the specific action to perform, see the ESSA_SET_* macros.
10442d42f947SClaudio Imbrenda * @oldpte: the PTE will be saved there if the pointer is not NULL.
10452d42f947SClaudio Imbrenda * @oldpgste: the old PGSTE will be saved there if the pointer is not NULL.
10462d42f947SClaudio Imbrenda *
10472d42f947SClaudio Imbrenda * Return: 1 if the page is to be added to the CBRL, otherwise 0,
10482d42f947SClaudio Imbrenda * or < 0 in case of error. -EINVAL is returned for invalid values
10492d42f947SClaudio Imbrenda * of orc, -EFAULT for invalid addresses.
10502d42f947SClaudio Imbrenda */
pgste_perform_essa(struct mm_struct * mm,unsigned long hva,int orc,unsigned long * oldpte,unsigned long * oldpgste)10512d42f947SClaudio Imbrenda int pgste_perform_essa(struct mm_struct *mm, unsigned long hva, int orc,
10522d42f947SClaudio Imbrenda unsigned long *oldpte, unsigned long *oldpgste)
10532d42f947SClaudio Imbrenda {
1054fe3d1002SDavid Hildenbrand struct vm_area_struct *vma;
10552d42f947SClaudio Imbrenda unsigned long pgstev;
10562d42f947SClaudio Imbrenda spinlock_t *ptl;
10572d42f947SClaudio Imbrenda pgste_t pgste;
10582d42f947SClaudio Imbrenda pte_t *ptep;
10592d42f947SClaudio Imbrenda int res = 0;
10602d42f947SClaudio Imbrenda
10612d42f947SClaudio Imbrenda WARN_ON_ONCE(orc > ESSA_MAX);
10622d42f947SClaudio Imbrenda if (unlikely(orc > ESSA_MAX))
10632d42f947SClaudio Imbrenda return -EINVAL;
1064fe3d1002SDavid Hildenbrand
1065fe3d1002SDavid Hildenbrand vma = vma_lookup(mm, hva);
1066fe3d1002SDavid Hildenbrand if (!vma || is_vm_hugetlb_page(vma))
1067fe3d1002SDavid Hildenbrand return -EFAULT;
10682d42f947SClaudio Imbrenda ptep = get_locked_pte(mm, hva, &ptl);
10692d42f947SClaudio Imbrenda if (unlikely(!ptep))
10702d42f947SClaudio Imbrenda return -EFAULT;
10712d42f947SClaudio Imbrenda pgste = pgste_get_lock(ptep);
10722d42f947SClaudio Imbrenda pgstev = pgste_val(pgste);
10732d42f947SClaudio Imbrenda if (oldpte)
10742d42f947SClaudio Imbrenda *oldpte = pte_val(*ptep);
10752d42f947SClaudio Imbrenda if (oldpgste)
10762d42f947SClaudio Imbrenda *oldpgste = pgstev;
10772d42f947SClaudio Imbrenda
10782d42f947SClaudio Imbrenda switch (orc) {
10792d42f947SClaudio Imbrenda case ESSA_GET_STATE:
10802d42f947SClaudio Imbrenda break;
10812d42f947SClaudio Imbrenda case ESSA_SET_STABLE:
10821bab1c02SClaudio Imbrenda pgstev &= ~(_PGSTE_GPS_USAGE_MASK | _PGSTE_GPS_NODAT);
10832d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_STABLE;
10842d42f947SClaudio Imbrenda break;
10852d42f947SClaudio Imbrenda case ESSA_SET_UNUSED:
10862d42f947SClaudio Imbrenda pgstev &= ~_PGSTE_GPS_USAGE_MASK;
10872d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_UNUSED;
10882d42f947SClaudio Imbrenda if (pte_val(*ptep) & _PAGE_INVALID)
10892d42f947SClaudio Imbrenda res = 1;
10902d42f947SClaudio Imbrenda break;
10912d42f947SClaudio Imbrenda case ESSA_SET_VOLATILE:
10922d42f947SClaudio Imbrenda pgstev &= ~_PGSTE_GPS_USAGE_MASK;
10932d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_VOLATILE;
10942d42f947SClaudio Imbrenda if (pte_val(*ptep) & _PAGE_INVALID)
10952d42f947SClaudio Imbrenda res = 1;
10962d42f947SClaudio Imbrenda break;
10972d42f947SClaudio Imbrenda case ESSA_SET_POT_VOLATILE:
10982d42f947SClaudio Imbrenda pgstev &= ~_PGSTE_GPS_USAGE_MASK;
10992d42f947SClaudio Imbrenda if (!(pte_val(*ptep) & _PAGE_INVALID)) {
11002d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_POT_VOLATILE;
11012d42f947SClaudio Imbrenda break;
11022d42f947SClaudio Imbrenda }
11032d42f947SClaudio Imbrenda if (pgstev & _PGSTE_GPS_ZERO) {
11042d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_VOLATILE;
11052d42f947SClaudio Imbrenda break;
11062d42f947SClaudio Imbrenda }
11072d42f947SClaudio Imbrenda if (!(pgstev & PGSTE_GC_BIT)) {
11082d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_VOLATILE;
11092d42f947SClaudio Imbrenda res = 1;
11102d42f947SClaudio Imbrenda break;
11112d42f947SClaudio Imbrenda }
11122d42f947SClaudio Imbrenda break;
11132d42f947SClaudio Imbrenda case ESSA_SET_STABLE_RESIDENT:
11142d42f947SClaudio Imbrenda pgstev &= ~_PGSTE_GPS_USAGE_MASK;
11152d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_STABLE;
11162d42f947SClaudio Imbrenda /*
11172d42f947SClaudio Imbrenda * Since the resident state can go away any time after this
11182d42f947SClaudio Imbrenda * call, we will not make this page resident. We can revisit
11192d42f947SClaudio Imbrenda * this decision if a guest will ever start using this.
11202d42f947SClaudio Imbrenda */
11212d42f947SClaudio Imbrenda break;
11222d42f947SClaudio Imbrenda case ESSA_SET_STABLE_IF_RESIDENT:
11232d42f947SClaudio Imbrenda if (!(pte_val(*ptep) & _PAGE_INVALID)) {
11242d42f947SClaudio Imbrenda pgstev &= ~_PGSTE_GPS_USAGE_MASK;
11252d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_STABLE;
11262d42f947SClaudio Imbrenda }
11272d42f947SClaudio Imbrenda break;
11281bab1c02SClaudio Imbrenda case ESSA_SET_STABLE_NODAT:
11291bab1c02SClaudio Imbrenda pgstev &= ~_PGSTE_GPS_USAGE_MASK;
11301bab1c02SClaudio Imbrenda pgstev |= _PGSTE_GPS_USAGE_STABLE | _PGSTE_GPS_NODAT;
11311bab1c02SClaudio Imbrenda break;
11322d42f947SClaudio Imbrenda default:
11332d42f947SClaudio Imbrenda /* we should never get here! */
11342d42f947SClaudio Imbrenda break;
11352d42f947SClaudio Imbrenda }
11362d42f947SClaudio Imbrenda /* If we are discarding a page, set it to logical zero */
11372d42f947SClaudio Imbrenda if (res)
11382d42f947SClaudio Imbrenda pgstev |= _PGSTE_GPS_ZERO;
11392d42f947SClaudio Imbrenda
11402d42f947SClaudio Imbrenda pgste_val(pgste) = pgstev;
11412d42f947SClaudio Imbrenda pgste_set_unlock(ptep, pgste);
11422d42f947SClaudio Imbrenda pte_unmap_unlock(ptep, ptl);
11432d42f947SClaudio Imbrenda return res;
11442d42f947SClaudio Imbrenda }
11452d42f947SClaudio Imbrenda EXPORT_SYMBOL(pgste_perform_essa);
11462d42f947SClaudio Imbrenda
11472d42f947SClaudio Imbrenda /**
11482d42f947SClaudio Imbrenda * set_pgste_bits - set specific PGSTE bits.
11492d42f947SClaudio Imbrenda * @mm: the memory context. It must have PGSTEs, no check is performed here!
11502d42f947SClaudio Imbrenda * @hva: the host virtual address of the page whose PGSTE is to be processed
11512d42f947SClaudio Imbrenda * @bits: a bitmask representing the bits that will be touched
11522d42f947SClaudio Imbrenda * @value: the values of the bits to be written. Only the bits in the mask
11532d42f947SClaudio Imbrenda * will be written.
11542d42f947SClaudio Imbrenda *
11552d42f947SClaudio Imbrenda * Return: 0 on success, < 0 in case of error.
11562d42f947SClaudio Imbrenda */
set_pgste_bits(struct mm_struct * mm,unsigned long hva,unsigned long bits,unsigned long value)11572d42f947SClaudio Imbrenda int set_pgste_bits(struct mm_struct *mm, unsigned long hva,
11582d42f947SClaudio Imbrenda unsigned long bits, unsigned long value)
11592d42f947SClaudio Imbrenda {
1160fe3d1002SDavid Hildenbrand struct vm_area_struct *vma;
11612d42f947SClaudio Imbrenda spinlock_t *ptl;
11622d42f947SClaudio Imbrenda pgste_t new;
11632d42f947SClaudio Imbrenda pte_t *ptep;
11642d42f947SClaudio Imbrenda
1165fe3d1002SDavid Hildenbrand vma = vma_lookup(mm, hva);
1166fe3d1002SDavid Hildenbrand if (!vma || is_vm_hugetlb_page(vma))
1167fe3d1002SDavid Hildenbrand return -EFAULT;
11682d42f947SClaudio Imbrenda ptep = get_locked_pte(mm, hva, &ptl);
11692d42f947SClaudio Imbrenda if (unlikely(!ptep))
11702d42f947SClaudio Imbrenda return -EFAULT;
11712d42f947SClaudio Imbrenda new = pgste_get_lock(ptep);
11722d42f947SClaudio Imbrenda
11732d42f947SClaudio Imbrenda pgste_val(new) &= ~bits;
11742d42f947SClaudio Imbrenda pgste_val(new) |= value & bits;
11752d42f947SClaudio Imbrenda
11762d42f947SClaudio Imbrenda pgste_set_unlock(ptep, new);
11772d42f947SClaudio Imbrenda pte_unmap_unlock(ptep, ptl);
11782d42f947SClaudio Imbrenda return 0;
11792d42f947SClaudio Imbrenda }
11802d42f947SClaudio Imbrenda EXPORT_SYMBOL(set_pgste_bits);
11812d42f947SClaudio Imbrenda
11822d42f947SClaudio Imbrenda /**
11832d42f947SClaudio Imbrenda * get_pgste - get the current PGSTE for the given address.
11842d42f947SClaudio Imbrenda * @mm: the memory context. It must have PGSTEs, no check is performed here!
11852d42f947SClaudio Imbrenda * @hva: the host virtual address of the page whose PGSTE is to be processed
11862d42f947SClaudio Imbrenda * @pgstep: will be written with the current PGSTE for the given address.
11872d42f947SClaudio Imbrenda *
11882d42f947SClaudio Imbrenda * Return: 0 on success, < 0 in case of error.
11892d42f947SClaudio Imbrenda */
get_pgste(struct mm_struct * mm,unsigned long hva,unsigned long * pgstep)11902d42f947SClaudio Imbrenda int get_pgste(struct mm_struct *mm, unsigned long hva, unsigned long *pgstep)
11912d42f947SClaudio Imbrenda {
1192fe3d1002SDavid Hildenbrand struct vm_area_struct *vma;
11932d42f947SClaudio Imbrenda spinlock_t *ptl;
11942d42f947SClaudio Imbrenda pte_t *ptep;
11952d42f947SClaudio Imbrenda
1196fe3d1002SDavid Hildenbrand vma = vma_lookup(mm, hva);
1197fe3d1002SDavid Hildenbrand if (!vma || is_vm_hugetlb_page(vma))
1198fe3d1002SDavid Hildenbrand return -EFAULT;
11992d42f947SClaudio Imbrenda ptep = get_locked_pte(mm, hva, &ptl);
12002d42f947SClaudio Imbrenda if (unlikely(!ptep))
12012d42f947SClaudio Imbrenda return -EFAULT;
12022d42f947SClaudio Imbrenda *pgstep = pgste_val(pgste_get(ptep));
12032d42f947SClaudio Imbrenda pte_unmap_unlock(ptep, ptl);
12042d42f947SClaudio Imbrenda return 0;
12052d42f947SClaudio Imbrenda }
12062d42f947SClaudio Imbrenda EXPORT_SYMBOL(get_pgste);
12071e133ab2SMartin Schwidefsky #endif
1208