xref: /openbmc/linux/arch/s390/mm/pageattr.c (revision bef7a78d)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Copyright IBM Corp. 2011
4  * Author(s): Jan Glauber <jang@linux.vnet.ibm.com>
5  */
6 #include <linux/hugetlb.h>
7 #include <linux/mm.h>
8 #include <asm/cacheflush.h>
9 #include <asm/facility.h>
10 #include <asm/pgalloc.h>
11 #include <asm/page.h>
12 #include <asm/set_memory.h>
13 
14 static inline unsigned long sske_frame(unsigned long addr, unsigned char skey)
15 {
16 	asm volatile(".insn rrf,0xb22b0000,%[skey],%[addr],1,0"
17 		     : [addr] "+a" (addr) : [skey] "d" (skey));
18 	return addr;
19 }
20 
21 void __storage_key_init_range(unsigned long start, unsigned long end)
22 {
23 	unsigned long boundary, size;
24 
25 	while (start < end) {
26 		if (MACHINE_HAS_EDAT1) {
27 			/* set storage keys for a 1MB frame */
28 			size = 1UL << 20;
29 			boundary = (start + size) & ~(size - 1);
30 			if (boundary <= end) {
31 				do {
32 					start = sske_frame(start, PAGE_DEFAULT_KEY);
33 				} while (start < boundary);
34 				continue;
35 			}
36 		}
37 		page_set_storage_key(start, PAGE_DEFAULT_KEY, 1);
38 		start += PAGE_SIZE;
39 	}
40 }
41 
42 #ifdef CONFIG_PROC_FS
43 atomic_long_t direct_pages_count[PG_DIRECT_MAP_MAX];
44 
45 void arch_report_meminfo(struct seq_file *m)
46 {
47 	seq_printf(m, "DirectMap4k:    %8lu kB\n",
48 		   atomic_long_read(&direct_pages_count[PG_DIRECT_MAP_4K]) << 2);
49 	seq_printf(m, "DirectMap1M:    %8lu kB\n",
50 		   atomic_long_read(&direct_pages_count[PG_DIRECT_MAP_1M]) << 10);
51 	seq_printf(m, "DirectMap2G:    %8lu kB\n",
52 		   atomic_long_read(&direct_pages_count[PG_DIRECT_MAP_2G]) << 21);
53 }
54 #endif /* CONFIG_PROC_FS */
55 
56 static void pgt_set(unsigned long *old, unsigned long new, unsigned long addr,
57 		    unsigned long dtt)
58 {
59 	unsigned long table, mask;
60 
61 	mask = 0;
62 	if (MACHINE_HAS_EDAT2) {
63 		switch (dtt) {
64 		case CRDTE_DTT_REGION3:
65 			mask = ~(PTRS_PER_PUD * sizeof(pud_t) - 1);
66 			break;
67 		case CRDTE_DTT_SEGMENT:
68 			mask = ~(PTRS_PER_PMD * sizeof(pmd_t) - 1);
69 			break;
70 		case CRDTE_DTT_PAGE:
71 			mask = ~(PTRS_PER_PTE * sizeof(pte_t) - 1);
72 			break;
73 		}
74 		table = (unsigned long)old & mask;
75 		crdte(*old, new, table, dtt, addr, S390_lowcore.kernel_asce);
76 	} else if (MACHINE_HAS_IDTE) {
77 		cspg(old, *old, new);
78 	} else {
79 		csp((unsigned int *)old + 1, *old, new);
80 	}
81 }
82 
83 static int walk_pte_level(pmd_t *pmdp, unsigned long addr, unsigned long end,
84 			  unsigned long flags)
85 {
86 	pte_t *ptep, new;
87 
88 	ptep = pte_offset_kernel(pmdp, addr);
89 	do {
90 		new = *ptep;
91 		if (pte_none(new))
92 			return -EINVAL;
93 		if (flags & SET_MEMORY_RO)
94 			new = pte_wrprotect(new);
95 		else if (flags & SET_MEMORY_RW)
96 			new = pte_mkwrite(pte_mkdirty(new));
97 		if (flags & SET_MEMORY_NX)
98 			pte_val(new) |= _PAGE_NOEXEC;
99 		else if (flags & SET_MEMORY_X)
100 			pte_val(new) &= ~_PAGE_NOEXEC;
101 		pgt_set((unsigned long *)ptep, pte_val(new), addr, CRDTE_DTT_PAGE);
102 		ptep++;
103 		addr += PAGE_SIZE;
104 		cond_resched();
105 	} while (addr < end);
106 	return 0;
107 }
108 
109 static int split_pmd_page(pmd_t *pmdp, unsigned long addr)
110 {
111 	unsigned long pte_addr, prot;
112 	pte_t *pt_dir, *ptep;
113 	pmd_t new;
114 	int i, ro, nx;
115 
116 	pt_dir = vmem_pte_alloc();
117 	if (!pt_dir)
118 		return -ENOMEM;
119 	pte_addr = pmd_pfn(*pmdp) << PAGE_SHIFT;
120 	ro = !!(pmd_val(*pmdp) & _SEGMENT_ENTRY_PROTECT);
121 	nx = !!(pmd_val(*pmdp) & _SEGMENT_ENTRY_NOEXEC);
122 	prot = pgprot_val(ro ? PAGE_KERNEL_RO : PAGE_KERNEL);
123 	if (!nx)
124 		prot &= ~_PAGE_NOEXEC;
125 	ptep = pt_dir;
126 	for (i = 0; i < PTRS_PER_PTE; i++) {
127 		pte_val(*ptep) = pte_addr | prot;
128 		pte_addr += PAGE_SIZE;
129 		ptep++;
130 	}
131 	pmd_val(new) = __pa(pt_dir) | _SEGMENT_ENTRY;
132 	pgt_set((unsigned long *)pmdp, pmd_val(new), addr, CRDTE_DTT_SEGMENT);
133 	update_page_count(PG_DIRECT_MAP_4K, PTRS_PER_PTE);
134 	update_page_count(PG_DIRECT_MAP_1M, -1);
135 	return 0;
136 }
137 
138 static void modify_pmd_page(pmd_t *pmdp, unsigned long addr,
139 			    unsigned long flags)
140 {
141 	pmd_t new = *pmdp;
142 
143 	if (flags & SET_MEMORY_RO)
144 		new = pmd_wrprotect(new);
145 	else if (flags & SET_MEMORY_RW)
146 		new = pmd_mkwrite(pmd_mkdirty(new));
147 	if (flags & SET_MEMORY_NX)
148 		pmd_val(new) |= _SEGMENT_ENTRY_NOEXEC;
149 	else if (flags & SET_MEMORY_X)
150 		pmd_val(new) &= ~_SEGMENT_ENTRY_NOEXEC;
151 	pgt_set((unsigned long *)pmdp, pmd_val(new), addr, CRDTE_DTT_SEGMENT);
152 }
153 
154 static int walk_pmd_level(pud_t *pudp, unsigned long addr, unsigned long end,
155 			  unsigned long flags)
156 {
157 	unsigned long next;
158 	pmd_t *pmdp;
159 	int rc = 0;
160 
161 	pmdp = pmd_offset(pudp, addr);
162 	do {
163 		if (pmd_none(*pmdp))
164 			return -EINVAL;
165 		next = pmd_addr_end(addr, end);
166 		if (pmd_large(*pmdp)) {
167 			if (addr & ~PMD_MASK || addr + PMD_SIZE > next) {
168 				rc = split_pmd_page(pmdp, addr);
169 				if (rc)
170 					return rc;
171 				continue;
172 			}
173 			modify_pmd_page(pmdp, addr, flags);
174 		} else {
175 			rc = walk_pte_level(pmdp, addr, next, flags);
176 			if (rc)
177 				return rc;
178 		}
179 		pmdp++;
180 		addr = next;
181 		cond_resched();
182 	} while (addr < end);
183 	return rc;
184 }
185 
186 static int split_pud_page(pud_t *pudp, unsigned long addr)
187 {
188 	unsigned long pmd_addr, prot;
189 	pmd_t *pm_dir, *pmdp;
190 	pud_t new;
191 	int i, ro, nx;
192 
193 	pm_dir = vmem_crst_alloc(_SEGMENT_ENTRY_EMPTY);
194 	if (!pm_dir)
195 		return -ENOMEM;
196 	pmd_addr = pud_pfn(*pudp) << PAGE_SHIFT;
197 	ro = !!(pud_val(*pudp) & _REGION_ENTRY_PROTECT);
198 	nx = !!(pud_val(*pudp) & _REGION_ENTRY_NOEXEC);
199 	prot = pgprot_val(ro ? SEGMENT_KERNEL_RO : SEGMENT_KERNEL);
200 	if (!nx)
201 		prot &= ~_SEGMENT_ENTRY_NOEXEC;
202 	pmdp = pm_dir;
203 	for (i = 0; i < PTRS_PER_PMD; i++) {
204 		pmd_val(*pmdp) = pmd_addr | prot;
205 		pmd_addr += PMD_SIZE;
206 		pmdp++;
207 	}
208 	pud_val(new) = __pa(pm_dir) | _REGION3_ENTRY;
209 	pgt_set((unsigned long *)pudp, pud_val(new), addr, CRDTE_DTT_REGION3);
210 	update_page_count(PG_DIRECT_MAP_1M, PTRS_PER_PMD);
211 	update_page_count(PG_DIRECT_MAP_2G, -1);
212 	return 0;
213 }
214 
215 static void modify_pud_page(pud_t *pudp, unsigned long addr,
216 			    unsigned long flags)
217 {
218 	pud_t new = *pudp;
219 
220 	if (flags & SET_MEMORY_RO)
221 		new = pud_wrprotect(new);
222 	else if (flags & SET_MEMORY_RW)
223 		new = pud_mkwrite(pud_mkdirty(new));
224 	if (flags & SET_MEMORY_NX)
225 		pud_val(new) |= _REGION_ENTRY_NOEXEC;
226 	else if (flags & SET_MEMORY_X)
227 		pud_val(new) &= ~_REGION_ENTRY_NOEXEC;
228 	pgt_set((unsigned long *)pudp, pud_val(new), addr, CRDTE_DTT_REGION3);
229 }
230 
231 static int walk_pud_level(p4d_t *p4d, unsigned long addr, unsigned long end,
232 			  unsigned long flags)
233 {
234 	unsigned long next;
235 	pud_t *pudp;
236 	int rc = 0;
237 
238 	pudp = pud_offset(p4d, addr);
239 	do {
240 		if (pud_none(*pudp))
241 			return -EINVAL;
242 		next = pud_addr_end(addr, end);
243 		if (pud_large(*pudp)) {
244 			if (addr & ~PUD_MASK || addr + PUD_SIZE > next) {
245 				rc = split_pud_page(pudp, addr);
246 				if (rc)
247 					break;
248 				continue;
249 			}
250 			modify_pud_page(pudp, addr, flags);
251 		} else {
252 			rc = walk_pmd_level(pudp, addr, next, flags);
253 		}
254 		pudp++;
255 		addr = next;
256 		cond_resched();
257 	} while (addr < end && !rc);
258 	return rc;
259 }
260 
261 static int walk_p4d_level(pgd_t *pgd, unsigned long addr, unsigned long end,
262 			  unsigned long flags)
263 {
264 	unsigned long next;
265 	p4d_t *p4dp;
266 	int rc = 0;
267 
268 	p4dp = p4d_offset(pgd, addr);
269 	do {
270 		if (p4d_none(*p4dp))
271 			return -EINVAL;
272 		next = p4d_addr_end(addr, end);
273 		rc = walk_pud_level(p4dp, addr, next, flags);
274 		p4dp++;
275 		addr = next;
276 		cond_resched();
277 	} while (addr < end && !rc);
278 	return rc;
279 }
280 
281 DEFINE_MUTEX(cpa_mutex);
282 
283 static int change_page_attr(unsigned long addr, unsigned long end,
284 			    unsigned long flags)
285 {
286 	unsigned long next;
287 	int rc = -EINVAL;
288 	pgd_t *pgdp;
289 
290 	if (addr == end)
291 		return 0;
292 	if (end >= MODULES_END)
293 		return -EINVAL;
294 	mutex_lock(&cpa_mutex);
295 	pgdp = pgd_offset_k(addr);
296 	do {
297 		if (pgd_none(*pgdp))
298 			break;
299 		next = pgd_addr_end(addr, end);
300 		rc = walk_p4d_level(pgdp, addr, next, flags);
301 		if (rc)
302 			break;
303 		cond_resched();
304 	} while (pgdp++, addr = next, addr < end && !rc);
305 	mutex_unlock(&cpa_mutex);
306 	return rc;
307 }
308 
309 int __set_memory(unsigned long addr, int numpages, unsigned long flags)
310 {
311 	if (!MACHINE_HAS_NX)
312 		flags &= ~(SET_MEMORY_NX | SET_MEMORY_X);
313 	if (!flags)
314 		return 0;
315 	addr &= PAGE_MASK;
316 	return change_page_attr(addr, addr + numpages * PAGE_SIZE, flags);
317 }
318 
319 #ifdef CONFIG_DEBUG_PAGEALLOC
320 
321 static void ipte_range(pte_t *pte, unsigned long address, int nr)
322 {
323 	int i;
324 
325 	if (test_facility(13)) {
326 		__ptep_ipte_range(address, nr - 1, pte, IPTE_GLOBAL);
327 		return;
328 	}
329 	for (i = 0; i < nr; i++) {
330 		__ptep_ipte(address, pte, 0, 0, IPTE_GLOBAL);
331 		address += PAGE_SIZE;
332 		pte++;
333 	}
334 }
335 
336 void __kernel_map_pages(struct page *page, int numpages, int enable)
337 {
338 	unsigned long address;
339 	int nr, i, j;
340 	pte_t *pte;
341 
342 	for (i = 0; i < numpages;) {
343 		address = page_to_phys(page + i);
344 		pte = virt_to_kpte(address);
345 		nr = (unsigned long)pte >> ilog2(sizeof(long));
346 		nr = PTRS_PER_PTE - (nr & (PTRS_PER_PTE - 1));
347 		nr = min(numpages - i, nr);
348 		if (enable) {
349 			for (j = 0; j < nr; j++) {
350 				pte_val(*pte) &= ~_PAGE_INVALID;
351 				address += PAGE_SIZE;
352 				pte++;
353 			}
354 		} else {
355 			ipte_range(pte, address, nr);
356 		}
357 		i += nr;
358 	}
359 }
360 
361 #endif /* CONFIG_DEBUG_PAGEALLOC */
362