xref: /openbmc/linux/fs/proc/page.c (revision 97a32539b9568bb653683349e5a76d02ff3c3e2c)
1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0
257c8a661SMike Rapoport #include <linux/memblock.h>
36d80e53fSAlexey Dobriyan #include <linux/compiler.h>
46d80e53fSAlexey Dobriyan #include <linux/fs.h>
56d80e53fSAlexey Dobriyan #include <linux/init.h>
69a840895SHugh Dickins #include <linux/ksm.h>
76d80e53fSAlexey Dobriyan #include <linux/mm.h>
86d80e53fSAlexey Dobriyan #include <linux/mmzone.h>
956873f43SWang, Yalin #include <linux/huge_mm.h>
106d80e53fSAlexey Dobriyan #include <linux/proc_fs.h>
116d80e53fSAlexey Dobriyan #include <linux/seq_file.h>
1220a0307cSWu Fengguang #include <linux/hugetlb.h>
1380ae2fdcSVladimir Davydov #include <linux/memcontrol.h>
1433c3fc71SVladimir Davydov #include <linux/mmu_notifier.h>
1533c3fc71SVladimir Davydov #include <linux/page_idle.h>
161a9b5b7fSWu Fengguang #include <linux/kernel-page-flags.h>
177c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
186d80e53fSAlexey Dobriyan #include "internal.h"
196d80e53fSAlexey Dobriyan 
206d80e53fSAlexey Dobriyan #define KPMSIZE sizeof(u64)
216d80e53fSAlexey Dobriyan #define KPMMASK (KPMSIZE - 1)
2233c3fc71SVladimir Davydov #define KPMBITS (KPMSIZE * BITS_PER_BYTE)
23ed7ce0f1SWu Fengguang 
24abec749fSDavid Hildenbrand static inline unsigned long get_max_dump_pfn(void)
25abec749fSDavid Hildenbrand {
26abec749fSDavid Hildenbrand #ifdef CONFIG_SPARSEMEM
27abec749fSDavid Hildenbrand 	/*
28abec749fSDavid Hildenbrand 	 * The memmap of early sections is completely populated and marked
29abec749fSDavid Hildenbrand 	 * online even if max_pfn does not fall on a section boundary -
30abec749fSDavid Hildenbrand 	 * pfn_to_online_page() will succeed on all pages. Allow inspecting
31abec749fSDavid Hildenbrand 	 * these memmaps.
32abec749fSDavid Hildenbrand 	 */
33abec749fSDavid Hildenbrand 	return round_up(max_pfn, PAGES_PER_SECTION);
34abec749fSDavid Hildenbrand #else
35abec749fSDavid Hildenbrand 	return max_pfn;
36abec749fSDavid Hildenbrand #endif
37abec749fSDavid Hildenbrand }
38abec749fSDavid Hildenbrand 
396d80e53fSAlexey Dobriyan /* /proc/kpagecount - an array exposing page counts
406d80e53fSAlexey Dobriyan  *
416d80e53fSAlexey Dobriyan  * Each entry is a u64 representing the corresponding
426d80e53fSAlexey Dobriyan  * physical page count.
436d80e53fSAlexey Dobriyan  */
446d80e53fSAlexey Dobriyan static ssize_t kpagecount_read(struct file *file, char __user *buf,
456d80e53fSAlexey Dobriyan 			     size_t count, loff_t *ppos)
466d80e53fSAlexey Dobriyan {
47abec749fSDavid Hildenbrand 	const unsigned long max_dump_pfn = get_max_dump_pfn();
486d80e53fSAlexey Dobriyan 	u64 __user *out = (u64 __user *)buf;
496d80e53fSAlexey Dobriyan 	struct page *ppage;
506d80e53fSAlexey Dobriyan 	unsigned long src = *ppos;
516d80e53fSAlexey Dobriyan 	unsigned long pfn;
526d80e53fSAlexey Dobriyan 	ssize_t ret = 0;
536d80e53fSAlexey Dobriyan 	u64 pcount;
546d80e53fSAlexey Dobriyan 
556d80e53fSAlexey Dobriyan 	pfn = src / KPMSIZE;
566d80e53fSAlexey Dobriyan 	if (src & KPMMASK || count & KPMMASK)
576d80e53fSAlexey Dobriyan 		return -EINVAL;
58abec749fSDavid Hildenbrand 	if (src >= max_dump_pfn * KPMSIZE)
59abec749fSDavid Hildenbrand 		return 0;
60abec749fSDavid Hildenbrand 	count = min_t(unsigned long, count, (max_dump_pfn * KPMSIZE) - src);
616d80e53fSAlexey Dobriyan 
626d80e53fSAlexey Dobriyan 	while (count > 0) {
63aad5f69bSDavid Hildenbrand 		/*
64aad5f69bSDavid Hildenbrand 		 * TODO: ZONE_DEVICE support requires to identify
65aad5f69bSDavid Hildenbrand 		 * memmaps that were actually initialized.
66aad5f69bSDavid Hildenbrand 		 */
67aad5f69bSDavid Hildenbrand 		ppage = pfn_to_online_page(pfn);
68aad5f69bSDavid Hildenbrand 
69144552ffSAnthony Yznaga 		if (!ppage || PageSlab(ppage) || page_has_type(ppage))
706d80e53fSAlexey Dobriyan 			pcount = 0;
716d80e53fSAlexey Dobriyan 		else
726d80e53fSAlexey Dobriyan 			pcount = page_mapcount(ppage);
736d80e53fSAlexey Dobriyan 
74ed7ce0f1SWu Fengguang 		if (put_user(pcount, out)) {
756d80e53fSAlexey Dobriyan 			ret = -EFAULT;
766d80e53fSAlexey Dobriyan 			break;
776d80e53fSAlexey Dobriyan 		}
786d80e53fSAlexey Dobriyan 
79ed7ce0f1SWu Fengguang 		pfn++;
80ed7ce0f1SWu Fengguang 		out++;
816d80e53fSAlexey Dobriyan 		count -= KPMSIZE;
82d3691d2cSVladimir Davydov 
83d3691d2cSVladimir Davydov 		cond_resched();
846d80e53fSAlexey Dobriyan 	}
856d80e53fSAlexey Dobriyan 
866d80e53fSAlexey Dobriyan 	*ppos += (char __user *)out - buf;
876d80e53fSAlexey Dobriyan 	if (!ret)
886d80e53fSAlexey Dobriyan 		ret = (char __user *)out - buf;
896d80e53fSAlexey Dobriyan 	return ret;
906d80e53fSAlexey Dobriyan }
916d80e53fSAlexey Dobriyan 
92*97a32539SAlexey Dobriyan static const struct proc_ops kpagecount_proc_ops = {
93*97a32539SAlexey Dobriyan 	.proc_lseek	= mem_lseek,
94*97a32539SAlexey Dobriyan 	.proc_read	= kpagecount_read,
956d80e53fSAlexey Dobriyan };
966d80e53fSAlexey Dobriyan 
976d80e53fSAlexey Dobriyan /* /proc/kpageflags - an array exposing page flags
986d80e53fSAlexey Dobriyan  *
996d80e53fSAlexey Dobriyan  * Each entry is a u64 representing the corresponding
1006d80e53fSAlexey Dobriyan  * physical page flags.
1016d80e53fSAlexey Dobriyan  */
1026d80e53fSAlexey Dobriyan 
10317797549SWu Fengguang static inline u64 kpf_copy_bit(u64 kflags, int ubit, int kbit)
10417797549SWu Fengguang {
10517797549SWu Fengguang 	return ((kflags >> kbit) & 1) << ubit;
10617797549SWu Fengguang }
10717797549SWu Fengguang 
1081a9b5b7fSWu Fengguang u64 stable_page_flags(struct page *page)
10917797549SWu Fengguang {
11017797549SWu Fengguang 	u64 k;
11117797549SWu Fengguang 	u64 u;
11217797549SWu Fengguang 
11317797549SWu Fengguang 	/*
11417797549SWu Fengguang 	 * pseudo flag: KPF_NOPAGE
11517797549SWu Fengguang 	 * it differentiates a memory hole from a page with no flags
11617797549SWu Fengguang 	 */
11717797549SWu Fengguang 	if (!page)
11817797549SWu Fengguang 		return 1 << KPF_NOPAGE;
11917797549SWu Fengguang 
12017797549SWu Fengguang 	k = page->flags;
12117797549SWu Fengguang 	u = 0;
12217797549SWu Fengguang 
12317797549SWu Fengguang 	/*
12417797549SWu Fengguang 	 * pseudo flags for the well known (anonymous) memory mapped pages
12517797549SWu Fengguang 	 *
12617797549SWu Fengguang 	 * Note that page->_mapcount is overloaded in SLOB/SLUB/SLQB, so the
127832fc1deSNaoya Horiguchi 	 * simple test in page_mapped() is not enough.
12817797549SWu Fengguang 	 */
129832fc1deSNaoya Horiguchi 	if (!PageSlab(page) && page_mapped(page))
13017797549SWu Fengguang 		u |= 1 << KPF_MMAP;
13117797549SWu Fengguang 	if (PageAnon(page))
13217797549SWu Fengguang 		u |= 1 << KPF_ANON;
1339a840895SHugh Dickins 	if (PageKsm(page))
1349a840895SHugh Dickins 		u |= 1 << KPF_KSM;
13517797549SWu Fengguang 
13617797549SWu Fengguang 	/*
13717797549SWu Fengguang 	 * compound pages: export both head/tail info
13817797549SWu Fengguang 	 * they together define a compound page's start/end pos and order
13917797549SWu Fengguang 	 */
14017797549SWu Fengguang 	if (PageHead(page))
14117797549SWu Fengguang 		u |= 1 << KPF_COMPOUND_HEAD;
14217797549SWu Fengguang 	if (PageTail(page))
14317797549SWu Fengguang 		u |= 1 << KPF_COMPOUND_TAIL;
14417797549SWu Fengguang 	if (PageHuge(page))
14517797549SWu Fengguang 		u |= 1 << KPF_HUGE;
1467a71932dSNaoya Horiguchi 	/*
1477a71932dSNaoya Horiguchi 	 * PageTransCompound can be true for non-huge compound pages (slab
1487a71932dSNaoya Horiguchi 	 * pages or pages allocated by drivers with __GFP_COMP) because it
149e3bba3c3SNaoya Horiguchi 	 * just checks PG_head/PG_tail, so we need to check PageLRU/PageAnon
150e3bba3c3SNaoya Horiguchi 	 * to make sure a given page is a thp, not a non-huge compound page.
1517a71932dSNaoya Horiguchi 	 */
15256873f43SWang, Yalin 	else if (PageTransCompound(page)) {
15356873f43SWang, Yalin 		struct page *head = compound_head(page);
15456873f43SWang, Yalin 
15556873f43SWang, Yalin 		if (PageLRU(head) || PageAnon(head))
156e873c49fSNaoya Horiguchi 			u |= 1 << KPF_THP;
15756873f43SWang, Yalin 		else if (is_huge_zero_page(head)) {
15856873f43SWang, Yalin 			u |= 1 << KPF_ZERO_PAGE;
15956873f43SWang, Yalin 			u |= 1 << KPF_THP;
16056873f43SWang, Yalin 		}
16156873f43SWang, Yalin 	} else if (is_zero_pfn(page_to_pfn(page)))
16256873f43SWang, Yalin 		u |= 1 << KPF_ZERO_PAGE;
16356873f43SWang, Yalin 
16417797549SWu Fengguang 
1655f24ce5fSAndrea Arcangeli 	/*
1660139aa7bSJoonsoo Kim 	 * Caveats on high order pages: page->_refcount will only be set
1675f24ce5fSAndrea Arcangeli 	 * -1 on the head page; SLUB/SLQB do the same for PG_slab;
1685f24ce5fSAndrea Arcangeli 	 * SLOB won't set PG_slab at all on compound pages.
1695f24ce5fSAndrea Arcangeli 	 */
1705f24ce5fSAndrea Arcangeli 	if (PageBuddy(page))
1715f24ce5fSAndrea Arcangeli 		u |= 1 << KPF_BUDDY;
172832fc1deSNaoya Horiguchi 	else if (page_count(page) == 0 && is_free_buddy_page(page))
173832fc1deSNaoya Horiguchi 		u |= 1 << KPF_BUDDY;
1745f24ce5fSAndrea Arcangeli 
175ca215086SDavid Hildenbrand 	if (PageOffline(page))
176ca215086SDavid Hildenbrand 		u |= 1 << KPF_OFFLINE;
1771d40a5eaSMatthew Wilcox 	if (PageTable(page))
1781d40a5eaSMatthew Wilcox 		u |= 1 << KPF_PGTABLE;
17909316c09SKonstantin Khlebnikov 
180f074a8f4SVladimir Davydov 	if (page_is_idle(page))
181f074a8f4SVladimir Davydov 		u |= 1 << KPF_IDLE;
182f074a8f4SVladimir Davydov 
18317797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_LOCKED,	PG_locked);
18417797549SWu Fengguang 
18517797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_SLAB,		PG_slab);
1860a71649cSNaoya Horiguchi 	if (PageTail(page) && PageSlab(compound_head(page)))
1870a71649cSNaoya Horiguchi 		u |= 1 << KPF_SLAB;
18817797549SWu Fengguang 
18917797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_ERROR,		PG_error);
19017797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_DIRTY,		PG_dirty);
19117797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_UPTODATE,	PG_uptodate);
19217797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_WRITEBACK,	PG_writeback);
19317797549SWu Fengguang 
19417797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_LRU,		PG_lru);
19517797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_REFERENCED,	PG_referenced);
19617797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_ACTIVE,	PG_active);
19717797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_RECLAIM,	PG_reclaim);
19817797549SWu Fengguang 
199b6789123SHugh Dickins 	if (PageSwapCache(page))
200b6789123SHugh Dickins 		u |= 1 << KPF_SWAPCACHE;
20117797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_SWAPBACKED,	PG_swapbacked);
20217797549SWu Fengguang 
20317797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_UNEVICTABLE,	PG_unevictable);
20417797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_MLOCKED,	PG_mlocked);
20517797549SWu Fengguang 
206253fb02dSWu Fengguang #ifdef CONFIG_MEMORY_FAILURE
207253fb02dSWu Fengguang 	u |= kpf_copy_bit(k, KPF_HWPOISON,	PG_hwpoison);
208253fb02dSWu Fengguang #endif
209253fb02dSWu Fengguang 
210ed430fecSTakashi Iwai #ifdef CONFIG_ARCH_USES_PG_UNCACHED
21117797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_UNCACHED,	PG_uncached);
21217797549SWu Fengguang #endif
21317797549SWu Fengguang 
21417797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_RESERVED,	PG_reserved);
21517797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_MAPPEDTODISK,	PG_mappedtodisk);
21617797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_PRIVATE,	PG_private);
21717797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_PRIVATE_2,	PG_private_2);
21817797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_OWNER_PRIVATE,	PG_owner_priv_1);
21917797549SWu Fengguang 	u |= kpf_copy_bit(k, KPF_ARCH,		PG_arch_1);
22017797549SWu Fengguang 
22117797549SWu Fengguang 	return u;
22217797549SWu Fengguang };
2236d80e53fSAlexey Dobriyan 
2246d80e53fSAlexey Dobriyan static ssize_t kpageflags_read(struct file *file, char __user *buf,
2256d80e53fSAlexey Dobriyan 			     size_t count, loff_t *ppos)
2266d80e53fSAlexey Dobriyan {
227abec749fSDavid Hildenbrand 	const unsigned long max_dump_pfn = get_max_dump_pfn();
2286d80e53fSAlexey Dobriyan 	u64 __user *out = (u64 __user *)buf;
2296d80e53fSAlexey Dobriyan 	struct page *ppage;
2306d80e53fSAlexey Dobriyan 	unsigned long src = *ppos;
2316d80e53fSAlexey Dobriyan 	unsigned long pfn;
2326d80e53fSAlexey Dobriyan 	ssize_t ret = 0;
2336d80e53fSAlexey Dobriyan 
2346d80e53fSAlexey Dobriyan 	pfn = src / KPMSIZE;
2356d80e53fSAlexey Dobriyan 	if (src & KPMMASK || count & KPMMASK)
2366d80e53fSAlexey Dobriyan 		return -EINVAL;
237abec749fSDavid Hildenbrand 	if (src >= max_dump_pfn * KPMSIZE)
238abec749fSDavid Hildenbrand 		return 0;
239abec749fSDavid Hildenbrand 	count = min_t(unsigned long, count, (max_dump_pfn * KPMSIZE) - src);
2406d80e53fSAlexey Dobriyan 
2416d80e53fSAlexey Dobriyan 	while (count > 0) {
242aad5f69bSDavid Hildenbrand 		/*
243aad5f69bSDavid Hildenbrand 		 * TODO: ZONE_DEVICE support requires to identify
244aad5f69bSDavid Hildenbrand 		 * memmaps that were actually initialized.
245aad5f69bSDavid Hildenbrand 		 */
246aad5f69bSDavid Hildenbrand 		ppage = pfn_to_online_page(pfn);
2476d80e53fSAlexey Dobriyan 
2481a9b5b7fSWu Fengguang 		if (put_user(stable_page_flags(ppage), out)) {
2496d80e53fSAlexey Dobriyan 			ret = -EFAULT;
2506d80e53fSAlexey Dobriyan 			break;
2516d80e53fSAlexey Dobriyan 		}
2526d80e53fSAlexey Dobriyan 
253ed7ce0f1SWu Fengguang 		pfn++;
254ed7ce0f1SWu Fengguang 		out++;
2556d80e53fSAlexey Dobriyan 		count -= KPMSIZE;
256d3691d2cSVladimir Davydov 
257d3691d2cSVladimir Davydov 		cond_resched();
2586d80e53fSAlexey Dobriyan 	}
2596d80e53fSAlexey Dobriyan 
2606d80e53fSAlexey Dobriyan 	*ppos += (char __user *)out - buf;
2616d80e53fSAlexey Dobriyan 	if (!ret)
2626d80e53fSAlexey Dobriyan 		ret = (char __user *)out - buf;
2636d80e53fSAlexey Dobriyan 	return ret;
2646d80e53fSAlexey Dobriyan }
2656d80e53fSAlexey Dobriyan 
266*97a32539SAlexey Dobriyan static const struct proc_ops kpageflags_proc_ops = {
267*97a32539SAlexey Dobriyan 	.proc_lseek	= mem_lseek,
268*97a32539SAlexey Dobriyan 	.proc_read	= kpageflags_read,
2696d80e53fSAlexey Dobriyan };
2706d80e53fSAlexey Dobriyan 
27180ae2fdcSVladimir Davydov #ifdef CONFIG_MEMCG
27280ae2fdcSVladimir Davydov static ssize_t kpagecgroup_read(struct file *file, char __user *buf,
27380ae2fdcSVladimir Davydov 				size_t count, loff_t *ppos)
27480ae2fdcSVladimir Davydov {
275abec749fSDavid Hildenbrand 	const unsigned long max_dump_pfn = get_max_dump_pfn();
27680ae2fdcSVladimir Davydov 	u64 __user *out = (u64 __user *)buf;
27780ae2fdcSVladimir Davydov 	struct page *ppage;
27880ae2fdcSVladimir Davydov 	unsigned long src = *ppos;
27980ae2fdcSVladimir Davydov 	unsigned long pfn;
28080ae2fdcSVladimir Davydov 	ssize_t ret = 0;
28180ae2fdcSVladimir Davydov 	u64 ino;
28280ae2fdcSVladimir Davydov 
28380ae2fdcSVladimir Davydov 	pfn = src / KPMSIZE;
28480ae2fdcSVladimir Davydov 	if (src & KPMMASK || count & KPMMASK)
28580ae2fdcSVladimir Davydov 		return -EINVAL;
286abec749fSDavid Hildenbrand 	if (src >= max_dump_pfn * KPMSIZE)
287abec749fSDavid Hildenbrand 		return 0;
288abec749fSDavid Hildenbrand 	count = min_t(unsigned long, count, (max_dump_pfn * KPMSIZE) - src);
28980ae2fdcSVladimir Davydov 
29080ae2fdcSVladimir Davydov 	while (count > 0) {
291aad5f69bSDavid Hildenbrand 		/*
292aad5f69bSDavid Hildenbrand 		 * TODO: ZONE_DEVICE support requires to identify
293aad5f69bSDavid Hildenbrand 		 * memmaps that were actually initialized.
294aad5f69bSDavid Hildenbrand 		 */
295aad5f69bSDavid Hildenbrand 		ppage = pfn_to_online_page(pfn);
29680ae2fdcSVladimir Davydov 
29780ae2fdcSVladimir Davydov 		if (ppage)
29880ae2fdcSVladimir Davydov 			ino = page_cgroup_ino(ppage);
29980ae2fdcSVladimir Davydov 		else
30080ae2fdcSVladimir Davydov 			ino = 0;
30180ae2fdcSVladimir Davydov 
30280ae2fdcSVladimir Davydov 		if (put_user(ino, out)) {
30380ae2fdcSVladimir Davydov 			ret = -EFAULT;
30480ae2fdcSVladimir Davydov 			break;
30580ae2fdcSVladimir Davydov 		}
30680ae2fdcSVladimir Davydov 
30780ae2fdcSVladimir Davydov 		pfn++;
30880ae2fdcSVladimir Davydov 		out++;
30980ae2fdcSVladimir Davydov 		count -= KPMSIZE;
310d3691d2cSVladimir Davydov 
311d3691d2cSVladimir Davydov 		cond_resched();
31280ae2fdcSVladimir Davydov 	}
31380ae2fdcSVladimir Davydov 
31480ae2fdcSVladimir Davydov 	*ppos += (char __user *)out - buf;
31580ae2fdcSVladimir Davydov 	if (!ret)
31680ae2fdcSVladimir Davydov 		ret = (char __user *)out - buf;
31780ae2fdcSVladimir Davydov 	return ret;
31880ae2fdcSVladimir Davydov }
31980ae2fdcSVladimir Davydov 
320*97a32539SAlexey Dobriyan static const struct proc_ops kpagecgroup_proc_ops = {
321*97a32539SAlexey Dobriyan 	.proc_lseek	= mem_lseek,
322*97a32539SAlexey Dobriyan 	.proc_read	= kpagecgroup_read,
32380ae2fdcSVladimir Davydov };
32480ae2fdcSVladimir Davydov #endif /* CONFIG_MEMCG */
32580ae2fdcSVladimir Davydov 
3266d80e53fSAlexey Dobriyan static int __init proc_page_init(void)
3276d80e53fSAlexey Dobriyan {
328*97a32539SAlexey Dobriyan 	proc_create("kpagecount", S_IRUSR, NULL, &kpagecount_proc_ops);
329*97a32539SAlexey Dobriyan 	proc_create("kpageflags", S_IRUSR, NULL, &kpageflags_proc_ops);
33080ae2fdcSVladimir Davydov #ifdef CONFIG_MEMCG
331*97a32539SAlexey Dobriyan 	proc_create("kpagecgroup", S_IRUSR, NULL, &kpagecgroup_proc_ops);
33280ae2fdcSVladimir Davydov #endif
3336d80e53fSAlexey Dobriyan 	return 0;
3346d80e53fSAlexey Dobriyan }
335abaf3787SPaul Gortmaker fs_initcall(proc_page_init);
336