mirror of
				https://github.com/torvalds/linux.git
				synced 2025-10-31 00:28:52 +02:00 
			
		
		
		
	 91e40668e7
			
		
	
	
		91e40668e7
		
	
	
	
	
		
			
			Convert page_table_check_p[mu]d_set(...) to page_table_check_p[mu]ds_set(..., nr) to allow checking a contiguous set of pmds/puds in single batch. We retain page_table_check_p[mu]d_set(...) as macros that call new batch functions with nr=1 for compatibility. arm64 is about to reorganise its pte/pmd/pud helpers to reuse more code and to allow the implementation for huge_pte to more efficiently set ptes/pmds/puds in batches. We need these batch-helpers to make the refactoring possible. Reviewed-by: Anshuman Khandual <anshuman.khandual@arm.com> Reviewed-by: Pasha Tatashin <pasha.tatashin@soleen.com> Reviewed-by: Catalin Marinas <catalin.marinas@arm.com> Signed-off-by: Ryan Roberts <ryan.roberts@arm.com> Tested-by: Luiz Capitulino <luizcap@redhat.com> Link: https://lore.kernel.org/r/20250422081822.1836315-4-ryan.roberts@arm.com Signed-off-by: Will Deacon <will@kernel.org>
		
			
				
	
	
		
			275 lines
		
	
	
	
		
			6.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			275 lines
		
	
	
	
		
			6.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| // SPDX-License-Identifier: GPL-2.0
 | |
| 
 | |
| /*
 | |
|  * Copyright (c) 2021, Google LLC.
 | |
|  * Pasha Tatashin <pasha.tatashin@soleen.com>
 | |
|  */
 | |
| #include <linux/kstrtox.h>
 | |
| #include <linux/mm.h>
 | |
| #include <linux/page_table_check.h>
 | |
| #include <linux/swap.h>
 | |
| #include <linux/swapops.h>
 | |
| 
 | |
| #undef pr_fmt
 | |
| #define pr_fmt(fmt)	"page_table_check: " fmt
 | |
| 
 | |
| struct page_table_check {
 | |
| 	atomic_t anon_map_count;
 | |
| 	atomic_t file_map_count;
 | |
| };
 | |
| 
 | |
| static bool __page_table_check_enabled __initdata =
 | |
| 				IS_ENABLED(CONFIG_PAGE_TABLE_CHECK_ENFORCED);
 | |
| 
 | |
| DEFINE_STATIC_KEY_TRUE(page_table_check_disabled);
 | |
| EXPORT_SYMBOL(page_table_check_disabled);
 | |
| 
 | |
| static int __init early_page_table_check_param(char *buf)
 | |
| {
 | |
| 	return kstrtobool(buf, &__page_table_check_enabled);
 | |
| }
 | |
| 
 | |
| early_param("page_table_check", early_page_table_check_param);
 | |
| 
 | |
| static bool __init need_page_table_check(void)
 | |
| {
 | |
| 	return __page_table_check_enabled;
 | |
| }
 | |
| 
 | |
| static void __init init_page_table_check(void)
 | |
| {
 | |
| 	if (!__page_table_check_enabled)
 | |
| 		return;
 | |
| 	static_branch_disable(&page_table_check_disabled);
 | |
| }
 | |
| 
 | |
| struct page_ext_operations page_table_check_ops = {
 | |
| 	.size = sizeof(struct page_table_check),
 | |
| 	.need = need_page_table_check,
 | |
| 	.init = init_page_table_check,
 | |
| 	.need_shared_flags = false,
 | |
| };
 | |
| 
 | |
| static struct page_table_check *get_page_table_check(struct page_ext *page_ext)
 | |
| {
 | |
| 	BUG_ON(!page_ext);
 | |
| 	return page_ext_data(page_ext, &page_table_check_ops);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * An entry is removed from the page table, decrement the counters for that page
 | |
|  * verify that it is of correct type and counters do not become negative.
 | |
|  */
 | |
| static void page_table_check_clear(unsigned long pfn, unsigned long pgcnt)
 | |
| {
 | |
| 	struct page_ext_iter iter;
 | |
| 	struct page_ext *page_ext;
 | |
| 	struct page *page;
 | |
| 	bool anon;
 | |
| 
 | |
| 	if (!pfn_valid(pfn))
 | |
| 		return;
 | |
| 
 | |
| 	page = pfn_to_page(pfn);
 | |
| 	BUG_ON(PageSlab(page));
 | |
| 	anon = PageAnon(page);
 | |
| 
 | |
| 	rcu_read_lock();
 | |
| 	for_each_page_ext(page, pgcnt, page_ext, iter) {
 | |
| 		struct page_table_check *ptc = get_page_table_check(page_ext);
 | |
| 
 | |
| 		if (anon) {
 | |
| 			BUG_ON(atomic_read(&ptc->file_map_count));
 | |
| 			BUG_ON(atomic_dec_return(&ptc->anon_map_count) < 0);
 | |
| 		} else {
 | |
| 			BUG_ON(atomic_read(&ptc->anon_map_count));
 | |
| 			BUG_ON(atomic_dec_return(&ptc->file_map_count) < 0);
 | |
| 		}
 | |
| 	}
 | |
| 	rcu_read_unlock();
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * A new entry is added to the page table, increment the counters for that page
 | |
|  * verify that it is of correct type and is not being mapped with a different
 | |
|  * type to a different process.
 | |
|  */
 | |
| static void page_table_check_set(unsigned long pfn, unsigned long pgcnt,
 | |
| 				 bool rw)
 | |
| {
 | |
| 	struct page_ext_iter iter;
 | |
| 	struct page_ext *page_ext;
 | |
| 	struct page *page;
 | |
| 	bool anon;
 | |
| 
 | |
| 	if (!pfn_valid(pfn))
 | |
| 		return;
 | |
| 
 | |
| 	page = pfn_to_page(pfn);
 | |
| 	BUG_ON(PageSlab(page));
 | |
| 	anon = PageAnon(page);
 | |
| 
 | |
| 	rcu_read_lock();
 | |
| 	for_each_page_ext(page, pgcnt, page_ext, iter) {
 | |
| 		struct page_table_check *ptc = get_page_table_check(page_ext);
 | |
| 
 | |
| 		if (anon) {
 | |
| 			BUG_ON(atomic_read(&ptc->file_map_count));
 | |
| 			BUG_ON(atomic_inc_return(&ptc->anon_map_count) > 1 && rw);
 | |
| 		} else {
 | |
| 			BUG_ON(atomic_read(&ptc->anon_map_count));
 | |
| 			BUG_ON(atomic_inc_return(&ptc->file_map_count) < 0);
 | |
| 		}
 | |
| 	}
 | |
| 	rcu_read_unlock();
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * page is on free list, or is being allocated, verify that counters are zeroes
 | |
|  * crash if they are not.
 | |
|  */
 | |
| void __page_table_check_zero(struct page *page, unsigned int order)
 | |
| {
 | |
| 	struct page_ext_iter iter;
 | |
| 	struct page_ext *page_ext;
 | |
| 
 | |
| 	BUG_ON(PageSlab(page));
 | |
| 
 | |
| 	rcu_read_lock();
 | |
| 	for_each_page_ext(page, 1 << order, page_ext, iter) {
 | |
| 		struct page_table_check *ptc = get_page_table_check(page_ext);
 | |
| 
 | |
| 		BUG_ON(atomic_read(&ptc->anon_map_count));
 | |
| 		BUG_ON(atomic_read(&ptc->file_map_count));
 | |
| 	}
 | |
| 	rcu_read_unlock();
 | |
| }
 | |
| 
 | |
| void __page_table_check_pte_clear(struct mm_struct *mm, pte_t pte)
 | |
| {
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	if (pte_user_accessible_page(pte)) {
 | |
| 		page_table_check_clear(pte_pfn(pte), PAGE_SIZE >> PAGE_SHIFT);
 | |
| 	}
 | |
| }
 | |
| EXPORT_SYMBOL(__page_table_check_pte_clear);
 | |
| 
 | |
| void __page_table_check_pmd_clear(struct mm_struct *mm, pmd_t pmd)
 | |
| {
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	if (pmd_user_accessible_page(pmd)) {
 | |
| 		page_table_check_clear(pmd_pfn(pmd), PMD_SIZE >> PAGE_SHIFT);
 | |
| 	}
 | |
| }
 | |
| EXPORT_SYMBOL(__page_table_check_pmd_clear);
 | |
| 
 | |
| void __page_table_check_pud_clear(struct mm_struct *mm, pud_t pud)
 | |
| {
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	if (pud_user_accessible_page(pud)) {
 | |
| 		page_table_check_clear(pud_pfn(pud), PUD_SIZE >> PAGE_SHIFT);
 | |
| 	}
 | |
| }
 | |
| EXPORT_SYMBOL(__page_table_check_pud_clear);
 | |
| 
 | |
| /* Whether the swap entry cached writable information */
 | |
| static inline bool swap_cached_writable(swp_entry_t entry)
 | |
| {
 | |
| 	return is_writable_device_private_entry(entry) ||
 | |
| 	       is_writable_migration_entry(entry);
 | |
| }
 | |
| 
 | |
| static inline void page_table_check_pte_flags(pte_t pte)
 | |
| {
 | |
| 	if (pte_present(pte) && pte_uffd_wp(pte))
 | |
| 		WARN_ON_ONCE(pte_write(pte));
 | |
| 	else if (is_swap_pte(pte) && pte_swp_uffd_wp(pte))
 | |
| 		WARN_ON_ONCE(swap_cached_writable(pte_to_swp_entry(pte)));
 | |
| }
 | |
| 
 | |
| void __page_table_check_ptes_set(struct mm_struct *mm, pte_t *ptep, pte_t pte,
 | |
| 		unsigned int nr)
 | |
| {
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	page_table_check_pte_flags(pte);
 | |
| 
 | |
| 	for (i = 0; i < nr; i++)
 | |
| 		__page_table_check_pte_clear(mm, ptep_get(ptep + i));
 | |
| 	if (pte_user_accessible_page(pte))
 | |
| 		page_table_check_set(pte_pfn(pte), nr, pte_write(pte));
 | |
| }
 | |
| EXPORT_SYMBOL(__page_table_check_ptes_set);
 | |
| 
 | |
| static inline void page_table_check_pmd_flags(pmd_t pmd)
 | |
| {
 | |
| 	if (pmd_present(pmd) && pmd_uffd_wp(pmd))
 | |
| 		WARN_ON_ONCE(pmd_write(pmd));
 | |
| 	else if (is_swap_pmd(pmd) && pmd_swp_uffd_wp(pmd))
 | |
| 		WARN_ON_ONCE(swap_cached_writable(pmd_to_swp_entry(pmd)));
 | |
| }
 | |
| 
 | |
| void __page_table_check_pmds_set(struct mm_struct *mm, pmd_t *pmdp, pmd_t pmd,
 | |
| 		unsigned int nr)
 | |
| {
 | |
| 	unsigned long stride = PMD_SIZE >> PAGE_SHIFT;
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	page_table_check_pmd_flags(pmd);
 | |
| 
 | |
| 	for (i = 0; i < nr; i++)
 | |
| 		__page_table_check_pmd_clear(mm, *(pmdp + i));
 | |
| 	if (pmd_user_accessible_page(pmd))
 | |
| 		page_table_check_set(pmd_pfn(pmd), stride * nr, pmd_write(pmd));
 | |
| }
 | |
| EXPORT_SYMBOL(__page_table_check_pmds_set);
 | |
| 
 | |
| void __page_table_check_puds_set(struct mm_struct *mm, pud_t *pudp, pud_t pud,
 | |
| 		unsigned int nr)
 | |
| {
 | |
| 	unsigned long stride = PUD_SIZE >> PAGE_SHIFT;
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	for (i = 0; i < nr; i++)
 | |
| 		__page_table_check_pud_clear(mm, *(pudp + i));
 | |
| 	if (pud_user_accessible_page(pud))
 | |
| 		page_table_check_set(pud_pfn(pud), stride * nr, pud_write(pud));
 | |
| }
 | |
| EXPORT_SYMBOL(__page_table_check_puds_set);
 | |
| 
 | |
| void __page_table_check_pte_clear_range(struct mm_struct *mm,
 | |
| 					unsigned long addr,
 | |
| 					pmd_t pmd)
 | |
| {
 | |
| 	if (&init_mm == mm)
 | |
| 		return;
 | |
| 
 | |
| 	if (!pmd_bad(pmd) && !pmd_leaf(pmd)) {
 | |
| 		pte_t *ptep = pte_offset_map(&pmd, addr);
 | |
| 		unsigned long i;
 | |
| 
 | |
| 		if (WARN_ON(!ptep))
 | |
| 			return;
 | |
| 		for (i = 0; i < PTRS_PER_PTE; i++) {
 | |
| 			__page_table_check_pte_clear(mm, ptep_get(ptep));
 | |
| 			addr += PAGE_SIZE;
 | |
| 			ptep++;
 | |
| 		}
 | |
| 		pte_unmap(ptep - PTRS_PER_PTE);
 | |
| 	}
 | |
| }
 |