mm: add pte_batch_hint() to reduce scanning in folio_pte_batch() (6db18de4) · Commits · EulixOS / Software / Kernel

include/linux/pgtable.h

+21 −0

Original line number	Diff line number	Diff line
		@@ -205,6 +205,27 @@ static inline int pmd_young(pmd_t pmd)
		#define arch_flush_lazy_mmu_mode() do {} while (0)
		#endif

		#ifndef pte_batch_hint
		/**
		* pte_batch_hint - Number of pages that can be added to batch without scanning.
		* @ptep: Page table pointer for the entry.
		* @pte: Page table entry.
		*
		* Some architectures know that a set of contiguous ptes all map the same
		* contiguous memory with the same permissions. In this case, it can provide a
		* hint to aid pte batching without the core code needing to scan every pte.
		*
		* An architecture implementation may ignore the PTE accessed state. Further,
		* the dirty state must apply atomically to all the PTEs described by the hint.
		*
		* May be overridden by the architecture, else pte_batch_hint is always 1.
		*/
		static inline unsigned int pte_batch_hint(pte_t *ptep, pte_t pte)
		{
		return 1;
		}
		#endif

		#ifndef pte_advance_pfn
		static inline pte_t pte_advance_pfn(pte_t pte, unsigned long nr)
		{

+12 −7

Original line number	Diff line number	Diff line
		@@ -993,16 +993,20 @@ static inline int folio_pte_batch(struct folio *folio, unsigned long addr,
		{
		unsigned long folio_end_pfn = folio_pfn(folio) + folio_nr_pages(folio);
		const pte_t *end_ptep = start_ptep + max_nr;
		pte_t expected_pte = __pte_batch_clear_ignored(pte_next_pfn(pte), flags);
		pte_t *ptep = start_ptep + 1;
		pte_t expected_pte, *ptep;
		bool writable;
		int nr;

		if (any_writable)
		*any_writable = false;

		VM_WARN_ON_FOLIO(!pte_present(pte), folio);

		while (ptep != end_ptep) {
		nr = pte_batch_hint(start_ptep, pte);
		expected_pte = __pte_batch_clear_ignored(pte_advance_pfn(pte, nr), flags);
		ptep = start_ptep + nr;

		while (ptep < end_ptep) {
		pte = ptep_get(ptep);
		if (any_writable)
		writable = !!pte_write(pte);
		@@ -1016,17 +1020,18 @@ static inline int folio_pte_batch(struct folio *folio, unsigned long addr,
		* corner cases the next PFN might fall into a different
		* folio.
		*/
		if (pte_pfn(pte) == folio_end_pfn)
		if (pte_pfn(pte) >= folio_end_pfn)
		break;

		if (any_writable)
		*any_writable \|= writable;

		expected_pte = pte_next_pfn(expected_pte);
		ptep++;
		nr = pte_batch_hint(ptep, pte);
		expected_pte = pte_advance_pfn(expected_pte, nr);
		ptep += nr;
		}

		return ptep - start_ptep;
		return min(ptep - start_ptep, max_nr);
		}

		/*