!6439 v3 m: convert mm's rss stats to use atomic mode (7e5b7bd6) · Commits · EulixOS / Software / Kernel

include/linux/mm.h

+43 −7

Original line number	Diff line number	Diff line
		@@ -2581,30 +2581,66 @@ static inline bool get_user_page_fast_only(unsigned long addr,
		*/
		static inline unsigned long get_mm_counter(struct mm_struct *mm, int member)
		{
		return percpu_counter_read_positive(&mm->rss_stat[member]);
		struct percpu_counter *fbc = &mm->rss_stat[member];

		if (percpu_counter_initialized(fbc))
		return percpu_counter_read_positive(fbc);

		return percpu_counter_atomic_read(fbc);
		}

		void mm_trace_rss_stat(struct mm_struct *mm, int member);

		static inline void add_mm_counter(struct mm_struct *mm, int member, long value)
		{
		percpu_counter_add(&mm->rss_stat[member], value);
		struct percpu_counter *fbc = &mm->rss_stat[member];

		if (percpu_counter_initialized(fbc))
		percpu_counter_add(fbc, value);
		else
		percpu_counter_atomic_add(fbc, value);

		mm_trace_rss_stat(mm, member);
		}

		static inline void inc_mm_counter(struct mm_struct *mm, int member)
		{
		percpu_counter_inc(&mm->rss_stat[member]);

		mm_trace_rss_stat(mm, member);
		add_mm_counter(mm, member, 1);
		}

		static inline void dec_mm_counter(struct mm_struct *mm, int member)
		{
		percpu_counter_dec(&mm->rss_stat[member]);
		add_mm_counter(mm, member, -1);
		}

		mm_trace_rss_stat(mm, member);
		static inline s64 mm_counter_sum(struct mm_struct *mm, int member)
		{
		struct percpu_counter *fbc = &mm->rss_stat[member];

		if (percpu_counter_initialized(fbc))
		return percpu_counter_sum(fbc);

		return percpu_counter_atomic_read(fbc);
		}

		static inline s64 mm_counter_sum_positive(struct mm_struct *mm, int member)
		{
		struct percpu_counter *fbc = &mm->rss_stat[member];

		if (percpu_counter_initialized(fbc))
		return percpu_counter_sum_positive(fbc);

		return percpu_counter_atomic_read(fbc);
		}

		static inline int mm_counter_switch_to_pcpu(struct mm_struct *mm)
		{
		return percpu_counter_switch_to_pcpu_many(mm->rss_stat, NR_MM_COUNTERS);
		}

		static inline void mm_counter_destroy(struct mm_struct *mm)
		{
		percpu_counter_destroy_many(mm->rss_stat, NR_MM_COUNTERS);
		}

		/* Optimized variant when folio is already known not to be anon */

include/linux/percpu_counter.h

+45 −3

Original line number	Diff line number	Diff line
		@@ -21,7 +21,18 @@

		struct percpu_counter {
		raw_spinlock_t lock;
		/*
		* Depending on whether counters is NULL, we can support two modes,
		* atomic mode using count_atomic and perpcu mode using count.
		* The single-thread processes should use atomic mode to reduce the
		* memory consumption and performance regression.
		* The multiple-thread processes should use percpu mode to reduce the
		* error margin.
		*/
		union {
		s64 count;
		atomic64_t count_atomic;
		};
		#ifdef CONFIG_HOTPLUG_CPU
		struct list_head list; /* All percpu_counters are on a list */
		#endif
		@@ -32,14 +43,14 @@ extern int percpu_counter_batch;

		int __percpu_counter_init_many(struct percpu_counter *fbc, s64 amount,
		gfp_t gfp, u32 nr_counters,
		struct lock_class_key *key);
		struct lock_class_key *key, bool switch_mode);

		#define percpu_counter_init_many(fbc, value, gfp, nr_counters) \
		({ \
		static struct lock_class_key __key; \
		\
		__percpu_counter_init_many(fbc, value, gfp, nr_counters,\
		&__key); \
		&__key, false); \
		})


		@@ -121,6 +132,20 @@ static inline bool percpu_counter_initialized(struct percpu_counter *fbc)
		return (fbc->counters != NULL);
		}

		static inline s64 percpu_counter_atomic_read(struct percpu_counter *fbc)
		{
		return atomic64_read(&fbc->count_atomic);
		}

		static inline void percpu_counter_atomic_add(struct percpu_counter *fbc,
		s64 amount)
		{
		atomic64_add(amount, &fbc->count_atomic);
		}

		int percpu_counter_switch_to_pcpu_many(struct percpu_counter *fbc,
		u32 nr_counters);

		#else /* !CONFIG_SMP */

		struct percpu_counter {
		@@ -230,6 +255,23 @@ static inline bool percpu_counter_initialized(struct percpu_counter *fbc)
		static inline void percpu_counter_sync(struct percpu_counter *fbc)
		{
		}

		static inline s64 percpu_counter_atomic_read(struct percpu_counter *fbc)
		{
		return fbc->count;
		}

		static inline void percpu_counter_atomic_add(struct percpu_counter *fbc,
		s64 amount)
		{
		percpu_counter_add(fbc, amount);
		}

		static inline int percpu_counter_switch_to_pcpu_many(struct percpu_counter *fbc,
		u32 nr_counters)
		{
		return 0;
		}
		#endif /* CONFIG_SMP */

		static inline void percpu_counter_inc(struct percpu_counter *fbc)

include/trace/events/kmem.h

+2 −2

Original line number	Diff line number	Diff line
		@@ -361,7 +361,7 @@ TRACE_EVENT(rss_stat,
		__entry->mm_id = mm_ptr_to_hash(mm);
		__entry->curr = !!(current->mm == mm);
		__entry->member = member;
		__entry->size = (percpu_counter_sum_positive(&mm->rss_stat[member])
		__entry->size = (mm_counter_sum_positive(mm, member)
		<< PAGE_SHIFT);
		),

kernel/fork.c

+12 −8

Original line number	Diff line number	Diff line
		@@ -853,7 +853,7 @@ static void check_mm(struct mm_struct *mm)
		"Please make sure 'struct resident_page_types[]' is updated as well");

		for (i = 0; i < NR_MM_COUNTERS; i++) {
		long x = percpu_counter_sum(&mm->rss_stat[i]);
		long x = mm_counter_sum(mm, i);

		if (unlikely(x))
		pr_alert("BUG: Bad rss-counter state mm:%p type:%s val:%ld\n",
		@@ -954,7 +954,7 @@ void __mmdrop(struct mm_struct *mm)
		put_user_ns(mm->user_ns);
		mm_pasid_drop(mm);
		mm_destroy_cid(mm);
		percpu_counter_destroy_many(mm->rss_stat, NR_MM_COUNTERS);
		mm_counter_destroy(mm);

		free_mm(mm);
		}
		@@ -1357,17 +1357,11 @@ static struct mm_struct mm_init(struct mm_struct mm, struct task_struct *p,
		if (mm_alloc_cid(mm))
		goto fail_cid;

		if (percpu_counter_init_many(mm->rss_stat, 0, GFP_KERNEL_ACCOUNT,
		NR_MM_COUNTERS))
		goto fail_pcpu;

		sp_init_mm(mm);
		mm->user_ns = get_user_ns(user_ns);
		lru_gen_init_mm(mm);
		return mm;

		fail_pcpu:
		mm_destroy_cid(mm);
		fail_cid:
		destroy_context(mm);
		fail_nocontext:
		@@ -1783,6 +1777,16 @@ static int copy_mm(unsigned long clone_flags, struct task_struct *tsk)
		if (!oldmm)
		return 0;

		/*
		* For single-thread processes, rss_stat is in atomic mode, which
		* reduces the memory consumption and performance regression caused by
		* using percpu. For multiple-thread processes, rss_stat is switched to
		* the percpu mode to reduce the error margin.
		*/
		if (clone_flags & CLONE_THREAD)
		if (mm_counter_switch_to_pcpu(oldmm))
		return -ENOMEM;

		if (clone_flags & CLONE_VM) {
		mmget(oldmm);
		mm = oldmm;

lib/percpu_counter.c

+33 −2

Original line number	Diff line number	Diff line
		@@ -153,7 +153,7 @@ EXPORT_SYMBOL(__percpu_counter_sum);

		int __percpu_counter_init_many(struct percpu_counter *fbc, s64 amount,
		gfp_t gfp, u32 nr_counters,
		struct lock_class_key *key)
		struct lock_class_key *key, bool switch_mode)
		{
		unsigned long flags __maybe_unused;
		size_t counter_size;
		@@ -174,6 +174,7 @@ int __percpu_counter_init_many(struct percpu_counter *fbc, s64 amount,
		#ifdef CONFIG_HOTPLUG_CPU
		INIT_LIST_HEAD(&fbc[i].list);
		#endif
		if (likely(!switch_mode))
		fbc[i].count = amount;
		fbc[i].counters = (void )counters + (i counter_size);

		@@ -278,6 +279,36 @@ int __percpu_counter_compare(struct percpu_counter *fbc, s64 rhs, s32 batch)
		}
		EXPORT_SYMBOL(__percpu_counter_compare);

		/*
		* percpu_counter_switch_to_pcpu_many: Converts struct percpu_counters from
		* atomic mode to percpu mode.
		*
		* Return: 0 if percpu_counter is already in atomic mode or successfully
		* switched to atomic mode; -ENOMEM if perpcu memory allocation fails,
		* perpcu_counter is still in atomic mode.
		*/
		int percpu_counter_switch_to_pcpu_many(struct percpu_counter *fbc,
		u32 nr_counters)
		{
		static struct lock_class_key __key;
		unsigned long flags;
		bool ret = 0;

		if (percpu_counter_initialized(fbc))
		return 0;

		preempt_disable();
		local_irq_save(flags);
		if (likely(!percpu_counter_initialized(fbc)))
		ret = __percpu_counter_init_many(fbc, 0,
		GFP_ATOMIC\|__GFP_NOWARN\|__GFP_ZERO,
		nr_counters, &__key, true);
		local_irq_restore(flags);
		preempt_enable();

		return ret;
		}

		static int __init percpu_counter_startup(void)
		{
		int ret;