[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20251009195024.GL3289052@noisy.programming.kicks-ass.net>
Date: Thu, 9 Oct 2025 21:50:24 +0200
From: Peter Zijlstra <peterz@...radead.org>
To: Oleg Nesterov <oleg@...hat.com>
Cc: Linus Torvalds <torvalds@...ux-foundation.org>,
Alexander Viro <viro@...iv.linux.org.uk>,
Boqun Feng <boqun.feng@...il.com>,
David Howells <dhowells@...hat.com>, Ingo Molnar <mingo@...hat.com>,
Li RongQing <lirongqing@...du.com>,
Waiman Long <longman@...hat.com>, Will Deacon <will@...nel.org>,
linux-kernel@...r.kernel.org
Subject: Re: [PATCH v2 1/4] seqlock: introduce scoped_seqlock_read() and
scoped_seqlock_read_irqsave()
On Thu, Oct 09, 2025 at 04:37:49PM +0200, Oleg Nesterov wrote:
> Let me think a bit more before I send V3...
How do we feel about something a little like so?
diff --git a/include/linux/seqlock.h b/include/linux/seqlock.h
index 5ce48eab7a2a..9786b8d14164 100644
--- a/include/linux/seqlock.h
+++ b/include/linux/seqlock.h
@@ -1209,4 +1209,85 @@ done_seqretry_irqrestore(seqlock_t *lock, int seq, unsigned long flags)
if (seq & 1)
read_sequnlock_excl_irqrestore(lock, flags);
}
+
+enum ss_state {
+ sss_done = 0,
+ sss_locked,
+ sss_lockless,
+};
+
+enum ss_type {
+ ss_lockless,
+ ss_lock,
+ ss_lock_irqsave,
+};
+
+struct ss_tmp {
+ enum ss_type type;
+ enum ss_state state;
+ int seq;
+ unsigned long flags;
+ spinlock_t *lock;
+};
+
+static inline void __scoped_seqlock_cleanup(struct ss_tmp *sst)
+{
+ if (!sst->lock)
+ return;
+
+ if (sst->type == ss_lock_irqsave) {
+ spin_unlock_irqrestore(sst->lock, sst->flags);
+ return;
+ }
+
+ spin_unlock(sst->lock);
+}
+
+static inline void
+__scoped_seqlock_next(struct ss_tmp *sst, seqlock_t *lock)
+{
+ switch (sst->state) {
+ case sss_lockless:
+ if (!read_seqretry(lock, sst->seq)) {
+ sst->state = sss_done;
+ return;
+ }
+
+ switch (sst->type) {
+ case ss_lock:
+ sst->lock = &lock->lock;
+ spin_lock(sst->lock);
+ sst->state = sss_locked;
+ return;
+
+ case ss_lock_irqsave:
+ sst->lock = &lock->lock;
+ spin_lock_irqsave(sst->lock, sst->flags);
+ sst->state = sss_locked;
+ return;
+
+ case ss_lockless:
+ sst->seq = read_seqbegin(lock);
+ return;
+ }
+
+ case sss_locked:
+ sst->state = sss_done;
+ return;
+
+ case sss_done:
+ BUG();
+ }
+}
+
+#define __scoped_seqlock_read(_seqlock, _type, _s) \
+ for (struct ss_tmp _s __cleanup(__scoped_seqlock_cleanup) = { \
+ .type = _type, .state = sss_lockless, \
+ .seq = read_seqbegin(_seqlock), .lock = NULL }; \
+ _s.state != sss_done; \
+ __scoped_seqlock_next(&_s, _seqlock))
+
+#define scoped_seqlock_read(_seqlock, _type) \
+ __scoped_seqlock_read(_seqlock, _type, __UNIQUE_ID(seqlock))
+
#endif /* __LINUX_SEQLOCK_H */
diff --git a/kernel/sched/cputime.c b/kernel/sched/cputime.c
index 7097de2c8cda..d2b3f987c888 100644
--- a/kernel/sched/cputime.c
+++ b/kernel/sched/cputime.c
@@ -313,10 +313,8 @@ static u64 read_sum_exec_runtime(struct task_struct *t)
void thread_group_cputime(struct task_struct *tsk, struct task_cputime *times)
{
struct signal_struct *sig = tsk->signal;
- u64 utime, stime;
struct task_struct *t;
- unsigned int seq, nextseq;
- unsigned long flags;
+ u64 utime, stime;
/*
* Update current task runtime to account pending time since last
@@ -329,27 +327,19 @@ void thread_group_cputime(struct task_struct *tsk, struct task_cputime *times)
if (same_thread_group(current, tsk))
(void) task_sched_runtime(current);
- rcu_read_lock();
- /* Attempt a lockless read on the first round. */
- nextseq = 0;
- do {
- seq = nextseq;
- flags = read_seqbegin_or_lock_irqsave(&sig->stats_lock, &seq);
+ guard(rcu)();
+ scoped_seqlock_read(&sig->stats_lock, ss_lock_irqsave) {
times->utime = sig->utime;
times->stime = sig->stime;
times->sum_exec_runtime = sig->sum_sched_runtime;
- for_each_thread(tsk, t) {
+ __for_each_thread(sig, t) {
task_cputime(t, &utime, &stime);
times->utime += utime;
times->stime += stime;
times->sum_exec_runtime += read_sum_exec_runtime(t);
}
- /* If lockless access failed, take the lock. */
- nextseq = 1;
- } while (need_seqretry(&sig->stats_lock, seq));
- done_seqretry_irqrestore(&sig->stats_lock, seq, flags);
- rcu_read_unlock();
+ }
}
#ifdef CONFIG_IRQ_TIME_ACCOUNTING
Powered by blists - more mailing lists