lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <Z5PvNqjv5lopk7ko@slm.duckdns.org>
Date: Fri, 24 Jan 2025 09:51:18 -1000
From: Tejun Heo <tj@...nel.org>
To: Andrea Righi <arighi@...dia.com>
Cc: David Vernet <void@...ifault.com>, Changwoo Min <changwoo@...lia.com>,
	Yury Norov <yury.norov@...il.com>, linux-kernel@...r.kernel.org
Subject: Re: [PATCH sched_ext/for-6.14] sched_ext: Move built-in idle CPU
 selection policy to a separate file

Hello,

On Thu, Jan 23, 2025 at 11:02:02PM +0100, Andrea Righi wrote:
...
> diff --git a/MAINTAINERS b/MAINTAINERS
> index 023df277737d..cd3d5b139a11 100644
> --- a/MAINTAINERS
> +++ b/MAINTAINERS
> @@ -20935,6 +20935,8 @@ T:	git://git.kernel.org/pub/scm/linux/kernel/git/tj/sched_ext.git
>  F:	include/linux/sched/ext.h
>  F:	kernel/sched/ext.h
>  F:	kernel/sched/ext.c
> +F:	kernel/sched/ext_idle.c
> +F:	kernel/sched/ext_idle.h

Maybe kernel/sched/ext*?

> diff --git a/kernel/sched/ext.c b/kernel/sched/ext.c
> index 564f250e7689..a24d48cebfb7 100644
> --- a/kernel/sched/ext.c
> +++ b/kernel/sched/ext.c
...
> @@ -896,6 +893,17 @@ static struct static_key_false scx_has_op[SCX_OPI_END] =
>  static atomic_t scx_exit_kind = ATOMIC_INIT(SCX_EXIT_DONE);
>  static struct scx_exit_info *scx_exit_info;
>  
> +#define scx_ops_error_kind(err, fmt, args...)					\
> +	scx_ops_exit_kind((err), 0, fmt, ##args)
> +
> +#define scx_ops_exit(code, fmt, args...)					\
> +	scx_ops_exit_kind(SCX_EXIT_UNREG_KERN, (code), fmt, ##args)
> +
> +#define scx_ops_error(fmt, args...)						\
> +	scx_ops_error_kind(SCX_EXIT_ERROR, fmt, ##args)
> +
> +#define SCX_HAS_OP(op)	static_branch_likely(&scx_has_op[SCX_OP_IDX(op)])
> +

This chunk is no longer necessary, right?

...
> @@ -7750,12 +7037,6 @@ BTF_ID_FLAGS(func, scx_bpf_nr_cpu_ids)
>  BTF_ID_FLAGS(func, scx_bpf_get_possible_cpumask, KF_ACQUIRE)
>  BTF_ID_FLAGS(func, scx_bpf_get_online_cpumask, KF_ACQUIRE)
>  BTF_ID_FLAGS(func, scx_bpf_put_cpumask, KF_RELEASE)
> -BTF_ID_FLAGS(func, scx_bpf_get_idle_cpumask, KF_ACQUIRE)
> -BTF_ID_FLAGS(func, scx_bpf_get_idle_smtmask, KF_ACQUIRE)
> -BTF_ID_FLAGS(func, scx_bpf_put_idle_cpumask, KF_RELEASE)
> -BTF_ID_FLAGS(func, scx_bpf_test_and_clear_cpu_idle)
> -BTF_ID_FLAGS(func, scx_bpf_pick_idle_cpu, KF_RCU)
> -BTF_ID_FLAGS(func, scx_bpf_pick_any_cpu, KF_RCU)

So, these were in ids_any and could be called from any BPF progs.

> diff --git a/kernel/sched/ext_idle.c b/kernel/sched/ext_idle.c
> new file mode 100644
> index 000000000000..ca99fc58af91
> --- /dev/null
> +++ b/kernel/sched/ext_idle.c
...
> +BTF_KFUNCS_START(scx_kfunc_ids_select_cpu)
> +BTF_ID_FLAGS(func, scx_bpf_select_cpu_dfl, KF_RCU)
> +BTF_ID_FLAGS(func, scx_bpf_get_idle_cpumask, KF_ACQUIRE)
> +BTF_ID_FLAGS(func, scx_bpf_get_idle_smtmask, KF_ACQUIRE)
> +BTF_ID_FLAGS(func, scx_bpf_put_idle_cpumask, KF_RELEASE)
> +BTF_ID_FLAGS(func, scx_bpf_test_and_clear_cpu_idle)
> +BTF_ID_FLAGS(func, scx_bpf_pick_idle_cpu, KF_RCU)
> +BTF_ID_FLAGS(func, scx_bpf_pick_any_cpu, KF_RCU)
> +BTF_KFUNCS_END(scx_kfunc_ids_select_cpu)

But they get moved into ids_select_cpu and can only be called from
struct_ops. Also, we currently don't use kfunc id sets directly to decide
which kfunc may be called from which ops but that may change in the future
too. Just create a separate ids and register directly from an init function?

...
> diff --git a/kernel/sched/ext_idle.h b/kernel/sched/ext_idle.h
> new file mode 100644
> index 000000000000..c1385af1ceeb
> --- /dev/null
> +++ b/kernel/sched/ext_idle.h
...
> +#ifdef CONFIG_SMP
> +static DEFINE_STATIC_KEY_FALSE(scx_selcpu_topo_llc);
> +static DEFINE_STATIC_KEY_FALSE(scx_selcpu_topo_numa);
> +
> +static void update_selcpu_topology(void);
> +static void reset_idle_masks(void);
> +static void init_idle_masks(void);
> +static bool test_and_clear_cpu_idle(int cpu);
> +
> +static s32 scx_pick_idle_cpu(const struct cpumask *cpus_allowed, u64 flags);
> +static s32 scx_select_cpu_dfl(struct task_struct *p,
> +			      s32 prev_cpu, u64 wake_flags, bool *found);

The way scheudler code is built is weird but let's keep it as close to usual
h/c splits - make them extern prototypes and prefix them with scx_. Also,
maybe name them to explicitly show that they deal with bulitin idle
handling?

Thanks.

-- 
tejun

Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ