[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-Id: <20240508085217.5094c121f0d8cc1593cb1b75@kernel.org>
Date: Wed, 8 May 2024 08:52:17 +0900
From: Masami Hiramatsu (Google) <mhiramat@...nel.org>
To: Mike Rapoport <rppt@...nel.org>
Cc: linux-kernel@...r.kernel.org, Alexandre Ghiti <alexghiti@...osinc.com>,
Andrew Morton <akpm@...ux-foundation.org>, Björn Töpel
<bjorn@...nel.org>, Catalin Marinas <catalin.marinas@....com>, Christophe
Leroy <christophe.leroy@...roup.eu>, "David S. Miller"
<davem@...emloft.net>, Dinh Nguyen <dinguyen@...nel.org>, Donald Dutile
<ddutile@...hat.com>, Eric Chanudet <echanude@...hat.com>, Heiko Carstens
<hca@...ux.ibm.com>, Helge Deller <deller@....de>, Huacai Chen
<chenhuacai@...nel.org>, Kent Overstreet <kent.overstreet@...ux.dev>, Liviu
Dudau <liviu@...au.co.uk>, Luis Chamberlain <mcgrof@...nel.org>, Mark
Rutland <mark.rutland@....com>, Masami Hiramatsu <mhiramat@...nel.org>,
Michael Ellerman <mpe@...erman.id.au>, Nadav Amit <nadav.amit@...il.com>,
Palmer Dabbelt <palmer@...belt.com>, Peter Zijlstra <peterz@...radead.org>,
Philippe Mathieu-Daudé <philmd@...aro.org>, Rick
Edgecombe <rick.p.edgecombe@...el.com>, Russell King
<linux@...linux.org.uk>, Sam Ravnborg <sam@...nborg.org>, Song Liu
<song@...nel.org>, Steven Rostedt <rostedt@...dmis.org>, Thomas
Bogendoerfer <tsbogend@...ha.franken.de>, Thomas Gleixner
<tglx@...utronix.de>, Will Deacon <will@...nel.org>, bpf@...r.kernel.org,
linux-arch@...r.kernel.org, linux-arm-kernel@...ts.infradead.org,
linux-mips@...r.kernel.org, linux-mm@...ck.org,
linux-modules@...r.kernel.org, linux-parisc@...r.kernel.org,
linux-riscv@...ts.infradead.org, linux-s390@...r.kernel.org,
linux-trace-kernel@...r.kernel.org, linuxppc-dev@...ts.ozlabs.org,
loongarch@...ts.linux.dev, netdev@...r.kernel.org,
sparclinux@...r.kernel.org, x86@...nel.org
Subject: Re: [PATCH RESEND v8 07/16] mm/execmem, arch: convert simple
overrides of module_alloc to execmem
On Sun, 5 May 2024 19:06:19 +0300
Mike Rapoport <rppt@...nel.org> wrote:
> From: "Mike Rapoport (IBM)" <rppt@...nel.org>
>
> Several architectures override module_alloc() only to define address
> range for code allocations different than VMALLOC address space.
>
> Provide a generic implementation in execmem that uses the parameters for
> address space ranges, required alignment and page protections provided
> by architectures.
>
> The architectures must fill execmem_info structure and implement
> execmem_arch_setup() that returns a pointer to that structure. This way the
> execmem initialization won't be called from every architecture, but rather
> from a central place, namely a core_initcall() in execmem.
>
> The execmem provides execmem_alloc() API that wraps __vmalloc_node_range()
> with the parameters defined by the architectures. If an architecture does
> not implement execmem_arch_setup(), execmem_alloc() will fall back to
> module_alloc().
>
Looks good to me.
Reviewed-by: Masami Hiramatsu (Google) <mhiramat@...nel.org>
Thanks,
> Signed-off-by: Mike Rapoport (IBM) <rppt@...nel.org>
> Acked-by: Song Liu <song@...nel.org>
> ---
> arch/loongarch/kernel/module.c | 19 ++++++++--
> arch/mips/kernel/module.c | 20 ++++++++--
> arch/nios2/kernel/module.c | 21 ++++++++---
> arch/parisc/kernel/module.c | 24 ++++++++----
> arch/riscv/kernel/module.c | 24 ++++++++----
> arch/sparc/kernel/module.c | 20 ++++++++--
> include/linux/execmem.h | 47 ++++++++++++++++++++++++
> mm/execmem.c | 67 ++++++++++++++++++++++++++++++++--
> mm/mm_init.c | 2 +
> 9 files changed, 210 insertions(+), 34 deletions(-)
>
> diff --git a/arch/loongarch/kernel/module.c b/arch/loongarch/kernel/module.c
> index c7d0338d12c1..ca6dd7ea1610 100644
> --- a/arch/loongarch/kernel/module.c
> +++ b/arch/loongarch/kernel/module.c
> @@ -18,6 +18,7 @@
> #include <linux/ftrace.h>
> #include <linux/string.h>
> #include <linux/kernel.h>
> +#include <linux/execmem.h>
> #include <asm/alternative.h>
> #include <asm/inst.h>
> #include <asm/unwind.h>
> @@ -490,10 +491,22 @@ int apply_relocate_add(Elf_Shdr *sechdrs, const char *strtab,
> return 0;
> }
>
> -void *module_alloc(unsigned long size)
> +static struct execmem_info execmem_info __ro_after_init;
> +
> +struct execmem_info __init *execmem_arch_setup(void)
> {
> - return __vmalloc_node_range(size, 1, MODULES_VADDR, MODULES_END,
> - GFP_KERNEL, PAGE_KERNEL, 0, NUMA_NO_NODE, __builtin_return_address(0));
> + execmem_info = (struct execmem_info){
> + .ranges = {
> + [EXECMEM_DEFAULT] = {
> + .start = MODULES_VADDR,
> + .end = MODULES_END,
> + .pgprot = PAGE_KERNEL,
> + .alignment = 1,
> + },
> + },
> + };
> +
> + return &execmem_info;
> }
>
> static void module_init_ftrace_plt(const Elf_Ehdr *hdr,
> diff --git a/arch/mips/kernel/module.c b/arch/mips/kernel/module.c
> index 9a6c96014904..59225a3cf918 100644
> --- a/arch/mips/kernel/module.c
> +++ b/arch/mips/kernel/module.c
> @@ -20,6 +20,7 @@
> #include <linux/kernel.h>
> #include <linux/spinlock.h>
> #include <linux/jump_label.h>
> +#include <linux/execmem.h>
> #include <asm/jump_label.h>
>
> struct mips_hi16 {
> @@ -32,11 +33,22 @@ static LIST_HEAD(dbe_list);
> static DEFINE_SPINLOCK(dbe_lock);
>
> #ifdef MODULES_VADDR
> -void *module_alloc(unsigned long size)
> +static struct execmem_info execmem_info __ro_after_init;
> +
> +struct execmem_info __init *execmem_arch_setup(void)
> {
> - return __vmalloc_node_range(size, 1, MODULES_VADDR, MODULES_END,
> - GFP_KERNEL, PAGE_KERNEL, 0, NUMA_NO_NODE,
> - __builtin_return_address(0));
> + execmem_info = (struct execmem_info){
> + .ranges = {
> + [EXECMEM_DEFAULT] = {
> + .start = MODULES_VADDR,
> + .end = MODULES_END,
> + .pgprot = PAGE_KERNEL,
> + .alignment = 1,
> + },
> + },
> + };
> +
> + return &execmem_info;
> }
> #endif
>
> diff --git a/arch/nios2/kernel/module.c b/arch/nios2/kernel/module.c
> index 9c97b7513853..0d1ee86631fc 100644
> --- a/arch/nios2/kernel/module.c
> +++ b/arch/nios2/kernel/module.c
> @@ -18,15 +18,26 @@
> #include <linux/fs.h>
> #include <linux/string.h>
> #include <linux/kernel.h>
> +#include <linux/execmem.h>
>
> #include <asm/cacheflush.h>
>
> -void *module_alloc(unsigned long size)
> +static struct execmem_info execmem_info __ro_after_init;
> +
> +struct execmem_info __init *execmem_arch_setup(void)
> {
> - return __vmalloc_node_range(size, 1, MODULES_VADDR, MODULES_END,
> - GFP_KERNEL, PAGE_KERNEL_EXEC,
> - VM_FLUSH_RESET_PERMS, NUMA_NO_NODE,
> - __builtin_return_address(0));
> + execmem_info = (struct execmem_info){
> + .ranges = {
> + [EXECMEM_DEFAULT] = {
> + .start = MODULES_VADDR,
> + .end = MODULES_END,
> + .pgprot = PAGE_KERNEL_EXEC,
> + .alignment = 1,
> + },
> + },
> + };
> +
> + return &execmem_info;
> }
>
> int apply_relocate_add(Elf32_Shdr *sechdrs, const char *strtab,
> diff --git a/arch/parisc/kernel/module.c b/arch/parisc/kernel/module.c
> index d214bbe3c2af..bdfa85e10c1b 100644
> --- a/arch/parisc/kernel/module.c
> +++ b/arch/parisc/kernel/module.c
> @@ -49,6 +49,7 @@
> #include <linux/bug.h>
> #include <linux/mm.h>
> #include <linux/slab.h>
> +#include <linux/execmem.h>
>
> #include <asm/unwind.h>
> #include <asm/sections.h>
> @@ -173,15 +174,22 @@ static inline int reassemble_22(int as22)
> ((as22 & 0x0003ff) << 3));
> }
>
> -void *module_alloc(unsigned long size)
> +static struct execmem_info execmem_info __ro_after_init;
> +
> +struct execmem_info __init *execmem_arch_setup(void)
> {
> - /* using RWX means less protection for modules, but it's
> - * easier than trying to map the text, data, init_text and
> - * init_data correctly */
> - return __vmalloc_node_range(size, 1, VMALLOC_START, VMALLOC_END,
> - GFP_KERNEL,
> - PAGE_KERNEL_RWX, 0, NUMA_NO_NODE,
> - __builtin_return_address(0));
> + execmem_info = (struct execmem_info){
> + .ranges = {
> + [EXECMEM_DEFAULT] = {
> + .start = VMALLOC_START,
> + .end = VMALLOC_END,
> + .pgprot = PAGE_KERNEL_RWX,
> + .alignment = 1,
> + },
> + },
> + };
> +
> + return &execmem_info;
> }
>
> #ifndef CONFIG_64BIT
> diff --git a/arch/riscv/kernel/module.c b/arch/riscv/kernel/module.c
> index 5e5a82644451..182904127ba0 100644
> --- a/arch/riscv/kernel/module.c
> +++ b/arch/riscv/kernel/module.c
> @@ -14,6 +14,7 @@
> #include <linux/vmalloc.h>
> #include <linux/sizes.h>
> #include <linux/pgtable.h>
> +#include <linux/execmem.h>
> #include <asm/alternative.h>
> #include <asm/sections.h>
>
> @@ -906,13 +907,22 @@ int apply_relocate_add(Elf_Shdr *sechdrs, const char *strtab,
> }
>
> #if defined(CONFIG_MMU) && defined(CONFIG_64BIT)
> -void *module_alloc(unsigned long size)
> -{
> - return __vmalloc_node_range(size, 1, MODULES_VADDR,
> - MODULES_END, GFP_KERNEL,
> - PAGE_KERNEL, VM_FLUSH_RESET_PERMS,
> - NUMA_NO_NODE,
> - __builtin_return_address(0));
> +static struct execmem_info execmem_info __ro_after_init;
> +
> +struct execmem_info __init *execmem_arch_setup(void)
> +{
> + execmem_info = (struct execmem_info){
> + .ranges = {
> + [EXECMEM_DEFAULT] = {
> + .start = MODULES_VADDR,
> + .end = MODULES_END,
> + .pgprot = PAGE_KERNEL,
> + .alignment = 1,
> + },
> + },
> + };
> +
> + return &execmem_info;
> }
> #endif
>
> diff --git a/arch/sparc/kernel/module.c b/arch/sparc/kernel/module.c
> index d37adb2a0b54..8b7ee45defc3 100644
> --- a/arch/sparc/kernel/module.c
> +++ b/arch/sparc/kernel/module.c
> @@ -14,6 +14,7 @@
> #include <linux/string.h>
> #include <linux/ctype.h>
> #include <linux/mm.h>
> +#include <linux/execmem.h>
>
> #include <asm/processor.h>
> #include <asm/spitfire.h>
> @@ -21,11 +22,22 @@
>
> #include "entry.h"
>
> -void *module_alloc(unsigned long size)
> +static struct execmem_info execmem_info __ro_after_init;
> +
> +struct execmem_info __init *execmem_arch_setup(void)
> {
> - return __vmalloc_node_range(size, 1, MODULES_VADDR, MODULES_END,
> - GFP_KERNEL, PAGE_KERNEL, 0, NUMA_NO_NODE,
> - __builtin_return_address(0));
> + execmem_info = (struct execmem_info){
> + .ranges = {
> + [EXECMEM_DEFAULT] = {
> + .start = MODULES_VADDR,
> + .end = MODULES_END,
> + .pgprot = PAGE_KERNEL,
> + .alignment = 1,
> + },
> + },
> + };
> +
> + return &execmem_info;
> }
>
> /* Make generic code ignore STT_REGISTER dummy undefined symbols. */
> diff --git a/include/linux/execmem.h b/include/linux/execmem.h
> index 8eebc8ef66e7..96fc59258467 100644
> --- a/include/linux/execmem.h
> +++ b/include/linux/execmem.h
> @@ -33,6 +33,47 @@ enum execmem_type {
> EXECMEM_TYPE_MAX,
> };
>
> +/**
> + * struct execmem_range - definition of an address space suitable for code and
> + * related data allocations
> + * @start: address space start
> + * @end: address space end (inclusive)
> + * @pgprot: permissions for memory in this address space
> + * @alignment: alignment required for text allocations
> + */
> +struct execmem_range {
> + unsigned long start;
> + unsigned long end;
> + pgprot_t pgprot;
> + unsigned int alignment;
> +};
> +
> +/**
> + * struct execmem_info - architecture parameters for code allocations
> + * @ranges: array of parameter sets defining architecture specific
> + * parameters for executable memory allocations. The ranges that are not
> + * explicitly initialized by an architecture use parameters defined for
> + * @EXECMEM_DEFAULT.
> + */
> +struct execmem_info {
> + struct execmem_range ranges[EXECMEM_TYPE_MAX];
> +};
> +
> +/**
> + * execmem_arch_setup - define parameters for allocations of executable memory
> + *
> + * A hook for architectures to define parameters for allocations of
> + * executable memory. These parameters should be filled into the
> + * @execmem_info structure.
> + *
> + * For architectures that do not implement this method a default set of
> + * parameters will be used
> + *
> + * Return: a structure defining architecture parameters and restrictions
> + * for allocations of executable memory
> + */
> +struct execmem_info *execmem_arch_setup(void);
> +
> /**
> * execmem_alloc - allocate executable memory
> * @type: type of the allocation
> @@ -54,4 +95,10 @@ void *execmem_alloc(enum execmem_type type, size_t size);
> */
> void execmem_free(void *ptr);
>
> +#ifdef CONFIG_EXECMEM
> +void execmem_init(void);
> +#else
> +static inline void execmem_init(void) {}
> +#endif
> +
> #endif /* _LINUX_EXECMEM_ALLOC_H */
> diff --git a/mm/execmem.c b/mm/execmem.c
> index 480adc69b20d..80e61c1e7319 100644
> --- a/mm/execmem.c
> +++ b/mm/execmem.c
> @@ -11,14 +11,30 @@
> #include <linux/execmem.h>
> #include <linux/moduleloader.h>
>
> -static void *__execmem_alloc(size_t size)
> +static struct execmem_info *execmem_info __ro_after_init;
> +
> +static void *__execmem_alloc(struct execmem_range *range, size_t size)
> {
> - return module_alloc(size);
> + unsigned long start = range->start;
> + unsigned long end = range->end;
> + unsigned int align = range->alignment;
> + pgprot_t pgprot = range->pgprot;
> +
> + return __vmalloc_node_range(size, align, start, end,
> + GFP_KERNEL, pgprot, VM_FLUSH_RESET_PERMS,
> + NUMA_NO_NODE, __builtin_return_address(0));
> }
>
> void *execmem_alloc(enum execmem_type type, size_t size)
> {
> - return __execmem_alloc(size);
> + struct execmem_range *range;
> +
> + if (!execmem_info)
> + return module_alloc(size);
> +
> + range = &execmem_info->ranges[type];
> +
> + return __execmem_alloc(range, size);
> }
>
> void execmem_free(void *ptr)
> @@ -30,3 +46,48 @@ void execmem_free(void *ptr)
> WARN_ON(in_interrupt());
> vfree(ptr);
> }
> +
> +static bool execmem_validate(struct execmem_info *info)
> +{
> + struct execmem_range *r = &info->ranges[EXECMEM_DEFAULT];
> +
> + if (!r->alignment || !r->start || !r->end || !pgprot_val(r->pgprot)) {
> + pr_crit("Invalid parameters for execmem allocator, module loading will fail");
> + return false;
> + }
> +
> + return true;
> +}
> +
> +static void execmem_init_missing(struct execmem_info *info)
> +{
> + struct execmem_range *default_range = &info->ranges[EXECMEM_DEFAULT];
> +
> + for (int i = EXECMEM_DEFAULT + 1; i < EXECMEM_TYPE_MAX; i++) {
> + struct execmem_range *r = &info->ranges[i];
> +
> + if (!r->start) {
> + r->pgprot = default_range->pgprot;
> + r->alignment = default_range->alignment;
> + r->start = default_range->start;
> + r->end = default_range->end;
> + }
> + }
> +}
> +
> +struct execmem_info * __weak execmem_arch_setup(void)
> +{
> + return NULL;
> +}
> +
> +void __init execmem_init(void)
> +{
> + struct execmem_info *info = execmem_arch_setup();
> +
> + if (!info || !execmem_validate(info))
> + return;
> +
> + execmem_init_missing(info);
> +
> + execmem_info = info;
> +}
> diff --git a/mm/mm_init.c b/mm/mm_init.c
> index 549e76af8f82..b6a1fcf6e13a 100644
> --- a/mm/mm_init.c
> +++ b/mm/mm_init.c
> @@ -27,6 +27,7 @@
> #include <linux/swap.h>
> #include <linux/cma.h>
> #include <linux/crash_dump.h>
> +#include <linux/execmem.h>
> #include "internal.h"
> #include "slab.h"
> #include "shuffle.h"
> @@ -2793,4 +2794,5 @@ void __init mm_core_init(void)
> pti_init();
> kmsan_init_runtime();
> mm_cache_init();
> + execmem_init();
> }
> --
> 2.43.0
>
--
Masami Hiramatsu (Google) <mhiramat@...nel.org>
Powered by blists - more mailing lists