[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20250206124631.7fe2ecfb@gandalf.local.home>
Date: Thu, 6 Feb 2025 12:46:31 -0500
From: Steven Rostedt <rostedt@...dmis.org>
To: "Masami Hiramatsu (Google)" <mhiramat@...nel.org>
Cc: linux-kernel@...r.kernel.org, linux-trace-kernel@...r.kernel.org, Mark
Rutland <mark.rutland@....com>, Mathieu Desnoyers
<mathieu.desnoyers@...icios.com>, Andrew Morton <akpm@...ux-foundation.org>
Subject: Re: [PATCH 3/3] tracing: Show last module text symbols in the
stacktrace
On Fri, 7 Feb 2025 01:59:05 +0900
"Masami Hiramatsu (Google)" <mhiramat@...nel.org> wrote:
> From: Masami Hiramatsu (Google) <mhiramat@...nel.org>
>
> Since the previous boot trace buffer can include module text address in
> the stacktrace. As same as the kernel text address, convert the module
> text address using the module address information.
Note, this doesn't look like it depends on the first two patches, which I
don't think we want yet. As that assumes we never disable the buffer once
we start it, and may start it again. But that's a debate we can have later.
>
> Signed-off-by: Masami Hiramatsu (Google) <mhiramat@...nel.org>
> ---
> kernel/trace/trace.c | 76 +++++++++++++++++++++++++++++++++++++++++--
> kernel/trace/trace.h | 4 ++
> kernel/trace/trace_output.c | 3 +-
> 3 files changed, 78 insertions(+), 5 deletions(-)
>
> diff --git a/kernel/trace/trace.c b/kernel/trace/trace.c
> index 5a064e712fd7..9d942b7c2651 100644
> --- a/kernel/trace/trace.c
> +++ b/kernel/trace/trace.c
> @@ -49,6 +49,7 @@
> #include <linux/fsnotify.h>
> #include <linux/irq_work.h>
> #include <linux/workqueue.h>
> +#include <linux/sort.h>
>
> #include <asm/setup.h> /* COMMAND_LINE_SIZE and kaslr_offset() */
>
> @@ -6007,6 +6008,27 @@ struct trace_scratch {
>
> static DEFINE_MUTEX(scratch_mutex);
>
> +unsigned long trace_adjust_address(struct trace_array *tr, unsigned long addr)
> +{
> + struct trace_scratch *tscratch;
> + int i;
> +
> + /* If we don't have last boot delta, return the address */
> + if (!(tr->flags & TRACE_ARRAY_FL_LAST_BOOT))
> + return addr;
> +
> + tscratch = tr->scratch;
> + if (tscratch && tr->module_delta && tscratch->entries[0].mod_addr < addr) {
> + /* Note that entries are sorted */
> + for (i = 0; i < tr->nr_modules; i++)
> + if (addr < tscratch->entries[i].mod_addr)
> + break;
> + return addr + tr->module_delta[i - 1];
> + }
> +
> + return addr + tr->text_delta;
> +}
> +
> static int save_mod(struct module *mod, void *data)
> {
> struct trace_array *tr = data;
> @@ -6068,6 +6090,9 @@ static void update_last_data(struct trace_array *tr)
>
> /* Using current data now */
> tr->text_delta = 0;
> + kfree(tr->module_delta);
> + tr->module_delta = NULL;
> + tr->nr_modules = 0;
>
> if (!tr->scratch)
> return;
The above could probably go after the check for !tr->scratch.
> @@ -9351,10 +9376,37 @@ static struct dentry *trace_instance_dir;
> static void
> init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer);
>
> +static int make_mod_delta(struct module *mod, void *data)
> +{
> + struct trace_scratch *tscratch;
> + struct trace_mod_entry *entry;
> + struct trace_array *tr = data;
> + int i;
> +
> + tscratch = tr->scratch;
> + for (i = 0; i < tr->nr_modules; i++) {
> + entry = &tscratch->entries[i];
> + if (!strcmp(mod->name, entry->mod_name)) {
> + tr->module_delta[i] = (unsigned long)mod->mem[MOD_TEXT].base - entry->mod_addr;
> + return 1;
Returning 1 causes the module_loop to stop. That is, this will only process
the first module it finds and then no more after that.
> + }
> + }
Doesn't this assume that we have the same modules loaded?
Note, I do plan on adding another field in the trace_scratch structure that
has the uname, then only allow the ascii trace to use the current kallsyms
if the uname matches.
> + return 0;
> +}
> +
> +static int mod_addr_comp(const void *a, const void *b, const void *data)
> +{
> + const struct trace_mod_entry *e1 = a;
> + const struct trace_mod_entry *e2 = b;
> +
> + return e1->mod_addr - e2->mod_addr;
Hmm, could this possibly cause an overflow issue? If the two addresses are
more than 32 bits apart?
> +}
> +
> static void setup_trace_scratch(struct trace_array *tr, void *scratch, unsigned int size)
> {
> struct trace_scratch *tscratch = scratch;
> struct trace_mod_entry *entry;
> + int i, nr_entries;
>
> if (!scratch)
> return;
> @@ -9371,7 +9423,7 @@ static void setup_trace_scratch(struct trace_array *tr, void *scratch, unsigned
> goto reset;
>
> /* Check if each module name is a valid string */
> - for (int i = 0; i < tscratch->nr_entries; i++) {
> + for (i = 0; i < tscratch->nr_entries; i++) {
> int n;
>
> entry = &tscratch->entries[i];
> @@ -9385,6 +9437,20 @@ static void setup_trace_scratch(struct trace_array *tr, void *scratch, unsigned
> if (n == MODULE_NAME_LEN)
> goto reset;
> }
> + nr_entries = i;
> + /* Allocate module delta array */
> + tr->module_delta = kcalloc(nr_entries, sizeof(long), GFP_KERNEL);
> + if (!tr->module_delta)
I wonder if this should trigger a WARN_ON()?
> + goto reset;
> + tr->nr_modules = nr_entries;
> +
> + /* Sort module table by base address. */
> + sort_r(tscratch->entries, nr_entries, sizeof(struct trace_mod_entry),
> + mod_addr_comp, NULL, NULL);
> +
> + /* Scan modules */
> + module_for_each_mod(make_mod_delta, tr);
> +
> return;
> reset:
> /* Invalid trace modules */
BTW, here's my removal patch:
-- Steve
From 521bc0e5286c93eb4be981d22a6c05043a78b555 Mon Sep 17 00:00:00 2001
From: Steven Rostedt <rostedt@...dmis.org>
Date: Wed, 5 Feb 2025 11:55:51 -0500
Subject: [PATCH] tracing: Update modules to persistent instances when removed
When a module is removed, remove it from the list of saved modules in the
persistent memory to any persistent instance that is currently active.
Signed-off-by: Steven Rostedt (Google) <rostedt@...dmis.org>
---
kernel/trace/trace.c | 69 +++++++++++++++++++++++++++++++++++++++++---
1 file changed, 65 insertions(+), 4 deletions(-)
diff --git a/kernel/trace/trace.c b/kernel/trace/trace.c
index 443f2bc5b856..13eeb8df8b8c 100644
--- a/kernel/trace/trace.c
+++ b/kernel/trace/trace.c
@@ -6001,6 +6001,7 @@ struct trace_mod_entry {
struct trace_scratch {
unsigned long kaslr_addr;
+ unsigned long first_free_slot;
unsigned long nr_entries;
struct trace_mod_entry entries[];
};
@@ -6012,6 +6013,7 @@ static int save_mod(struct module *mod, void *data)
struct trace_array *tr = data;
struct trace_scratch *tscratch;
struct trace_mod_entry *entry;
+ unsigned int idx;
unsigned int size;
guard(mutex)(&scratch_mutex);
@@ -6021,16 +6023,60 @@ static int save_mod(struct module *mod, void *data)
return -1;
size = tr->scratch_size;
- if (struct_size(tscratch, entries, tscratch->nr_entries + 1) > size)
- return -1;
+ idx = tscratch->first_free_slot < tscratch->nr_entries ?
+ tscratch->first_free_slot : tscratch->nr_entries;
- entry = &tscratch->entries[tscratch->nr_entries];
+ if (struct_size(tscratch, entries, idx + 1) > size)
+ return -1;
- tscratch->nr_entries++;
+ entry = &tscratch->entries[idx];
entry->mod_addr = (unsigned long)mod->mem[MOD_TEXT].base;
strscpy(entry->mod_name, mod->name);
+ if (idx == tscratch->nr_entries)
+ tscratch->nr_entries++;
+
+ for (idx++; idx < tscratch->nr_entries; idx++) {
+ entry = &tscratch->entries[idx];
+ if (!entry->mod_addr)
+ break;
+ }
+
+ tscratch->first_free_slot = idx;
+
+ return 0;
+}
+
+static int remove_mod(struct module *mod, void *data)
+{
+ struct trace_array *tr = data;
+ struct trace_scratch *tscratch;
+ struct trace_mod_entry *entry;
+ unsigned int idx;
+ unsigned int size;
+
+ guard(mutex)(&scratch_mutex);
+
+ tscratch = tr->scratch;
+ if (!tscratch)
+ return -1;
+ size = tr->scratch_size;
+
+ for (idx = 0; idx < tscratch->nr_entries; idx++) {
+ entry = &tscratch->entries[idx];
+ if (entry->mod_addr == (unsigned long)mod->mem[MOD_TEXT].base)
+ break;
+ }
+ if (idx == tscratch->nr_entries)
+ return -1;
+
+ if (idx < tscratch->first_free_slot)
+ tscratch->first_free_slot = idx;
+
+ entry->mod_addr = 0;
+ entry->mod_name[0] = '\0';
+
return 0;
}
@@ -10112,6 +10158,20 @@ static void trace_module_record(struct module *mod)
}
}
+static void trace_module_delete(struct module *mod)
+{
+ struct trace_array *tr;
+
+ list_for_each_entry(tr, &ftrace_trace_arrays, list) {
+ /* Update any persistent trace array that has already been started */
+ if ((tr->flags & (TRACE_ARRAY_FL_BOOT | TRACE_ARRAY_FL_LAST_BOOT)) ==
+ TRACE_ARRAY_FL_BOOT) {
+ if (trace_array_active(tr))
+ remove_mod(mod, tr);
+ }
+ }
+}
+
static int trace_module_notify(struct notifier_block *self,
unsigned long val, void *data)
{
@@ -10124,6 +10184,7 @@ static int trace_module_notify(struct notifier_block *self,
break;
case MODULE_STATE_GOING:
trace_module_remove_evals(mod);
+ trace_module_delete(mod);
break;
}
--
2.45.2
Powered by blists - more mailing lists