On Fri,  7 Feb 2025 01:59:05 +0900
"Masami Hiramatsu (Google)" <mhira...@kernel.org> wrote:

> From: Masami Hiramatsu (Google) <mhira...@kernel.org>
> 
> Since the previous boot trace buffer can include module text address in
> the stacktrace. As same as the kernel text address, convert the module
> text address using the module address information.

Note, this doesn't look like it depends on the first two patches, which I
don't think we want yet. As that assumes we never disable the buffer once
we start it, and may start it again. But that's a debate we can have later.

> 
> Signed-off-by: Masami Hiramatsu (Google) <mhira...@kernel.org>
> ---
>  kernel/trace/trace.c        |   76 
> +++++++++++++++++++++++++++++++++++++++++--
>  kernel/trace/trace.h        |    4 ++
>  kernel/trace/trace_output.c |    3 +-
>  3 files changed, 78 insertions(+), 5 deletions(-)
> 
> diff --git a/kernel/trace/trace.c b/kernel/trace/trace.c
> index 5a064e712fd7..9d942b7c2651 100644
> --- a/kernel/trace/trace.c
> +++ b/kernel/trace/trace.c
> @@ -49,6 +49,7 @@
>  #include <linux/fsnotify.h>
>  #include <linux/irq_work.h>
>  #include <linux/workqueue.h>
> +#include <linux/sort.h>
>  
>  #include <asm/setup.h> /* COMMAND_LINE_SIZE and kaslr_offset() */
>  
> @@ -6007,6 +6008,27 @@ struct trace_scratch {
>  
>  static DEFINE_MUTEX(scratch_mutex);
>  
> +unsigned long trace_adjust_address(struct trace_array *tr, unsigned long 
> addr)
> +{
> +     struct trace_scratch *tscratch;
> +     int i;
> +
> +     /* If we don't have last boot delta, return the address */
> +     if (!(tr->flags & TRACE_ARRAY_FL_LAST_BOOT))
> +             return addr;
> +
> +     tscratch = tr->scratch;
> +     if (tscratch && tr->module_delta && tscratch->entries[0].mod_addr < 
> addr) {
> +             /* Note that entries are sorted */
> +             for (i = 0; i < tr->nr_modules; i++)
> +                     if (addr < tscratch->entries[i].mod_addr)
> +                             break;
> +             return addr + tr->module_delta[i - 1];
> +     }
> +
> +     return addr + tr->text_delta;
> +}
> +
>  static int save_mod(struct module *mod, void *data)
>  {
>       struct trace_array *tr = data;
> @@ -6068,6 +6090,9 @@ static void update_last_data(struct trace_array *tr)
>  
>       /* Using current data now */
>       tr->text_delta = 0;
> +     kfree(tr->module_delta);
> +     tr->module_delta = NULL;
> +     tr->nr_modules = 0;
>  
>       if (!tr->scratch)
>               return;

The above could probably go after the check for !tr->scratch.

> @@ -9351,10 +9376,37 @@ static struct dentry *trace_instance_dir;
>  static void
>  init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer);
>  
> +static int make_mod_delta(struct module *mod, void *data)
> +{
> +     struct trace_scratch *tscratch;
> +     struct trace_mod_entry *entry;
> +     struct trace_array *tr = data;
> +     int i;
> +
> +     tscratch = tr->scratch;
> +     for (i = 0; i < tr->nr_modules; i++) {
> +             entry = &tscratch->entries[i];
> +             if (!strcmp(mod->name, entry->mod_name)) {
> +                     tr->module_delta[i] = (unsigned 
> long)mod->mem[MOD_TEXT].base - entry->mod_addr;
> +                     return 1;

Returning 1 causes the module_loop to stop. That is, this will only process
the first module it finds and then no more after that.

> +             }
> +     }

Doesn't this assume that we have the same modules loaded?

Note, I do plan on adding another field in the trace_scratch structure that
has the uname, then only allow the ascii trace to use the current kallsyms
if the uname matches.

> +     return 0;
> +}
> +
> +static int mod_addr_comp(const void *a, const void *b, const void *data)
> +{
> +     const struct trace_mod_entry *e1 = a;
> +     const struct trace_mod_entry *e2 = b;
> +
> +     return e1->mod_addr - e2->mod_addr;

Hmm, could this possibly cause an overflow issue? If the two addresses are
more than 32 bits apart?

> +}
> +
>  static void setup_trace_scratch(struct trace_array *tr, void *scratch, 
> unsigned int size)
>  {
>       struct trace_scratch *tscratch = scratch;
>       struct trace_mod_entry *entry;
> +     int i, nr_entries;
>  
>       if (!scratch)
>               return;
> @@ -9371,7 +9423,7 @@ static void setup_trace_scratch(struct trace_array *tr, 
> void *scratch, unsigned
>               goto reset;
>  
>       /* Check if each module name is a valid string */
> -     for (int i = 0; i < tscratch->nr_entries; i++) {
> +     for (i = 0; i < tscratch->nr_entries; i++) {
>               int n;
>  
>               entry = &tscratch->entries[i];
> @@ -9385,6 +9437,20 @@ static void setup_trace_scratch(struct trace_array 
> *tr, void *scratch, unsigned
>               if (n == MODULE_NAME_LEN)
>                       goto reset;
>       }
> +     nr_entries = i;
> +     /* Allocate module delta array */
> +     tr->module_delta = kcalloc(nr_entries, sizeof(long), GFP_KERNEL);
> +     if (!tr->module_delta)

I wonder if this should trigger a WARN_ON()?

> +             goto reset;
> +     tr->nr_modules = nr_entries;
> +
> +     /* Sort module table by base address. */
> +     sort_r(tscratch->entries, nr_entries, sizeof(struct trace_mod_entry),
> +             mod_addr_comp, NULL, NULL);
> +
> +     /* Scan modules */
> +     module_for_each_mod(make_mod_delta, tr);
> +
>       return;
>   reset:
>       /* Invalid trace modules */


BTW, here's my removal patch:

-- Steve


From 521bc0e5286c93eb4be981d22a6c05043a78b555 Mon Sep 17 00:00:00 2001
From: Steven Rostedt <rost...@goodmis.org>
Date: Wed, 5 Feb 2025 11:55:51 -0500
Subject: [PATCH] tracing: Update modules to persistent instances when removed

When a module is removed, remove it from the list of saved modules in the
persistent memory to any persistent instance that is currently active.

Signed-off-by: Steven Rostedt (Google) <rost...@goodmis.org>
---
 kernel/trace/trace.c | 69 +++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 65 insertions(+), 4 deletions(-)

diff --git a/kernel/trace/trace.c b/kernel/trace/trace.c
index 443f2bc5b856..13eeb8df8b8c 100644
--- a/kernel/trace/trace.c
+++ b/kernel/trace/trace.c
@@ -6001,6 +6001,7 @@ struct trace_mod_entry {
 
 struct trace_scratch {
        unsigned long           kaslr_addr;
+       unsigned long           first_free_slot;
        unsigned long           nr_entries;
        struct trace_mod_entry  entries[];
 };
@@ -6012,6 +6013,7 @@ static int save_mod(struct module *mod, void *data)
        struct trace_array *tr = data;
        struct trace_scratch *tscratch;
        struct trace_mod_entry *entry;
+       unsigned int idx;
        unsigned int size;
 
        guard(mutex)(&scratch_mutex);
@@ -6021,16 +6023,60 @@ static int save_mod(struct module *mod, void *data)
                return -1;
        size = tr->scratch_size;
 
-       if (struct_size(tscratch, entries, tscratch->nr_entries + 1) > size)
-               return -1;
+       idx = tscratch->first_free_slot < tscratch->nr_entries ?
+               tscratch->first_free_slot : tscratch->nr_entries;
 
-       entry = &tscratch->entries[tscratch->nr_entries];
+       if (struct_size(tscratch, entries, idx + 1) > size)
+               return -1;
 
-       tscratch->nr_entries++;
+       entry = &tscratch->entries[idx];
 
        entry->mod_addr = (unsigned long)mod->mem[MOD_TEXT].base;
        strscpy(entry->mod_name, mod->name);
 
+       if (idx == tscratch->nr_entries)
+               tscratch->nr_entries++;
+
+       for (idx++; idx < tscratch->nr_entries; idx++) {
+               entry = &tscratch->entries[idx];
+               if (!entry->mod_addr)
+                       break;
+       }
+
+       tscratch->first_free_slot = idx;
+
+       return 0;
+}
+
+static int remove_mod(struct module *mod, void *data)
+{
+       struct trace_array *tr = data;
+       struct trace_scratch *tscratch;
+       struct trace_mod_entry *entry;
+       unsigned int idx;
+       unsigned int size;
+
+       guard(mutex)(&scratch_mutex);
+
+       tscratch = tr->scratch;
+       if (!tscratch)
+               return -1;
+       size = tr->scratch_size;
+
+       for (idx = 0; idx < tscratch->nr_entries; idx++) {
+               entry = &tscratch->entries[idx];
+               if (entry->mod_addr == (unsigned long)mod->mem[MOD_TEXT].base)
+                       break;
+       }
+       if (idx == tscratch->nr_entries)
+               return -1;
+
+       if (idx < tscratch->first_free_slot)
+               tscratch->first_free_slot = idx;
+
+       entry->mod_addr = 0;
+       entry->mod_name[0] = '\0';
+
        return 0;
 }
 
@@ -10112,6 +10158,20 @@ static void trace_module_record(struct module *mod)
        }
 }
 
+static void trace_module_delete(struct module *mod)
+{
+       struct trace_array *tr;
+
+       list_for_each_entry(tr, &ftrace_trace_arrays, list) {
+               /* Update any persistent trace array that has already been 
started */
+               if ((tr->flags & (TRACE_ARRAY_FL_BOOT | 
TRACE_ARRAY_FL_LAST_BOOT)) ==
+                   TRACE_ARRAY_FL_BOOT) {
+                       if (trace_array_active(tr))
+                               remove_mod(mod, tr);
+               }
+       }
+}
+
 static int trace_module_notify(struct notifier_block *self,
                               unsigned long val, void *data)
 {
@@ -10124,6 +10184,7 @@ static int trace_module_notify(struct notifier_block 
*self,
                break;
        case MODULE_STATE_GOING:
                trace_module_remove_evals(mod);
+               trace_module_delete(mod);
                break;
        }
 
-- 
2.45.2


Reply via email to