Hi Mark,
On Tue, Mar 3, 2026 at 7:16 AM Mark Wielaard <[email protected]> wrote:
>
> libdwfl tries to model the loading of modules (executables, shared
> libraries, the linux kernel and/or kernel modules) in
> memory. Depending on the (offline) load address it then also applies
> (simple) relocations for ET_REL (object files or kernel modules). Load
> addresses are normally represented through phdr segments for ET_EXEC
> or ET_DYN, but for ET_REL files (which don't have phdrs) the Elf
> section sh_addr fields are used.
>
> The sh_addr fields of the ET_REL Elf images are updated in two places
> __libdwfl_elf_address_range (through __libdwfl_report_elf) and
> __libdwfl_relocate (through dwfl_module_getelf and
> dwfl_module_getdwarf). Both rely on sh_addr being zero if no load
> address has been set yet, so the address layout for each (SHF_ALLOC)
> section is done only once.
>
> Recent linux kernels use a linker script that does set the sh_addr
> fields to (random, linker assigned) non-zero addresses. See commit
> 1ba9f8979426 ("vmlinux.lds: Unify TEXT_MAIN, DATA_MAIN, and related
> macros").
>
> The sh_addr values seems unnecessary, but because they aren't zero
> anymore our layout/relocation code doesn't know it still has to figure
> out a "real" load value for these sections.
>
> Introduce __libdwfl_reset_sh_addr which resets all sh_addr fields to
> zero for SHF_ALLOC sections in ET_REL files.
>
> We don't call __libdwfl_reset_sh_addr on aux_sym files (from
> .gnu_debugdata) and when constructing an Elf from a core file. In all
> other cases we know (or assume) that the Elf file is being opened
> through libdw_open_elf (called indirectly through __libdw_open_elf,
> __libdwfl_report_offline, dwfl_module_getelf and dwfl_module_getdwarf)
>
> This technically changes the Elf that goes through libdwfl, but we
> would already update the sh_addr fields for ET_REL Elf sections in
> memory anyway to represent the load address as libdwfl would see
> them. So this isn't really a change in behavior (it just might update
> the sh_addr field twice).
>
> * libdwfl/libdwflP.h (__libdwfl_reset_sh_addr): Define new
> internal function.
> * libdwfl/relocate.c (__libdwfl_reset_sh_addr): New internal
> function.
> * libdwfl/open.c (libdw_open_elf): Call __libdwfl_reset_sh_addr.
> * libdwfl/dwfl_module_getdwarf.c (open_elf_file): Add comment.
> (find_aux_sym): Likewise.
> (find_dw): Likewise.
> * libdwfl/dwfl_segment_report_module.c
> (dwfl_segment_report_module): Likewise.
> * libdwfl/dwfl_report_elf.c (__libdwfl_report_elf): Likewise.
>
> Signed-off-by: Mark Wielaard <[email protected]>
LGTM.
Aaron
> ---
> libdwfl/dwfl_module_getdwarf.c | 3 +++
> libdwfl/dwfl_report_elf.c | 3 +++
> libdwfl/dwfl_segment_report_module.c | 2 ++
> libdwfl/libdwflP.h | 4 ++++
> libdwfl/open.c | 2 ++
> libdwfl/relocate.c | 32 ++++++++++++++++++++++++++++
> 6 files changed, 46 insertions(+)
>
> diff --git a/libdwfl/dwfl_module_getdwarf.c b/libdwfl/dwfl_module_getdwarf.c
> index 135132d69178..430c32367d01 100644
> --- a/libdwfl/dwfl_module_getdwarf.c
> +++ b/libdwfl/dwfl_module_getdwarf.c
> @@ -57,6 +57,7 @@ open_elf_file (Elf **elf, int *fd, char **name)
> if (*fd < 0)
> return CBFAIL;
>
> + /* This will call __libdwfl_reset_sh_addr. */
> return __libdw_open_file (fd, elf, true, false);
> }
> else if (unlikely (elf_kind (*elf) != ELF_K_ELF))
> @@ -1004,6 +1005,7 @@ find_aux_sym (Dwfl_Module *mod __attribute__ ((unused)),
> free (buffer);
> else
> {
> + /* We don't call __libdwfl_reset_sh_addr here, should we? */
> mod->aux_sym.elf = elf_memory (buffer, size);
> if (mod->aux_sym.elf == NULL)
> free (buffer);
> @@ -1423,6 +1425,7 @@ find_dw (Dwfl_Module *mod)
> switch (mod->dwerr)
> {
> case DWFL_E_NOERROR:
> + /* main.elf already should have had __libdwfl_reset_sh_addr called. */
> mod->debug.elf = mod->main.elf;
> mod->debug.address_sync = mod->main.address_sync;
>
> diff --git a/libdwfl/dwfl_report_elf.c b/libdwfl/dwfl_report_elf.c
> index a76d36816c6f..7173375127a8 100644
> --- a/libdwfl/dwfl_report_elf.c
> +++ b/libdwfl/dwfl_report_elf.c
> @@ -268,6 +268,9 @@ __libdwfl_report_elf (Dwfl *dwfl, const char *name, const
> char *file_name,
> /* Preinstall the open ELF handle for the module. */
> if (m->main.elf == NULL)
> {
> + /* We assume all calls to __libdwfl_report_elf got their Elf
> + through __libdw_open_file which already called
> + __libdwfl_reset_sh_addr. */
> m->main.elf = elf;
> m->main.vaddr = vaddr;
> m->main.address_sync = address_sync;
> diff --git a/libdwfl/dwfl_segment_report_module.c
> b/libdwfl/dwfl_segment_report_module.c
> index f2f866c2c70f..5ad318c78b09 100644
> --- a/libdwfl/dwfl_segment_report_module.c
> +++ b/libdwfl/dwfl_segment_report_module.c
> @@ -1072,6 +1072,8 @@ dwfl_segment_report_module (Dwfl *dwfl, int ndx, const
> char *name,
> elf->flags |= ELF_F_MALLOCED;
> }
>
> + /* Elf comes through a core file, so cannot be an ET_REL. Don't call
> + __libdwfl_reset_sh_addr. */
> if (elf != NULL && mod->main.elf == NULL)
> {
> /* Install the file in the module. */
> diff --git a/libdwfl/libdwflP.h b/libdwfl/libdwflP.h
> index 6e394c262010..7a181029c529 100644
> --- a/libdwfl/libdwflP.h
> +++ b/libdwfl/libdwflP.h
> @@ -482,6 +482,10 @@ extern void __libdwfl_module_free (Dwfl_Module *mod)
> internal_function;
> /* Find the main ELF file, update MOD->elferr and/or MOD->main.elf. */
> extern void __libdwfl_getelf (Dwfl_Module *mod) internal_function;
>
> +/* Reset all sh_addr fields to zero for SHF_ALLOC sections if the Elf
> + handle is an ET_REL. Called from libdw_open_elf. */
> +extern void __libdwfl_reset_sh_addr (Elf *elf) internal_function;
> +
> /* Process relocations in debugging sections in an ET_REL file.
> FILE must be opened with ELF_C_READ_MMAP_PRIVATE or ELF_C_READ,
> to make it possible to relocate the data in place (or ELF_C_RDWR or
> diff --git a/libdwfl/open.c b/libdwfl/open.c
> index e66595fba097..86a3540f2af3 100644
> --- a/libdwfl/open.c
> +++ b/libdwfl/open.c
> @@ -190,6 +190,8 @@ libdw_open_elf (int *fdp, Elf **elfp, bool close_on_fail,
> bool archive_ok,
> *fdp = -1;
> }
>
> + __libdwfl_reset_sh_addr (elf);
> +
> *elfp = elf;
> return error;
> }
> diff --git a/libdwfl/relocate.c b/libdwfl/relocate.c
> index 0497bd4fe1f3..dc9f45e64f3f 100644
> --- a/libdwfl/relocate.c
> +++ b/libdwfl/relocate.c
> @@ -1,5 +1,6 @@
> /* Relocate debug information.
> Copyright (C) 2005-2011, 2014, 2016, 2018 Red Hat, Inc.
> + Copyright (C) 2026 Mark J. Wielaard <[email protected]>
> This file is part of elfutils.
>
> This file is free software; you can redistribute it and/or modify
> @@ -37,6 +38,37 @@
>
> typedef uint8_t GElf_Byte;
>
> +/* Reset all sh_addr fields to zero for SHF_ALLOC sections if the Elf
> + handle is an ET_REL. Called from libdw_open_elf. */
> +
> +void
> +internal_function
> +__libdwfl_reset_sh_addr (Elf *elf)
> +{
> + if (elf == NULL || elf->kind != ELF_K_ELF)
> + return;
> +
> + GElf_Ehdr ehdr_mem;
> + GElf_Ehdr *ehdr = gelf_getehdr (elf, &ehdr_mem);
> + if (ehdr == NULL || ehdr->e_type != ET_REL)
> + return;
> +
> + Elf_Scn *scn = NULL;
> + while ((scn = elf_nextscn (elf, scn)) != NULL)
> + {
> + GElf_Shdr shdr_mem;
> + GElf_Shdr *shdr = gelf_getshdr (scn, &shdr_mem);
> + if (shdr != NULL)
> + {
> + if ((shdr->sh_flags & SHF_ALLOC) != 0 && shdr->sh_addr != 0)
> + {
> + shdr_mem.sh_addr = 0;
> + gelf_update_shdr (scn, &shdr_mem);
> + }
> + }
> + }
> +}
> +
> /* Adjust *VALUE to add the load address of the SHNDX section.
> We update the section header in place to cache the result. */
>
> --
> 2.53.0
>