From: Mark Wielaard <mark@klomp.org>
To: Di Chen <dichen@redhat.com>
Cc: elfutils-devel@sourceware.org
Subject: Re: [PATCH] readelf: Support --dynamic with --use-dynamic
Date: Fri, 20 May 2022 02:41:38 +0200 [thread overview]
Message-ID: <YobjwpvfqIbd4pkY@wildebeest.org> (raw)
In-Reply-To: <CAN-Pu7QbduAO5M1JO6HZxkiR0_c5Uq0k=Uu0iH4csMKk6p-uMA@mail.gmail.com>
Hi,
On Thu, May 05, 2022 at 09:01:24PM +0800, Di Chen via Elfutils-devel wrote:
> From 3ac23c2584d76114deab0c0af6f4af99068dc7f4 Mon Sep 17 00:00:00 2001
> From: Di Chen <dichen@redhat.com>
> Date: Thu, 28 Apr 2022 19:55:33 +0800
> Subject: [PATCH] readelf: Support --dynamic with --use-dynamic
>
> Currently, eu-readelf is using section headers to dump the dynamic
> segment information (print_dynamic -> handle_dynamic).
>
> This patch adds new options to eu-readelf (-D, --use-dynamic)
> for (-d, --dynamic).
>
> https://sourceware.org/bugzilla/show_bug.cgi?id=28873
This looks pretty good. But there are lots of white-space issues which
make it hard to apply the patch. Could you sent it again preferrably
using git send-email ?
> Signed-off-by: Di Chen <dichen@redhat.com>
> ---
> src/readelf.c | 168 +++++++++++++++++++++++++++++++++++++---
> tests/Makefile.am | 3 +-
> tests/run-readelf-Dd.sh | 65 ++++++++++++++++
> 3 files changed, 223 insertions(+), 13 deletions(-)
> create mode 100755 tests/run-readelf-Dd.sh
>
> diff --git a/src/readelf.c b/src/readelf.c
> index 4b6aab2b..e578456b 100644
> --- a/src/readelf.c
> +++ b/src/readelf.c
> @@ -137,6 +137,8 @@ static const struct argp_option options[] =
> { "string-dump", 'p', NULL, OPTION_ALIAS | OPTION_HIDDEN, NULL, 0 },
> { "archive-index", 'c', NULL, 0,
> N_("Display the symbol index of an archive"), 0 },
> + { "use-dynamic", 'D', NULL, 0,
> + N_("Use the dynamic section info when displaying symbols"), 0 },
This doesn't handle symbols yet. Should it simply say:
"Use the dynamic segment when possible for displaying info"
> { NULL, 0, NULL, 0, N_("Output control:"), 0 },
> { "numeric-addresses", 'N', NULL, 0,
> @@ -195,6 +197,9 @@ static bool print_symbol_table;
> /* True if (only) the dynsym table should be printed. */
> static bool print_dynsym_table;
>
> +/* True if reconstruct dynamic symbol table from the PT_DYNAMIC segment.
> */
> +static bool use_dynamic_segment;
> +
> /* A specific section name, or NULL to print all symbol tables. */
> static char *symbol_table_section;
>
> @@ -268,6 +273,19 @@ static enum section_e
> | section_macro | section_addr | section_types)
> } print_debug_sections, implicit_debug_sections;
>
> +enum dyn_idx
> +{
> + i_strsz,
> + i_verneed,
> + i_verdef,
> + i_versym,
> + i_symtab,
> + i_strtab,
> + i_hash,
> + i_gnu_hash,
> + i_max
> +};
Maybe move this just before it is used in declarations of the
get_dyn... functions?
> /* Select hex dumping of sections. */
> static struct section_argument *dump_data_sections;
> static struct section_argument **dump_data_sections_tail =
> &dump_data_sections;
> @@ -318,6 +336,11 @@ static void dump_strings (Ebl *ebl);
> static void print_strings (Ebl *ebl);
> static void dump_archive_index (Elf *, const char *);
>
> +/* Declarations of local functions for use-dynamic. */
> +static Elf_Data * get_dynscn_strtab(Elf *elf, GElf_Phdr *phdr);
> +static void get_dynscn_addrs(Elf *elf, GElf_Phdr *phdr, GElf_Addr
> addrs[i_max]);
> +static void find_offsets(Elf *elf, GElf_Addr main_bias, size_t n,
> + GElf_Addr addrs[n], GElf_Off offs[n]);
I mean, just before these.
> /* Looked up once with gettext in main. */
> static char *yes_str;
> @@ -429,6 +452,9 @@ parse_opt (int key, char *arg,
> print_dynamic_table = true;
> any_control_option = true;
> break;
> + case 'D':
> + use_dynamic_segment = true;
> + break;
> case 'e':
> print_debug_sections |= section_exception;
> any_control_option = true;
> @@ -1791,7 +1817,7 @@ get_dyn_ents (Elf_Data * dyn_data)
OK, setting flag.
>
> static void
> -handle_dynamic (Ebl *ebl, Elf_Scn *scn, GElf_Shdr *shdr)
> +handle_dynamic (Ebl *ebl, Elf_Scn *scn, GElf_Shdr *shdr, GElf_Phdr *phdr)
> {
> int class = gelf_getclass (ebl->elf);
> GElf_Shdr glink_mem;
> @@ -1802,13 +1828,20 @@ handle_dynamic (Ebl *ebl, Elf_Scn *scn, GElf_Shdr
> *shdr)
> size_t dyn_ents;
>
> /* Get the data of the section. */
> - data = elf_getdata (scn, NULL);
> + if (use_dynamic_segment)
> + data = elf_getdata_rawchunk(
> + ebl->elf, phdr->p_offset, phdr->p_filesz, ELF_T_DYN);
> + else
> + data = elf_getdata (scn, NULL);
> +
> if (data == NULL)
> return;
>
> /* Get the dynamic section entry number */
> dyn_ents = get_dyn_ents (data);
>
> + if (!use_dynamic_segment)
> +{
> /* Get the section header string table index. */
> if (unlikely (elf_getshdrstrndx (ebl->elf, &shstrndx) < 0))
> error_exit (0, _("cannot get section header string table index"));
> @@ -1828,8 +1861,25 @@ handle_dynamic (Ebl *ebl, Elf_Scn *scn, GElf_Shdr
> *shdr)
> shdr->sh_offset,
> (int) shdr->sh_link,
> elf_strptr (ebl->elf, shstrndx, glink->sh_name));
> +} else {
> + printf (ngettext ("\
> +\nDynamic segment contains %lu entry:\n Addr: %#0*" PRIx64 " Offset:
> %#08" PRIx64 "\n",
> + "\
> +\nDynamic segment contains %lu entries:\n Addr: %#0*" PRIx64 " Offset:
> %#08" PRIx64 "\n",
> + dyn_ents),
> + (unsigned long int) dyn_ents,
> + class == ELFCLASS32 ? 10 : 18, phdr->p_paddr,
> + phdr->p_offset);
> +}
> +
> fputs_unlocked (_(" Type Value\n"), stdout);
>
> + /* if --use-dynamic option is enabled,
> + use the string table to get the related library info. */
> + Elf_Data *strtab_data = NULL;
> + if (use_dynamic_segment)
> + strtab_data = get_dynscn_strtab(ebl->elf, phdr);
> +
> for (cnt = 0; cnt < dyn_ents; ++cnt)
> {
> GElf_Dyn dynmem;
> @@ -1841,6 +1891,12 @@ handle_dynamic (Ebl *ebl, Elf_Scn *scn, GElf_Shdr
> *shdr)
> printf (" %-17s ",
> ebl_dynamic_tag_name (ebl, dyn->d_tag, buf, sizeof (buf)));
>
> + char *lib_name = NULL;
> + if (use_dynamic_segment)
> + lib_name = ((char *)strtab_data->d_buf) + dyn->d_un.d_ptr;
I think strtab_data can be NULL here (if get_dynscn_strtab failed) and
dyn->d_un.d_ptr could be beyond the end of data (if the ELF file is
bogus).
> + else
> + lib_name = elf_strptr (ebl->elf, shdr->sh_link, dyn->d_un.d_val);
> +
> switch (dyn->d_tag)
> {
> case DT_NULL:
> @@ -1852,23 +1908,19 @@ handle_dynamic (Ebl *ebl, Elf_Scn *scn, GElf_Shdr
> *shdr)
> break;
>
> case DT_NEEDED:
> - printf (_("Shared library: [%s]\n"),
> - elf_strptr (ebl->elf, shdr->sh_link, dyn->d_un.d_val));
> + printf (_("Shared library: [%s]\n"), lib_name);
> break;
>
> case DT_SONAME:
> - printf (_("Library soname: [%s]\n"),
> - elf_strptr (ebl->elf, shdr->sh_link, dyn->d_un.d_val));
> + printf (_("Library soname: [%s]\n"),lib_name);
> break;
>
> case DT_RPATH:
> - printf (_("Library rpath: [%s]\n"),
> - elf_strptr (ebl->elf, shdr->sh_link, dyn->d_un.d_val));
> + printf (_("Library rpath: [%s]\n"),lib_name);
> break;
>
> case DT_RUNPATH:
> - printf (_("Library runpath: [%s]\n"),
> - elf_strptr (ebl->elf, shdr->sh_link, dyn->d_un.d_val));
> + printf (_("Library runpath: [%s]\n"), lib_name);
> break;
OK.
> case DT_PLTRELSZ:
> @@ -1942,8 +1994,8 @@ print_dynamic (Ebl *ebl)
> Elf_Scn *scn = gelf_offscn (ebl->elf, phdr->p_offset);
> GElf_Shdr shdr_mem;
> GElf_Shdr *shdr = gelf_getshdr (scn, &shdr_mem);
> - if (shdr != NULL && shdr->sh_type == SHT_DYNAMIC)
> - handle_dynamic (ebl, scn, shdr);
> + if (use_dynamic_segment || (shdr != NULL && shdr->sh_type ==
> SHT_DYNAMIC))
> + handle_dynamic (ebl, scn, shdr, phdr);
> break;
Should you check that phdr != NULL here?
> }
> }
> @@ -4801,6 +4853,98 @@ print_ops (Dwfl_Module *dwflmod, Dwarf *dbg, int
> indent, int indentrest,
> }
>
>
> +static void
> +find_offsets(Elf *elf, GElf_Addr main_bias, size_t n,
> + GElf_Addr addrs[n], GElf_Off offs[n])
> +{
> + size_t unsolved = n;
> + for (size_t i = 0; i < phnum; ++i) {
> + GElf_Phdr phdr_mem;
> + GElf_Phdr *phdr = gelf_getphdr(elf, i, &phdr_mem);
> + if (phdr != NULL && phdr->p_type == PT_LOAD && phdr->p_memsz > 0)
> + for (size_t j = 0; j < n; ++j)
> + if (offs[j] == 0 && addrs[j] >= phdr->p_vaddr + main_bias &&
> + addrs[j] - (phdr->p_vaddr + main_bias) < phdr->p_filesz) {
> + offs[j] = addrs[j] - (phdr->p_vaddr + main_bias) +
> phdr->p_offset;
> + if (--unsolved == 0)
> + break;
> + }
> + }
> +}
OK, so this turns the addresses into file offsets using the phdrs. It
is slightly tricky, so I wouldn't mind a comment explaining what is
going on.
> +/* The dynamic segment (type PT_DYNAMIC), contains the .dynamic section.
> + And .dynamic section contains an array of the dynamic structures.
> + We use the array to get:
> + DT_STRTAB: the address of the string table.
> + DT_SYMTAB: the address of the symbol table.
> + DT_STRSZ: the size, in bytes, of the string table.
> + , and etc. */
> +static void
> +get_dynscn_addrs(Elf *elf, GElf_Phdr *phdr, GElf_Addr addrs[i_max])
> +{
> + Elf_Data *data = elf_getdata_rawchunk(
> + elf, phdr->p_offset, phdr->p_filesz, ELF_T_DYN);
> +
> + int dyn_idx = 0;
> + for (;; ++dyn_idx) {
> + GElf_Dyn dyn_mem;
> + GElf_Dyn *dyn = gelf_getdyn(data, dyn_idx, &dyn_mem);
> + /* DT_NULL Marks end of dynamic section. */
> + if (dyn->d_tag == DT_NULL)
> + break;
> +
> + switch (dyn->d_tag) {
> + case DT_SYMTAB:
> + addrs[i_symtab] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_HASH:
> + addrs[i_hash] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_GNU_HASH:
> + addrs[i_gnu_hash] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_STRTAB:
> + addrs[i_strtab] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_VERSYM:
> + addrs[i_versym] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_VERDEF:
> + addrs[i_verdef] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_VERNEED:
> + addrs[i_verneed] = dyn->d_un.d_ptr;
> + break;
> +
> + case DT_STRSZ:
> + addrs[i_strsz] = dyn->d_un.d_val;
> + }
> + }
> + return;
> +}
Note that the return here is redundant and could be left off.
> +/* Use dynamic segment to get data for the string table section. */
> +static Elf_Data *
> +get_dynscn_strtab(Elf *elf, GElf_Phdr *phdr)
> +{
> + Elf_Data *strtab_data;
> + GElf_Addr addrs[i_max] = {0,};
> + GElf_Off offs[i_max] = {0,};
> + get_dynscn_addrs(elf, phdr, addrs);
> + find_offsets(elf, 0, i_max, addrs, offs);
> + strtab_data = elf_getdata_rawchunk(
> + elf, offs[i_strtab], addrs[i_strsz], ELF_T_BYTE);
> + return strtab_data;
> +}
OK.
> +
> struct listptr
> {
> Dwarf_Off offset:(64 - 3);
> diff --git a/tests/Makefile.am b/tests/Makefile.am
> index 84c3950a..b239a461 100644
> --- a/tests/Makefile.am
> +++ b/tests/Makefile.am
> @@ -197,7 +197,8 @@ TESTS = run-arextract.sh run-arsymtest.sh run-ar.sh
> newfile test-nlist \
> msg_tst system-elf-libelf-test \
> $(asm_TESTS) run-disasm-bpf.sh run-low_high_pc-dw-form-indirect.sh \
> run-nvidia-extended-linemap-libdw.sh
> run-nvidia-extended-linemap-readelf.sh \
> - run-readelf-dw-form-indirect.sh run-strip-largealign.sh
> + run-readelf-dw-form-indirect.sh run-strip-largealign.sh \
> + run-readelf-Dd.sh
Don't forget to add run-readelf-Dd.sh to EXTRA_DISTS.
(make distcheck can be used to check for that)
> if !BIARCH
> export ELFUTILS_DISABLE_BIARCH = 1
> diff --git a/tests/run-readelf-Dd.sh b/tests/run-readelf-Dd.sh
> new file mode 100755
> index 00000000..6420a0fe
> --- /dev/null
> +++ b/tests/run-readelf-Dd.sh
> @@ -0,0 +1,65 @@
> +#! /bin/sh
> +# Copyright (C) 2022 Red Hat, Inc.
> +# This file is part of elfutils.
> +#
> +# This file is free software; you can redistribute it and/or modify
> +# it under the terms of the GNU General Public License as published by
> +# the Free Software Foundation; either version 3 of the License, or
> +# (at your option) any later version.
> +#
> +# elfutils is distributed in the hope that it will be useful, but
> +# WITHOUT ANY WARRANTY; without even the implied warranty of
> +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
> +# GNU General Public License for more details.
> +#
> +# You should have received a copy of the GNU General Public License
> +# along with this program. If not, see <http://www.gnu.org/licenses/>.
> +
> +. $srcdir/test-subr.sh
> +
> +# #include <stdio.h>
> +#
> +# __thread int i;
> +#
> +# void print_i ()
> +# {
> +# printf("%d\n", i);
> +# }
> +#
> +# gcc -fPIC -shared -o testlib_dynseg.so testlib_dynseg.c
> +# With ld --version
> +# GNU gold (GNU Binutils 2.22.52.20120402) 1.11
> +
> +testfiles testlib_dynseg.so
Maybe add a comment saying the same testfile is used in run-readelf-d.sh
> +testrun_compare ${abs_top_builddir}/src/readelf -Dd testlib_dynseg.so
> <<\EOF
> +
> +Dynamic segment contains 23 entries:
> + Addr: 0x00000000000017e0 Offset: 0x0007e0
> + Type Value
> + PLTGOT 0x00000000000019c8
> + PLTRELSZ 72 (bytes)
> + JMPREL 0x0000000000000568
> + PLTREL RELA
> + RELA 0x00000000000004d8
> + RELASZ 144 (bytes)
> + RELAENT 24 (bytes)
> + RELACOUNT 1
> + SYMTAB 0x0000000000000228
> + SYMENT 24 (bytes)
> + STRTAB 0x0000000000000360
> + STRSZ 190 (bytes)
> + GNU_HASH 0x0000000000000420
> + NEEDED Shared library: [libc.so.6]
> + NEEDED Shared library: [ld-linux-x86-64.so.2]
> + INIT 0x00000000000005b0
> + FINI 0x0000000000000748
> + VERSYM 0x0000000000000460
> + VERDEF 0x000000000000047c
> + VERDEFNUM 1
> + VERNEED 0x0000000000000498
> + VERNEEDNUM 2
> + NULL
> +EOF
> +
> +exit 0
> --
> 2.35.1
next prev parent reply other threads:[~2022-05-20 0:41 UTC|newest]
Thread overview: 4+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-05-05 13:01 Di Chen
2022-05-20 0:41 ` Mark Wielaard [this message]
2022-05-24 15:53 ` Di Chen
2022-07-31 23:22 ` Mark Wielaard
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=YobjwpvfqIbd4pkY@wildebeest.org \
--to=mark@klomp.org \
--cc=dichen@redhat.com \
--cc=elfutils-devel@sourceware.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for read-only IMAP folder(s) and NNTP newsgroup(s).