From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: by sourceware.org (Postfix, from userid 1551) id 4E8263856246; Tue, 10 May 2022 13:18:14 +0000 (GMT) DKIM-Filter: OpenDKIM Filter v2.11.0 sourceware.org 4E8263856246 Content-Type: text/plain; charset="utf-8" MIME-Version: 1.0 Content-Transfer-Encoding: quoted-printable From: Pedro Alves To: gdb-cvs@sourceware.org Subject: [binutils-gdb] Fix "b f(std::string)", always use DMGL_VERBOSE X-Act-Checkin: binutils-gdb X-Git-Author: Pedro Alves X-Git-Refname: refs/heads/master X-Git-Oldrev: 6dc7160b2d598201653f74d65d4c4d34a0284f6c X-Git-Newrev: cb2cd8cba82a0a5480a147d95b16098ad74d33c6 Message-Id: <20220510131814.4E8263856246@sourceware.org> Date: Tue, 10 May 2022 13:18:14 +0000 (GMT) X-BeenThere: gdb-cvs@sourceware.org X-Mailman-Version: 2.1.29 Precedence: list List-Id: Gdb-cvs mailing list List-Unsubscribe: , List-Archive: List-Help: List-Subscribe: , X-List-Received-Date: Tue, 10 May 2022 13:18:14 -0000 https://sourceware.org/git/gitweb.cgi?p=3Dbinutils-gdb.git;h=3Dcb2cd8cba82a= 0a5480a147d95b16098ad74d33c6 commit cb2cd8cba82a0a5480a147d95b16098ad74d33c6 Author: Pedro Alves Date: Fri Apr 29 23:21:18 2022 +0100 Fix "b f(std::string)", always use DMGL_VERBOSE =20 Currently, on any remotely modern GNU/Linux system, gdb.cp/no-dmgl-verbose.exp fails like so: =20 break 'f(std::string)' Function "f(std::string)" not defined. (gdb) FAIL: gdb.cp/no-dmgl-verbose.exp: gdb_breakpoint: set breakpoin= t at 'f(std::string)' break 'f(std::basic_string, std::allocat= or >)' Function "f(std::basic_string, std::allo= cator >)" not defined. (gdb) PASS: gdb.cp/no-dmgl-verbose.exp: DMGL_VERBOSE-demangled f(std:= :string) is not defined =20 This testcase was added back in 2011, here: =20 [patch] Remove DMGL_VERBOSE https://sourceware.org/pipermail/gdb-patches/2011-June/083081.html =20 Back then, the testcase would pass cleanly. It turns out that the reason it fails today is that the testcase is exercising something in GDB that only makes sense if the program is built for the pre-C++11 libstc++ ABI. Back then the C++11 ABI didn't exist yet, but nowadays, you need to compile with -D_GLIBCXX_USE_CXX11_ABI=3D0 to use the old ABI. See "Dual ABI" in the libstdc++ manual, at . =20 If we tweak the gdb.cp/no-dmgl-verbose.exp testcase to force the old ABI with -D_GLIBCXX_USE_CXX11_ABI=3D0, then it passes cleanly. =20 So why is it that setting a breakpoint at "f(std::string)" fails with modern ABI, but passes with old ABI? =20 This is where libiberty demangler's DMGL_VERBOSE option comes in. The Itanium ABI mangling scheme has a shorthand form for std::string (and some other types). See : =20 "In addition, the following catalog of abbreviations of the form "Sx"= are used: =20 ::=3D St # ::std:: ::=3D Sa # ::std::allocator ::=3D Sb # ::std::basic_string ::=3D Ss # ::std::basic_string < char, ::std::char_traits, ::std::allocator > ::=3D Si # ::std::basic_istream > ::=3D So # ::std::basic_ostream > ::=3D Sd # ::std::basic_iostream > " =20 When the libiberty demangler encounters such a abbreviation, by default, it expands it to the user-friendly typedef "std::string", "std::iostream", etc.. If OTOH DMGL_VERBOSE is specified, the abbreviation is expanded to the underlying, non-typedefed fullname "std::basic_string, std::allocator >" etc. as documented in the Itanium ABI, and pasted above. You can see the standard abbreviations/substitutions in libiberty/cp-demangle.c:standard_subs. =20 Back before Jan's patch in 2011, there were parts of GDB that used DMGL_VERBOSE, and others that did not, leading to mismatches. The solution back then was to stop using DMGL_VERBOSE throughout. =20 GDB has code in place to let users set a breakpoint at a function with typedefs in its parameters, like "b f(uint32_t)". Demangled function names as they appear in the symbol tables almost (more on this is in a bit) never have typedefs in them, so when processing "b f(uint32_t)" GDB first replaces "uint32_t" for its underlying type, and then sets a breakpoint on the resulting prototype, in this case "f(unsigned int)". =20 Now, if DMGL_VERBOSE is _not_ used, then the demangler demangles the mangled name of a function such as "void f(std::string)" that was mangled using the standard abbreviations mentioned above really as: =20 "void f(std::string)". =20 For example, the mangled name of "void f(std::string)" if you compile with old pre-C++11 ABI is "_Z1fSs". That uses the abbreviation "Ss", so if you demangle that without DMGL_VERBOSE, you get: =20 $ echo "_Z1fSs" | c++filt --no-verbose f(std::string) =20 while with DMGL_VERBOSE you'd get: =20 $ echo "_Z1fSs" | c++filt f(std::basic_string, std::allocator >) =20 If, when the user sets a breakpoint at "f(std::string)", GDB would replace the std::string typedef for its underlying type using the same mechanism I mentioned for the "f(uint32_t)" example above, then GDB would really try to set a breakpoint at "f(std::basic_string, std::allocator >)", and that would fail, as the function symbol GDB knows about for that function, given no DMGL_VERBOSE, is "f(std::string)". =20 For this reason, the code that expands typedefs in function parameter names has an exception for std::string (and other standard abbreviation types), such that "std::string" is never typedef-expanded. =20 And here lies the problem when you try to do "b f(std::string)" with a program compiled with the C++11 ABI. In that case, std::string expands to a different underlying type, like so: =20 f(std::__cxx11::basic_string, std::alloc= ator >) =20 and this symbol naturally mangles differently, as: =20 _Z1fNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE =20 and then because this doesn't use the shorthand mangling abbreviation for "std::string" anymore, it always demangles as: =20 f(std::__cxx11::basic_string, std::alloc= ator >) =20 Now, when using the C++11 ABI, and you set a breakpoint at "f(std::string)", GDB's typedefs-in-parameters expansion code hits the exception for "std::string" and doesn't expand it, so the breakpoint fails to be inserted, because the symbol that exists is really the =20 f(std::__cxx11::basic_string, std::alloc= ator >) =20 one, not "f(std::string)". =20 So to fix things for C++11 ABI, clearly we need to remove the "std::string" exception from the typedef-in-parameters expansion logic. If we do just that, then "b f(std::string)" starts working with the C++11 ABI. =20 However, if we do _just_ that, and nothing else, then we break pre-C++11 ABI... =20 The solution is then to in addition switch GDB to always use DMGL_VERBOSE. If we do this, then pre-C++11 ABI symbols works the same as C++11 ABI symbols overall -- the demangler expands the standard abbreviation for "std::string" as "std::basic_string, std::allocator >" and letting GDB expand the "std::string" typedef (etc.) too is no longer a problem. =20 To avoid getting in the situation where some parts of GDB use DMGL_VERBOSE and others not, this patch adds wrappers around the demangler's entry points that GDB uses, and makes those force DMGL_VERBOSE. =20 The point of the gdb.cp/no-dmgl-verbose.exp testcase was to try to ensure that DMGL_VERBOSE doesn't creep back in: =20 gdb_test {break 'f(std::basic_string, std= ::allocator >)'} \ {Function ".*" not defined\.} \ "DMGL_VERBOSE-demangled f(std::string) is not defined" =20 This obviously no longer makes sense to have, since we now depend on DMGL_VERBOSE. So the patch replaces gdb.cp/no-dmgl-verbose.exp with a new gdb.cp/break-f-std-string.exp testcase whose purpose is to make sure that setting a breakpoint at "f(std::string)" works. It exercises both pre-C++11 ABI and C++11 ABI. =20 Change-Id: Ib54fab4cf0fd307bfd55bf1dd5056830096a653b Diff: --- gdb/cp-name-parser.y | 12 +-- gdb/cp-support.c | 45 +++++---- gdb/cp-support.h | 16 ++++ .../{no-dmgl-verbose.cc =3D> break-f-std-string.cc} | 0 gdb/testsuite/gdb.cp/break-f-std-string.exp | 105 +++++++++++++++++= ++++ gdb/testsuite/gdb.cp/no-dmgl-verbose.exp | 35 ------- 6 files changed, 154 insertions(+), 59 deletions(-) diff --git a/gdb/cp-name-parser.y b/gdb/cp-name-parser.y index 6410363c87f..34c691ddabb 100644 --- a/gdb/cp-name-parser.y +++ b/gdb/cp-name-parser.y @@ -1948,19 +1948,15 @@ allocate_info (void) return info; } =20 -/* Convert RESULT to a string. The return value is allocated - using xmalloc. ESTIMATED_LEN is used only as a guide to the - length of the result. This functions handles a few cases that - cplus_demangle_print does not, specifically the global destructor - and constructor labels. */ +/* See cp-support.h. */ =20 gdb::unique_xmalloc_ptr cp_comp_to_string (struct demangle_component *result, int estimated_len) { size_t err; =20 - char *res =3D cplus_demangle_print (DMGL_PARAMS | DMGL_ANSI, - result, estimated_len, &err); + char *res =3D gdb_cplus_demangle_print (DMGL_PARAMS | DMGL_ANSI, + result, estimated_len, &err); return gdb::unique_xmalloc_ptr (res); } =20 @@ -2060,7 +2056,7 @@ cp_print (struct demangle_component *result) char *str; size_t err =3D 0; =20 - str =3D cplus_demangle_print (DMGL_PARAMS | DMGL_ANSI, result, 64, &err); + str =3D gdb_cplus_demangle_print (DMGL_PARAMS | DMGL_ANSI, result, 64, &= err); if (str =3D=3D NULL) return; =20 diff --git a/gdb/cp-support.c b/gdb/cp-support.c index f52055893d2..71c14635e38 100644 --- a/gdb/cp-support.c +++ b/gdb/cp-support.c @@ -70,18 +70,16 @@ static void add_symbol_overload_list_qualified =20 struct cmd_list_element *maint_cplus_cmd_list =3D NULL; =20 -/* A list of typedefs which should not be substituted by replace_typedefs.= */ -static const char * const ignore_typedefs[] =3D - { - "std::istream", "std::iostream", "std::ostream", "std::string" - }; - static void replace_typedefs (struct demangle_parse_info *info, struct demangle_component *ret_comp, canonicalization_ftype *finder, void *data); =20 +static struct demangle_component * + gdb_cplus_demangle_v3_components (const char *mangled, + int options, void **mem); + /* A convenience function to copy STRING into OBSTACK, returning a pointer to the newly allocated string and saving the number of bytes saved in L= EN. =20 @@ -146,13 +144,6 @@ inspect_type (struct demangle_parse_info *info, memcpy (name, ret_comp->u.s_name.s, ret_comp->u.s_name.len); name[ret_comp->u.s_name.len] =3D '\0'; =20 - /* Ignore any typedefs that should not be substituted. */ - for (const char *ignorable : ignore_typedefs) - { - if (strcmp (name, ignorable) =3D=3D 0) - return 0; - } - sym =3D NULL; =20 try @@ -670,8 +661,8 @@ mangled_name_to_comp (const char *mangled_name, int opt= ions, { struct demangle_component *ret; =20 - ret =3D cplus_demangle_v3_components (mangled_name, - options, memory); + ret =3D gdb_cplus_demangle_v3_components (mangled_name, + options, memory); if (ret) { std::unique_ptr info (new demangle_parse_info); @@ -1635,7 +1626,7 @@ gdb_demangle (const char *name, int options) #endif =20 if (crash_signal =3D=3D 0) - result.reset (bfd_demangle (NULL, name, options)); + result.reset (bfd_demangle (NULL, name, options | DMGL_VERBOSE)); =20 #ifdef HAVE_WORKING_FORK if (catch_demangler_crashes) @@ -1670,6 +1661,28 @@ gdb_demangle (const char *name, int options) =20 /* See cp-support.h. */ =20 +char * +gdb_cplus_demangle_print (int options, + struct demangle_component *tree, + int estimated_length, + size_t *p_allocated_size) +{ + return cplus_demangle_print (options | DMGL_VERBOSE, tree, + estimated_length, p_allocated_size); +} + +/* A wrapper for cplus_demangle_v3_components that forces + DMGL_VERBOSE. */ + +static struct demangle_component * +gdb_cplus_demangle_v3_components (const char *mangled, + int options, void **mem) +{ + return cplus_demangle_v3_components (mangled, options | DMGL_VERBOSE, me= m); +} + +/* See cp-support.h. */ + unsigned int cp_search_name_hash (const char *search_name) { diff --git a/gdb/cp-support.h b/gdb/cp-support.h index 4fbd53c8923..2e0ad50d2b9 100644 --- a/gdb/cp-support.h +++ b/gdb/cp-support.h @@ -175,6 +175,9 @@ struct type *cp_find_type_baseclass_by_name (struct typ= e *parent_type, extern std::unique_ptr cp_demangled_name_to_comp (const char *demangled_name, std::string *errmsg); =20 +/* Convert RESULT to a string. ESTIMATED_LEN is used only as a guide + to the length of the result. */ + extern gdb::unique_xmalloc_ptr cp_comp_to_string (struct demangle_component *result, int estimated_len); =20 @@ -186,10 +189,23 @@ extern void cp_merge_demangle_parse_infos (struct dem= angle_parse_info *, =20 extern struct cmd_list_element *maint_cplus_cmd_list; =20 +/* Wrappers for bfd and libiberty demangling entry points. Note they + all force DMGL_VERBOSE so that callers don't need to. This is so + that GDB consistently uses DMGL_VERBOSE throughout -- we want + libiberty's demangler to expand standard substitutions to their + full template name. */ + /* A wrapper for bfd_demangle. */ =20 gdb::unique_xmalloc_ptr gdb_demangle (const char *name, int options); =20 +/* A wrapper for cplus_demangle_print. */ + +extern char *gdb_cplus_demangle_print (int options, + struct demangle_component *tree, + int estimated_length, + size_t *p_allocated_size); + /* Find an instance of the character C in the string S that is outside of all parenthesis pairs, single-quoted strings, and double-quoted strings. Also, ignore the char within a template name, like a ',' diff --git a/gdb/testsuite/gdb.cp/no-dmgl-verbose.cc b/gdb/testsuite/gdb.cp= /break-f-std-string.cc similarity index 100% rename from gdb/testsuite/gdb.cp/no-dmgl-verbose.cc rename to gdb/testsuite/gdb.cp/break-f-std-string.cc diff --git a/gdb/testsuite/gdb.cp/break-f-std-string.exp b/gdb/testsuite/gd= b.cp/break-f-std-string.exp new file mode 100644 index 00000000000..0869912bb29 --- /dev/null +++ b/gdb/testsuite/gdb.cp/break-f-std-string.exp @@ -0,0 +1,105 @@ +# Copyright 2022 Free Software Foundation, Inc. + +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 3 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program. If not, see . */ + +# Test setting a breakpoint at "f(std::string)". +# +# GDB should be able to expand the std::string typedef, and then set +# the breakpoint using the resulting name. In the Itanium ABI's +# mangling scheme, "std::string", "std::istream", "std::iostream", +# "std::ostream" are special, though, they have corresponding standard +# abbreviations. The libiberty demangler only expands these standard +# abbreviations to their full non-typedef underlying type if the +# DMGL_VERBOSE option is requested. By default it expands them to the +# user-friendly "std::string", etc. typedefs. GDB didn't use to use +# that option, and would instead prevent expansion of the +# "std::string" (etc.) standard-abbreviation typedefs at +# breakpoint-set type, such that the function name used for function +# lookup would match the "std::string" present in the function's +# non-DMGL_VERBOSE demangled name. +# +# For example (DMGL_VERBOSE): +# +# $ echo "_Z1fSs" | c++filt +# f(std::basic_string, std::allocator = >) +# +# vs (no DMGL_VERBOSE): +# +# $ echo "_Z1fSs" | c++filt --no-verbose +# f(std::string) +# +# This design broke setting a breakpoint at "f(std::string)" when the +# libstdc++ C++11 ABI was introduced, as the "f(std::string)" +# function's mangled name no longer uses a standard substitution for +# std::string... +# +# I.e., with the libstdc++ C++11 ABI, we now have (and DMGL_VERBOSE +# makes no difference): +# +# $ echo _Z1fNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE | c++fi= lt +# f(std::__cxx11::basic_string, std::allocat= or >) +# +# So nowadays, GDB always uses DMGL_VERBOSE and no longer prevents +# std::string (etc.) typedef expansion. This test exercises both +# pre-C++11 and C++11 ABIs for this reason. On non-libstdc++ systems +# where _GLIBCXX_USE_CXX11_ABI has no effect, we just end up running +# the test twice with whatever ABI is used. + +standard_testfile .cc + +if { [skip_cplus_tests] } { continue } + +# CXX11_ABI specifies the value to define _GLIBCXX_USE_CXX11_ABI as. + +proc test {cxx11_abi} { + global srcdir subdir srcfile binfile testfile + + set options \ + [list c++ debug additional_flags=3D-D_GLIBCXX_USE_CXX11_ABI=3D$cxx11_abi] + if { [gdb_compile \ + "${srcdir}/${subdir}/${srcfile}" "${binfile}-${cxx11_abi}.o" \ + object $options] !=3D "" } { + untested "failed to compile" + return -1 + } + + clean_restart ${testfile}-${cxx11_abi}.o + + # Since we're debugging an .o file, GDB doesn't figure out we're + # debugging C++ code and the current language when auto, is + # guessed as C. + gdb_test_no_output "set language c++" + + # Get the type std::string is a typedef for. We'll try to set a + # breakpoint using the expanded type too. + set realtype "" + set type "std::string" + gdb_test_multiple "whatis /r $type" "" { + -re -wrap "type =3D (\[^\r\n\]+)" { + set realtype $expect_out(1,string) + gdb_assert {![string eq "$realtype" "$type"]} \ + $gdb_test_name + } + } + + gdb_test "break f($type)" "$srcfile, line $::decimal\\." + + if { $realtype !=3D "" } { + gdb_test "break f($realtype)" "$srcfile, line $::decimal\\." + } +} + +foreach_with_prefix _GLIBCXX_USE_CXX11_ABI {0 1} { + test $_GLIBCXX_USE_CXX11_ABI +} diff --git a/gdb/testsuite/gdb.cp/no-dmgl-verbose.exp b/gdb/testsuite/gdb.c= p/no-dmgl-verbose.exp deleted file mode 100644 index 14f11ddcf04..00000000000 --- a/gdb/testsuite/gdb.cp/no-dmgl-verbose.exp +++ /dev/null @@ -1,35 +0,0 @@ -# Copyright 2011-2022 Free Software Foundation, Inc. - -# This program is free software; you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation; either version 3 of the License, or -# (at your option) any later version. -# -# This program is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with this program. If not, see . */ - -# Test loading symbols from unrelocated C++ object files. - -standard_testfile .cc - -if { [skip_cplus_tests] } { continue } - -if { [gdb_compile "${srcdir}/${subdir}/${srcfile}" "${binfile}.o" object {= c++ debug}] !=3D "" } { - untested "failed to compile" - return -1 -} - -clean_restart ${testfile}.o - -gdb_test_no_output "set breakpoint pending off" - -gdb_breakpoint {'f(std::string)'} - -gdb_test {break 'f(std::basic_string, std::al= locator >)'} \ - {Function ".*" not defined\.} \ - "DMGL_VERBOSE-demangled f(std::string) is not defined"