On Tue, 7 Jan 2025, Jakub Jelinek wrote:

> Hi!
> 
> DWARF has voted in yesterday https://dwarfstd.org/issues/241209.1.html ,
> which is basically just a guarantee that the DWARF 6 draft
> DW_AT_language_{name,version} attribute codes and content of
> https://dwarfstd.org/languages-v6.html can be used as an extension
> in DWARF 5 and won't be changed.
> 
> So, this patch is an alternative to the
> https://gcc.gnu.org/pipermail/gcc-patches/2024-November/669671.html
> patch, which had the major problem that it required changing all the
> DWARF consumers to be able to debug C17 or later or C++17 or later
> sources.
> This patch uses still DWARF 5 DW_LANG_C11 or DW_LANG_C_plus_plus_14,
> the latest code in DWARF 5 proper, so all DWARF 5 capable consumers
> should be able to deal with that, but additionally emits the
> DWARF 6 attributes so that newer DWARF consumers can see it isn't
> just C++14 but say C++23 or C11 but C23.  Consumers which don't know
> those DWARF 6 attributes would just ignore them.  This is like any other
> -gno-strict-dwarf extension, except that normally we emit say DWARF 5
> codes where possible only after DWARF 5 is released, while in this case
> there is a guarantee it can be used before DWARF 6 is released.
> 
> Bootstrapped/regtested on x86_64-linux and i686-linux, ok for trunk?

Ok with me.

Thanks,
Richard.

> 2025-01-07  Jakub Jelinek  <ja...@redhat.com>
> 
> include/
>       * dwarf2.h (enum dwarf_source_language): Fix comment pasto.
>       (enum dwarf_source_language_name): New type.
>       * dwarf2.def (DW_AT_language_name, DW_AT_language_version): New
>       DWARF 6 codes.
> gcc/
>       * dwarf2out.cc (break_out_comdat_types): Copy over
>       DW_AT_language_{name,version} if present.
>       (output_skeleton_debug_sections): Remove also
>       DW_AT_language_{name,version}.
>       (gen_compile_unit_die): For C17, C23, C2Y, C++17, C++20, C++23
>       and C++26 emit for -gdwarf-5 -gno-strict-dwarf also
>       DW_AT_language_{name,version} attributes.
> gcc/testsuite/
>       * g++.dg/debug/dwarf2/lang-cpp17.C: Add -gno-strict-dwarf to
>       dg-options.  Check also for DW_AT_language_{name,version} values.
>       * g++.dg/debug/dwarf2/lang-cpp20.C: Likewise.
>       * g++.dg/debug/dwarf2/lang-cpp23.C: New test.
> 
> --- include/dwarf2.h.jj       2025-01-02 11:47:47.431981968 +0100
> +++ include/dwarf2.h  2025-01-06 18:55:59.802378204 +0100
> @@ -411,7 +411,7 @@ enum dwarf_source_language
>      DW_LANG_Hylo = 0x0042,
>  
>      DW_LANG_lo_user = 0x8000,        /* Implementation-defined range start.  
> */
> -    DW_LANG_hi_user = 0xffff,        /* Implementation-defined range start.  
> */
> +    DW_LANG_hi_user = 0xffff,        /* Implementation-defined range end.  */
>  
>      /* MIPS.  */
>      DW_LANG_Mips_Assembler = 0x8001,
> @@ -428,6 +428,59 @@ enum dwarf_source_language
>      DW_LANG_Rust_old = 0x9000
>    };
>  
> +/* DWARF 6 source language names and codes.  */
> +enum dwarf_source_language_name
> +  {
> +    /* https://dwarfstd.org/languages-v6.html */
> +    DW_LNAME_Ada = 0x0001,
> +    DW_LNAME_BLISS = 0x0002,
> +    DW_LNAME_C = 0x0003,
> +    DW_LNAME_C_plus_plus = 0x0004,
> +    DW_LNAME_Cobol = 0x0005,
> +    DW_LNAME_Crystal = 0x0006,
> +    DW_LNAME_D = 0x0007,
> +    DW_LNAME_Dylan = 0x0008,
> +    DW_LNAME_Fortran = 0x0009,
> +    DW_LNAME_Go = 0x000a,
> +    DW_LNAME_Haskell = 0x000b,
> +    DW_LNAME_Java = 0x000c,
> +    DW_LNAME_Julia = 0x000d,
> +    DW_LNAME_Kotlin = 0x000e,
> +    DW_LNAME_Modula2 = 0x000f,
> +    DW_LNAME_Modula3 = 0x0010,
> +    DW_LNAME_ObjC = 0x0011,
> +    DW_LNAME_ObjC_plus_plus = 0x0012,
> +    DW_LNAME_OCaml = 0x0013,
> +    DW_LNAME_OpenCL_C = 0x0014,
> +    DW_LNAME_Pascal = 0x0015,
> +    DW_LNAME_PLI = 0x0016,
> +    DW_LNAME_Python = 0x0017,
> +    DW_LNAME_RenderScript = 0x0018,
> +    DW_LNAME_Rust = 0x0019,
> +    DW_LNAME_Swift = 0x001a,
> +    DW_LNAME_UPC = 0x001b,
> +    DW_LNAME_Zig = 0x001c,
> +    DW_LNAME_Assembly = 0x001d,
> +    DW_LNAME_C_sharp = 0x001e,
> +    DW_LNAME_Mojo = 0x001f,
> +    DW_LNAME_GLSL = 0x0020,
> +    DW_LNAME_GLSL_ES = 0x0021,
> +    DW_LNAME_HLSL = 0x0022,
> +    DW_LNAME_OpenCL_CPP = 0x0023,
> +    DW_LNAME_CPP_for_OpenCL = 0x0024,
> +    DW_LNAME_SYCL = 0x0025,
> +    DW_LNAME_Ruby = 0x0026,
> +    DW_LNAME_Move = 0x0027,
> +    DW_LNAME_Hylo = 0x0028,
> +    DW_LNAME_HIP = 0x0029,
> +    DW_LNAME_Odin = 0x002a,
> +    DW_LNAME_P4 = 0x002b,
> +    DW_LNAME_Metal = 0x002c,
> +
> +    DW_LNAME_lo_user = 0x8000,       /* Implementation-defined range start.  
> */
> +    DW_LNAME_hi_user = 0xffff        /* Implementation-defined range end.  */
> +  };
> +
>  /* Names and codes for macro information.  */
>  enum dwarf_macinfo_record_type
>    {
> --- include/dwarf2.def.jj     2025-01-02 11:47:47.191985318 +0100
> +++ include/dwarf2.def        2025-01-06 18:39:02.642383150 +0100
> @@ -364,6 +364,9 @@ DW_AT (DW_AT_export_symbols, 0x89)
>  DW_AT (DW_AT_deleted, 0x8a)
>  DW_AT (DW_AT_defaulted, 0x8b)
>  DW_AT (DW_AT_loclists_base, 0x8c)
> +/* DWARF 6.  */
> +DW_AT (DW_AT_language_name, 0x90)
> +DW_AT (DW_AT_language_version, 0x91)
>  
>  DW_AT_DUP (DW_AT_lo_user, 0x2000) /* Implementation-defined range start.  */
>  DW_AT_DUP (DW_AT_hi_user, 0x3fff) /* Implementation-defined range end.  */
> --- gcc/dwarf2out.cc.jj       2025-01-02 11:23:35.541251268 +0100
> +++ gcc/dwarf2out.cc  2025-01-07 10:09:16.866866563 +0100
> @@ -8755,6 +8755,14 @@ break_out_comdat_types (dw_die_ref die)
>          unit = new_die (DW_TAG_type_unit, NULL, NULL);
>          add_AT_unsigned (unit, DW_AT_language,
>                           get_AT_unsigned (comp_unit_die (), DW_AT_language));
> +     if (unsigned lname = get_AT_unsigned (comp_unit_die (),
> +                                           DW_AT_language_name))
> +       {
> +         add_AT_unsigned (unit, DW_AT_language_name, lname);
> +         add_AT_unsigned (unit, DW_AT_language_version,
> +                          get_AT_unsigned (comp_unit_die (),
> +                                           DW_AT_language_version));
> +       }
>  
>       /* Add the new unit's type DIE into the comdat type list.  */
>          type_node = ggc_cleared_alloc<comdat_type_node> ();
> @@ -11404,6 +11412,8 @@ output_skeleton_debug_sections (dw_die_r
>    /* These attributes will be found in the full debug_info section.  */
>    remove_AT (comp_unit, DW_AT_producer);
>    remove_AT (comp_unit, DW_AT_language);
> +  remove_AT (comp_unit, DW_AT_language_name);
> +  remove_AT (comp_unit, DW_AT_language_version);
>  
>    switch_to_section (debug_skeleton_info_section);
>    ASM_OUTPUT_LABEL (asm_out_file, debug_skeleton_info_section_label);
> @@ -25318,7 +25328,7 @@ gen_compile_unit_die (const char *filena
>  {
>    dw_die_ref die;
>    const char *language_string = lang_hooks.name;
> -  int language;
> +  int language, lname, lversion;
>  
>    die = new_die (DW_TAG_compile_unit, NULL, NULL);
>  
> @@ -25366,6 +25376,8 @@ gen_compile_unit_die (const char *filena
>      }
>  
>    language = DW_LANG_C;
> +  lname = 0;
> +  lversion = 0;
>    if (startswith (language_string, "GNU C")
>        && ISDIGIT (language_string[5]))
>      {
> @@ -25376,11 +25388,28 @@ gen_compile_unit_die (const char *filena
>           language = DW_LANG_C99;
>  
>         if (dwarf_version >= 5 /* || !dwarf_strict */)
> -         if (strcmp (language_string, "GNU C11") == 0
> -             || strcmp (language_string, "GNU C17") == 0
> -             || strcmp (language_string, "GNU C23") == 0
> -             || strcmp (language_string, "GNU C2Y") == 0)
> -           language = DW_LANG_C11;
> +         {
> +           if (strcmp (language_string, "GNU C11") == 0)
> +             language = DW_LANG_C11;
> +           else if (strcmp (language_string, "GNU C17") == 0)
> +             {
> +               language = DW_LANG_C11;
> +               lname = DW_LNAME_C;
> +               lversion = 201710;
> +             }
> +           else if (strcmp (language_string, "GNU C23") == 0)
> +             {
> +               language = DW_LANG_C11;
> +               lname = DW_LNAME_C;
> +               lversion = 202311;
> +             }
> +           else if (strcmp (language_string, "GNU C2Y") == 0)
> +             {
> +               language = DW_LANG_C11;
> +               lname = DW_LNAME_C;
> +               lversion = 202500;
> +             }
> +         }
>       }
>      }
>    else if (startswith (language_string, "GNU C++"))
> @@ -25392,12 +25421,30 @@ gen_compile_unit_die (const char *filena
>           language = DW_LANG_C_plus_plus_11;
>         else if (strcmp (language_string, "GNU C++14") == 0)
>           language = DW_LANG_C_plus_plus_14;
> -       else if (strcmp (language_string, "GNU C++17") == 0
> -                || strcmp (language_string, "GNU C++20") == 0
> -                || strcmp (language_string, "GNU C++23") == 0
> -                || strcmp (language_string, "GNU C++26") == 0)
> -         /* For now.  */
> -         language = DW_LANG_C_plus_plus_14;
> +       else if (strcmp (language_string, "GNU C++17") == 0)
> +         {
> +           language = DW_LANG_C_plus_plus_14;
> +           lname = DW_LNAME_C_plus_plus;
> +           lversion = 201703;
> +         }
> +       else if (strcmp (language_string, "GNU C++20") == 0)
> +         {
> +           language = DW_LANG_C_plus_plus_14;
> +           lname = DW_LNAME_C_plus_plus;
> +           lversion = 202002;
> +         }
> +       else if (strcmp (language_string, "GNU C++23") == 0)
> +         {
> +           language = DW_LANG_C_plus_plus_14;
> +           lname = DW_LNAME_C_plus_plus;
> +           lversion = 202302;
> +         }
> +       else if (strcmp (language_string, "GNU C++26") == 0)
> +         {
> +           language = DW_LANG_C_plus_plus_14;
> +           lname = DW_LNAME_C_plus_plus;
> +           lversion = 202400;
> +         }
>       }
>      }
>    else if (strcmp (language_string, "GNU F77") == 0)
> @@ -25441,6 +25488,11 @@ gen_compile_unit_die (const char *filena
>      language = DW_LANG_Ada83;
>  
>    add_AT_unsigned (die, DW_AT_language, language);
> +  if (lname && dwarf_version >= 5 && !dwarf_strict)
> +    {
> +      add_AT_unsigned (die, DW_AT_language_name, lname);
> +      add_AT_unsigned (die, DW_AT_language_version, lversion);
> +    }
>  
>    switch (language)
>      {
> --- gcc/testsuite/g++.dg/debug/dwarf2/lang-cpp17.C.jj 2021-01-18 
> 07:18:14.929659650 +0100
> +++ gcc/testsuite/g++.dg/debug/dwarf2/lang-cpp17.C    2025-01-07 
> 10:07:46.473125326 +0100
> @@ -1,8 +1,10 @@
>  // { dg-do compile }
> -// { dg-options "-O -std=c++17 -gdwarf-5 -dA" }
> +// { dg-options "-O -std=c++17 -gdwarf-5 -dA -gno-strict-dwarf" }
>  // { dg-skip-if "AIX DWARF5" { powerpc-ibm-aix* } }
> -// For -gdwarf-6 hopefully DW_LANG_C_plus_plus_17
>  // DW_LANG_C_plus_plus_14 = 0x0021
> +// DW_LNAME_C_plus_plus = 0x0004 201703
>  // { dg-final { scan-assembler "0x21\[^\n\r]* DW_AT_language" } } */
> +// { dg-final { scan-assembler "0x4\[^\n\r]* DW_AT_language_name" } } */
> +// { dg-final { scan-assembler "0x313e7\[^\n\r]* DW_AT_language_version" } } 
> */
>  
>  int version;
> --- gcc/testsuite/g++.dg/debug/dwarf2/lang-cpp20.C.jj 2021-01-18 
> 14:52:42.946040137 +0100
> +++ gcc/testsuite/g++.dg/debug/dwarf2/lang-cpp20.C    2025-01-07 
> 10:08:28.982533366 +0100
> @@ -1,8 +1,10 @@
>  // { dg-do compile }
> -// { dg-options "-O -std=c++20 -gdwarf-5 -dA" }
> +// { dg-options "-O -std=c++20 -gdwarf-5 -dA -gno-strict-dwarf" }
>  // { dg-skip-if "AIX DWARF5" { powerpc-ibm-aix* } }
> -// For -gdwarf-6 hopefully DW_LANG_C_plus_plus_20
>  // DW_LANG_C_plus_plus_14 = 0x0021
> +// DW_LNAME_C_plus_plus = 0x0004 202002
>  // { dg-final { scan-assembler "0x21\[^\n\r]* DW_AT_language" } } */
> +// { dg-final { scan-assembler "0x4\[^\n\r]* DW_AT_language_name" } } */
> +// { dg-final { scan-assembler "0x31512\[^\n\r]* DW_AT_language_version" } } 
> */
>  
>  int version;
> --- gcc/testsuite/g++.dg/debug/dwarf2/lang-cpp23.C.jj 2025-01-07 
> 10:07:54.926007612 +0100
> +++ gcc/testsuite/g++.dg/debug/dwarf2/lang-cpp23.C    2025-01-07 
> 10:08:19.206669497 +0100
> @@ -0,0 +1,10 @@
> +// { dg-do compile }
> +// { dg-options "-O -std=c++23 -gdwarf-5 -dA -gno-strict-dwarf" }
> +// { dg-skip-if "AIX DWARF5" { powerpc-ibm-aix* } }
> +// DW_LANG_C_plus_plus_14 = 0x0021
> +// DW_LNAME_C_plus_plus = 0x0004 202302
> +// { dg-final { scan-assembler "0x21\[^\n\r]* DW_AT_language" } } */
> +// { dg-final { scan-assembler "0x4\[^\n\r]* DW_AT_language_name" } } */
> +// { dg-final { scan-assembler "0x3163e\[^\n\r]* DW_AT_language_version" } } 
> */
> +
> +int version;
> 
>       Jakub
> 
> 

-- 
Richard Biener <rguent...@suse.de>
SUSE Software Solutions Germany GmbH,
Frankenstrasse 146, 90461 Nuernberg, Germany;
GF: Ivo Totev, Andrew McDonald, Werner Knoblich; (HRB 36809, AG Nuernberg)

Reply via email to