This is Andi's backport for unused types pruning. I (matz) have only added the option to disable it again. From: Andi Kleen Subject: More compact dwarf2 information for gcc (with patch) Date: Sun, 2 Mar 2003 07:43:14 +0100 I ported Scott Snyder's dwarf2 compression patch that was recently posted on the gcc mailing list to the SuSE gcc. What it does is to not dump types to the debugging information that are not referenced to dwarf2. The main change compared to the patch (which was against 3.4 mainline) was to not use varrays which do not seem to exist in that tree. I just cloned the file_table dynamic array instead. I enabled it by default. In theory it makes a difference when you try to reference a type that is not used in the program from gdb, but referencing just types seems to be somewhat pointless to me (especially when such a obscure feature eats >100MB of disk space in the build), so I just enabled it by default. gcc also seems to have an -feliminate-dwarf2-dups option which may further help (but is off by default for some reason). Perhaps it can be considered for turning on too? Or is there some problem with it I am missing? Just applying the patch makes a nice difference (without -feliminate-dwarf2-dups) e.g. this is a simple x86-64 kernel compilation with -g. The tree is stripped down with only minimal drivers enabled. before: build tree size 528M -rwxr-xr-x 1 ak users 44M 2003-03-02 02:25 vmlinux random object file: 1356440 276 -rw-r--r-- 2 ak users 276312 Mar 2 01:45 ./kernel/sys after: ld tree size 411M -rwxr-xr-x 1 ak users 30M 2003-03-02 07:26 vmlinux -rw-r--r-- 2 ak users 206096 2003-03-02 07:22 kernel/sys.o Both the final executable and the object files shrink nicely. Also the compilation is faster because gcc has to do much less IO (compilation with -g seems to be mostly IO bound) Can we please consider this patch for inclusion into the 3.3 SuSE gcc ? -Andi Index: gcc/flags.h =================================================================== RCS file: /cvs/gcc/gcc/gcc/flags.h,v retrieving revision 1.93.2.13 diff -u -p -r1.93.2.13 flags.h --- gcc/flags.h 2 Feb 2004 16:25:40 -0000 1.93.2.13 +++ gcc/flags.h 21 May 2004 12:58:25 -0000 @@ -677,6 +677,10 @@ extern int flag_speculative_prefetching; extern int flag_eliminate_dwarf2_dups; +/* Nonzero means we should do unused type elimination. */ + +extern int flag_eliminate_unused_debug_types; + /* Nonzero means to collect statistics which might be expensive and to print them when we are done. */ extern int flag_detailed_statistics; Index: gcc/toplev.c =================================================================== RCS file: /cvs/gcc/gcc/gcc/toplev.c,v retrieving revision 1.688.2.50 diff -u -p -r1.688.2.50 toplev.c --- gcc/toplev.c 21 Apr 2004 15:17:24 -0000 1.688.2.50 +++ gcc/toplev.c 21 May 2004 12:58:26 -0000 @@ -383,6 +383,10 @@ tree current_function_func_begin_label; int flag_eliminate_dwarf2_dups = 0; +/* Nonzero if doing unused type elimination. */ + +int flag_eliminate_unused_debug_types = 1; + /* Nonzero if generating code to do profiling. */ int profile_flag = 0; @@ -1054,6 +1058,8 @@ static const lang_independent_options f_ { {"eliminate-dwarf2-dups", &flag_eliminate_dwarf2_dups, 1, N_("Perform DWARF2 duplicate elimination") }, + {"eliminate-unused-debug-types", &flag_eliminate_unused_debug_types, 1, + N_("Eliminate debug info of unused types") }, {"float-store", &flag_float_store, 1, N_("Do not store floats in registers") }, {"volatile", &flag_volatile, 1, Index: gcc/dwarf2out.c =================================================================== RCS file: /cvs/gcc/gcc/gcc/dwarf2out.c,v retrieving revision 1.389.2.20 diff -u -p -r1.389.2.20 dwarf2out.c --- gcc/dwarf2out.c 29 Apr 2004 15:20:33 -0000 1.389.2.20 +++ gcc/dwarf2out.c 21 May 2004 12:58:26 -0000 @@ -3397,6 +3397,7 @@ struct file_table /* Filenames referenced by this compilation unit. */ static struct file_table file_table; +static struct file_table file_table_emitted; /* Local pointer to the name of the main input file. Initialized in dwarf2out_init. */ @@ -3796,6 +3797,14 @@ static void output_loc_list PARAMS ((dw static char *gen_internal_sym PARAMS ((const char *)); static void mark_limbo_die_list PARAMS ((void *)); +static void prune_unmark_dies PARAMS ((dw_die_ref)); +static void prune_unused_types_mark PARAMS ((dw_die_ref, int)); +static void prune_unused_types_walk PARAMS ((dw_die_ref)); +static void prune_unused_types_walk_attribs PARAMS ((dw_die_ref)); +static void prune_unused_types_prune PARAMS ((dw_die_ref)); +static void prune_unused_types PARAMS ((void)); +static unsigned long maybe_emit_file PARAMS ((int)); + /* Section names used to hold DWARF debugging information. */ #ifndef DEBUG_INFO_SECTION #define DEBUG_INFO_SECTION ".debug_info" @@ -5172,6 +5181,7 @@ splice_child_die (parent, child) break; } + child->die_parent = parent; child->die_sib = parent->die_child; parent->die_child = child; } @@ -12746,13 +12756,21 @@ lookup_filename (file_name) file_table.in_use = i + 1; file_table.last_lookup_index = i; - if (DWARF2_ASM_LINE_DEBUG_INFO) + /* Prepare to add a new table entry by making sure there is enough space in + the table to do so. If not, expand the current table. */ + if (i >= file_table_emitted.allocated) { - fprintf (asm_out_file, "\t.file %u ", i); - output_quoted_string (asm_out_file, file_name); - fputc ('\n', asm_out_file); + file_table_emitted.allocated = i + FILE_TABLE_INCREMENT; + file_table_emitted.table = (char **) + xrealloc (file_table_emitted.table, + file_table_emitted.allocated * sizeof (char *)); } + /* Add the new entry to the end of the filename table. */ + file_table_emitted.table[i] = NULL; + file_table_emitted.in_use = i + 1; + file_table_emitted.last_lookup_index = i; + return i; } @@ -12763,9 +12781,38 @@ init_file_table () file_table.table = (char **) xcalloc (FILE_TABLE_INCREMENT, sizeof (char *)); file_table.allocated = FILE_TABLE_INCREMENT; + file_table_emitted.table = (char **) xcalloc (FILE_TABLE_INCREMENT, sizeof (char *)); + file_table_emitted.allocated = FILE_TABLE_INCREMENT; + /* Skip the first entry - file numbers begin at 1. */ file_table.in_use = 1; file_table.last_lookup_index = 0; + + file_table_emitted.in_use = 1; + file_table_emitted.last_lookup_index = 0; +} + +static unsigned long +maybe_emit_file (fileno) + int fileno; +{ + static int emitcount = 0; + if (DWARF2_ASM_LINE_DEBUG_INFO && fileno > 0) + { + if (!file_table_emitted.table[fileno]) + { + file_table_emitted.table[fileno] = (char *)++emitcount; + fprintf (asm_out_file, "\t.file %lu ", + (unsigned long) + file_table_emitted.table[fileno]); + output_quoted_string (asm_out_file, + file_table.table[fileno]); + fputc ('\n', asm_out_file); + } + return (unsigned long)file_table_emitted.table[fileno]; + } + else + return fileno; } /* Called by the final INSN scan whenever we see a var location. We @@ -12847,6 +12894,8 @@ dwarf2out_source_line (line, filename) { unsigned file_num = lookup_filename (filename); + file_num = maybe_emit_file (file_num); + /* Emit the .loc directive understood by GNU as. */ fprintf (asm_out_file, "\t.loc %d %d 0\n", file_num, line); @@ -12932,6 +12981,7 @@ dwarf2out_start_source_file (lineno, fil dw2_asm_output_data (1, DW_MACINFO_start_file, "Start new file"); dw2_asm_output_data_uleb128 (lineno, "Included from line number %d", lineno); + maybe_emit_file (lookup_filename (filename)); dw2_asm_output_data_uleb128 (lookup_filename (filename), "Filename we just started"); } @@ -13122,6 +13172,213 @@ output_indirect_string (pfile, h, v) return 1; } + +/* Clear the marks for a die and its children. + Be cool if the mark isn't set. */ + +static void +prune_unmark_dies (die) + dw_die_ref die; +{ + dw_die_ref c; + die->die_mark = 0; + for (c = die->die_child; c; c = c->die_sib) + prune_unmark_dies (c); +} + + +/* Given DIE that we're marking as used, find any other dies + it references as attributes and mark them as used. */ + +static void +prune_unused_types_walk_attribs (die) + dw_die_ref die; +{ + dw_attr_ref a; + + for (a = die->die_attr; a != NULL; a = a->dw_attr_next) + { + if (a->dw_attr_val.val_class == dw_val_class_die_ref) + { + /* A reference to another DIE. + Make sure that it will get emitted. */ + prune_unused_types_mark (a->dw_attr_val.v.val_die_ref.die, 1); + } + else if (a->dw_attr == DW_AT_decl_file) + { + /* A reference to a file. Make sure the file name is emitted. */ + a->dw_attr_val.v.val_unsigned = + maybe_emit_file (a->dw_attr_val.v.val_unsigned); + } + } +} + + +/* Mark DIE as being used. If DOKIDS is true, then walk down + to DIE's children. */ + +static void +prune_unused_types_mark (die, dokids) + dw_die_ref die; + int dokids; +{ + dw_die_ref c; + + if (die->die_mark == 0) { + /* We haven't done this node yet. Mark it as used. */ + die->die_mark = 1; + + /* We also have to mark its parents as used. + (But we don't want to mark our parents' kids due to this.) */ + if (die->die_parent) + prune_unused_types_mark (die->die_parent, 0); + + /* Mark any referenced nodes. */ + prune_unused_types_walk_attribs (die); + } + + if (dokids && die->die_mark != 2) + { + /* We need to walk the children, but haven't done so yet. + Remember that we've walked the kids. */ + die->die_mark = 2; + + /* Walk them. */ + for (c = die->die_child; c; c = c->die_sib) + { + /* If this is an array type, we need to make sure our + kids get marked, even if they're types. */ + if (die->die_tag == DW_TAG_array_type) + prune_unused_types_mark (c, 1); + else + prune_unused_types_walk (c); + } + } +} + + +/* Walk the tree DIE and mark types that we actually use. */ + +static void +prune_unused_types_walk (die) + dw_die_ref die; +{ + dw_die_ref c; + + /* Don't do anything if this node is already marked. */ + if (die->die_mark) + return; + + switch (die->die_tag) { + case DW_TAG_const_type: + case DW_TAG_packed_type: + case DW_TAG_pointer_type: + case DW_TAG_reference_type: + case DW_TAG_volatile_type: + case DW_TAG_typedef: + case DW_TAG_array_type: + case DW_TAG_structure_type: + case DW_TAG_union_type: + case DW_TAG_class_type: + case DW_TAG_friend: + case DW_TAG_variant_part: + case DW_TAG_enumeration_type: + case DW_TAG_subroutine_type: + case DW_TAG_string_type: + case DW_TAG_set_type: + case DW_TAG_subrange_type: + case DW_TAG_ptr_to_member_type: + case DW_TAG_file_type: + /* It's a type node --- don't mark it. */ + return; + + default: + /* Mark everything else. */ + break; + } + + die->die_mark = 1; + + /* Now, mark any dies referenced from here. */ + prune_unused_types_walk_attribs (die); + + /* Mark children. */ + for (c = die->die_child; c; c = c->die_sib) + prune_unused_types_walk (c); +} + + +/* Remove from the tree DIE any dies that aren't marked. */ + +static void +prune_unused_types_prune (die) + dw_die_ref die; +{ + dw_die_ref c, p, n; + if (!die->die_mark) + abort(); + + p = NULL; + for (c = die->die_child; c; c = n) + { + n = c->die_sib; + if (c->die_mark) + { + prune_unused_types_prune (c); + p = c; + } + else + { + if (p) + p->die_sib = n; + else + die->die_child = n; + free_die (c); + } + } +} + + +/* Remove dies representing declarations that we never use. */ + +static void +prune_unused_types () +{ + unsigned int i; + limbo_die_node *node; + + /* Clear all the marks. */ + prune_unmark_dies (comp_unit_die); + for (node = limbo_die_list; node; node = node->next) + prune_unmark_dies (node->die); + + /* Set the mark on nodes that are actually used. */ + prune_unused_types_walk (comp_unit_die); + for (node = limbo_die_list; node; node = node->next) + prune_unused_types_walk (node->die); + + /* Also set the mark on nodes referenced from the + pubname_table or arange_table. */ + for (i=0; i < pubname_table_in_use; i++) + { + prune_unused_types_mark (pubname_table[i].die, 1); + } + for (i=0; i < arange_table_in_use; i++) + { + prune_unused_types_mark (arange_table[i], 1); + } + + /* Get rid of nodes that aren't marked. */ + prune_unused_types_prune (comp_unit_die); + for (node = limbo_die_list; node; node = node->next) + prune_unused_types_prune (node->die); + + /* Leave the marks clear. */ + prune_unmark_dies (comp_unit_die); + for (node = limbo_die_list; node; node = node->next) + prune_unmark_dies (node->die); +} + /* Output stuff that dwarf requires at the end of every file, and generate the DWARF-2 debugging info. */ @@ -13196,6 +13453,9 @@ dwarf2out_finish (input_filename) /* We need to reverse all the dies before break_out_includes, or we'll see the end of an include file before the beginning. */ reverse_all_dies (comp_unit_die); + + if (flag_eliminate_unused_debug_types) + prune_unused_types (); /* Generate separate CUs for each of the include files we've seen. They will go into limbo_die_list. */