diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-05-04 17:55:52 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-05-04 17:55:52 +0000 |
commit | f7a951d79bc895eb2171c2570add9f4899794a10 (patch) | |
tree | cc0c7147f472fecbc93add134f5c0e5c1bb72529 /dwz.c | |
parent | Initial commit. (diff) | |
download | dwz-f7a951d79bc895eb2171c2570add9f4899794a10.tar.xz dwz-f7a951d79bc895eb2171c2570add9f4899794a10.zip |
Adding upstream version 0.15.upstream/0.15upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to '')
-rw-r--r-- | dwz.c | 16872 |
1 files changed, 16872 insertions, 0 deletions
@@ -0,0 +1,16872 @@ +/* Copyright (C) 2001-2021 Red Hat, Inc. + Copyright (C) 2003 Free Software Foundation, Inc. + Copyright (C) 2019-2021 SUSE LLC. + Written by Jakub Jelinek <jakub@redhat.com>, 2012. + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 2, or (at your option) + any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program; see the file COPYING. If not, write to + the Free Software Foundation, 51 Franklin Street - Fifth Floor, + Boston, MA 02110-1301, USA. */ + +#include <assert.h> +#include <errno.h> +#include <error.h> +#include <fcntl.h> +#include <setjmp.h> +#include <string.h> +#include <stdbool.h> +#include <stddef.h> +#include <stdint.h> +#include <inttypes.h> +#include <stdlib.h> +#include <unistd.h> +#include <sys/mman.h> +#include <sys/stat.h> +#include <sys/types.h> +#include <sys/times.h> +#include <sys/wait.h> + +#include <obstack.h> + +#include <gelf.h> +#include <xxhash.h> + +#include "dwarf2.h" +#include "hashtab.h" +#include "sha1.h" +#include "args.h" +#include "util.h" +#include "pool.h" + +#ifndef SHF_COMPRESSED + /* Glibc elf.h contains SHF_COMPRESSED starting v2.22. Libelf libelf.h has + a fallback definition starting v0.166. Define a fallback definition here + for the case of both pre-v2.22 glibc and pre-v0.166 libelf. */ +# define SHF_COMPRESSED (1 << 11) /* Section with compressed data. */ +#endif + +/* Theory of operation: + The DWZ tool can either optimize debug sections of a single + executable or shared library at a time, or, when -m option + is used, optimize debug sections even in between different + executables or shared libraries by constructing a new ET_REL + ELF object containing debug sections to which the individual + debug sections in the various executables or shared libraries + can refer. As debug info can be pretty large, the multifile + optimization is done in several phases in order to decrease + memory usage of the tool, which can still be quite high. + + The dwz () function optimizes a single file, and at the end, + after processing that single file, it frees all allocated memory. + Without -m, the dwz () function is called once on each argument. + + When -m has been passed, the dwz () function is first called on + each argument, and during it in addition to performing the same + optimizations as dwz tool does without -m it also may append + data to several temporary files (one for each .debug_* section + that is needed for the multifile optimization). During + preparation of the additions to the temporary files (write_multifile + function), wr_multifile flag is true. + + Next phase (optimize_multifile) is that all these temporary files + are mmapped, it is determined what DIEs, strings, .debug_macro + sequences etc. might be beneficial to have in the common debug + sections and finally a new ET_REL ELF object is written. During + this phase the op_multifile flag is true. This is often very + memory consuming phase, so extra hacks are used to decrease + the memory usage during it. + + Next phase (read_multifile) is where the previously written ET_REL + ELF object is parsed again and needed hash tables and other data + structures filled in. The rd_multifile flag is set during this + phase. The reason why this phase is separate from the previous one, + as opposed to just populating the hash tables right away in + optimize_multifile, is that the memory consumption during that phase + can be very big and keeping malloced data around would mean the address + space would be unnecessarily fragmented. read_multifile usually needs + to allocate only small fragment of the memory optimize_multifile + needs, on the other side that memory needs to be kept around until + the end of the last phase. + + During the last phase, the dwz () function is called second + time on each argument, with fi_multifile flag set. During this + phase duplicates in the common debug sections are referenced + from the local debug sections where possible. + + If some executable or shared library has too large debug information + (number of DIEs in .debug_info section) that there would be + risk of too high memory consumption, that file isn't multifile + optimized, instead it is processed by dwz () in a low-memory mode + with low_mem flag set. This can decrease memory consumption to + half in some very large cases. */ + +#ifndef NT_GNU_BUILD_ID +# define NT_GNU_BUILD_ID 3 +#endif + +/* xxHash state object. Init in main. */ +static XXH64_state_t *state; + +/* Clear xxHash state to zero. */ +#define hash_init_state() XXH64_reset(state, 0) + +/* Update hash STATE with VALUE. */ +#define hash_update_state_object(value) XXH64_update(state, &value, sizeof value) + +/* Update hash STATE with OBJECT that has a provided SIZE. */ +#define hash_update_state(object, size) XXH64_update(state, object, size) + +/* Get digest once we are done with a state. */ +#define hash_digest() XXH64_digest(state) + +/* Shorthand for hashing something with an intrinsic size. */ +#define hash(IN,LEN) XXH64(IN, LEN, 0) +#define iterative_hash(IN,LEN,INIT) XXH64(IN, LEN, INIT) +#define iterative_hash_object(OB,INIT) iterative_hash (&OB, sizeof (OB), INIT) + +/* Print memory amount M (in kb) in both exact and human readable, like so: + 1382508 (1.3G). */ +static void +print_mem (long m) +{ + float h = m; + int level = 0; + const char *unit[] = { "K", "M", "G"}; + while (h > 1024 && level <= 2) + { + h = h / 1024; + level++; + } + fprintf (stderr, "%ld (%.1f%s)\n", m, h, unit[level]); +} + +static void +report_progress (void) +{ + static struct tms current; + static struct tms prev; + static bool first = true; + static long ticks_per_second = 0; + + if (!first) + prev = current; + + times (¤t); + + if (first) + { + ticks_per_second = sysconf (_SC_CLK_TCK); + first = false; + return; + } + + clock_t user = current.tms_utime - prev.tms_utime; + clock_t sys = current.tms_stime - prev.tms_stime; + fprintf (stderr, "user: %.2f\n", (float)user / (float)ticks_per_second); + fprintf (stderr, "sys : %.2f\n", (float)sys / (float)ticks_per_second); + + if (progress_mem_p) + { + FILE *s = fopen ("/proc/self/status", "r"); + char *p; + bool print_next = false; + for (p = NULL; fscanf (s, "%ms", &p) && p != NULL; free (p)) + { + if (print_next) + { + long mem = strtol (p, NULL, 10); + print_mem (mem); + print_next = false; + continue; + } + + if (!(p[0] == 'V' && p[1] == 'm')) + continue; + + if (strcmp (&p[2], "Peak:") == 0) + fprintf (stderr, "VM Peak: "); + else if (strcmp (&p[2], "Size:") == 0) + fprintf (stderr, "VM Current: "); + else if (strcmp (&p[2], "HWM:") == 0) + fprintf (stderr, "RSS Peak: "); + else if (strcmp (&p[2], "RSS:") == 0) + fprintf (stderr, "RSS Current: "); + else + continue; + + print_next = true; + } + fclose (s); + } +} + +#define obstack_chunk_alloc malloc +#define obstack_chunk_free free + +/* Where to longjmp on OOM. */ +static jmp_buf oom_buf; + +/* Handle OOM situation. If handling more than one file, we might + just fail to handle some large file due to OOM, but could very well + handle other smaller files after it. */ +void +dwz_oom (void) +{ + longjmp (oom_buf, 1); +} + +/* General obstack for struct dw_cu, dw_die, also used for temporary + vectors. */ +static struct obstack ob; +/* Short lived obstack, global only to free it on allocation failures. */ +static struct obstack ob2; + +/* After read_multifile ob and ob2 are moved over to these variables + and restored during final cleanup. */ +static struct obstack alt_ob, alt_ob2; + +static bool odr_active_p = false; + +/* Struct to gather statistics. */ +struct stats +{ + const char *file; + unsigned int root_cnt; + unsigned int namespace_cnt; + unsigned int lower_toplevel; + unsigned int die_count; + unsigned int lower_toplevel_with_checksum; + unsigned int dup_cnt; + unsigned int dup_chain_cnt; + unsigned int dup_chain_max_length; + unsigned int part_cnt; + unsigned int pu_ph1_cnt; + unsigned int pu_ph2_cnt; + unsigned int pu_toplevel_die_cnt; +}; +static struct stats *stats; + +/* Initialize stats struct. */ +static void +init_stats (const char *file) +{ + if (stats == NULL) + stats = (struct stats *)malloc (sizeof (*stats)); + memset (stats, 0, sizeof (*stats)); + stats->file = file; +} + +/* Print stats struct, parsing statistics. */ +static void +print_parse_stats (void) +{ + if (stats == NULL || stats->file == NULL) + return; + + fprintf (stderr, "Parse statistics for %s\n", stats->file); + + fprintf (stderr, "root_count : %10u\n", + stats->root_cnt); + fprintf (stderr, "namespace_count : %10u\n", + stats->namespace_cnt); + unsigned int upper_toplevel = stats->root_cnt + stats->namespace_cnt; + fprintf (stderr, "upper_toplevel : %10u\n", + upper_toplevel); + unsigned lower_toplevel + = stats->lower_toplevel + stats->lower_toplevel_with_checksum; + fprintf (stderr, "lower_toplevel : %10u\n", + lower_toplevel); + unsigned int toplevel = upper_toplevel + lower_toplevel; + fprintf (stderr, "toplevel : %10u\n", + toplevel); + unsigned non_toplevel = stats->die_count - toplevel; + fprintf (stderr, "non_toplevel : %10u\n", + non_toplevel); + fprintf (stderr, "die_count : %10u\n", + stats->die_count); +} + +/* Print stats struct, dups statistics. */ +static void +print_dups_stats (void) +{ + if (stats == NULL || stats->file == NULL) + return; + + fprintf (stderr, "Duplicate statistics for %s\n", stats->file); + + fprintf (stderr, "lower_toplevel with checksum : %10u\n", + stats->lower_toplevel_with_checksum); + fprintf (stderr, "dup_cnt : %10u\n", + stats->dup_cnt); + fprintf (stderr, "dup_chain_cnt : %10u\n", + stats->dup_chain_cnt); + fprintf (stderr, "average dup_chain length : %10.2f\n", + (double)stats->dup_cnt / (double)stats->dup_chain_cnt); + fprintf (stderr, "max dup_chain length : %10u\n", + stats->dup_chain_max_length); +} + +static void +print_part_stats (void) +{ + if (stats == NULL || stats->file == NULL) + return; + + fprintf (stderr, "Partition statistics for %s\n", stats->file); + + fprintf (stderr, "part_cnt : %10u\n", stats->part_cnt); + fprintf (stderr, "pu_ph1_cnt : %10u\n", + stats->pu_ph1_cnt); + fprintf (stderr, "pu_ph2_cnt : %10u\n", + stats->pu_ph2_cnt); + fprintf (stderr, "pu_cnt : %10u\n", + stats->pu_ph1_cnt + stats->pu_ph2_cnt); + fprintf (stderr, "pu_toplevel_die_cnt : %10u\n", + stats->pu_toplevel_die_cnt); +} + +typedef struct +{ + Elf *elf; + GElf_Ehdr ehdr; + Elf_Scn **scn; + const char *filename; + int lastscn; + GElf_Shdr shdr[0]; +} DSO; + +/* Macro to parse an uleb128 number, return it and + update ptr to the end of the uleb128 at the same time. */ +#define read_uleb128(ptr) ({ \ + uint64_t ret = 0; \ + uint64_t c; \ + int shift = 0; \ + do \ + { \ + c = *ptr++; \ + ret |= (c & 0x7f) << shift; \ + shift += 7; \ + } while (c & 0x80); \ + \ + if (shift >= 70) \ + ret = ~(uint64_t) 0; \ + ret; \ +}) + +/* Macro to parse a sleb128 number, return it and + update ptr to the end of the sleb128 at the same time. */ +#define read_sleb128(ptr) ({ \ + uint64_t ret = 0; \ + uint64_t c; \ + int shift = 0; \ + do \ + { \ + c = *ptr++; \ + ret |= (c & 0x7f) << shift; \ + shift += 7; \ + } while (c & 0x80); \ + \ + if (shift >= 70) \ + ret = ~(uint64_t) 0; \ + else if (c & 0x40) \ + ret |= (-(uint64_t) 1) << shift; \ + ret; \ +}) + +/* Macro to store an uleb128 number to ptr and update + ptr to point after it. */ +#define write_uleb128(ptr, val) \ + do \ + { \ + uint64_t valv = (val); \ + do \ + { \ + unsigned char c = valv & 0x7f;\ + valv >>= 7; \ + if (valv) \ + c |= 0x80; \ + *ptr++ = c; \ + } \ + while (valv); \ + } \ + while (0) + +#define write_sleb128(ptr, val) \ + do \ + { \ + int64_t valv = (val); \ + bool more; \ + do \ + { \ + unsigned char c = valv & 0x7f; \ + valv >>= 7; \ + more = ((valv != 0 || (c & 0x40) != 0) \ + && (valv != -1 || (c & 0x40) == 0)); \ + if (more) \ + c |= 0x80; \ + *ptr++ = c; \ + } \ + while (more); \ + } \ + while (0) + +/* Macro to skip a uleb128 or sleb128 number and update ptr to the end of the + number. */ +#define skip_leb128(ptr) \ + do {} while ((*ptr++) & 0x80) + +/* Macro to parse a uint16_t value represented using form, return it and + update ptr to the end of the value at the same time. If the value doesn't + fit, assign true to error_p. */ +#define read_u16(ptr, form, error_p) \ + ({ \ + uint16_t ret = 0; \ + switch (form) \ + { \ + case DW_FORM_data1: \ + ret = read_8 (ptr); \ + break; \ + case DW_FORM_data2: \ + ret = read_16 (ptr); \ + break; \ + case DW_FORM_data4: \ + { \ + uint32_t res = read_32 (ptr); \ + ret = (uint16_t)res; \ + if ((uint32_t)ret != res) \ + error_p = true; \ + break; \ + } \ + case DW_FORM_data8: \ + { \ + uint64_t res = read_64 (ptr); \ + ret = (uint16_t)res; \ + if ((uint64_t)ret != res) \ + error_p = true; \ + break; \ + } \ + case DW_FORM_udata: \ + { \ + uint64_t res = read_uleb128 (ptr); \ + ret = (uint16_t)res; \ + if ((uint64_t)ret != res) \ + error_p = true; \ + break; \ + } \ + case DW_FORM_sdata: \ + { \ + union { \ + uint64_t u; \ + int64_t i; \ + } res; \ + res.u = read_sleb128 (ptr); \ + ret = (uint16_t)res.u; \ + if (res.i < 0 || (uint64_t)ret != res.u) \ + error_p = true; \ + break; \ + } \ + default: \ + error_p = true; \ + break; \ + } \ + ret; \ + }) + +/* Pointer size in the debug info, in bytes. Only debug info + with a single pointer size are handled. */ +static int ptr_size; + +/* Lowest debug_line version we have seen. When writing out the multi + file .debug_line we'll only use a DWARF5 version when there is no + lower line table seen (since the debug_line dir and file table is + shared between all CUs). */ +static unsigned int lowest_line_version = 5; + +/* Utility functions and macros for reading/writing values in + given ELF endianity, which might be different from host endianity. + No specific alignment is expected. */ +static uint16_t (*do_read_16) (unsigned char *ptr); +static uint32_t (*do_read_32) (unsigned char *ptr); +static uint64_t (*do_read_64) (unsigned char *ptr); +static void (*do_write_16) (unsigned char *ptr, unsigned short val); +static void (*do_write_32) (unsigned char *ptr, unsigned int val); +static void (*do_write_64) (unsigned char *ptr, uint64_t val); + +static inline uint16_t +buf_read_ule16 (unsigned char *data) +{ + return data[0] | (data[1] << 8); +} + +static inline uint16_t +buf_read_ube16 (unsigned char *data) +{ + return data[1] | (data[0] << 8); +} + +static inline uint32_t +buf_read_ule32 (unsigned char *data) +{ + return (data[0] | (data[1] << 8) | (data[2] << 16) + | ((unsigned int)data[3] << 24)); +} + +static inline uint32_t +buf_read_ube32 (unsigned char *data) +{ + return (data[3] | (data[2] << 8) | (data[1] << 16) + | ((unsigned int)data[0] << 24)); +} + +static inline uint64_t +buf_read_ule64 (unsigned char *data) +{ + return buf_read_ule32 (data) + | (((uint64_t) buf_read_ule32 (data + 4)) << 32); +} + +static inline uint64_t +buf_read_ube64 (unsigned char *data) +{ + return (((uint64_t) buf_read_ube32 (data)) << 32) + | buf_read_ube32 (data + 4); +} + +#define read_8(ptr) *ptr++ + +#define read_16(ptr) ({ \ + uint16_t ret = do_read_16 (ptr); \ + ptr += 2; \ + ret; \ +}) + +#define read_32(ptr) ({ \ + uint32_t ret = do_read_32 (ptr); \ + ptr += 4; \ + ret; \ +}) + +#define read_64(ptr) ({ \ + uint64_t ret = do_read_64 (ptr); \ + ptr += 8; \ + ret; \ +}) + +#define write_8(ptr, val) \ + do \ + *ptr++ = (val); \ + while (0) + +#define write_16(ptr, val) \ + do \ + { \ + do_write_16 (ptr, val); \ + ptr += 2; \ + } \ + while (0) + +#define write_32(ptr, val) \ + do \ + { \ + do_write_32 (ptr, val); \ + ptr += 4; \ + } \ + while (0) + +#define write_64(ptr, val) \ + do \ + { \ + do_write_64 (ptr, val); \ + ptr += 8; \ + } \ + while (0) + +static uint64_t +read_size (unsigned char *p, int size) +{ + switch (size) + { + case 1: return read_8 (p); + case 2: return read_16 (p); + case 4: return read_32 (p); + case 8: return read_64 (p); + default: abort (); + } +} + +static void +write_size (unsigned char *p, int size, uint64_t val) +{ + switch (size) + { + case 1: write_8 (p, val); break; + case 2: write_16 (p, val); break; + case 4: write_32 (p, val); break; + case 8: write_64 (p, val); break; + default: abort (); + } +} + +static void +buf_write_le16 (unsigned char *p, unsigned short v) +{ + p[0] = v; + p[1] = v >> 8; +} + +static void +buf_write_be16 (unsigned char *p, unsigned short v) +{ + p[1] = v; + p[0] = v >> 8; +} + +static void +buf_write_le32 (unsigned char *p, unsigned int v) +{ + p[0] = v; + p[1] = v >> 8; + p[2] = v >> 16; + p[3] = v >> 24; +} + +static void +buf_write_be32 (unsigned char *p, unsigned int v) +{ + p[3] = v; + p[2] = v >> 8; + p[1] = v >> 16; + p[0] = v >> 24; +} + +static void +buf_write_le64 (unsigned char *data, uint64_t v) +{ + buf_write_le32 (data, v); + buf_write_le32 (data + 4, v >> 32); +} + +static void +buf_write_be64 (unsigned char *data, uint64_t v) +{ + buf_write_be32 (data, v >> 32); + buf_write_be32 (data + 4, v); +} + +/* Return a DW_FORM_* name. */ +static const char * +get_DW_FORM_str (unsigned int form) +{ + const char *name = get_DW_FORM_name (form); + static char buf[9 + 3 * sizeof (int)]; + if (name) + return name; + sprintf (buf, "DW_FORM_%u", form); + return buf; +} + +/* Return a DW_OP_* name. */ +static const char * +get_DW_OP_str (unsigned int op) +{ + const char *name = get_DW_OP_name (op); + static char buf[7 + 3 * sizeof (int)]; + if (name) + return name; + sprintf (buf, "DW_OP_%u", op); + return buf; +} + +/* Return a DW_AT_* name. */ +static const char * +get_DW_AT_str (unsigned int at) +{ + const char *name = get_DW_AT_name (at); + static char buf[7 + 3 * sizeof (int)]; + if (name) + return name; + sprintf (buf, "DW_AT_%u", at); + return buf; +} + +/* Return a DW_UT_* name. */ +static const char * +get_DW_UT_str (unsigned int ut) +{ + const char *name = get_DW_UT_name (ut); + static char buf[7 + 3 * sizeof (int)]; + if (name) + return name; + sprintf (buf, "DW_UT_%u", ut); + return buf; +} + +/* Retrun a DW_LNCT_* name. */ +static const char * +get_DW_LNCT_str (unsigned int lnct) +{ + const char *name; + static char buf[9 + 3 * sizeof (int)]; + switch (lnct) + { + case DW_LNCT_path: name = "DW_LNCT_path"; break; + case DW_LNCT_directory_index: name = "DW_LNCT_directory_index"; break; + case DW_LNCT_timestamp: name = "DW_LNCT_timestamp"; break; + case DW_LNCT_size: name = "DW_LNCT_size"; break; + case DW_LNCT_MD5: name = "DW_LNCT_MD5"; break; + + default: name = 0; break; + } + if (name) + return name; + sprintf (buf, "DW_LNCT_%u", lnct); + return buf; +} + +/* This must match the debug_sections array content + below. */ +enum debug_section_kind +{ + DEBUG_INFO, + DEBUG_ABBREV, + DEBUG_LINE, + DEBUG_STR, + DEBUG_MACRO, + DEBUG_TYPES, + DEBUG_ARANGES, + DEBUG_PUBNAMES, + DEBUG_PUBTYPES, + DEBUG_GNU_PUBNAMES, + DEBUG_GNU_PUBTYPES, + DEBUG_MACINFO, + DEBUG_LOC, + DEBUG_LOCLISTS, + DEBUG_FRAME, + DEBUG_RANGES, + DEBUG_RNGLISTS, + DEBUG_LINE_STR, + DEBUG_SUP, + DEBUG_GDB_SCRIPTS, + GDB_INDEX, + GNU_DEBUGALTLINK, + SECTION_COUNT, + SAVED_SECTIONS = DEBUG_TYPES + 1 +}; + +/* Details about standard DWARF sections. */ +static struct +{ + const char *name; + unsigned char *data; + unsigned char *new_data; + size_t size; + size_t new_size; + int sec; +} debug_sections[] = + { + { ".debug_info", NULL, NULL, 0, 0, 0 }, + { ".debug_abbrev", NULL, NULL, 0, 0, 0 }, + { ".debug_line", NULL, NULL, 0, 0, 0 }, + { ".debug_str", NULL, NULL, 0, 0, 0 }, + { ".debug_macro", NULL, NULL, 0, 0, 0 }, + { ".debug_types", NULL, NULL, 0, 0, 0 }, + { ".debug_aranges", NULL, NULL, 0, 0, 0 }, + { ".debug_pubnames", NULL, NULL, 0, 0, 0 }, + { ".debug_pubtypes", NULL, NULL, 0, 0, 0 }, + { ".debug_gnu_pubnames", NULL, NULL, 0, 0, 0 }, + { ".debug_gnu_pubtypes", NULL, NULL, 0, 0, 0 }, + { ".debug_macinfo", NULL, NULL, 0, 0, 0 }, + { ".debug_loc", NULL, NULL, 0, 0, 0 }, + { ".debug_loclists", NULL, NULL, 0, 0, 0 }, + { ".debug_frame", NULL, NULL, 0, 0, 0 }, + { ".debug_ranges", NULL, NULL, 0, 0, 0 }, + { ".debug_rnglists", NULL, NULL, 0, 0, 0 }, + { ".debug_line_str", NULL, NULL, 0, 0, 0 }, + { ".debug_sup", NULL, NULL, 0, 0, 0 }, + { ".debug_gdb_scripts", NULL, NULL, 0, 0, 0 }, + { ".gdb_index", NULL, NULL, 0, 0, 0 }, + { ".gnu_debugaltlink", NULL, NULL, 0, 0, 0 }, + { NULL, NULL, NULL, 0, 0, 0 } + }; + +/* Copies of .new_data fields during write_multifile. */ +static unsigned char *saved_new_data[SAVED_SECTIONS]; +/* Copies of .new_size fields during write_multifile. */ +static size_t saved_new_size[SAVED_SECTIONS]; + +/* Copies of .data fields after read_multifile. */ +static unsigned char *alt_data[SAVED_SECTIONS]; +/* Copies of .size fields after read_multifile. */ +static size_t alt_size[SAVED_SECTIONS]; + +/* How many bytes of each of /tmp/dwz.debug_*.XXXXXX have we written + already. */ +static unsigned int multi_info_off, multi_abbrev_off; +static unsigned int multi_line_off, multi_str_off; +static unsigned int multi_macro_off; +/* And corresponding file descriptors. */ +static int multi_info_fd = -1, multi_abbrev_fd = -1; +static int multi_line_fd = -1, multi_str_fd = -1; +static int multi_macro_fd = -1; + +/* Copy of one of the input file's ehdr. */ +static GElf_Ehdr multi_ehdr; + +/* Pointer size of all debug info sources accumulated during + write_multifile. */ +static int multi_ptr_size; +/* And their endianity. */ +static int multi_endian; +/* Highest .gdb_index version seen. */ +static unsigned int multi_gdb_index_ver; + +enum multifile_mode_kind +{ + MULTIFILE_MODE_WR = 1, + MULTIFILE_MODE_OP = 2, + MULTIFILE_MODE_RD = 4, + MULTIFILE_MODE_FI = 8, + MULTIFILE_MODE_LOW_MEM = 16 +}; + +/* True while in write_multifile. */ +#define wr_multifile (multifile_mode & MULTIFILE_MODE_WR) + +/* True while in optimize_multifile. */ +#define op_multifile (multifile_mode & MULTIFILE_MODE_OP) + +/* True while in read_multifile. */ +#define rd_multifile (multifile_mode & MULTIFILE_MODE_RD) + +/* True while in finalize_multifile. */ +#define fi_multifile (multifile_mode & MULTIFILE_MODE_FI) + +/* True if running in low_mem mode. */ +#define low_mem (multifile_mode & MULTIFILE_MODE_LOW_MEM) + +/* SHA1 checksum (build-id) of the common file. */ +static unsigned char multifile_sha1[0x14]; + +/* A single attribute in abbreviations. */ +struct abbrev_attr +{ + /* DW_AT_* attribute code. */ + unsigned int attr; + /* DW_FORM_* form code. */ + unsigned int form; +}; + +/* Internal structure for .debug_abbrev entries. */ +struct abbrev_tag +{ + /* Abbreviation number. */ + unsigned int entry; + /* Hash value, in first abbrev hash tables it is + the same as entry, in cu->cu_new_abbrev hash tables + iterative hash of all the relevant values. */ + hashval_t hash; + /* DW_TAG_* code. */ + unsigned int tag; + /* Number of attributes. */ + unsigned int nattr; + /* How many DIEs refer to this abbreviation (unused + in first abbrev hash tables). */ + unsigned int nusers; + /* True if DIEs with this abbreviation have children. */ + bool children; + /* True if any typed DWARF opcodes refer to this. */ + bool op_type_referenced; + /* The values of DW_FORM_implicit_const attribute forms. */ + int64_t *values; + /* Attribute/form pairs. */ + struct abbrev_attr attr[0]; +}; + +typedef struct dw_die *dw_die_ref; +typedef struct dw_cu *dw_cu_ref; +struct import_cu; + +/* An entry from .debug_line file table. */ +struct dw_file +{ + char *dir; + char *file; + uint64_t time, size; + unsigned int file_angle_brackets_encapsulated_no_slash : 1; +}; + +/* Internal representation of a compilation (or partial) + unit. */ +struct dw_cu +{ + /* Cached entries from .debug_line file table. */ + struct dw_file *cu_files; + unsigned int cu_nfiles; + /* Kind of CU, normal (present in .debug_info), newly created + partial unit, .debug_types unit or .debug_info partial unit + from the common file. */ + enum { CU_NORMAL, CU_PU, CU_TYPES, CU_ALT } cu_kind; + /* CUs linked from first_cu through this chain. */ + dw_cu_ref cu_next; + /* Offset in original .debug_info if CU_NORMAL or .debug_types + if CU_TYPES, otherwise a unique index of the newly created + partial CU. */ + unsigned int cu_offset; + /* DWARF version of the CU. */ + unsigned int cu_version; + /* Cached DW_AT_comp_dir value from DW_TAG_*_unit cu_die, + or NULL if that attribute is not present. */ + char *cu_comp_dir; + /* Pointer to the DW_TAG_*_unit inside of the .debug_info + chunk. */ + dw_die_ref cu_die; + /* The original abbreviation hash table. */ + htab_t cu_abbrev; + /* New abbreviation hash table. */ + htab_t cu_new_abbrev; + union dw_cu_u1 + { + /* Pointer to another struct dw_cu that owns + cu_new_abbrev for this CU. */ + dw_cu_ref cu_new_abbrev_owner; + /* Pointer used during create_import_tree. */ + struct import_cu *cu_icu; + } u1; + union dw_cu_u2 + { + /* Offset into the new .debug_abbrev section. */ + unsigned int cu_new_abbrev_offset; + /* Highest ->entry value in the new abbrev table + For abbrevs computed by this tool it is always + equal to the number of abbreviations, but if + abbrevs are read for .debug_types section which + is not rewritten, there might be holes. */ + unsigned int cu_largest_entry; + } u2; + /* Offset into the new .debug_info section. */ + unsigned int cu_new_offset; + /* When op_multifile, record which object this came from here, + otherwise it is the index of the CU. */ + unsigned int cu_chunk; + /* Form chosen for intra-cu references. */ + enum dwarf_form cu_intracu_form; + /* Intracusize argument to init_new_die_offsets. Set in compute_abbrevs, + used in recompute_abbrevs. */ + unsigned int initial_intracusize; + enum dwarf_source_language lang; +}; + +/* Internal representation of a debugging information entry (DIE). + This structure should be kept as small as possible, + there are .debug_info sections with tens of millions of DIEs + in them and this structure is allocated for each of them. */ +struct dw_die +{ + /* Offset in old .debug_info from the start of the .debug_info section, + -1U for newly created DIEs. */ + unsigned int die_offset; + /* Cached copy of die_abbrev->tag. */ + enum dwarf_tag die_tag : 16; + /* State of checksum computation. Not computed yet, computed and + suitable for moving into partial units, currently being computed + and finally determined unsuitable for moving into partial units. */ + enum { CK_UNKNOWN, CK_KNOWN, CK_BEING_COMPUTED, CK_BAD } die_ck_state : 2; + /* Set if any DW_OP_call2 opcode refers to this DIE. */ + unsigned int die_op_call2_referenced : 1; + /* Set if any DW_OP_GNU_{{regval,deref,const}_type,convert,reinterpret} + opcode refers to this DIE. Only DW_TAG_base_type DIEs should be + referenced. As those opcodes refer to them using uleb128, we need to try + hard to have those DIEs with low enough offsets that the uleb128 will + fit. */ + unsigned int die_op_type_referenced : 1; + /* Set in DW_TAG_namespace or DW_TAG_module with DW_AT_name that is + either a child of DW_TAG_*_unit, or a child of another + die_named_namespace DIE. */ + unsigned int die_named_namespace : 1; + /* Set if u.p1.die_ref_hash is valid. */ + unsigned int die_ref_hash_computed : 1; + /* Set if die_dup and die_nextdup fields are after this structure. + True for DW_TAG_*_unit DIEs, die_named_namespace DIEs and their + immediate children. */ + unsigned int die_toplevel : 1; + /* Set if we want to remove this DIE from its containing CU. */ + unsigned int die_remove : 1; + /* Set if DIE is unsuitable for moving into alternate .debug_info. */ + unsigned int die_no_multifile : 1; + /* Set if DIE is referenced using DW_FORM_ref*. So far only used during + optimize_multifile and low_mem. */ + unsigned int die_referenced : 1; + /* Set if DIE is referenced using DW_FORM_ref_addr. So far used only + during low_mem. */ + unsigned int die_intercu_referenced : 1; + /* Set if DIE has its children collapsed. Only used during + optimize_multifile. */ + unsigned int die_collapsed_children : 1; + /* Set on collapsed child DIE that is referenced. In that case, die_tag + is reused for die_enter difference from parent and no fields after + die_parent are allocated. */ + unsigned int die_collapsed_child : 1; + /* Set if die_parent field is reused for struct dw_cu pointer. */ + unsigned int die_root : 1; + /* State for ODR optimization. */ + enum { ODR_UNKNOWN, ODR_NONE, ODR_DEF, ODR_DECL } die_odr_state : 2; + /* Tree pointer to parent. */ + dw_die_ref die_parent; + + /* The remaining fields are present only if die_collapsed_child is + 0. */ + + /* Tree pointers, to first child and pointer to next sibling. */ + dw_die_ref die_child, die_sib; + /* Pointer to the old .debug_abbrev entry's internal representation. */ + struct abbrev_tag *die_abbrev; + /* Size of the DIE (abbrev number + attributes), not including children. + In later phases this holds the new size as opposed to the old one. */ + unsigned int die_size; + /* Index into the dw_die_ref vector used in checksum_ref_die function. + While this is only phase 1 field, we get better packing by having it + here instead of u.p1. */ + unsigned int die_ref_seen; + union dw_die_phase + { + /* Fields used in the first phase (read_debug_info and partition_dups + and functions they call). */ + struct dw_die_p1 + { + /* Iterative hash value of the tag, attributes other than + references or DW_FORM_ref_addr references or references + within the subtree of ultimate parent's die_toplevel DIE's + children. Computed by checksum_die function. */ + hashval_t die_hash; + /* Iterative hash of other references. Computed by + checksum_ref_die function. */ + hashval_t die_ref_hash; + /* For ODR phase 1, we change die_hash for ODR_DEF and ODR_DECL DIEs + to only hash in the tag and the name, to be able to construct + maximal duplicate chains. But during ODR phase 2, we want to + compare ODR_DEF DIEs in the normal way, for which we need the + unchanged die_hash, which we store here in die_hash2. */ + hashval_t die_hash2; + /* Tick count of entering and leaving a DIE during depth first + traversal of the CU, used to quickly find if a subtree is + referenced. */ + unsigned int die_enter, die_exit; + } p1; + /* Fields used only after the first phase (from compute_abbrevs + till the end). */ + struct dw_die_p2 + { + /* Pointer to internal representation of new .debug_abbrev + entry for this DIE. */ + struct abbrev_tag *die_new_abbrev; + /* Offset within the new .debug_info CU. Unlike die_offset + this one is CU relative, so die_cu (die)->cu_new_offset needs + to be added to it to get .debug_info offset. */ + unsigned int die_new_offset; + /* Used during compute_abbrevs DW_FORM_ref_udata optimization. */ + unsigned int die_intracu_udata_size; + } p2; + } u; + + /* The remaining fields are present only if die_toplevel is + 1. */ + + /* Pointer to a duplicate DIE. */ + dw_die_ref die_dup; + /* Chain of duplicate DIEs. If die_dup is NULL, but die_nextdup + is non-NULL, this is the reference DIE of the duplicates. + All DIEs in the die->nextdup linked list have die_dup pointing + to this node. The reference DIE is initially just a DIE in the + lowest CU that has the matching DIE, later on it is a DIE in + the newly created partial unit CU. */ + dw_die_ref die_nextdup; +}; + +#include "iterators.h" + +/* Return CU structure pointer for a DIE. In order to save memory, + individual DIEs don't have a dw_cu_ref field, and the pointer can + be only found by overriding the die_parent pointer in a + DW_TAG_{compile,partial}_unit descriptor, which has no parent. */ +static inline dw_cu_ref +die_cu (dw_die_ref die) +{ + while (!die->die_root) + die = die->die_parent; + return (dw_cu_ref) die->die_parent; +} + +/* Given a toplevel die DIE, return the first (that is, the reference die) in + the duplicate chain. */ +#define first_dup(die) \ + (die->die_dup \ + ? die->die_dup \ + : (die->die_nextdup \ + ? die \ + : NULL)) + +/* Safe variant that check die_toplevel. Can't be used on LHS. */ +#define die_safe_dup(die) \ + ((die)->die_toplevel ? (die)->die_dup : (dw_die_ref) NULL) +#define die_safe_nextdup(die) \ + ((die)->die_toplevel ? (die)->die_nextdup : (dw_die_ref) NULL) + +ALIGN_STRUCT (abbrev_tag) +ALIGN_STRUCT (dw_file) +ALIGN_STRUCT (dw_cu) +ALIGN_STRUCT (dw_die) + + +/* After read_multifile, pool variable is moved over to this variable + as the pool from read_multifile needs to be around for subsequent dwz + calls. Freed only during the final cleanup at the very end. */ +static unsigned char *alt_pool; + +static struct abbrev_tag * +pool_clone_abbrev (struct abbrev_tag *t) +{ + struct abbrev_tag *newt; + size_t newt_size; + unsigned nvalue = 0; + if (t->values != NULL) + { + unsigned i; + for (i = 0; i < t->nattr; i++) + if (t->attr[i].form == DW_FORM_implicit_const) + nvalue = i + 1; + } + newt_size = (sizeof (*newt) + + t->nattr * sizeof (struct abbrev_attr) + + nvalue * sizeof (int64_t)); + newt = pool_alloc (abbrev_tag, newt_size); + memcpy (newt, t, newt_size - (nvalue * sizeof (int64_t))); + if (nvalue == 0) + newt->values = NULL; + else + { + newt->values = (int64_t *) &newt->attr[newt->nattr]; + memcpy (newt->values, t->values, nvalue * sizeof (int64_t)); + } + return newt; +} + +/* Hash function in first abbrev hash table as well as cu->cu_new_abbrev + htab. */ +static hashval_t +abbrev_hash (const void *p) +{ + struct abbrev_tag *t = (struct abbrev_tag *)p; + + return t->hash; +} + +/* Equality function in first abbrev htab. */ +static int +abbrev_eq (const void *p, const void *q) +{ + struct abbrev_tag *t1 = (struct abbrev_tag *)p; + struct abbrev_tag *t2 = (struct abbrev_tag *)q; + + return t1->entry == t2->entry; +} + +/* Equality function in cu->cu_new_abbrev htab. */ +static int +abbrev_eq2 (const void *p, const void *q) +{ + struct abbrev_tag *t1 = (struct abbrev_tag *)p; + struct abbrev_tag *t2 = (struct abbrev_tag *)q; + unsigned int i; + + if (t1->hash != t2->hash + || t1->tag != t2->tag + || t1->nattr != t2->nattr + || t1->children != t2->children) + return 0; + for (i = 0; i < t1->nattr; i++) + if (t1->attr[i].attr != t2->attr[i].attr + || t1->attr[i].form != t2->attr[i].form + || (t1->attr[i].form == DW_FORM_implicit_const + && t1->values[i] != t2->values[i])) + return 0; + return 1; +} + +/* Helper function to compute abbrev entry iterative hash value. */ +static void +compute_abbrev_hash (struct abbrev_tag *t) +{ + unsigned int i; + + hash_init_state (); + hash_update_state_object (t->tag); + hash_update_state_object (t->nattr); + hash_update_state_object (t->children); + for (i = 0; i < t->nattr; i++) + { + hash_update_state_object (t->attr[i].attr); + hash_update_state_object (t->attr[i].form); + if (t->attr[i].form == DW_FORM_implicit_const) + hash_update_state_object (t->values[i]); + } + t->hash = hash_digest (); +} + +/* Maximum number of attributes in a DIE. */ +static unsigned int max_nattr; + +/* Parse a .debug_abbrev entry at PTR. */ +static htab_t +read_abbrev (DSO *dso, unsigned char *ptr) +{ + htab_t h; + unsigned int attr, form; + struct abbrev_tag *t; + void **slot; + + h = htab_try_create (50, abbrev_hash, abbrev_eq, NULL); + if (h == NULL) + dwz_oom (); + + while ((attr = read_uleb128 (ptr)) != 0) + { + int highest_implicit_value_ndx = -1; + unsigned int nattr = 0; + unsigned char *p = ptr; + + skip_leb128 (p); + p++; + while (read_uleb128 (p) != 0) + { + nattr++; + form = read_uleb128 (p); + if (form == DW_FORM_implicit_const) + { + skip_leb128 (p); + highest_implicit_value_ndx = nattr - 1; + } + else if (form == 2 + || (form > DW_FORM_flag_present + && !(form == DW_FORM_ref_sig8 + || form == DW_FORM_data16 + || form == DW_FORM_line_strp))) + { + error (0, 0, "%s: Unknown DWARF %s at .debug_abbrev [%zd]", + dso->filename, get_DW_FORM_str (form), + p - debug_sections[DEBUG_ABBREV].data); + htab_delete (h); + return NULL; + } + } + if (read_uleb128 (p) != 0) + { + error (0, 0, "%s: DWARF abbreviation does not end with 2 zeros", + dso->filename); + htab_delete (h); + return NULL; + } + + t = pool_alloc (abbrev_tag, + sizeof (*t) + nattr * sizeof (struct abbrev_attr) + + sizeof (int64_t) * (highest_implicit_value_ndx + 1)); + t->entry = attr; + t->hash = attr; + t->nattr = nattr; + t->nusers = 0; + t->tag = read_uleb128 (ptr); + t->children = *ptr++ == DW_CHILDREN_yes; + t->op_type_referenced = false; + t->values = (highest_implicit_value_ndx >= 0 + ? (int64_t *) &t->attr[nattr] : NULL); + nattr = 0; + while ((attr = read_uleb128 (ptr)) != 0) + { + form = read_uleb128 (ptr); + if (form == DW_FORM_implicit_const) + t->values[nattr] = read_sleb128 (ptr); + t->attr[nattr].attr = attr; + t->attr[nattr++].form = form; + } + skip_leb128 (ptr); + if (t->nattr > max_nattr) + max_nattr = t->nattr; + slot = htab_find_slot_with_hash (h, t, t->hash, INSERT); + if (slot == NULL) + { + htab_delete (h); + dwz_oom (); + } + if (*slot != NULL) + { + error (0, 0, "%s: Duplicate DWARF abbreviation %d", dso->filename, + t->entry); + htab_delete (h); + return NULL; + } + *slot = t; + } + + return h; +} + +/* For a die attribute with form FORM starting at PTR, with the die in CU, + return the pointer after the attribute, assuming FORM is not + dw_form_indirect. */ +static inline unsigned char * FORCE_INLINE +skip_attr_no_dw_form_indirect (unsigned int cu_version, uint32_t form, + unsigned char *ptr) +{ + size_t len = 0; + + switch (form) + { + case DW_FORM_ref_addr: + ptr += cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_addr: + ptr += ptr_size; + break; + case DW_FORM_flag_present: + case DW_FORM_implicit_const: + break; + case DW_FORM_ref1: + case DW_FORM_flag: + case DW_FORM_data1: + ++ptr; + break; + case DW_FORM_ref2: + case DW_FORM_data2: + ptr += 2; + break; + case DW_FORM_ref4: + case DW_FORM_data4: + case DW_FORM_sec_offset: + case DW_FORM_strp: + case DW_FORM_line_strp: + ptr += 4; + break; + case DW_FORM_ref8: + case DW_FORM_data8: + case DW_FORM_ref_sig8: + ptr += 8; + break; + case DW_FORM_data16: + ptr += 16; + break; + case DW_FORM_sdata: + case DW_FORM_ref_udata: + case DW_FORM_udata: + skip_leb128 (ptr); + break; + case DW_FORM_string: + ptr = (unsigned char *) strchr ((char *)ptr, '\0') + 1; + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *ptr++; + break; + case DW_FORM_block2: + len = read_16 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + case DW_FORM_exprloc: + len = read_uleb128 (ptr); + form = DW_FORM_block1; + break; + default: + abort (); + } + + if (form == DW_FORM_block1) + ptr += len; + + return ptr; +} + +/* Read the directory and file table from .debug_line offset OFF, + record it in CU. */ +static int +read_debug_line (DSO *dso, dw_cu_ref cu, uint32_t off) +{ + unsigned char *ptr = debug_sections[DEBUG_LINE].data, *dir, *file; + unsigned char **dirt; + unsigned char *endsec = ptr + debug_sections[DEBUG_LINE].size; + unsigned char *endcu, *endprol; + unsigned char opcode_base; + unsigned int culen; + uint32_t value, version, ndirs, nfiles, dirt_cnt, file_cnt; + /* DWARF5 has a dynamic table of elements in possible different + forms. But we are only interested in the known elements (path, + dir index, time, size and possibly later md5). */ + unsigned char n, nelems = 0; + int path_ndx = -1; + int dir_ndx = -1; + int time_ndx = -1; + int size_ndx = -1; + uint16_t elems[256]; + + if (off >= debug_sections[DEBUG_LINE].size - 4) + { + error (0, 0, "%s: .debug_line reference above end of section", + dso->filename); + return 1; + } + + ptr += off; + + endcu = ptr + 4; + culen = read_32 (ptr); + if (culen >= 0xfffffff0) + { + error (0, 0, "%s: 64-bit DWARF not supported", dso->filename); + return 1; + } + endcu += culen; + + if (endcu > endsec) + { + error (0, 0, "%s: .debug_line CU does not fit into section", + dso->filename); + return 1; + } + + value = read_16 (ptr); + if (value < 2 || value > 5) + { + error (0, 0, "%s: DWARF version %d in .debug_line unhandled", + dso->filename, value); + return 1; + } + version = value; + + if (version < lowest_line_version) + lowest_line_version = version; + + if (version >= 5) + { + int addr_size, seg_size; + if (ptr + 2 > endcu) + { + error (0, 0, "%s: .debug_line header too short", dso->filename); + return 1; + } + addr_size = *ptr++; + seg_size = *ptr++; + if (addr_size != ptr_size) + { + error (0, 0, "%s: .debug_line address size differs from CU ptr size", + dso->filename); + return 1; + } + if (seg_size != 0) + { + error (0, 0, "%s: .debug_line non-zero segment selector size", + dso->filename); + return 1; + } + } + + endprol = ptr + 4; + endprol += read_32 (ptr); + if (endprol > endcu) + { + error (0, 0, "%s: .debug_line CU prologue does not fit into CU", + dso->filename); + return 1; + } + + opcode_base = ptr[4 + (version >= 4)]; + ptr = dir = ptr + 4 + (version >= 4) + opcode_base; + + /* dir table: */ + if (version < 5) + { + value = 1; + while (*ptr != 0) + { + ptr = (unsigned char *) strchr ((char *)ptr, 0) + 1; + ++value; + } + ndirs = value; + } + else + { + nelems = *ptr++; + for (n = 0; n < nelems; n++) + { + uint16_t lnct = read_uleb128 (ptr); + uint16_t form = read_uleb128 (ptr); + if (lnct == DW_LNCT_path) + { + if (path_ndx != -1) + { + error (0, 0, "%s: .debug_line duplicate dir path elements", + dso->filename); + return 1; + } + path_ndx = n; + } + else + { + error (0, 0, "%s: .debug_line unhandled dir element %s", + dso->filename, get_DW_LNCT_str (lnct)); + return 1; + } + + if (form != DW_FORM_string + && form != DW_FORM_strp + && form != DW_FORM_line_strp) + { + error (0, 0, "%s: .debug_line unhandled form %s for dir path", + dso->filename, get_DW_FORM_str (form)); + return 1; + } + + elems[n] = form; + } + + ndirs = read_uleb128 (ptr); + } + + dirt = (unsigned char **) alloca (ndirs * sizeof (unsigned char *)); + if (version < 5) + { + dirt[0] = NULL; + dirt_cnt = 1; + ptr = dir; + while (*ptr != 0) + { + dirt[dirt_cnt++] = ptr; + ptr = (unsigned char *) strchr ((char *)ptr, 0) + 1; + } + ptr++; + } + else + { + for (dirt_cnt = 0; dirt_cnt < ndirs; dirt_cnt++) + { + for (n = 0; n < nelems; n++) + { + uint32_t form = elems[n]; + if (n == path_ndx) + { + unsigned char *d; + switch (form) + { + case DW_FORM_string: + d = (unsigned char *) ptr; + break; + case DW_FORM_strp: + { + unsigned int strp = do_read_32 (ptr); + if (strp >= debug_sections[DEBUG_STR].size) + d = NULL; + else + d = ((unsigned char *) + debug_sections[DEBUG_STR].data + + strp); + } + break; + case DW_FORM_line_strp: + { + unsigned int line_strp = do_read_32 (ptr); + if (line_strp >= debug_sections[DEBUG_LINE_STR].size) + d = NULL; + else + d = ((unsigned char *) + debug_sections[DEBUG_LINE_STR].data + + line_strp); + } + break; + default: + d = NULL; + break; + } + + if (d == NULL) + { + error (0, 0, "%s: .debug_line bad dir path", + dso->filename); + return 1; + } + + /* Note we do this even for the zero entry, which is + marked as NULL for pre-DWARF5 line tables. This + is important for when we merge file entries + together for a multifile because the zero dir + entry could differ. It is should be equivalent + to the CU DIE comp_dir attribute, but we don't + track that all CUs referring to the (same) line + table share identical an DW_AT_comp_dir value. */ + dirt[dirt_cnt] = d; + } + ptr = skip_attr_no_dw_form_indirect (cu->cu_version, form, ptr); + } + } + } + + /* file table: */ + file = ptr; + if (version < 5) + { + file_cnt = 0; + while (*ptr != 0) + { + ptr = (unsigned char *) strchr ((char *)ptr, 0) + 1; + value = read_uleb128 (ptr); + + if (value >= dirt_cnt) + { + error (0, 0, "%s: Wrong directory table index %u", + dso->filename, value); + return 1; + } + + skip_leb128 (ptr); + skip_leb128 (ptr); + file_cnt++; + } + nfiles = file_cnt; + } + else + { + nelems = *ptr++; + path_ndx = -1; + for (n = 0; n < nelems; n++) + { + uint16_t lnct = read_uleb128 (ptr); + uint16_t form = read_uleb128 (ptr); + switch (lnct) + { + case DW_LNCT_path: + if (path_ndx != -1) + { + error (0, 0, + "%s: .debug_line duplicate file path elements", + dso->filename); + return 1; + } + path_ndx = n; + + /* Currently we only handle two string form which always + stay... */ + if (form != DW_FORM_string && form != DW_FORM_line_strp) + { + error (0, 0, + "%s: .debug_line unhandled form %s for file path", + dso->filename, get_DW_FORM_str (form)); + return 1; + } + break; + + case DW_LNCT_directory_index: + if (dir_ndx != -1) + { + error (0, 0, + "%s: .debug_line duplicate file dir elements", + dso->filename); + return 1; + } + dir_ndx = n; + + if (form != DW_FORM_data1 + && form != DW_FORM_data2 + && form != DW_FORM_udata) + { + error (0, 0, + "%s: .debug_line unhandled form %s for dir index", + dso->filename, get_DW_FORM_str (form)); + return 1; + } + break; + + case DW_LNCT_timestamp: + if (time_ndx != -1) + { + error (0, 0, + "%s: .debug_line duplicate file time elements", + dso->filename); + return 1; + } + time_ndx = n; + + if (form != DW_FORM_udata + && form != DW_FORM_data4 + && form != DW_FORM_data8) + { + error (0, 0, + "%s: .debug_line unhandled form %s for file time", + dso->filename, get_DW_FORM_str (form)); + return 1; + } + break; + + case DW_LNCT_size: + if (size_ndx != -1) + { + error (0, 0, + "%s: .debug_line duplicate file size elements", + dso->filename); + return 1; + } + size_ndx = n; + + if (form != DW_FORM_udata + && form != DW_FORM_data1 + && form != DW_FORM_data2 + && form != DW_FORM_data4 + && form != DW_FORM_data8) + { + error (0, 0, + "%s: .debug_line unhandled form %s for file size", + dso->filename, get_DW_FORM_str (form)); + return 1; + } + break; + + default: + error (0, 0, "%s: .debug_line unhandled file element %s", + dso->filename, get_DW_LNCT_str (lnct)); + return 1; + } + elems[n] = form; + } + + nfiles = read_uleb128 (ptr); + if (nfiles > 0) + nfiles--; /* We will skip the first (zero) entry. */ + } + + cu->cu_nfiles = nfiles; + cu->cu_files = pool_alloc (dw_file, nfiles * sizeof (struct dw_file)); + memset (cu->cu_files, 0, nfiles * sizeof (struct dw_file)); + + if (version < 5) + ptr = file; + + for (file_cnt = 0; file_cnt < nfiles; file_cnt++) + { + char *f = NULL; + char *end = NULL; + uint32_t d = 0; + uint64_t time = 0; + uint64_t size = 0; + if (version < 5) + { + f = (char *) ptr; + ptr = (unsigned char *) strchr ((char *)ptr, 0) + 1; + end = (char *) ptr; + d = read_uleb128 (ptr); + time = read_uleb128 (ptr); + size = read_uleb128 (ptr); + } + else + { + /* Skip zero entry. */ + if (file_cnt == 0) + for (n = 0; n < nelems; n++) + ptr = skip_attr_no_dw_form_indirect (cu->cu_version, + elems[n], ptr); + + for (n = 0; n < nelems; n++) + { + uint32_t form = elems[n]; + if (n == path_ndx) + { + switch (form) + { + case DW_FORM_string: + f = (char *) ptr; + end = strchr ((char *)ptr, 0) + 1; + break; + case DW_FORM_strp: + { + unsigned int strp = do_read_32 (ptr); + if (strp >= debug_sections[DEBUG_STR].size) + f = NULL; + else + { + f = ((char *) debug_sections[DEBUG_STR].data + + strp); + end = f + strlen (f) + 1; + } + } + break; + case DW_FORM_line_strp: + { + unsigned int line_strp = do_read_32 (ptr); + if (line_strp >= debug_sections[DEBUG_LINE_STR].size) + f = NULL; + else + { + f = ((char *) debug_sections[DEBUG_LINE_STR].data + + line_strp); + end = f + strlen (f) + 1; + } + } + break; + default: + f = NULL; + break; + } + + if (f == NULL) + { + error (0, 0, "%s: .debug_line bad file path", + dso->filename); + return 1; + } + } + else if (n == dir_ndx) + { + switch (form) + { + case DW_FORM_data1: + d = *ptr; + break; + case DW_FORM_data2: + d = do_read_16 (ptr); + break; + case DW_FORM_udata: + { + unsigned char *p = ptr; + d = read_uleb128 (p); + } + break; + } + } + ptr = skip_attr_no_dw_form_indirect (cu->cu_version, form, ptr); + } + } + + cu->cu_files[file_cnt].file = f; + if (d >= dirt_cnt) + { + error (0, 0, "%s: Wrong directory table index %u", + dso->filename, value); + return 1; + } + + cu->cu_files[file_cnt].dir = (char *) dirt[d]; + cu->cu_files[file_cnt].time = time; + cu->cu_files[file_cnt].size = size; + size_t file_len = (char *) end - f; + size_t strlen_file = file_len - 1; + bool file_has_slash = false; + if (cu->cu_files[file_cnt].file[0] != '/' + && cu->cu_files[file_cnt].dir != NULL) + { + size_t dir_len = strlen (cu->cu_files[file_cnt].dir); + if (dir_len) + { + obstack_grow (&ob, cu->cu_files[file_cnt].dir, + dir_len); + strlen_file += dir_len; + if (cu->cu_files[file_cnt].dir[dir_len - 1] != '/') + { + obstack_1grow (&ob, '/'); + strlen_file++; + } + file_has_slash = true; + obstack_grow (&ob, cu->cu_files[file_cnt].file, + file_len); + cu->cu_files[file_cnt].file + = (char *) obstack_finish (&ob); + cu->cu_files[file_cnt].dir = NULL; + } + } + cu->cu_files[file_cnt].file_angle_brackets_encapsulated_no_slash + = (!file_has_slash + && cu->cu_files[file_cnt].file[0] == '<' + && cu->cu_files[file_cnt].file[strlen_file - 1] == '>' + && strchr (cu->cu_files[file_cnt].file, '/') == NULL); + } + + return 0; +} + +/* Estimate the amount of DIEs in the .debug_info section, based on the size + of that section. */ +static unsigned int +estimate_nr_dies (void) +{ + unsigned int average_die_size = 11; + unsigned int nr_dies = debug_sections[DEBUG_INFO].size / average_die_size; + return nr_dies; +} + +static size_t +emulate_htab (size_t initial, size_t final_nr_elements) +{ + size_t size = initial; + + /* Emulate creation. */ + size = higher_prime_number (size); + + /* Emulate growing till htab contains find_nr_elements. */ + while (1) + { + /* Emulate expansion trigger. */ + size_t nr_elements = size * 3 / 4; + while (!(size * 3 <= nr_elements * 4)) + nr_elements++; + + if (nr_elements > final_nr_elements) + { + nr_elements = final_nr_elements; + break; + } + + /* Emulate expansion. */ + size = size * 2; + size = higher_prime_number (size); + } + + return size; +} + +/* Print hash table statistics for hash table HTAB with message string MSG. */ +static void +htab_report (htab_t htab, const char *msg) +{ + double collisions = htab_collisions (htab); + unsigned int searches = htab->searches; + size_t elements = htab->n_elements; + size_t deleted = htab->n_deleted; + size_t adjusted_elements = elements - deleted; + size_t size = htab->size; + double occupancy = (double)elements / (double)size; + double adjusted_occupancy = (double)adjusted_elements / (double)size; + /* Indent unconditional fprintfs similar to conditional fprintfs to + left-align literal strings. */ + if (1) + fprintf (stderr, "htab: %s\n", msg); + if (1) + fprintf (stderr, " size: %zu\n", size); + if (elements > 0 && deleted == 0) + fprintf (stderr, " elements: %zu, occupancy: %f\n", elements, + occupancy); + if (deleted > 0) + fprintf (stderr, " elements (incl. deleted): %zu, occupancy: %f\n", + elements, occupancy); + if (deleted > 0) + fprintf (stderr, " elements (excl. deleted): %zu, occupancy: %f\n", + adjusted_elements, adjusted_occupancy); + if (elements > 0) + fprintf (stderr, " searches: %u, collisions: %f\n", searches, + collisions); +} + +/* Hash function for off_htab hash table. */ +static hashval_t +off_hash (const void *p) +{ + dw_die_ref die = (dw_die_ref) p; + + return die->die_offset / 6; +} + +/* Equality function for off_htab hash table. */ +static int +off_eq (const void *p, const void *q) +{ + return ((dw_die_ref) p)->die_offset == ((dw_die_ref) q)->die_offset; +} + +/* Hash table to map die_offset values to struct dw_die pointers. */ +static htab_t off_htab; + +/* After read_multifile off_htab is copied over to this variable. + Offsets in the alternate .debug_info are found using this hash table. */ +static htab_t alt_off_htab; + +/* Offset hash table for .debug_types section. */ +static htab_t types_off_htab; + +/* Function to add DIE into the hash table (and create the hash table + when not already created). */ +static void +off_htab_add_die (dw_cu_ref cu, dw_die_ref die, unsigned int *die_count) +{ + void **slot; + + if (unlikely (cu->cu_kind == CU_TYPES)) + { + if (types_off_htab == NULL) + { + types_off_htab = htab_try_create (100000, off_hash, off_eq, NULL); + if (types_off_htab == NULL) + dwz_oom (); + } + + slot = htab_find_slot (types_off_htab, die, INSERT); + if (slot == NULL) + dwz_oom (); + assert (*slot == NULL); + *slot = die; + return; + } + + if (off_htab == NULL) + { + unsigned int estimated_nr_dies = estimate_nr_dies (); + size_t default_initial_size = 100000; + size_t initial_size; + if (low_mem + || op_multifile + || (multifile_mode == 0 + && die_count_method == estimate + && (estimated_nr_dies >= low_mem_die_limit + || estimated_nr_dies >= max_die_limit))) + initial_size = default_initial_size; + else + { + size_t nr_dies; + if (die_count && *die_count != 0) + { + nr_dies = *die_count; + if (tracing) + fprintf (stderr, "Using die count %zu for off_htab" + " allocation\n", nr_dies); + } + else if (die_count_method == none) + nr_dies = 0; + else if (die_count_method == estimate) + { + nr_dies = estimated_nr_dies; + if (tracing) + fprintf (stderr, "Using die count estimate %zu for off_htab" + " allocation\n", nr_dies); + } + else + assert (false); + + if (nr_dies != 0) + { + size_t final_hashtab_size + = emulate_htab (default_initial_size, nr_dies); + initial_size = final_hashtab_size; + } + else + initial_size = default_initial_size; + } + off_htab = htab_try_create (initial_size, off_hash, off_eq, NULL); + if (tracing) + htab_report (off_htab, "off_htab allocation"); + if (off_htab == NULL) + dwz_oom (); + if (rd_multifile) + alt_off_htab = off_htab; + } + + slot = htab_find_slot_with_hash (off_htab, die, off_hash (die), INSERT); + if (slot == NULL) + dwz_oom (); + assert (*slot == NULL); + *slot = die; +} + +/* For DIE_OFFSET return dw_die_ref whose die_offset field is equal + to that value. Return NULL if no DIE is at that position (buggy + DWARF input?). */ +static dw_die_ref +off_htab_lookup (dw_cu_ref cu, unsigned int die_offset) +{ + struct dw_die die; + die.die_offset = die_offset; + if (cu == NULL) + return (dw_die_ref) htab_find_with_hash (off_htab, &die, off_hash (&die)); + if (unlikely (cu->cu_kind == CU_ALT)) + return (dw_die_ref) htab_find_with_hash (alt_off_htab, &die, + off_hash (&die)); + if (unlikely (cu->cu_kind == CU_TYPES)) + return (dw_die_ref) htab_find_with_hash (types_off_htab, &die, + off_hash (&die)); + return (dw_die_ref) htab_find_with_hash (off_htab, &die, off_hash (&die)); +} + +/* For a die attribute ATTR starting at PTR, with the die in CU, return the + pointer after the attribute. */ +static inline unsigned char * FORCE_INLINE +skip_attr (unsigned int cu_version, struct abbrev_attr *attr, + unsigned char *ptr) +{ + uint32_t form = attr->form; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + return skip_attr_no_dw_form_indirect (cu_version, form, ptr); +} + +/* Return a pointer at which DIE's attribute AT is encoded, and fill in + its form into *FORMP. Return NULL if the attribute is not present. */ +static unsigned char * +get_AT (dw_die_ref die, enum dwarf_attribute at, enum dwarf_form *formp) +{ + struct abbrev_tag *t = die->die_abbrev; + unsigned int i; + unsigned char *ptr; + dw_cu_ref cu = die_cu (die); + if (unlikely (fi_multifile) && cu->cu_kind == CU_ALT) + ptr = alt_data[DEBUG_INFO]; + else if (cu->cu_kind == CU_TYPES) + ptr = debug_sections[DEBUG_TYPES].data; + else + ptr = debug_sections[DEBUG_INFO].data; + ptr += die->die_offset; + skip_leb128 (ptr); + for (i = 0; i < t->nattr; ++i) + { + uint32_t form = t->attr[i].form; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + if (t->attr[i].attr == at) + { + *formp = form; + if (form == DW_FORM_implicit_const) + return (unsigned char *) &t->values[i]; + return ptr; + } + + ptr = skip_attr_no_dw_form_indirect (cu->cu_version, form, ptr); + } + return NULL; +} + +/* Return an integer attribute AT of DIE. Set *PRESENT to true + if found. */ +static uint64_t +get_AT_int (dw_die_ref die, enum dwarf_attribute at, bool *present, + enum dwarf_form *formp) +{ + unsigned char *ptr; + ptr = get_AT (die, at, formp); + *present = false; + if (ptr == NULL) + return 0; + *present = true; + switch (*formp) + { + case DW_FORM_ref_addr: + return read_size (ptr, die_cu (die)->cu_version == 2 ? ptr_size : 4); + case DW_FORM_addr: + return read_size (ptr, ptr_size); + case DW_FORM_flag_present: + return 1; + case DW_FORM_ref1: + case DW_FORM_flag: + case DW_FORM_data1: + return read_8 (ptr); + case DW_FORM_ref2: + case DW_FORM_data2: + return read_16 (ptr); + case DW_FORM_ref4: + case DW_FORM_data4: + case DW_FORM_sec_offset: + return read_32 (ptr); + case DW_FORM_ref8: + case DW_FORM_data8: + case DW_FORM_ref_sig8: + return read_64 (ptr); + case DW_FORM_sdata: + return read_sleb128 (ptr); + case DW_FORM_ref_udata: + case DW_FORM_udata: + return read_uleb128 (ptr); + case DW_FORM_implicit_const: + return *(uint64_t *)ptr; /* See get_AT. */ + default: + *present = false; + return 0; + } +} + +/* Return a pointer to string attribute AT in DIE, or NULL + if the attribute is not present. */ +static char * +get_AT_string (dw_die_ref die, enum dwarf_attribute at) +{ + enum dwarf_form form; + unsigned char *ptr; + ptr = get_AT (die, at, &form); + if (ptr == NULL) + return NULL; + switch (form) + { + case DW_FORM_string: + return (char *) ptr; + case DW_FORM_strp: + { + unsigned int strp = read_32 (ptr); + if (unlikely (fi_multifile) && die_cu (die)->cu_kind == CU_ALT) + { + if (strp >= alt_size[DEBUG_STR]) + return NULL; + return (char *) alt_data[DEBUG_STR] + strp; + } + if (strp >= debug_sections[DEBUG_STR].size) + return NULL; + return (char *) debug_sections[DEBUG_STR].data + strp; + } + case DW_FORM_line_strp: + { + unsigned int line_strp = read_32 (ptr); + if (line_strp >= debug_sections[DEBUG_LINE_STR].size) + return NULL; + else + return (char *) debug_sections[DEBUG_LINE_STR].data + line_strp; + } + default: + return NULL; + } +} + +/* Parse DWARF expression referenced or stored in DIE, starting at + PTR with LEN bytes. Return non-zero on error. If NEED_ADJUST + is non-NULL, set *NEED_ADJUST to true if it contains DIE references + that will need adjusting. Some opcodes cause DIE or referenced + DIEs as unsuitable for moving into partial units, or limit their + location. */ +static int +read_exprloc (DSO *dso, dw_die_ref die, unsigned char *ptr, size_t len, + bool *need_adjust) +{ + unsigned char *end = ptr + len; + unsigned char op; + GElf_Addr addr; + dw_die_ref ref; + dw_cu_ref cu; + + while (ptr < end) + { + op = *ptr++; + switch (op) + { + case DW_OP_addr: + die->die_no_multifile = 1; + ptr += ptr_size; + break; + case DW_OP_deref: + case DW_OP_dup: + case DW_OP_drop: + case DW_OP_over: + case DW_OP_swap: + case DW_OP_rot: + case DW_OP_xderef: + case DW_OP_abs: + case DW_OP_and: + case DW_OP_div: + case DW_OP_minus: + case DW_OP_mod: + case DW_OP_mul: + case DW_OP_neg: + case DW_OP_not: + case DW_OP_or: + case DW_OP_plus: + case DW_OP_shl: + case DW_OP_shr: + case DW_OP_shra: + case DW_OP_xor: + case DW_OP_eq: + case DW_OP_ge: + case DW_OP_gt: + case DW_OP_le: + case DW_OP_lt: + case DW_OP_ne: + case DW_OP_lit0 ... DW_OP_lit31: + case DW_OP_reg0 ... DW_OP_reg31: + case DW_OP_nop: + case DW_OP_push_object_address: + case DW_OP_form_tls_address: + case DW_OP_call_frame_cfa: + case DW_OP_stack_value: + case DW_OP_GNU_push_tls_address: + case DW_OP_GNU_uninit: + break; + case DW_OP_const1u: + case DW_OP_pick: + case DW_OP_deref_size: + case DW_OP_xderef_size: + case DW_OP_const1s: + ++ptr; + break; + case DW_OP_const2u: + case DW_OP_const2s: + case DW_OP_skip: + case DW_OP_bra: + ptr += 2; + break; + case DW_OP_call2: + case DW_OP_call4: + case DW_OP_GNU_parameter_ref: + if (op == DW_OP_call2) + addr = read_16 (ptr); + else + addr = read_32 (ptr); + cu = die_cu (die); + ref = off_htab_lookup (cu, cu->cu_offset + addr); + if (ref == NULL) + { + error (0, 0, "%s: Couldn't find DIE at [%" PRIx64 "] " + "referenced by %s from DIE at [%x]", + dso->filename, cu->cu_offset + addr, + get_DW_OP_str (op), die->die_offset); + return 1; + } + if (op == DW_OP_call2) + ref->die_op_call2_referenced = 1; + if (ref->die_ck_state == CK_KNOWN) + { + dw_die_ref d; + ref->die_ck_state = CK_BAD; + + d = ref; + while (!d->die_root + && d->die_parent->die_ck_state == CK_KNOWN) + { + d = d->die_parent; + d->die_ck_state = CK_BAD; + } + } + else + ref->die_ck_state = CK_BAD; + if (unlikely (low_mem)) + { + ref->die_referenced = 1; + /* As .debug_loc adjustment is done after + write_info finishes, we need to keep the referenced + DIEs around uncollapsed. */ + if (need_adjust) + ref->die_intercu_referenced = 1; + } + die->die_ck_state = CK_BAD; + if (need_adjust) + *need_adjust = true; + break; + case DW_OP_const4u: + case DW_OP_const4s: + ptr += 4; + break; + case DW_OP_call_ref: + case DW_OP_GNU_implicit_pointer: + case DW_OP_implicit_pointer: + case DW_OP_GNU_variable_value: + cu = die_cu (die); + addr = read_size (ptr, cu->cu_version == 2 ? ptr_size : 4); + if (cu->cu_version == 2) + ptr += ptr_size; + else + ptr += 4; + ref = off_htab_lookup (NULL, addr); + if (ref == NULL || (unlikely (low_mem) && ref->die_tag == 0)) + { + error (0, 0, "%s: Couldn't find DIE at [%" PRIx64 "] " + "referenced by %s from DIE at [%x]", + dso->filename, addr, get_DW_OP_str (op), die->die_offset); + return 1; + } + ref->die_no_multifile = 1; + if (unlikely (low_mem)) + { + ref->die_referenced = 1; + /* As .debug_loc adjustment is done after + write_info finishes, we need to keep the referenced + DIEs around uncollapsed. */ + if (die_cu (ref) != cu || need_adjust) + ref->die_intercu_referenced = 1; + } + die->die_ck_state = CK_BAD; + if (need_adjust) + *need_adjust = true; + if (op == DW_OP_GNU_implicit_pointer || op == DW_OP_implicit_pointer) + skip_leb128 (ptr); + break; + case DW_OP_const8u: + case DW_OP_const8s: + ptr += 8; + break; + case DW_OP_constu: + case DW_OP_plus_uconst: + case DW_OP_regx: + case DW_OP_piece: + case DW_OP_consts: + case DW_OP_breg0 ... DW_OP_breg31: + case DW_OP_fbreg: + skip_leb128 (ptr); + break; + case DW_OP_bregx: + case DW_OP_bit_piece: + skip_leb128 (ptr); + skip_leb128 (ptr); + break; + case DW_OP_implicit_value: + { + uint32_t leni = read_uleb128 (ptr); + ptr += leni; + } + break; + case DW_OP_GNU_entry_value: + case DW_OP_entry_value: + { + uint32_t leni = read_uleb128 (ptr); + if ((uint64_t) (end - ptr) < leni) + { + error (0, 0, "%s: %s with too large length", + get_DW_OP_str (op), dso->filename); + return 1; + } + if (read_exprloc (dso, die, ptr, leni, need_adjust)) + return 1; + ptr += leni; + } + break; + case DW_OP_GNU_convert: + case DW_OP_convert: + case DW_OP_GNU_reinterpret: + case DW_OP_reinterpret: + addr = read_uleb128 (ptr); + if (addr == 0) + break; + goto typed_dwarf; + case DW_OP_GNU_regval_type: + case DW_OP_regval_type: + skip_leb128 (ptr); + addr = read_uleb128 (ptr); + goto typed_dwarf; + case DW_OP_GNU_const_type: + case DW_OP_const_type: + addr = read_uleb128 (ptr); + ptr += *ptr + 1; + goto typed_dwarf; + case DW_OP_GNU_deref_type: + case DW_OP_deref_type: + ++ptr; + addr = read_uleb128 (ptr); + typed_dwarf: + cu = die_cu (die); + ref = off_htab_lookup (cu, cu->cu_offset + addr); + if (ref == NULL) + { + error (0, 0, "%s: Couldn't find DIE at [%" PRIx64 "] " + "referenced by %s from DIE at [%x]", + dso->filename, cu->cu_offset + addr, + get_DW_OP_str (op), die->die_offset); + return 1; + } + if (unlikely (low_mem)) + { + ref->die_referenced = 1; + /* As .debug_loc adjustment is done after + write_info finishes, we need to keep the referenced + DIEs around uncollapsed. */ + if (need_adjust) + ref->die_intercu_referenced = 1; + } + ref->die_op_type_referenced = 1; + die->die_ck_state = CK_BAD; + if (need_adjust) + *need_adjust = true; + break; + default: + error (0, 0, "%s: Unknown DWARF %s " + "referenced from DIE at [%x]", + dso->filename, get_DW_OP_str (op), + die->die_offset); + return 1; + } + } + if (die->die_ck_state != CK_BAD) + die->u.p1.die_hash = iterative_hash (end - len, len, die->u.p1.die_hash); + return 0; +} + +/* Add dummy die in CU at OFFSET. */ +static inline void FORCE_INLINE +add_dummy_die (dw_cu_ref cu, unsigned int offset) +{ + dw_die_ref ref; + struct dw_die ref_buf; + void **slot; + + memset (&ref_buf, '\0', offsetof (struct dw_die, die_child)); + ref_buf.die_offset = offset; + ref_buf.die_collapsed_child = 1; + ref_buf.die_referenced = 1; + ref_buf.die_intercu_referenced = 1; + if (off_htab == NULL) + { + ref = pool_alloc (dw_die, offsetof (struct dw_die, die_child)); + memcpy (ref, &ref_buf, offsetof (struct dw_die, die_child)); + off_htab_add_die (cu, ref, NULL); + return; + } + + slot + = htab_find_slot_with_hash (off_htab, &ref_buf, off_hash (&ref_buf), + INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot != NULL) + return; + + ref = pool_alloc (dw_die, offsetof (struct dw_die, die_child)); + memcpy (ref, &ref_buf, offsetof (struct dw_die, die_child)); + *slot = (void *) ref; +} + +/* Add dummy DIEs for expr_loc at PTR. */ +static int +read_exprloc_low_mem_phase1 (DSO *dso, dw_die_ref die, unsigned char *ptr, + size_t len) +{ + unsigned char *end = ptr + len; + unsigned char op; + GElf_Addr addr; + dw_cu_ref cu; + + while (ptr < end) + { + op = *ptr++; + switch (op) + { + case DW_OP_addr: + ptr += ptr_size; + break; + case DW_OP_deref: + case DW_OP_dup: + case DW_OP_drop: + case DW_OP_over: + case DW_OP_swap: + case DW_OP_rot: + case DW_OP_xderef: + case DW_OP_abs: + case DW_OP_and: + case DW_OP_div: + case DW_OP_minus: + case DW_OP_mod: + case DW_OP_mul: + case DW_OP_neg: + case DW_OP_not: + case DW_OP_or: + case DW_OP_plus: + case DW_OP_shl: + case DW_OP_shr: + case DW_OP_shra: + case DW_OP_xor: + case DW_OP_eq: + case DW_OP_ge: + case DW_OP_gt: + case DW_OP_le: + case DW_OP_lt: + case DW_OP_ne: + case DW_OP_lit0 ... DW_OP_lit31: + case DW_OP_reg0 ... DW_OP_reg31: + case DW_OP_nop: + case DW_OP_push_object_address: + case DW_OP_form_tls_address: + case DW_OP_call_frame_cfa: + case DW_OP_stack_value: + case DW_OP_GNU_push_tls_address: + case DW_OP_GNU_uninit: + break; + case DW_OP_const1u: + case DW_OP_pick: + case DW_OP_deref_size: + case DW_OP_xderef_size: + case DW_OP_const1s: + ++ptr; + break; + case DW_OP_const2u: + case DW_OP_const2s: + case DW_OP_skip: + case DW_OP_bra: + ptr += 2; + break; + case DW_OP_call2: + case DW_OP_call4: + case DW_OP_GNU_parameter_ref: + if (op == DW_OP_call2) + read_16 (ptr); + else + read_32 (ptr); + break; + case DW_OP_const4u: + case DW_OP_const4s: + ptr += 4; + break; + case DW_OP_call_ref: + case DW_OP_GNU_implicit_pointer: + case DW_OP_implicit_pointer: + case DW_OP_GNU_variable_value: + cu = die_cu (die); + addr = read_size (ptr, cu->cu_version == 2 ? ptr_size : 4); + if (cu->cu_version == 2) + ptr += ptr_size; + else + ptr += 4; + /* Adding a dummy DIE ref to mark an intercu reference is only + necessary if die_cu (ref) != cu, but we don't track cu's during + low-mem phase1. */ + add_dummy_die (cu, addr); + if (op == DW_OP_GNU_implicit_pointer || op == DW_OP_implicit_pointer) + skip_leb128 (ptr); + break; + case DW_OP_const8u: + case DW_OP_const8s: + ptr += 8; + break; + case DW_OP_constu: + case DW_OP_plus_uconst: + case DW_OP_regx: + case DW_OP_piece: + case DW_OP_consts: + case DW_OP_breg0 ... DW_OP_breg31: + case DW_OP_fbreg: + skip_leb128 (ptr); + break; + case DW_OP_bregx: + case DW_OP_bit_piece: + skip_leb128 (ptr); + skip_leb128 (ptr); + break; + case DW_OP_implicit_value: + { + uint32_t leni = read_uleb128 (ptr); + ptr += leni; + } + break; + case DW_OP_GNU_entry_value: + case DW_OP_entry_value: + { + uint32_t leni = read_uleb128 (ptr); + if ((uint64_t) (end - ptr) < leni) + { + error (0, 0, "%s: %s with too large length", + get_DW_OP_str (op), dso->filename); + return 1; + } + if (read_exprloc_low_mem_phase1 (dso, die, ptr, leni)) + return 1; + ptr += leni; + } + break; + case DW_OP_GNU_convert: + case DW_OP_convert: + case DW_OP_GNU_reinterpret: + case DW_OP_reinterpret: + skip_leb128 (ptr); + break; + case DW_OP_GNU_regval_type: + case DW_OP_regval_type: + skip_leb128 (ptr); + skip_leb128 (ptr); + break; + case DW_OP_GNU_const_type: + case DW_OP_const_type: + read_uleb128 (ptr); + ptr += *ptr + 1; + break; + case DW_OP_GNU_deref_type: + case DW_OP_deref_type: + ++ptr; + skip_leb128 (ptr); + break; + default: + error (0, 0, "%s: Unknown DWARF %s " + "referenced from DIE at [%x]", + dso->filename, get_DW_OP_str (op), + die->die_offset); + return 1; + } + } + + return 0; +} + +/* Add dummy DIEs for loclist at OFFSET. */ +static int +read_loclist_low_mem_phase1 (DSO *dso, dw_cu_ref cu, dw_die_ref die, + GElf_Addr offset) +{ + unsigned char *ptr, *endsec; + GElf_Addr low, high; + size_t len = 0; + int sec; + + sec = cu->cu_version < 5 ? DEBUG_LOC : DEBUG_LOCLISTS; + ptr = debug_sections[sec].data; + if (ptr == NULL) + { + error (0, 0, "%s: loclistptr attribute, yet no %s section", + dso->filename, debug_sections[sec].name); + return 1; + } + if (offset >= debug_sections[sec].size) + { + error (0, 0, + "%s: loclistptr offset %Ld outside of %s section", + dso->filename, (long long) offset, debug_sections[sec].name); + return 1; + } + endsec = ptr + debug_sections[sec].size; + ptr += offset; +again: + while (ptr < endsec) + { + if (sec == DEBUG_LOC) + { + low = read_size (ptr, ptr_size); + high = read_size (ptr + ptr_size, ptr_size); + ptr += 2 * ptr_size; + if (low == 0 && high == 0) + break; + + if (low == ~ (GElf_Addr) 0 || (ptr_size == 4 && low == 0xffffffff)) + continue; + + len = read_16 (ptr); + } + else + { + uint8_t lle = *ptr++; + switch (lle) + { + case DW_LLE_end_of_list: + goto done; + + case DW_LLE_base_addressx: + skip_leb128 (ptr); + goto again; + + case DW_LLE_startx_endx: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_startx_length: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_offset_pair: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_default_location: + len = read_uleb128 (ptr); + break; + + case DW_LLE_base_address: + ptr += ptr_size; + goto again; + + case DW_LLE_start_end: + ptr += 2 * ptr_size; + len = read_uleb128 (ptr); + break; + + case DW_LLE_start_length: + ptr += ptr_size; + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_GNU_view_pair: + if (cu->cu_version != 5) + error (0, 0, + "%s: DW_LLE_GNU_view_pair used with DWARF version %u", + dso->filename, cu->cu_version); + skip_leb128 (ptr); + skip_leb128 (ptr); + goto again; + + default: + error (0, 0, + "%s: unhandled location list entry 0x%x in %s section", + dso->filename, lle, debug_sections[sec].name); + return 1; + } + } + + if (unlikely (!(ptr + len <= endsec))) + { + error (0, 0, + "%s: locexpr length 0x%Lx exceeds %s section", + dso->filename, (long long) len, debug_sections[sec].name); + return 1; + } + + if (len > 0) + if (read_exprloc_low_mem_phase1 (dso, die, ptr, len)) + return 1; + + ptr += len; + } + +done: + return 0; +} + +/* Add dummy dies for loc_exprs and loc_lists referenced from DIE. */ +static int +add_locexpr_dummy_dies (DSO *dso, dw_cu_ref cu, dw_die_ref die, + unsigned char *ptr, uint32_t form, unsigned int attr, + size_t len) +{ + if (form == DW_FORM_block1 && cu->cu_version < 4) + { + /* Old DWARF uses blocks instead of exprlocs. */ + switch (attr) + { + case DW_AT_frame_base: + case DW_AT_location: + case DW_AT_data_member_location: + case DW_AT_vtable_elem_location: + case DW_AT_byte_size: + case DW_AT_bit_offset: + case DW_AT_bit_size: + case DW_AT_string_length: + case DW_AT_lower_bound: + case DW_AT_return_addr: + case DW_AT_bit_stride: + case DW_AT_upper_bound: + case DW_AT_count: + case DW_AT_segment: + case DW_AT_static_link: + case DW_AT_use_location: + case DW_AT_allocated: + case DW_AT_associated: + case DW_AT_data_location: + case DW_AT_byte_stride: + case DW_AT_rank: + case DW_AT_call_value: + case DW_AT_call_target: + case DW_AT_call_target_clobbered: + case DW_AT_call_data_location: + case DW_AT_call_data_value: + case DW_AT_GNU_call_site_value: + case DW_AT_GNU_call_site_data_value: + case DW_AT_GNU_call_site_target: + case DW_AT_GNU_call_site_target_clobbered: + if (read_exprloc_low_mem_phase1 (dso, die, ptr, len)) + return 1; + default: + break; + } + + return 0; + } + + if (form == DW_FORM_exprloc) + return read_exprloc_low_mem_phase1 (dso, die, ptr, len); + + switch (attr) + { + case DW_AT_location: + case DW_AT_string_length: + case DW_AT_return_addr: + case DW_AT_data_member_location: + case DW_AT_frame_base: + case DW_AT_segment: + case DW_AT_static_link: + case DW_AT_use_location: + case DW_AT_vtable_elem_location: + if ((cu->cu_version < 4 && form == DW_FORM_data4) + || form == DW_FORM_sec_offset) + { + if (read_loclist_low_mem_phase1 (dso, cu, die, do_read_32 (ptr))) + return 1; + break; + } + else if (cu->cu_version < 4 && form == DW_FORM_data8) + { + if (read_loclist_low_mem_phase1 (dso, cu, die, do_read_64 (ptr))) + return 1; + break; + } + break; + default: + break; + } + + return 0; +} + +/* Structure recording a portion of .debug_loc section that will need + adjusting. */ +struct debug_loc_adjust +{ + /* Starting offset in .debug_loc that needs adjusting. */ + unsigned int start_offset; + /* End offset. This is used for hashing, as in theory some DIE + might be referencing a middle of a .debug_loc sequence (the address + part of it) referenced by a different DIE. */ + unsigned int end_offset; + /* Owning CU. We give up if the same .debug_loc part that needs adjusting + is owned by more than one CU. */ + dw_cu_ref cu; +}; +ALIGN_STRUCT (debug_loc_adjust) + +/* Hash table and obstack for recording .debug_loc and .debug_loclists + adjustment ranges. */ +static htab_t loc_htab; +static htab_t loclists_htab; + +/* Hash function for loc[lists]_htab. */ +static hashval_t +loc_hash (const void *p) +{ + struct debug_loc_adjust *a = (struct debug_loc_adjust *)p; + + return a->end_offset; +} + +/* Equality function for loc[lists]_htab. */ +static int +loc_eq (const void *p, const void *q) +{ + struct debug_loc_adjust *t1 = (struct debug_loc_adjust *)p; + struct debug_loc_adjust *t2 = (struct debug_loc_adjust *)q; + + return t1->end_offset == t2->end_offset; +} + +/* Parse .debug_loc portion starting at OFFSET, referenced by + DIE. Call read_exprloc on each of the DWARF expressions + contained in it. */ +static int +read_loclist (DSO *dso, dw_cu_ref cu, dw_die_ref die, GElf_Addr offset) +{ + unsigned char *ptr, *endsec; + GElf_Addr low, high; + size_t len; + int sec; + bool need_adjust = false; + + die->die_ck_state = CK_BAD; + sec = cu->cu_version < 5 ? DEBUG_LOC : DEBUG_LOCLISTS; + ptr = debug_sections[sec].data; + if (ptr == NULL) + { + error (0, 0, "%s: loclistptr attribute, yet no %s section", + dso->filename, debug_sections[sec].name); + return 1; + } + if (offset >= debug_sections[sec].size) + { + error (0, 0, + "%s: loclistptr offset %Ld outside of %s section", + dso->filename, (long long) offset, debug_sections[sec].name); + return 1; + } + endsec = ptr + debug_sections[sec].size; + ptr += offset; +again: + while (ptr < endsec) + { + if (cu->cu_version < 5) + { + low = read_size (ptr, ptr_size); + high = read_size (ptr + ptr_size, ptr_size); + ptr += 2 * ptr_size; + if (low == 0 && high == 0) + break; + + if (low == ~ (GElf_Addr) 0 || (ptr_size == 4 && low == 0xffffffff)) + continue; + + len = read_16 (ptr); + } + else + { + uint8_t lle = *ptr++; + switch (lle) + { + case DW_LLE_end_of_list: + goto done; + + case DW_LLE_base_addressx: + skip_leb128 (ptr); + goto again; + + case DW_LLE_startx_endx: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_startx_length: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_offset_pair: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_default_location: + len = read_uleb128 (ptr); + break; + + case DW_LLE_base_address: + ptr += ptr_size; + goto again; + + case DW_LLE_start_end: + ptr += 2 * ptr_size; + len = read_uleb128 (ptr); + break; + + case DW_LLE_start_length: + ptr += ptr_size; + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_GNU_view_pair: + if (cu->cu_version != 5) + error (0, 0, + "%s: DW_LLE_GNU_view_pair used with DWARF version %u", + dso->filename, cu->cu_version); + skip_leb128 (ptr); + skip_leb128 (ptr); + goto again; + + default: + error (0, 0, + "%s: unhandled location list entry 0x%x in %s section", + dso->filename, lle, debug_sections[sec].name); + return 1; + } + } + + if (unlikely (!(ptr + len <= endsec))) + { + error (0, 0, + "%s: locexpr length 0x%Lx exceeds %s section", + dso->filename, (long long) len, debug_sections[sec].name); + return 1; + } + + if (read_exprloc (dso, die, ptr, len, &need_adjust)) + return 1; + + ptr += len; + } + +done: + if (need_adjust) + { + struct debug_loc_adjust adj, *a; + void **slot; + + adj.start_offset = offset; + adj.end_offset = ptr - debug_sections[sec].data; + adj.cu = cu; + if (sec == DEBUG_LOC) + { + if (loc_htab == NULL) + { + loc_htab = htab_try_create (50, loc_hash, loc_eq, NULL); + if (loc_htab == NULL) + dwz_oom (); + } + slot = htab_find_slot_with_hash (loc_htab, &adj, adj.end_offset, + INSERT); + } + else + { + if (loclists_htab == NULL) + { + loclists_htab = htab_try_create (50, loc_hash, loc_eq, NULL); + if (loclists_htab == NULL) + dwz_oom (); + } + slot = htab_find_slot_with_hash (loclists_htab, &adj, adj.end_offset, + INSERT); + } + if (slot == NULL) + dwz_oom (); + if (*slot == NULL) + { + a = pool_alloc (debug_loc_adjust, sizeof (*a)); + *a = adj; + *slot = (void *) a; + } + else if (((struct debug_loc_adjust *)*slot)->cu != adj.cu) + { + error (0, 0, "%s: can't adjust %s section because multiple " + "CUs refer to it", dso->filename, debug_sections[sec].name); + return 1; + } + else if (((struct debug_loc_adjust *)*slot)->start_offset > offset) + ((struct debug_loc_adjust *)*slot)->start_offset = offset; + } + + return 0; +} + +/* Initialize die_odr_state field for DIE with CU. */ +static void +set_die_odr_state (dw_cu_ref cu, dw_die_ref die) +{ + unsigned char *ptr; + struct abbrev_tag *t; + unsigned int i; + bool decl_p; + bool name_p; + bool other_p; + + assert (die->die_odr_state == ODR_UNKNOWN); + die->die_odr_state = ODR_NONE; + + if (low_mem) + /* Todo: allow low-mem mode. */ + return; + + if (multifile_mode == 0) + /* We're in regular mode, enable the ODR optimization. */ + ; + else + /* One definition rule does not hold across executables and shared + libraries, so disable. */ + return; + + if (!die->die_toplevel) + /* A nested struct is not uniquely identified by its name. There may be a + different type with the same name nested in a different struct. */ + return; + + switch (cu->lang) + { + case DW_LANG_C_plus_plus: + case DW_LANG_C_plus_plus_03: + case DW_LANG_C_plus_plus_11: + case DW_LANG_C_plus_plus_14: + /* c++ defines one-definition-rule. */ + if (die->die_tag == DW_TAG_structure_type + || die->die_tag == DW_TAG_class_type + || die->die_tag == DW_TAG_union_type) + /* ODR holds for all types, but we limit the optimization to these + tags, which are the ones likely to profit from it. */ + ; + else + return; + break; + default: + return; + } + + ptr = debug_sections[DEBUG_INFO].data + die->die_offset; + skip_leb128 (ptr); + + t = die->die_abbrev; + + decl_p = false; + name_p = false; + other_p = false; + for (i = 0; i < t->nattr; ++i) + { + if (t->attr[i].attr == DW_AT_name) + { + name_p = true; + continue; + } + + if (t->attr[i].attr == DW_AT_declaration) + { + decl_p = true; + continue; + } + + other_p = true; + } + + if (!name_p) + /* Ignore anonymous types. */ + return; + + odr_active_p = true; + + if (decl_p && !other_p && die->die_child == NULL) + { + /* Detected a declaration with no attributes other than DW_AT_name and + DW_AT_declaration, and no children. */ + die->die_odr_state = ODR_DECL; + return; + } + + die->die_odr_state = ODR_DEF; +} + +/* Return the initialized die_odr_state field for DIE with CU. */ +static unsigned int +die_odr_state (dw_die_ref die) +{ + assert (die->die_odr_state != ODR_UNKNOWN); + return die->die_odr_state; +} + +/* This function computes u.p1.die_hash and die_ck_state of DIE. + The field u.p1.die_hash is an iterative hash of: + - the die_tag, + - for all attributes except DW_AT_sibling: the attribute code, + - for non-reference class attributes: the value of the attribute (magic + for DW_AT_*_file), + - for DW_FORM_ref_addr attributes: the value of the attribute, + - for reference class attributes that point into the subtree of TOP_DIE + (note, other references are intentionally ignored here): + ref->u.p1.die_enter - top_die->u.p1.die_enter, + - for all children: their hashes. + The field die_ck_state is set to CK_BAD if the die is unsuitable for + moving into a partial unit (contains code references or other reasons). + TOP_DIE is initially NULL when DW_TAG_*_unit or die_named_namespace dies + are walked. */ +static int +checksum_die (DSO *dso, dw_cu_ref cu, dw_die_ref top_die, dw_die_ref die) +{ + unsigned short s; + struct abbrev_tag *t; + unsigned int i; + unsigned char *ptr; + dw_die_ref child; + bool only_hash_name_p; + hashval_t die_hash2; + + switch (die->die_ck_state) + { + case CK_UNKNOWN: + break; + case CK_KNOWN: + case CK_BAD: + return 0; + case CK_BEING_COMPUTED: + die->die_ck_state = CK_BAD; + return 0; + } + die->die_ck_state = CK_BEING_COMPUTED; + die->u.p1.die_hash = 0; + if (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit + || die->die_tag == DW_TAG_namespace + || die->die_tag == DW_TAG_module + || die->die_tag == DW_TAG_imported_unit) + die->die_ck_state = CK_BAD; + t = die->die_abbrev; + ptr = debug_sections[DEBUG_INFO].data + die->die_offset; + skip_leb128 (ptr); + s = die->die_tag; + die->u.p1.die_hash = iterative_hash_object (s, die->u.p1.die_hash); + if (dump_checksum_p) + fprintf (stderr, "DIE %x, hash: %x, tag\n", die->die_offset, + die->u.p1.die_hash); + if (uni_lang_p && die == top_die) + { + die->u.p1.die_hash + = iterative_hash_object (cu->lang, die->u.p1.die_hash); + if (dump_checksum_p) + fprintf (stderr, "DIE %x, hash: %x, lang\n", die->die_offset, + die->u.p1.die_hash); + } + + if (odr && die->die_odr_state == ODR_UNKNOWN) + set_die_odr_state (die_cu (die), die); + only_hash_name_p = odr && die_odr_state (die) != ODR_NONE; + die_hash2 = 0; + if (only_hash_name_p) + die_hash2 = die->u.p1.die_hash; + for (i = 0; i < t->nattr; ++i) + { + uint32_t form = t->attr[i].form; + size_t len = 0; + unsigned char *old_ptr; + bool handled = false; + int64_t svalue; + uint64_t value; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + old_ptr = ptr; + + switch (t->attr[i].attr) + { + /* Ignore DW_AT_sibling attribute. */ + case DW_AT_sibling: + handled = true; + break; + /* These attributes reference code, prevent moving + DIEs with them. */ + case DW_AT_low_pc: + case DW_AT_high_pc: + case DW_AT_entry_pc: + case DW_AT_ranges: + case DW_AT_call_return_pc: + case DW_AT_call_pc: + die->die_ck_state = CK_BAD; + break; + case DW_AT_start_scope: + if (form == DW_FORM_sec_offset) + die->die_ck_state = CK_BAD; + break; + /* These attributes reference other sections, they + can't be moved to other files easily. */ + case DW_AT_stmt_list: + case DW_AT_macro_info: + case DW_AT_macros: + case DW_AT_GNU_macros: + if (!die->die_root) + die->die_no_multifile = 1; + break; + /* loclistptr attributes. */ + case DW_AT_location: + case DW_AT_string_length: + case DW_AT_return_addr: + case DW_AT_data_member_location: + case DW_AT_frame_base: + case DW_AT_segment: + case DW_AT_static_link: + case DW_AT_use_location: + case DW_AT_vtable_elem_location: + if ((cu->cu_version < 4 && form == DW_FORM_data4) + || form == DW_FORM_sec_offset) + { + if (read_loclist (dso, cu, die, read_32 (ptr))) + return 1; + ptr = old_ptr; + break; + } + else if (cu->cu_version < 4 && form == DW_FORM_data8) + { + if (read_loclist (dso, cu, die, read_64 (ptr))) + return 1; + ptr = old_ptr; + break; + } + break; + case DW_AT_decl_file: + case DW_AT_call_file: + switch (form) + { + case DW_FORM_data1: value = read_8 (ptr); handled = true; break; + case DW_FORM_data2: value = read_16 (ptr); handled = true; break; + case DW_FORM_data4: value = read_32 (ptr); handled = true; break; + case DW_FORM_data8: value = read_64 (ptr); handled = true; break; + case DW_FORM_udata: + value = read_uleb128 (ptr); handled = true; break; + case DW_FORM_sdata: + { + svalue = read_sleb128 (ptr); + if (svalue >= 0) + { + value = svalue; + handled = true; + break; + } + else + { + negative: + error (0, 0, "%s: negative value %" PRId64 " for %s", + dso->filename, svalue, + get_DW_AT_str (t->attr[i].attr)); + return 1; + } + } + case DW_FORM_implicit_const: + { + svalue = t->values[i]; + if (svalue >= 0) + { + value = svalue; + handled = true; + break; + } + else + goto negative; + } + default: + error (0, 0, "%s: Unhandled %s for %s", + dso->filename, get_DW_FORM_str (form), + get_DW_AT_str (t->attr[i].attr)); + return 1; + } + if (handled) + { + unsigned char *new_ptr = ptr; + ptr = old_ptr; + if (value > cu->cu_nfiles) + { + error (0, 0, "%s: Invalid %s file number %d", + dso->filename, get_DW_AT_str (t->attr[i].attr), + (int) value); + return 1; + } + if (value == 0) + handled = false; + else if (!ignore_locus && die->die_ck_state != CK_BAD) + { + struct dw_file *cu_file = &cu->cu_files[value - 1]; + size_t file_len = strlen (cu_file->file); + s = t->attr[i].attr; + hash_init_state (); + hash_update_state_object (die->u.p1.die_hash); + hash_update_state_object (s); + hash_update_state_object (cu_file->time); + hash_update_state_object (cu_file->size); + hash_update_state (cu_file->file, file_len + 1); + if (cu_file->dir) + { + hash_update_state (cu_file->dir, + strlen (cu_file->dir) + 1); + } + /* Ignore DW_AT_comp_dir for DW_AT_*_file <built-in> + etc. if immediately followed by DW_AT_*_line 0. */ + else if (cu_file->file_angle_brackets_encapsulated_no_slash + && i + 1 < t->nattr + && t->attr[i + 1].attr + == (t->attr[i].attr == DW_AT_decl_file + ? DW_AT_decl_line : DW_AT_call_line) + && t->attr[i + 1].form == DW_FORM_data1 + && *new_ptr == 0) + { + die->u.p1.die_hash = hash_digest (); + break; + } + + die->u.p1.die_hash = hash_digest (); + + if (cu->cu_comp_dir + && (cu_file->dir ? cu_file->dir[0] + : cu_file->file[0]) != '/') + die->u.p1.die_hash + = iterative_hash (cu->cu_comp_dir, + strlen (cu->cu_comp_dir) + 1, + die->u.p1.die_hash); + } + } + break; + case DW_AT_decl_line: + case DW_AT_decl_column: + case DW_AT_call_line: + case DW_AT_call_column: + if (ignore_locus) + { + handled = true; + break; + } + switch (form) + { + case DW_FORM_data1: value = read_8 (ptr); handled = true; break; + case DW_FORM_data2: value = read_16 (ptr); handled = true; break; + case DW_FORM_data4: value = read_32 (ptr); handled = true; break; + case DW_FORM_data8: value = read_64 (ptr); handled = true; break; + case DW_FORM_udata: + value = read_uleb128 (ptr); handled = true; break; + case DW_FORM_sdata: + { + svalue = read_sleb128 (ptr); + if (svalue >= 0) + { + value = svalue; + handled = true; + break; + } + else + goto negative; + } + case DW_FORM_implicit_const: + svalue = t->values[i]; + if (svalue >= 0) + { + value = svalue; + handled = true; + break; + } + else + goto negative; + default: + error (0, 0, "%s: Unhandled %s for %s", + dso->filename, get_DW_FORM_str (form), + get_DW_AT_str (t->attr[i].attr)); + return 1; + } + if (handled) + { + ptr = old_ptr; + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + die->u.p1.die_hash + = iterative_hash_object (value, die->u.p1.die_hash); + } + break; + default: + break; + } + + switch (form) + { + case DW_FORM_ref_addr: + if (unlikely (op_multifile || rd_multifile || fi_multifile)) + { + dw_die_ref ref; + + value = read_size (ptr, cu->cu_version == 2 + ? ptr_size : 4); + ptr += cu->cu_version == 2 ? ptr_size : 4; + if (die->die_ck_state != CK_BAD) + { + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + } + ref = off_htab_lookup (cu, value); + if (ref == NULL) + { + error (0, 0, "%s: Couldn't find DIE at [%" PRIx64 "] " + "referenced by %s from DIE at [%x]", + dso->filename, value, + get_DW_AT_str (t->attr[i].attr), die->die_offset); + return 1; + } + if (unlikely (op_multifile) && ref->die_collapsed_child) + ref = ref->die_parent; + if (cu == die_cu (ref)) + { + /* The reference was encoded using a section-relative + encoding, while if it could have been encoded using + CU-relative encoding. Typically, the latter is used, + because: + - it's potentially smaller, and + - it doesn't require a link-time relocation. */ + + /* Assert that the multifile only contains section-relative + encoding when necessary. */ + assert (!op_multifile && !rd_multifile); + + if (fi_multifile) + { + /* It's possible that the input DWARF contains this + sub-optimal reference. We currently don't optimize + this during single-file optimization, so it will still + be there during finalize_multifile. Bail out to handle + this conservatively. */ + die->die_ck_state = CK_BAD; + return 0; + } + } + /* Assert that during op_multifile, die belongs to the same object + as ref. */ + assert (!op_multifile || cu->cu_chunk == die_cu (ref)->cu_chunk); + handled = true; + break; + } + die->die_no_multifile = 1; + ptr += cu->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_addr: + die->die_no_multifile = 1; + ptr += ptr_size; + break; + case DW_FORM_flag_present: + break; + case DW_FORM_implicit_const: + if (!handled && die->die_ck_state != CK_BAD) + { + handled = true; + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + die->u.p1.die_hash + = iterative_hash_object (t->values[i], die->u.p1.die_hash); + } + break; + case DW_FORM_flag: + case DW_FORM_data1: + ++ptr; + break; + case DW_FORM_data2: + ptr += 2; + break; + case DW_FORM_data4: + case DW_FORM_sec_offset: + ptr += 4; + break; + case DW_FORM_data8: + ptr += 8; + break; + case DW_FORM_data16: + ptr += 16; + break; + case DW_FORM_ref_sig8: + die->die_no_multifile = 1; + ptr += 8; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + skip_leb128 (ptr); + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form) + { + case DW_FORM_ref_udata: value = read_uleb128 (ptr); break; + case DW_FORM_ref1: value = read_8 (ptr); break; + case DW_FORM_ref2: value = read_16 (ptr); break; + case DW_FORM_ref4: value = read_32 (ptr); break; + case DW_FORM_ref8: value = read_64 (ptr); break; + default: abort (); + } + if (!handled) + { + dw_die_ref ref + = off_htab_lookup (cu, cu->cu_offset + value); + if (ref == NULL) + { + error (0, 0, "%s: Couldn't find DIE at [%" PRIx64 "] " + "referenced by %s from DIE at [%x]", + dso->filename, cu->cu_offset + value, + get_DW_AT_str (t->attr[i].attr), die->die_offset); + return 1; + } + if (die->die_ck_state != CK_BAD) + { + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + } + if (top_die + && !ref->die_collapsed_child + && ref->u.p1.die_enter >= top_die->u.p1.die_enter + && ref->u.p1.die_exit <= top_die->u.p1.die_exit) + { + if (die->die_ck_state != CK_BAD) + { + unsigned int val + = ref->u.p1.die_enter - top_die->u.p1.die_enter; + die->u.p1.die_hash + = iterative_hash_object (val, die->u.p1.die_hash); + } + } + handled = true; + } + break; + case DW_FORM_strp: + if (unlikely (op_multifile || rd_multifile || fi_multifile) + && die->die_ck_state != CK_BAD) + { + value = read_32 (ptr); + if (value >= debug_sections[DEBUG_STR].size) + die->die_ck_state = CK_BAD; + else + { + unsigned char *p = debug_sections[DEBUG_STR].data + value; + unsigned int l = strlen ((char *) p) + 1; + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + die->u.p1.die_hash + = iterative_hash (p, l, die->u.p1.die_hash); + handled = true; + } + } + else + { + ptr += 4; + if (only_hash_name_p && t->attr[i].attr == DW_AT_name) + { + s = t->attr[i].attr; + die_hash2 = iterative_hash_object (s, die_hash2); + die_hash2 + = iterative_hash (old_ptr, ptr - old_ptr, die_hash2); + } + } + break; + case DW_FORM_line_strp: + /* There is no .debug_line_str in the alt file, so we cannot + move this DIE unless we change the string reference. + This is not that bad because DW_FORM_line_strp is often + only used in the CU DIE for file name and comp_dir and we + don't move the CU DIE anyway. */ + die->die_ck_state = CK_BAD; + break; + case DW_FORM_string: + ptr = (unsigned char *) strchr ((char *)ptr, '\0') + 1; + if (only_hash_name_p && t->attr[i].attr == DW_AT_name) + { + s = t->attr[i].attr; + die_hash2 = iterative_hash_object (s, die_hash2); + die_hash2 + = iterative_hash (old_ptr, ptr - old_ptr, die_hash2); + } + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *ptr++; + break; + case DW_FORM_block2: + len = read_16 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + len = read_uleb128 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_exprloc: + len = read_uleb128 (ptr); + break; + default: + abort (); + } + + if (form == DW_FORM_block1 && cu->cu_version < 4) + { + /* Old DWARF uses blocks instead of exprlocs. */ + switch (t->attr[i].attr) + { + case DW_AT_frame_base: + case DW_AT_location: + case DW_AT_data_member_location: + case DW_AT_vtable_elem_location: + case DW_AT_byte_size: + case DW_AT_bit_offset: + case DW_AT_bit_size: + case DW_AT_string_length: + case DW_AT_lower_bound: + case DW_AT_return_addr: + case DW_AT_bit_stride: + case DW_AT_upper_bound: + case DW_AT_count: + case DW_AT_segment: + case DW_AT_static_link: + case DW_AT_use_location: + case DW_AT_allocated: + case DW_AT_associated: + case DW_AT_data_location: + case DW_AT_byte_stride: + case DW_AT_rank: + case DW_AT_call_value: + case DW_AT_call_target: + case DW_AT_call_target_clobbered: + case DW_AT_call_data_location: + case DW_AT_call_data_value: + case DW_AT_GNU_call_site_value: + case DW_AT_GNU_call_site_data_value: + case DW_AT_GNU_call_site_target: + case DW_AT_GNU_call_site_target_clobbered: + if (die->die_ck_state != CK_BAD) + { + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + } + if (read_exprloc (dso, die, ptr, len, NULL)) + return 1; + handled = true; + default: + break; + } + } + else if (form == DW_FORM_exprloc) + { + if (die->die_ck_state != CK_BAD) + { + s = t->attr[i].attr; + die->u.p1.die_hash + = iterative_hash_object (s, die->u.p1.die_hash); + } + if (read_exprloc (dso, die, ptr, len, NULL)) + return 1; + handled = true; + } + ptr += len; /* Skip expr/blocks. */ + if (!handled && die->die_ck_state != CK_BAD) + { + s = t->attr[i].attr; + die->u.p1.die_hash = iterative_hash_object (s, die->u.p1.die_hash); + die->u.p1.die_hash + = iterative_hash (old_ptr, ptr - old_ptr, die->u.p1.die_hash); + } + + if (dump_checksum_p) + fprintf (stderr, "DIE %x, hash: %x, attr (%d)\n", die->die_offset, + die->u.p1.die_hash, i); + } + + for (child = die->die_child, i = 0; child; child = child->die_sib, ++i) + if (checksum_die (dso, cu, + top_die ? top_die + : child->die_named_namespace + ? NULL : child, child)) + return 1; + else if (die->die_ck_state != CK_BAD) + { + if (child->die_ck_state == CK_KNOWN) + { + die->u.p1.die_hash + = iterative_hash_object (child->u.p1.die_hash, + die->u.p1.die_hash); + if (dump_checksum_p) + fprintf (stderr, "DIE %x, hash: %x, child (%i)\n", + die->die_offset, die->u.p1.die_hash, i); + die->die_no_multifile + |= child->die_no_multifile; + } + else + die->die_ck_state = CK_BAD; + } + if (die->die_ck_state == CK_BEING_COMPUTED) + die->die_ck_state = CK_KNOWN; + + if (dump_checksum_p) + fprintf (stderr, "DIE %x, hash: %x, final\n", die->die_offset, + die->u.p1.die_hash); + + if (only_hash_name_p) + { + unsigned int tmp = die->u.p1.die_hash; + die->u.p1.die_hash = die_hash2; + die->u.p1.die_hash2 = tmp; + } + + return 0; +} + +/* Helper function for checksum_ref_die to sort DIE pointers + by increasing u.p1.die_hash. */ +static int +checksum_ref_die_cmp (const void *p, const void *q) +{ + dw_die_ref die1 = *(dw_die_ref *)p; + dw_die_ref die2 = *(dw_die_ref *)q; + if (die1->u.p1.die_hash < die2->u.p1.die_hash) + return -1; + if (die1->u.p1.die_hash > die2->u.p1.die_hash) + return 1; + /* The rest is just to keep the sort stable. If there is more than + one DIE with the same hash, we don't consider any of them as suitable + starting point for the walk. */ + if (die1->die_offset < die2->die_offset) + return -1; + if (die1->die_offset > die2->die_offset) + return 1; + return 0; +} + +/* This function is the second phase of hash computation, which computes + u.p1.die_ref_hash after u.p1.die_hash has been computed. + u.p1.die_ref_hash is an iterative hash of the references (other than + those checksummed already into u.p1.die_hash by checksum_die). + u.p1.die_ref_hash is only computed for the toplevel DIEs, i.e. children + of DW_TAG_*_unit or die_named_namespace DIEs. So, in the graph + containing DIEs as nodes and parent<->child and referrer<->referree edges + we virtually coalesce all children of toplevel DIEs into the + corresponding toplevel DIE ultimate parent node. The function has 4 + modes of operation: + + The first one is when TOP_DIE, SECOND_IDX and SECOND_HASH are all NULL, + this is when we walk through DW_TAG_*_unit and die_named_namespace DIEs + to reach their children. + + The second mode of operation is with TOP_DIE != NULL and both SECOND_IDX + and SECOND_HASH NULL. In this mode we optimistically assume there are no + cycles in the graph, first hash into TOP_DIE's u.p1.die_ref_hash its + u.p1.die_hash, push the TOP_DIE into a vector (in OB obstack), for each + reference if the referree isn't already toplevel DIE find its + (grand)*parent that is a toplevel DIE, recurse on that and if it computed + the referree toplevel DIE's u.p1.die_ref_hash (i.e. no cycle), + iteratively hash in the referree toplevel DIE's u.p1.die_ref_hash (and, + if referree isn't toplevel, before that also its relative position in the + subtree). When existing, remove the TOP_DIE from the vector and set + die_ref_hash_computed to note that it is computed and doesn't have to be + computed again. If there are no cycles, the return value of the function + is 0. If a cycle is found, things are more complicated. We can't just + not walk into DIEs we've already seen and compute u.p1.die_ref_hash for + toplevel DIEs on the cycle(s), because in different CUs matching cycles + might be starting computation of the hash from different nodes on the + cycle (the order of children of DW_TAG_*_unit or DW_TAG_namespace is + usually not significant in DWARF). So, if a cycle is found, the return + value is a minimum of the die_ref_seen indexes (positions in the + vector); at that point it makes no sense to further compute + u.p1.die_ref_hash of the toplevel DIEs on the cycle, but for references + to acyclic subgraphs we still continue computing their u.p1.die_ref_hash. + For DIEs on the cycle(s) pointers to them aren't immediately removed from + the vector and everything is handled only after reaching the TOP_DIE with + die_ref_seen equal to the minimum vector index (i.e. the first of + the DIEs on the cycle(s) we've seen). At this point in the vector + starting with that index should be a list of DIEs on the cycle, and all + references to (toplevel) DIEs not on that list from those DIEs should + have die_ref_hash_computed already set. If the cycle has matches in + different CUs, we should have the same set of u.p1.die_hash values in the + list in between all those CUs, but the order might be different. At this + point we try to find a DIE from which to start walk using third mode of + operation of this function. We can't base that decision on e.g. + die_offset, as it may be not just different between the CUs, but the + matching DIEs might be in different relative orders. So we look if there + is just a single DIE with lowest u.p1.die_hash value and use that in that + case, (and if not, look if there is just a single DIE with second lowest + u.p1.die_hash and so on up to 20th). If none is found, the more + expensive 4th mode of operation is used instead. + + The third mode of operation is when TOP_DIE, SECOND_IDX and SECOND_HASH + are all non-NULL. This mode is used when the initial TOP_DIE is + a uniquely chosen DIE on the cycle (same in each CU that has + matching cycle). In this mode into each TOP_DIE's u.p1.die_ref_hash + we hash in *SECOND_IDX (counter when in that walk the DIE has been + seen first) and relative referree positions in subtree, and hash in + referree toplevel u.p1.die_ref_hash into *SECOND_HASH, and finally + when the walk finishes, the caller will compute the final + u.p1.die_ref_hash for DIEs on the cycle(s) from their intermediate + u.p1.die_ref_hash and *SECOND_HASH. + + The last mode of operation is when TOP_DIE and SECOND_HASH + are non-NULL, but SECOND_IDX is NULL. This mode is used when no + suitable DIE from which to start walking the cycle has been discovered. + In that case we for each DIE on the cycle walk everything that hasn't + die_ref_hash_computed yet, for DIEs seen that have die_ref_hash_computed + hash in their u.p1.die_ref_hash, otherwise (DIEs on the current cycle(s)) + hash in their u.p1.die_hash. */ +static unsigned int +checksum_ref_die (dw_cu_ref cu, dw_die_ref top_die, dw_die_ref die, + unsigned int *second_idx, hashval_t *second_hash) +{ + struct abbrev_tag *t; + unsigned int i, ret = 0; + unsigned char *ptr; + dw_die_ref child; + + if (top_die == die) + { + if (die->die_ref_hash_computed) + return 0; + if (die->die_ck_state != CK_KNOWN) + return 0; + if (die->die_ref_seen) + return second_hash != NULL ? 0 : die->die_ref_seen; + if (second_hash != NULL) + { + die->die_ref_seen = 1; + if (second_idx != NULL) + { + die->u.p1.die_ref_hash + = iterative_hash_object (*second_idx, die->u.p1.die_hash); + (*second_idx)++; + } + } + else + { + die->die_ref_seen + = obstack_object_size (&ob) / sizeof (void *) + 1; + obstack_ptr_grow (&ob, die); + die->u.p1.die_ref_hash = die->u.p1.die_hash; + } + } + else + assert (top_die == NULL || die->die_ck_state == CK_KNOWN); + t = die->die_abbrev; + for (i = 0; i < t->nattr; ++i) + if (t->attr[i].attr != DW_AT_sibling) + switch (t->attr[i].form) + { + case DW_FORM_ref_addr: + if (unlikely (op_multifile || rd_multifile || fi_multifile)) + i = -2U; + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + case DW_FORM_indirect: + i = -2U; + break; + } + if (i == -1U) + { + ptr = debug_sections[DEBUG_INFO].data + die->die_offset; + skip_leb128 (ptr); + for (i = 0; i < t->nattr; ++i) + { + uint32_t form = t->attr[i].form; + size_t len = 0; + uint64_t value; + dw_die_ref ref, reft; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + + switch (form) + { + case DW_FORM_ref_addr: + if (unlikely (op_multifile || rd_multifile || fi_multifile)) + { + value = read_size (ptr, cu->cu_version == 2 ? ptr_size : 4); + ptr += cu->cu_version == 2 ? ptr_size : 4; + assert (t->attr[i].attr != DW_AT_sibling); + if (top_die == NULL) + break; + ref = off_htab_lookup (cu, value); + goto finish_ref; + } + ptr += cu->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_addr: + ptr += ptr_size; + break; + case DW_FORM_flag_present: + case DW_FORM_implicit_const: + break; + case DW_FORM_flag: + case DW_FORM_data1: + ++ptr; + break; + case DW_FORM_data2: + ptr += 2; + break; + case DW_FORM_data4: + case DW_FORM_sec_offset: + case DW_FORM_strp: + case DW_FORM_line_strp: + ptr += 4; + break; + case DW_FORM_data8: + case DW_FORM_ref_sig8: + ptr += 8; + break; + case DW_FORM_data16: + ptr += 16; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + skip_leb128 (ptr); + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form) + { + case DW_FORM_ref_udata: value = read_uleb128 (ptr); break; + case DW_FORM_ref1: value = read_8 (ptr); break; + case DW_FORM_ref2: value = read_16 (ptr); break; + case DW_FORM_ref4: value = read_32 (ptr); break; + case DW_FORM_ref8: value = read_64 (ptr); break; + default: abort (); + } + if (t->attr[i].attr == DW_AT_sibling || top_die == NULL) + break; + ref = off_htab_lookup (cu, cu->cu_offset + value); + if (ref->u.p1.die_enter >= top_die->u.p1.die_enter + && ref->u.p1.die_exit <= top_die->u.p1.die_exit) + break; + finish_ref: + reft = ref; + while (!reft->die_root + && reft->die_parent->die_tag != DW_TAG_compile_unit + && reft->die_parent->die_tag != DW_TAG_partial_unit + && !reft->die_parent->die_named_namespace) + reft = reft->die_parent; + if (reft->die_ck_state != CK_KNOWN || reft->die_root) + top_die->die_ck_state = CK_BAD; + else + { + unsigned int r = checksum_ref_die (die_cu (reft), reft, reft, + second_idx, second_hash); + if (ret == 0 || (r && r < ret)) + ret = r; + if (reft->die_ck_state != CK_KNOWN) + top_die->die_ck_state = CK_BAD; + else + top_die->die_no_multifile |= reft->die_no_multifile; + } + if (top_die->die_ck_state == CK_BAD) + { + if (top_die != die) + return ret; + i = t->nattr - 1; + break; + } + if (ret) + break; + if (reft != ref) + { + unsigned int val + = ref->u.p1.die_enter - reft->u.p1.die_enter; + if (second_hash != NULL && second_idx == NULL) + *second_hash + = iterative_hash_object (val, *second_hash); + else + top_die->u.p1.die_ref_hash + = iterative_hash_object (val, + top_die->u.p1.die_ref_hash); + } + if (second_hash) + { + if (second_idx == NULL && !reft->die_ref_hash_computed) + *second_hash + = iterative_hash_object (reft->u.p1.die_hash, + *second_hash); + else + *second_hash + = iterative_hash_object (reft->u.p1.die_ref_hash, + *second_hash); + } + else + top_die->u.p1.die_ref_hash + = iterative_hash_object (reft->u.p1.die_ref_hash, + top_die->u.p1.die_ref_hash); + break; + case DW_FORM_string: + ptr = (unsigned char *) strchr ((char *)ptr, '\0') + 1; + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *ptr++; + break; + case DW_FORM_block2: + len = read_16 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + case DW_FORM_exprloc: + len = read_uleb128 (ptr); + form = DW_FORM_block1; + break; + default: + abort (); + } + + if (form == DW_FORM_block1) + ptr += len; + } + } + + if (top_die == NULL || top_die->die_ck_state != CK_BAD) + { + for (child = die->die_child; child; child = child->die_sib) + { + unsigned int r + = checksum_ref_die (cu, + top_die ? top_die + : child->die_named_namespace + ? NULL : child, child, + second_idx, second_hash); + if (top_die == NULL) + assert (r == 0 && obstack_object_size (&ob) == 0); + + if (ret == 0 || (r && r < ret)) + ret = r; + if (top_die && top_die->die_ck_state == CK_BAD) + break; + } + } + + if (top_die == die) + { + if (ret == 0) + { + if (second_hash != NULL) + return 0; + die->die_ref_seen = 0; + die->die_ref_hash_computed = 1; + obstack_blank_fast (&ob, -(int) sizeof (void *)); + return 0; + } + assert (ret <= die->die_ref_seen); + if (ret == die->die_ref_seen) + { + unsigned int first = die->die_ref_seen - 1; + dw_die_ref *arr; + unsigned int count + = obstack_object_size (&ob) / sizeof (void *) - first; + unsigned int idx, minidx; + hashval_t ref_hash = 0; + bool bad = false; + bool no_multifile = false; + + arr = (dw_die_ref *) obstack_base (&ob) + first; + for (i = 0; i < count; i++) + { + arr[i]->die_ref_seen = 0; + if (arr[i]->die_ck_state == CK_BAD) + bad = true; + else if (arr[i]->die_no_multifile) + no_multifile = true; + } + if (bad) + { + for (i = 0; i < count; i++) + arr[i]->die_ck_state = CK_BAD; + obstack_blank_fast (&ob, -(int) (count * sizeof (void *))); + return 0; + } + /* Find the DIE in the array with the smallest u.p1.die_hash. */ + for (i = 0, minidx = -1U, bad = true; i < count; i++) + { + if (no_multifile) + arr[i]->die_no_multifile = 1; + if (minidx == -1U + || arr[i]->u.p1.die_hash < arr[minidx]->u.p1.die_hash) + { + minidx = i; + bad = false; + } + else if (arr[i]->u.p1.die_hash == arr[minidx]->u.p1.die_hash) + bad = true; + } + if (bad) + { + unsigned int iter, limv; + /* If there is more than one smallest u.p1.die_hash, + look for second (up to 6th) smallest u.p1.die_hash + if there is just one of that value. */ + for (iter = 0; iter < 5; iter++) + { + limv = arr[minidx]->u.p1.die_hash; + for (i = 0, minidx = -1U, bad = true; i < count; i++) + if (arr[i]->u.p1.die_hash <= limv) + continue; + else if (minidx == -1U + || arr[i]->u.p1.die_hash + < arr[minidx]->u.p1.die_hash) + { + minidx = i; + bad = false; + } + else if (arr[i]->u.p1.die_hash + == arr[minidx]->u.p1.die_hash) + bad = true; + if (minidx == -1U || !bad) + break; + } + /* If all of 1st to 6th smallest u.p1.die_hash has more than + one DIE with that u.p1.die_hash, sort the array and find + the smallest u.p1.die_hash that only a single DIE has. */ + if (minidx != -1U && iter == 5) + { + unsigned int j; + qsort (arr, count, sizeof (void *), checksum_ref_die_cmp); + for (i = 0, minidx = -1U; i < count; i = j) + { + if (i + 1 == count + || arr[i + 1]->u.p1.die_hash + != arr[i]->u.p1.die_hash) + { + minidx = i; + break; + } + for (j = i + 1; j < count; j++) + if (arr[j]->u.p1.die_hash != arr[i]->u.p1.die_hash) + break; + } + } + } + if (checksum_cycle_opt && minidx != -1U) + { + idx = 0; + checksum_ref_die (die_cu (arr[minidx]), arr[minidx], + arr[minidx], &idx, &ref_hash); + assert (arr == (dw_die_ref *) obstack_base (&ob) + first); + for (i = 0; i < count; i++) + { + arr[i]->u.p1.die_ref_hash + = iterative_hash_object (arr[i]->u.p1.die_ref_hash, + ref_hash); + arr[i]->die_ref_hash_computed = 1; + arr[i]->die_ref_seen = 0; + } + } + else + { + /* If we get here, all u.p1.die_hash values in the arr array + are used by more than one DIE. Do the more expensive + computation as fallback. */ + for (i = 0; i < count; i++) + { + unsigned int j; + arr[i]->u.p1.die_ref_hash = arr[i]->u.p1.die_hash; + checksum_ref_die (die_cu (arr[i]), arr[i], arr[i], NULL, + &arr[i]->u.p1.die_ref_hash); + assert (arr == (dw_die_ref *) obstack_base (&ob) + first); + for (j = 0; j < count; j++) + arr[j]->die_ref_seen = 0; + } + for (i = 0; i < count; i++) + arr[i]->die_ref_hash_computed = 1; + } + obstack_blank_fast (&ob, -(int) (count * sizeof (void *))); + return 0; + } + } + return ret; +} + +/* Hash function for dup_htab. u.p1.die_ref_hash should have u.p1.die_hash + iteratively hashed into it already. */ +static hashval_t +die_hash (const void *p) +{ + dw_die_ref die = (dw_die_ref) p; + + return die->u.p1.die_ref_hash; +} + +/* Freelist of !die->die_toplevel DIEs, chained through die_sib fields. */ +static dw_die_ref die_nontoplevel_freelist; +/* Freelist of die->die_collapsed_child DIEs, chained through die_parent + fields. */ +static dw_die_ref die_collapsed_child_freelist; + +/* Return pointer after the attributes of a DIE from a cu with CU_VERSION + which uses abbrevs T and starts at PTR. */ +static unsigned char * +skip_attrs_1 (unsigned int cu_version, struct abbrev_tag *t, unsigned char *ptr) +{ + unsigned int i; + for (i = 0; i < t->nattr; ++i) + ptr = skip_attr (cu_version, &t->attr[i], ptr); + + return ptr; +} + +/* Return pointer after the attributes of a DIE from CU which uses abbrevs + T and starts at PTR. */ +static unsigned char * +skip_attrs (dw_cu_ref cu, struct abbrev_tag *t, unsigned char *ptr) +{ + return skip_attrs_1 (cu->cu_version, t, ptr); +} + +/* Expand children of TOP_DIE that have been collapsed by + collapse_child. CHECKSUM is true if checksum should be + computed - expansion is performed during read_debug_info + when duplicates are looked for - or false, if the expansion + is performed late (e.g. during compute_abbrevs or write_{info,types}. */ +static void +expand_child (dw_die_ref top_die, bool checksum) +{ + dw_cu_ref cu = die_cu (top_die); + dw_die_ref *diep = &top_die->die_child; + dw_die_ref parent = top_die, child; + unsigned char *ptr, *base; + struct abbrev_tag tag, *t; + dw_die_ref die; + unsigned int tick = checksum ? top_die->u.p1.die_enter + 1 : 0; + + if (unlikely (cu->cu_kind == CU_TYPES)) + base = debug_sections[DEBUG_TYPES].data; + else + base = debug_sections[DEBUG_INFO].data; + ptr = base + top_die->die_offset; + if (likely (checksum)) + ptr += top_die->die_size; + else + { + t = top_die->die_abbrev; + skip_leb128 (ptr); + ptr = skip_attrs (cu, t, ptr); + } + + while (1) + { + unsigned int die_offset = ptr - base; + void **slot; + struct dw_die diebuf; + dw_die_ref collapsed; + + tag.entry = read_uleb128 (ptr); + if (tag.entry == 0) + { + if (parent == top_die) + break; + diep = &parent->die_sib; + if (checksum) + parent->u.p1.die_exit = tick++; + parent = parent->die_parent; + continue; + } + + diebuf.die_offset = die_offset; + slot = htab_find_slot_with_hash (cu->cu_kind == CU_TYPES + ? types_off_htab : off_htab, + &diebuf, off_hash (&diebuf), NO_INSERT); + if (slot == NULL) + die = NULL; + else + die = (dw_die_ref) *slot; + if (die != NULL && !die->die_collapsed_child) + { + *diep = die; + die->die_parent = parent; + die->die_ck_state = CK_UNKNOWN; + die->die_ref_seen = 0; + assert (!checksum || die->u.p1.die_enter == tick); + if (die->die_abbrev->children) + { + diep = &die->die_child; + parent = die; + } + else + { + diep = &die->die_sib; + assert (!checksum || die->u.p1.die_exit == tick); + } + tick++; + if (checksum) + ptr = base + die_offset + die->die_size; + else + ptr = skip_attrs (cu, die->die_abbrev, ptr); + continue; + } + + collapsed = die; + t = htab_find_with_hash (cu->cu_abbrev, &tag, tag.entry); + if (die_nontoplevel_freelist) + { + die = die_nontoplevel_freelist; + die_nontoplevel_freelist = die->die_sib; + } + else + die = pool_alloc (dw_die, offsetof (struct dw_die, die_dup)); + memset (die, '\0', offsetof (struct dw_die, die_dup)); + *diep = die; + die->die_tag = t->tag; + die->die_abbrev = t; + die->die_offset = die_offset; + die->die_parent = parent; + if (checksum) + { + die->u.p1.die_enter = tick; + die->u.p1.die_exit = tick++; + } + if (t->children) + { + diep = &die->die_child; + parent = die; + } + else + diep = &die->die_sib; + + ptr = skip_attrs (cu, t, ptr); + die->die_size = (ptr - base) - die_offset; + if (collapsed != NULL) + { + die->die_referenced = collapsed->die_referenced; + *slot = (void *) die; + memset (collapsed, '\0', offsetof (struct dw_die, die_child)); + collapsed->die_parent = die_collapsed_child_freelist; + die_collapsed_child_freelist = collapsed; + } + } + assert (!checksum || top_die->u.p1.die_exit == tick); + top_die->die_collapsed_children = 0; + if (checksum && likely (cu->cu_kind != CU_TYPES)) + for (child = top_die->die_child; child; child = child->die_sib) + checksum_die (NULL, cu, top_die, child); +} + +/* Call expand_child on all collapsed toplevel children DIEs. */ +static bool +expand_children (dw_die_ref die) +{ + dw_die_ref child; + bool ret = false; + for (child = die->die_child; child; child = child->die_sib) + if (child->die_named_namespace) + ret |= expand_children (child); + else if (child->die_collapsed_children) + { + expand_child (child, false); + ret = true; + } + return ret; +} + +static unsigned odr_phase; + +/* Return 1 if DIE1 and DIE2 match. TOP_DIE1 and TOP_DIE2 + is the corresponding ultimate parent with die_toplevel + set. u.p1.die_hash and u.p1.die_ref_hash hashes should + hopefully ensure that in most cases this function actually + just verifies matching. */ +static int +die_eq_1 (dw_cu_ref cu1, dw_cu_ref cu2, + dw_die_ref top_die1, dw_die_ref top_die2, + dw_die_ref die1, dw_die_ref die2) +{ + struct abbrev_tag *t1, *t2; + unsigned int i, j; + unsigned char *ptr1, *ptr2; + dw_die_ref ref1, ref2; + dw_die_ref child1, child2; + bool only_compare_name_p; + +#define FAIL goto fail + if (die1 == die2 || die_safe_dup (die2) == die1) + return 1; + if (die1->u.p1.die_hash != die2->u.p1.die_hash + || die1->u.p1.die_ref_hash != die2->u.p1.die_ref_hash + || die1->die_tag != die2->die_tag + || (!odr && (die1->u.p1.die_exit - die1->u.p1.die_enter + != die2->u.p1.die_exit - die2->u.p1.die_enter)) + || die_safe_dup (die2) != NULL + || die1->die_ck_state != CK_KNOWN + || die2->die_ck_state != CK_KNOWN + || die1->die_toplevel != die2->die_toplevel) + return 0; + assert (!die1->die_root && !die2->die_root); + + if (uni_lang_p && die1 == top_die1 && die2 == top_die2 + && cu1->lang != cu2->lang) + return 0; + + only_compare_name_p + = odr && die1->die_odr_state != ODR_NONE && die2->die_odr_state != ODR_NONE; + + if (only_compare_name_p && odr_phase == 1) + { + const char *name1 = get_AT_string (die1, DW_AT_name); + const char *name2 = get_AT_string (die2, DW_AT_name); + // TODO: Handle DW_AT_linkage_name? + if (name1 == NULL || name2 == NULL) + return 0; + if (strcmp (name1, name2) != 0) + return 0; + } + else if (die1->u.p1.die_exit - die1->u.p1.die_enter + != die2->u.p1.die_exit - die2->u.p1.die_enter) + return 0; + + if (only_compare_name_p && odr_phase == 2 + && die1->die_odr_state == ODR_DEF && die2->die_odr_state == ODR_DEF) + { + if (die1->u.p1.die_hash2 != die2->u.p1.die_hash2) + return 0; + } + + t1 = die1->die_abbrev; + t2 = die2->die_abbrev; + if (likely (!fi_multifile)) + { + ptr1 = debug_sections[DEBUG_INFO].data + die1->die_offset; + ptr2 = debug_sections[DEBUG_INFO].data + die2->die_offset; + } + else + { + if (cu1->cu_kind == CU_ALT) + ptr1 = alt_data[DEBUG_INFO]; + else + ptr1 = debug_sections[DEBUG_INFO].data; + ptr1 += die1->die_offset; + if (cu2->cu_kind == CU_ALT) + ptr2 = alt_data[DEBUG_INFO]; + else + ptr2 = debug_sections[DEBUG_INFO].data; + ptr2 += die2->die_offset; + } + skip_leb128 (ptr1); + skip_leb128 (ptr2); + i = 0; + j = 0; + if (die1->die_toplevel) + { + for (ref1 = die1->die_parent, ref2 = die2->die_parent; ref1 && ref2; ) + { + const char *name1, *name2; + if ((ref1->die_tag == DW_TAG_compile_unit + || ref1->die_tag == DW_TAG_partial_unit) + && (ref2->die_tag == DW_TAG_compile_unit + || ref2->die_tag == DW_TAG_partial_unit)) + break; + if (ref1->die_tag != ref2->die_tag) + return 0; + if (!ref1->die_named_namespace || !ref2->die_named_namespace) + return 0; + name1 = get_AT_string (ref1, DW_AT_name); + name2 = get_AT_string (ref2, DW_AT_name); + if (strcmp (name1, name2)) + return 0; + ref1 = ref1->die_root ? NULL : ref1->die_parent; + ref2 = ref2->die_root ? NULL : ref2->die_parent; + } + if (ref1 == NULL || ref2 == NULL) + return 0; + /* For each toplevel die seen, record optimistically + that we expect them to match, to avoid recursing + on it again. If non-match is determined later, + die_eq wrapper undoes this (which is why the DIE + pointer is added to the vector). */ + if (!die2->die_op_type_referenced) + die2->die_remove = 1; + obstack_ptr_grow (&ob, die2); + if (likely (die2->die_nextdup == NULL)) + { + die2->die_dup = die1; + die2->die_nextdup = die1->die_nextdup; + obstack_ptr_grow (&ob, NULL); + } + else + { + dw_die_ref next; + for (next = die2; next->die_nextdup; next = next->die_nextdup) + next->die_dup = die1; + next->die_dup = die1; + next->die_nextdup = die1->die_nextdup; + obstack_ptr_grow (&ob, next); + } + die1->die_nextdup = die2; + } + + if (only_compare_name_p && odr_phase == 1) + return 1; + + while (1) + { + uint32_t form1, form2; + size_t len = 0; + unsigned char *old_ptr1; + unsigned char *old_ptr2; + uint64_t value1, value2; + + while (i < t1->nattr && t1->attr[i].attr == DW_AT_sibling) + { + form1 = t1->attr[i].form; + while (form1 == DW_FORM_indirect) + form1 = read_uleb128 (ptr1); + switch (form1) + { + case DW_FORM_ref_udata: skip_leb128 (ptr1); break; + case DW_FORM_ref1: ptr1++; break; + case DW_FORM_ref2: read_16 (ptr1); break; + case DW_FORM_ref4: read_32 (ptr1); break; + case DW_FORM_ref8: read_64 (ptr1); break; + default: FAIL; + } + i++; + } + while (j < t2->nattr && t2->attr[j].attr == DW_AT_sibling) + { + form2 = t2->attr[j].form; + while (form2 == DW_FORM_indirect) + form2 = read_uleb128 (ptr2); + switch (form2) + { + case DW_FORM_ref_udata: skip_leb128 (ptr2); break; + case DW_FORM_ref1: ptr2++; break; + case DW_FORM_ref2: read_16 (ptr2); break; + case DW_FORM_ref4: read_32 (ptr2); break; + case DW_FORM_ref8: read_64 (ptr2); break; + default: FAIL; + } + j++; + } + if (i == t1->nattr) + { + if (j != t2->nattr) + FAIL; + break; + } + if (j == t2->nattr) + FAIL; + + if (t1->attr[i].attr != t2->attr[j].attr) + FAIL; + + form1 = t1->attr[i].form; + while (form1 == DW_FORM_indirect) + form1 = read_uleb128 (ptr1); + form2 = t2->attr[j].form; + while (form2 == DW_FORM_indirect) + form2 = read_uleb128 (ptr2); + old_ptr1 = ptr1; + old_ptr2 = ptr2; + + switch (t1->attr[i].attr) + { + case DW_AT_sibling: + case DW_AT_low_pc: + case DW_AT_high_pc: + case DW_AT_entry_pc: + case DW_AT_ranges: + case DW_AT_call_return_pc: + case DW_AT_call_pc: + /* We shouldn't be hitting DIEs with attributes referencing + addresses and we should have removed DW_AT_subling. */ + abort (); + case DW_AT_decl_file: + case DW_AT_call_file: + switch (form1) + { + case DW_FORM_data1: value1 = read_8 (ptr1); break; + case DW_FORM_data2: value1 = read_16 (ptr1); break; + case DW_FORM_data4: value1 = read_32 (ptr1); break; + case DW_FORM_data8: value1 = read_64 (ptr1); break; + case DW_FORM_udata: value1 = read_uleb128 (ptr1); break; + case DW_FORM_sdata: value1 = read_sleb128 (ptr1); break; + case DW_FORM_implicit_const: value1 = t1->values[i]; break; + default: abort (); + } + switch (form2) + { + case DW_FORM_data1: value2 = read_8 (ptr2); break; + case DW_FORM_data2: value2 = read_16 (ptr2); break; + case DW_FORM_data4: value2 = read_32 (ptr2); break; + case DW_FORM_data8: value2 = read_64 (ptr2); break; + case DW_FORM_udata: value2 = read_uleb128 (ptr2); break; + case DW_FORM_sdata: value2 = read_sleb128 (ptr2); break; + case DW_FORM_implicit_const: value2 = t2->values[j]; break; + default: abort (); + } + if (ignore_locus) + { + i++; + j++; + continue; + } + if ((value1 == 0) ^ (value2 == 0)) + FAIL; + if (value1 != 0) + { + struct dw_file *cu_file1 + = &cu1->cu_files[value1 - 1]; + struct dw_file *cu_file2 + = &cu2->cu_files[value2 - 1]; + + if (cu_file1->time != cu_file2->time + || cu_file1->size != cu_file2->size + || strcmp (cu_file1->file, cu_file2->file)) + FAIL; + + if (cu_file1->dir != NULL) + { + if (cu_file2->dir == NULL + || strcmp (cu_file1->dir, cu_file2->dir)) + FAIL; + } + else if (cu_file2->dir != NULL) + FAIL; + /* Ignore DW_AT_comp_dir for DW_AT_*_file <built-in> + etc. if immediately followed by DW_AT_*_line 0. */ + else if (cu_file1->file_angle_brackets_encapsulated_no_slash + && i + 1 < t1->nattr + && j + 1 < t2->nattr + && t1->attr[i + 1].attr + == (t1->attr[i].attr == DW_AT_decl_file + ? DW_AT_decl_line : DW_AT_call_line) + && t1->attr[i + 1].form == DW_FORM_data1 + && t1->attr[i + 1].attr == t2->attr[j + 1].attr + && t2->attr[j + 1].form == DW_FORM_data1 + && *ptr1 == 0 + && *ptr2 == 0) + { + i++; + j++; + continue; + } + + if ((cu_file1->dir ? cu_file1->dir[0] : cu_file1->file[0]) + != '/') + { + if (cu1->cu_comp_dir != NULL) + { + if (cu2->cu_comp_dir == NULL + || strcmp (cu1->cu_comp_dir, cu2->cu_comp_dir)) + FAIL; + } + else if (cu2->cu_comp_dir != NULL) + FAIL; + } + } + i++; + j++; + continue; + case DW_AT_decl_line: + case DW_AT_decl_column: + case DW_AT_call_line: + case DW_AT_call_column: + if (ignore_locus) + { + old_ptr1 = NULL; + break; + } + switch (form1) + { + case DW_FORM_data1: value1 = read_8 (ptr1); break; + case DW_FORM_data2: value1 = read_16 (ptr1); break; + case DW_FORM_data4: value1 = read_32 (ptr1); break; + case DW_FORM_data8: value1 = read_64 (ptr1); break; + case DW_FORM_udata: value1 = read_uleb128 (ptr1); break; + case DW_FORM_sdata: value1 = read_sleb128 (ptr1); break; + case DW_FORM_implicit_const: value1 = t1->values[i]; break; + default: abort (); + } + switch (form2) + { + case DW_FORM_data1: value2 = read_8 (ptr2); break; + case DW_FORM_data2: value2 = read_16 (ptr2); break; + case DW_FORM_data4: value2 = read_32 (ptr2); break; + case DW_FORM_data8: value2 = read_64 (ptr2); break; + case DW_FORM_udata: value2 = read_uleb128 (ptr2); break; + case DW_FORM_sdata: value2 = read_sleb128 (ptr2); break; + case DW_FORM_implicit_const: value2 = t2->values[j]; break; + default: abort (); + } + if (value1 != value2) + FAIL; + i++; + j++; + continue; + default: + break; + } + + switch (form1) + { + case DW_FORM_ref_addr: + if (likely (!op_multifile && !rd_multifile && !fi_multifile)) + { + if (form1 != form2) + FAIL; + break; + } + /* FALLTHRU */ + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form2) + { + case DW_FORM_ref_addr: + if (likely (!op_multifile && !rd_multifile && !fi_multifile)) + FAIL; + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + break; + default: + FAIL; + } + break; + default: + if (form1 != form2) + FAIL; + break; + } + + switch (form1) + { + case DW_FORM_addr: + ptr1 += ptr_size; + ptr2 += ptr_size; + break; + case DW_FORM_flag_present: + break; + case DW_FORM_implicit_const: + if ((!ignore_locus || old_ptr1) && t1->values[i] != t2->values[j]) + FAIL; + break; + case DW_FORM_flag: + case DW_FORM_data1: + ++ptr1; + ++ptr2; + break; + case DW_FORM_data2: + ptr1 += 2; + ptr2 += 2; + break; + case DW_FORM_data4: + case DW_FORM_sec_offset: + ptr1 += 4; + ptr2 += 4; + break; + case DW_FORM_data8: + case DW_FORM_ref_sig8: + ptr1 += 8; + ptr2 += 8; + break; + case DW_FORM_data16: + ptr1 += 16; + ptr2 += 16; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + skip_leb128 (ptr1); + skip_leb128 (ptr2); + break; + case DW_FORM_strp: + if (unlikely (op_multifile || rd_multifile || fi_multifile)) + { + value1 = read_32 (ptr1); + value2 = read_32 (ptr2); + if (fi_multifile) + { + if (strcmp ((char *) (cu1->cu_kind == CU_ALT + ? alt_data[DEBUG_STR] + : debug_sections[DEBUG_STR].data) + + value1, + (char *) (cu2->cu_kind == CU_ALT + ? alt_data[DEBUG_STR] + : debug_sections[DEBUG_STR].data) + + value2) != 0) + FAIL; + i++; + j++; + continue; + } + if (strcmp ((char *) debug_sections[DEBUG_STR].data + value1, + (char *) debug_sections[DEBUG_STR].data + value2) + != 0) + FAIL; + i++; + j++; + continue; + } + ptr1 += 4; + ptr2 += 4; + break; + case DW_FORM_line_strp: + ptr1 += 4; + ptr2 += 4; + break; + case DW_FORM_string: + ptr1 = (unsigned char *) strchr ((char *)ptr1, '\0') + 1; + ptr2 = (unsigned char *) strchr ((char *)ptr2, '\0') + 1; + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *ptr1++; + ptr1 += len; + len = *ptr2++; + ptr2 += len; + break; + case DW_FORM_block2: + len = read_16 (ptr1); + ptr1 += len; + len = read_16 (ptr2); + ptr2 += len; + break; + case DW_FORM_block4: + len = read_32 (ptr1); + ptr1 += len; + len = read_32 (ptr2); + ptr2 += len; + break; + case DW_FORM_block: + case DW_FORM_exprloc: + len = read_uleb128 (ptr1); + ptr1 += len; + len = read_uleb128 (ptr2); + ptr2 += len; + break; + case DW_FORM_ref_addr: + if (likely (!op_multifile && !rd_multifile && !fi_multifile)) + { + ptr1 += cu1->cu_version == 2 ? ptr_size : 4; + ptr2 += cu2->cu_version == 2 ? ptr_size : 4; + break; + } + /* FALLTHRU */ + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form1) + { + case DW_FORM_ref_addr: + value1 = read_size (ptr1, cu1->cu_version == 2 + ? ptr_size : 4) + - cu1->cu_offset; + ptr1 += cu1->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_ref_udata: + value1 = read_uleb128 (ptr1); + break; + case DW_FORM_ref1: + value1 = read_8 (ptr1); + break; + case DW_FORM_ref2: + value1 = read_16 (ptr1); + break; + case DW_FORM_ref4: + value1 = read_32 (ptr1); + break; + case DW_FORM_ref8: + value1 = read_64 (ptr1); + break; + default: abort (); + } + ref1 = off_htab_lookup (cu1, cu1->cu_offset + value1); + switch (form2) + { + case DW_FORM_ref_addr: + value2 = read_size (ptr2, cu2->cu_version == 2 + ? ptr_size : 4) + - cu2->cu_offset; + ptr2 += cu2->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_ref_udata: + value2 = read_uleb128 (ptr2); + break; + case DW_FORM_ref1: + value2 = read_8 (ptr2); + break; + case DW_FORM_ref2: + value2 = read_16 (ptr2); + break; + case DW_FORM_ref4: + value2 = read_32 (ptr2); + break; + case DW_FORM_ref8: + value2 = read_64 (ptr2); + break; + default: abort (); + } + ref2 = off_htab_lookup (cu2, cu2->cu_offset + value2); + assert (ref1 != NULL && ref2 != NULL); + if (unlikely (op_multifile || low_mem)) + { + if (die1->die_collapsed_children && ref1->die_collapsed_child) + { + expand_child (die1, true); + ref1 = off_htab_lookup (cu1, cu1->cu_offset + value1); + } + assert (ref2->die_collapsed_child == 0); + } + if (likely (!ref1->die_collapsed_child) + && die_cu (ref1) == cu1 + && ref1->u.p1.die_enter >= top_die1->u.p1.die_enter + && ref1->u.p1.die_exit <= top_die1->u.p1.die_exit) + { + /* A reference into a subdie of the DIE being compared. */ + if (die_cu (ref2) != cu2 + || ref1->u.p1.die_enter - top_die1->u.p1.die_enter + != ref2->u.p1.die_enter - top_die2->u.p1.die_enter + || top_die1->u.p1.die_exit - ref1->u.p1.die_exit + != top_die2->u.p1.die_exit - ref2->u.p1.die_exit) + FAIL; + } + else + { + dw_die_ref reft1 = ref1, reft2 = ref2; + dw_cu_ref refcu1, refcu2; + while (reft1->die_toplevel == 0) + reft1 = reft1->die_parent; + while (reft2->die_toplevel == 0) + reft2 = reft2->die_parent; + if (unlikely (ref1->die_collapsed_child)) + { + if (ref1->die_tag + != ref2->u.p1.die_enter - reft2->u.p1.die_enter) + FAIL; + } + else if (ref1->u.p1.die_enter - reft1->u.p1.die_enter + != ref2->u.p1.die_enter - reft2->u.p1.die_enter) + FAIL; + refcu1 = die_cu (reft1); + refcu2 = die_cu (reft2); + if (unlikely (refcu1->cu_chunk == refcu2->cu_chunk) + && likely (!fi_multifile)) + { + if (reft1->die_dup + && die_cu (reft1->die_dup)->cu_chunk + == refcu1->cu_chunk) + reft1 = reft1->die_dup; + if (reft2->die_dup + && die_cu (reft2->die_dup)->cu_chunk + == refcu2->cu_chunk) + reft2 = reft2->die_dup; + if (reft2->die_offset < reft1->die_offset) + { + dw_die_ref tem = reft1; + reft1 = reft2; + reft2 = tem; + } + if (reft1->die_dup == NULL && reft2->die_dup != NULL) + { + dw_die_ref tem = reft1; + reft1 = reft2; + reft2 = tem; + } + } + /* If reft1 (die1 or whatever refers to it is already + in the hash table) already has a dup, follow to that + dup. Don't do the same for reft2, {{top_,}die,reft,child}2 + should always be from the current CU. */ + if (reft1->die_dup) + reft1 = reft1->die_dup; + refcu1 = die_cu (reft1); + refcu2 = die_cu (reft2); + if (die_eq_1 (refcu1, refcu2, reft1, reft2, reft1, reft2) == 0) + FAIL; + } + i++; + j++; + continue; + default: + abort (); + } + + if ((!ignore_locus || old_ptr1) + && (ptr1 - old_ptr1 != ptr2 - old_ptr2 + || memcmp (old_ptr1, old_ptr2, ptr1 - old_ptr1))) + FAIL; + i++; + j++; + } + + if (unlikely (op_multifile || low_mem)) + { + if (die1->die_collapsed_children) + expand_child (die1, true); + assert (die2->die_collapsed_children == 0); + } + + for (child1 = die1->die_child, child2 = die2->die_child; + child1 && child2; + child1 = child1->die_sib, child2 = child2->die_sib) + if (die_eq_1 (cu1, cu2, top_die1, top_die2, child1, child2) == 0) + FAIL; + + if (child1 || child2) + { + fail: + return 0; + } + + if (unlikely (fi_multifile)) + assert (cu1->cu_kind == CU_ALT && cu2->cu_kind != CU_ALT); + return 1; +} + +/* Wrapper around die_eq_1, used as equality function in + dup_htab hash table. If zero (non-match) is returned and + any toplevel DIEs have been pushed to the vector in ob obstack, + undo the optimistic assignment of die_dup and die_nextdup. */ +static int +die_eq (const void *p, const void *q) +{ + dw_die_ref die1 = (dw_die_ref) p; + dw_die_ref die2 = (dw_die_ref) q; + dw_die_ref *arr; + unsigned int i, count; + int ret; + + if (die1->u.p1.die_hash != die2->u.p1.die_hash + || die1->u.p1.die_ref_hash != die2->u.p1.die_ref_hash) + return 0; + ret = die_eq_1 (die_cu (die1), die_cu (die2), die1, die2, die1, die2); + count = obstack_object_size (&ob) / sizeof (void *); + arr = (dw_die_ref *) obstack_finish (&ob); + if (!ret) + for (i = count; i;) + { + dw_die_ref die; + i -= 2; + die = arr[i]->die_dup; + if (likely (arr[i + 1] == NULL)) + { + die->die_nextdup = arr[i]->die_nextdup; + arr[i]->die_nextdup = NULL; + arr[i]->die_dup = NULL; + } + else + { + dw_die_ref next; + + assert (die->die_nextdup == arr[i]); + for (next = arr[i]->die_nextdup; + next != arr[i + 1]; + next = next->die_nextdup) + { + assert (next->die_dup == die); + next->die_dup = arr[i]; + } + assert (next->die_dup == die); + next->die_dup = arr[i]; + die->die_nextdup = next->die_nextdup; + next->die_nextdup = NULL; + arr[i]->die_dup = NULL; + } + arr[i]->die_remove = 0; + } + obstack_free (&ob, (void *) arr); + return ret; +} + +/* Hash table for finding of matching toplevel DIEs (and all + its children together with it). */ +static htab_t dup_htab; + +/* After read_multifile dup_htab is moved to this variable. */ +static htab_t alt_dup_htab; + +/* First CU, start of the linked list of CUs, and the tail + of that list. Initially this contains just the original + CUs, later on newly created partial units are added + to the beginning of the list and optionally .debug_types + CUs are added to its tail. */ +static dw_cu_ref first_cu, last_cu; + +/* After read_multifile first_cu is copied to this variable. */ +static dw_cu_ref alt_first_cu; + +/* Compute approximate size of DIE and all its children together. */ +static unsigned long +calc_sizes (dw_die_ref die) +{ + unsigned long ret = die->die_size; + dw_die_ref child; + if (wr_multifile ? die->die_no_multifile : die->die_remove) + return 0; + for (child = die->die_child; child; child = child->die_sib) + ret += calc_sizes (child); + return ret; +} + +/* Verify the duplicate chains starting at DIE. If ORDERED, also check that + the duplicate chain is in the correct order. */ +static void +verify_dups (dw_die_ref die, bool ordered) +{ + dw_die_ref d, prev; + + assert (die->die_dup == NULL); + assert (die->die_collapsed_children == 0); + assert (die->die_remove == 0); + + for (prev = die, d = prev->die_nextdup; + d; + prev = d, d = prev->die_nextdup) + { + if (ordered) + assert (die_cu (prev)->cu_chunk <= die_cu (d)->cu_chunk); + assert (d->die_offset != -1U); + assert (d->die_dup == die); + assert (d->die_remove != d->die_op_type_referenced); + assert (d->die_tag == die->die_tag); + } +} + +/* Walk toplevel DIEs in tree rooted by PARENT, and see if they + match previously processed DIEs. */ +static int +find_dups (dw_die_ref parent) +{ + void **slot; + dw_die_ref child; + + if (stats_p && parent->die_root) + stats->root_cnt++; + + for (child = parent->die_child; child; child = child->die_sib) + { + if (child->die_ck_state == CK_KNOWN) + { + if (stats_p) + stats->lower_toplevel_with_checksum++; + if (child->die_dup != NULL) + continue; + slot = htab_find_slot_with_hash (dup_htab, child, + child->u.p1.die_ref_hash, + INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot == NULL) + *slot = child; + } + else if (child->die_named_namespace) + { + if (stats_p) + stats->namespace_cnt++; + if (find_dups (child)) + return 1; + } + else if (stats_p) + stats->lower_toplevel++; + } + return 0; +} + +/* Like find_dups, but for the last multifile optimization phase, + where it only looks at duplicates in the common .debug_info + section. */ +static int +find_dups_fi (dw_die_ref parent) +{ + dw_die_ref child; + + for (child = parent->die_child; child; child = child->die_sib) + { + if (child->die_ck_state == CK_KNOWN) + { + if (child->die_dup != NULL) + continue; + htab_find_with_hash (alt_dup_htab, child, child->u.p1.die_ref_hash); + } + else if (child->die_named_namespace) + if (find_dups_fi (child)) + return 1; + } + return 0; +} + +/* Return value of DW_AT_name for DIE, or for its specification or abstract + origin. */ +static const char * +get_name (dw_die_ref die) +{ + if (die->die_collapsed_child) + return NULL; + const char *name = get_AT_string (die, DW_AT_name); + if (name) + return name; + dw_cu_ref cu = die_cu (die); + bool present; + enum dwarf_form form; + unsigned int value = get_AT_int (die, DW_AT_specification, &present, &form); + if (present) + { + dw_die_ref ref; + if (form != DW_FORM_ref_addr) + value = cu->cu_offset + value; + ref = off_htab_lookup (cu, value); + if (ref) + return get_name (ref); + } + value = get_AT_int (die, DW_AT_abstract_origin, &present, &form); + if (present) + { + dw_die_ref ref; + if (form != DW_FORM_ref_addr) + value = cu->cu_offset + value; + ref = off_htab_lookup (die_cu (die), value); + if (ref) + return get_name (ref); + } + return NULL; +} + +/* Dump type of DIE to stderr. */ +static void +dump_type (dw_die_ref die) +{ + bool present; + enum dwarf_form form; + if (die->die_collapsed_child) + return; + unsigned int value = get_AT_int (die, DW_AT_type, &present, &form); + if (!present) + return; + + dw_cu_ref cu = die_cu (die); + if (cu == NULL) + return; + + dw_die_ref ref; + if (form != DW_FORM_ref_addr) + value = cu->cu_offset + value; + fprintf (stderr, " (type: %x", value); + ref = off_htab_lookup (cu, value); + if (ref != NULL && !ref->die_collapsed_child) + { + const char *type_name = get_name (ref); + if (type_name) + fprintf (stderr, " %s", type_name); + fprintf (stderr, " %s", get_DW_TAG_name (ref->die_tag) + 7); + dump_type (ref); + } + fprintf (stderr, ")"); +} + +/* Dump DIE to stderr with INDENT. */ +static void +dump_die_with_indent (int indent, dw_die_ref die) +{ + if (die == NULL) + fprintf (stderr, "%*s null", indent, ""); + else if (die->die_offset == -1U) + { + fprintf (stderr, "%*s -1 %s", indent, "", + get_DW_TAG_name (die->die_tag) + 7); + dw_die_ref d = die->die_nextdup; + while (d) + { + const char *name = get_name (d); + fprintf (stderr, " -> %x %s %s", d->die_offset, name ? name : "", + get_DW_TAG_name (d->die_tag) + 7); + d = d->die_nextdup; + } + } + else if (die->die_collapsed_child) + { + fprintf (stderr, "%*s %x %c", indent, "", die->die_offset, + die->die_ck_state == CK_KNOWN ? 'O' : 'X'); + } + else + { + const char *name = get_name (die); + fprintf (stderr, "%*s %x %c %x", indent, "", die->die_offset, + die->die_ck_state == CK_KNOWN ? 'O' : 'X', + (unsigned) die->u.p1.die_hash); + if (odr && die->die_odr_state != ODR_NONE + && die->die_odr_state != ODR_UNKNOWN) + fprintf (stderr, "(%x)", (unsigned) die->u.p1.die_hash2); + fprintf (stderr, " %x %s %s", (unsigned) die->u.p1.die_ref_hash, + name ? name : "", get_DW_TAG_name (die->die_tag) + 7); + dump_type (die); + } + fprintf (stderr, "\n"); +} + +/* Dump DIE to stderr. */ +static void +dump_die (dw_die_ref die) +{ + dump_die_with_indent (0, die); +} + +static void +dump_dups (dw_die_ref die) +{ + dw_die_ref d; + for (d = die; d; d = d->die_nextdup) + dump_die (d); +} + +/* Dump DIE tree at tree depth DEPTH. */ +static void +dump_dies (int depth, dw_die_ref die) +{ + dw_die_ref child; + dump_die_with_indent (depth, die); + for (child = die->die_child; child; child = child->die_sib) + dump_dies (depth + 1, child); +} + +/* Hash table for .debug_str. Depending on multifile optimization + phase this hash table has 3 different hash/equality functions. + The first set is used to record tail optimized strings, during + write_multifile the whole .debug_str section is written as is, + plus then all the strings which are just suffixes of other + strings. E.g. if .debug_str section contains "foobar" string + and .debug_info section refers to the whole "foobar" string + as well as "bar" by referring to "foobar" + 3. + The second set is used during op_multifile and fi_multifile, + noting each string and in addition to that how many times it + has been seen (0, 1 or more than 1). If 0 then it isn't present + in the hash table, 1 has lowest bit of new_off clear, more than 1 + the LSB of new_off is set. + The final set is used during finalize_strp and afterwards, it is + then used to map strings to their location in the new .debug_str + section. */ +static htab_t strp_htab; +/* Current offset in .debug_str when adding the tail optimized strings. + This is initially the size of .debug_str section in the object, + and as unique tail optimized strings are found, this is increased + each time. */ +static unsigned int max_strp_off; + +/* At the end of read_multifile strp_htab is moved to this variable, + which is used to find strings in the shared .debug_str section. */ +static htab_t alt_strp_htab; + +/* Structure describing strings in strp_htab. */ +struct strp_entry +{ + /* Original .debug_str offset. */ + unsigned int off; + /* New .debug_str offset, or when using strp_{hash,eq}2 + this is initially iterative hash of the string with the + LSB bit used for whether the string has been seen just once + or more than once. */ + unsigned int new_off; +}; +ALIGN_STRUCT (strp_entry) + +/* Hash function in strp_htab used for discovery of tail optimized + strings. */ +static hashval_t +strp_hash (const void *p) +{ + struct strp_entry *s = (struct strp_entry *)p; + + return s->off; +} + +/* Corresponding equality function in strp_htab. */ +static int +strp_eq (const void *p, const void *q) +{ + struct strp_entry *s1 = (struct strp_entry *)p; + struct strp_entry *s2 = (struct strp_entry *)q; + + return s1->off == s2->off; +} + +/* Hash function in strp_htab used to find what strings are + used by more than one object. */ +static hashval_t +strp_hash2 (const void *p) +{ + struct strp_entry *s = (struct strp_entry *)p; + + return s->new_off & ~1U; +} + +/* Corresponding equality function in strp_htab. */ +static int +strp_eq2 (const void *p, const void *q) +{ + struct strp_entry *s1 = (struct strp_entry *)p; + struct strp_entry *s2 = (struct strp_entry *)q; + + return strcmp ((char *) debug_sections[DEBUG_STR].data + s1->off, + (char *) debug_sections[DEBUG_STR].data + s2->off) == 0; +} + +/* Hash function in strp_htab used from finalize_strp onwards, + mapping strings into strings in the new .debug_str section. */ +static hashval_t +strp_hash3 (const void *p) +{ + return hash (p, strlen (p)); +} + +/* Corresponding equality function in strp_htab. */ +static int +strp_eq3 (const void *p, const void *q) +{ + return strcmp (p, q) == 0; +} + +/* Called for each DW_FORM_strp offset seen during initial + .debug_{info,types,macro} parsing. Before fi_multifile phase + this records just tail optimized strings, during fi_multifile + it checks whether the string is already in the shared .debug_str + section and if not, notes that it will need to be added to the + new local .debug_str section. */ +static void +note_strp_offset (unsigned int off) +{ + void **slot; + struct strp_entry se; + + if (unlikely (fi_multifile)) + { + unsigned char *p; + unsigned int len; + hashval_t hash; + + p = debug_sections[DEBUG_STR].data + off; + len = strlen ((char *) p); + hash = hash (p, len); + if (alt_strp_htab) + { + if (htab_find_with_hash (alt_strp_htab, p, hash)) + return; + } + if (strp_htab == NULL) + { + unsigned int strp_count = debug_sections[DEBUG_STR].size / 64; + + if (strp_count < 100) + strp_count = 100; + strp_htab = htab_try_create (strp_count, strp_hash2, strp_eq2, NULL); + if (strp_htab == NULL) + dwz_oom (); + } + + se.off = off; + se.new_off = hash | 1; + slot = htab_find_slot_with_hash (strp_htab, &se, se.new_off & ~1U, INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot == NULL) + { + struct strp_entry *s = pool_alloc (strp_entry, sizeof (*s)); + *s = se; + *slot = (void *) s; + } + return; + } + if (off >= debug_sections[DEBUG_STR].size || off == 0) + return; + if (debug_sections[DEBUG_STR].data[off - 1] == '\0') + return; + if (strp_htab == NULL) + { + if (multifile == NULL) + return; + strp_htab = htab_try_create (50, strp_hash, strp_eq, NULL); + if (strp_htab == NULL) + dwz_oom (); + max_strp_off = debug_sections[DEBUG_STR].size; + } + se.off = off; + slot = htab_find_slot_with_hash (strp_htab, &se, off, INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot == NULL) + { + struct strp_entry *s = pool_alloc (strp_entry, sizeof (*s)); + s->off = off; + s->new_off = max_strp_off; + max_strp_off += strlen ((char *) debug_sections[DEBUG_STR].data + + off) + 1; + if (max_strp_off < s->new_off) + { + htab_delete (strp_htab); + strp_htab = NULL; + max_strp_off = 0; + multifile = NULL; + error (0, 0, ".debug_str too large for multi-file optimization"); + } + *slot = (void *) s; + } +} + +/* Map offset in original .debug_str section into + offset in new .debug_str, either the shared .debug_str + or new local .debug_str. */ +static unsigned +lookup_strp_offset (unsigned int off) +{ + struct strp_entry *s, se; + + if (unlikely (op_multifile || fi_multifile)) + { + unsigned char *p; + unsigned int len; + hashval_t hash; + + p = debug_sections[DEBUG_STR].data + off; + len = strlen ((char *) p); + hash = hash (p, len); + if (alt_strp_htab) + { + unsigned char *q = (unsigned char *) + htab_find_with_hash (alt_strp_htab, p, hash); + if (q != NULL) + return q - alt_data[DEBUG_STR]; + } + assert (strp_htab); + p = (unsigned char *) htab_find_with_hash (strp_htab, p, hash); + assert (p != NULL); + return p - debug_sections[DEBUG_STR].new_data; + } + if (off >= debug_sections[DEBUG_STR].size || off == 0) + return off + multi_str_off; + if (debug_sections[DEBUG_STR].data[off - 1] == '\0') + return off + multi_str_off; + se.off = off; + s = (struct strp_entry *) htab_find_with_hash (strp_htab, &se, off); + return s->new_off + multi_str_off; +} + +/* Note .debug_str offset during write_macro or compute_abbrevs, + return either DW_FORM_strp if the string will be in the local + .debug_str section, or DW_FORM_strp_sup / DW_FORM_GNU_strp_alt if it + will be in the shared .debug_str section. */ +static enum dwarf_form +note_strp_offset2 (unsigned int off) +{ + hashval_t hash; + struct strp_entry se; + unsigned char *p, *q; + + if (likely (fi_multifile)) + { + unsigned int len; + + if (alt_strp_htab) + { + p = debug_sections[DEBUG_STR].data + off; + len = strlen ((char *) p); + hash = hash (p, len); + if (htab_find_with_hash (alt_strp_htab, p, hash)) + return dwarf_5 ? DW_FORM_strp_sup : DW_FORM_GNU_strp_alt; + } + return DW_FORM_strp; + } + if (off >= debug_sections[DEBUG_STR].size) + return DW_FORM_strp; + p = debug_sections[DEBUG_STR].data + off; + q = (unsigned char *) strchr ((char *) p, '\0'); + hash = hash (p, q - p); + se.off = off; + se.new_off = hash & ~1U; + struct strp_entry *s = (struct strp_entry *) + htab_find_with_hash (strp_htab, &se, se.new_off); + assert (s != NULL); + s->new_off |= 1; + return DW_FORM_strp; +} + +/* Helper to record all strp_entry entries from strp_htab. + Called through htab_traverse. */ +static int +list_strp_entries (void **slot, void *data) +{ + struct strp_entry ***end = (struct strp_entry ***) data; + **end = (struct strp_entry *) *slot; + (*end)++; + return 1; +} + +/* Adapted from bfd/merge.c strrevcmp. */ +static int +strrevcmp (const void *p, const void *q) +{ + struct strp_entry *s1 = *(struct strp_entry **)p; + struct strp_entry *s2 = *(struct strp_entry **)q; + unsigned int len1 = s1->new_off & ~1U; + unsigned int len2 = s2->new_off & ~1U; + unsigned int len; + unsigned char *p1 = debug_sections[DEBUG_STR].data + s1->off; + unsigned char *p2 = debug_sections[DEBUG_STR].data + s2->off; + + if (p1[len1]) + len1++; + if (p2[len2]) + len2++; + p1 += len1; + p2 += len2; + len = len1; + if (len2 < len) + len = len2; + while (len) + { + p1--; + p2--; + if (*p1 != *p2) + { + if (*p1 < *p2) + return -1; + return 1; + } + len--; + } + if (len1 < len2) + return 1; + if (len1 > len2) + return -1; + assert (s1->off == s2->off); + return 0; +} + +/* Compute new .debug_str section, from strp_htab content, + replace strp_htab hash table with a new one, which maps strings + to new .debug_str locations. */ +static unsigned int * +finalize_strp (bool build_tail_offset_list) +{ + unsigned int count, new_count, i, *tail_offset_list = NULL; + unsigned int strp_index = 0, tail_offset_list_count = 0, k; + struct strp_entry **arr, **end; + unsigned char *p; + + if (strp_htab == NULL) + { + debug_sections[DEBUG_STR].new_data = NULL; + debug_sections[DEBUG_STR].new_size = 0; + return NULL; + } + count = htab_elements (strp_htab); + arr = (struct strp_entry **) + obstack_alloc (&ob, count * sizeof (struct strp_entry *)); + end = arr; + htab_traverse (strp_htab, list_strp_entries, (void *) &end); + for (i = 0; i < count; i++) + { + unsigned int len = strlen ((char *) debug_sections[DEBUG_STR].data + + arr[i]->off); + arr[i]->new_off = (len & ~1U) | (arr[i]->new_off & 1); + } + qsort (arr, count, sizeof (struct strp_entry *), strrevcmp); + htab_delete (strp_htab); + strp_htab = NULL; + new_count = count; + for (i = 0; i < count; i++) + if ((arr[i]->new_off & 1) == 0) + { + arr[i]->off = -1U; + arr[i]->new_off = -1U; + new_count--; + } + else + { + unsigned int len1, len2, lastlen, j; + unsigned char *p1, *p2; + len1 = arr[i]->new_off & ~1U; + p1 = debug_sections[DEBUG_STR].data + arr[i]->off; + if (p1[len1]) + len1++; + lastlen = len1; + arr[i]->new_off = strp_index; + strp_index += len1 + 1; + for (j = i + 1; j < count; j++) + { + len2 = arr[j]->new_off & ~1U; + p2 = debug_sections[DEBUG_STR].data + arr[j]->off; + if (p2[len2]) + len2++; + if (len2 >= lastlen) + break; + if (memcmp (p1 + len1 - len2, p2, len2 + 1) != 0) + break; + arr[j]->new_off = arr[i]->new_off + len1 - len2; + lastlen = len2; + tail_offset_list_count++; + } + i = j - 1; + } + debug_sections[DEBUG_STR].new_data = malloc (strp_index); + if (debug_sections[DEBUG_STR].new_data == NULL) + dwz_oom (); + debug_sections[DEBUG_STR].new_size = strp_index; + strp_htab = htab_try_create (new_count < 32 ? 32 : new_count, + strp_hash3, strp_eq3, NULL); + if (strp_htab == NULL) + dwz_oom (); + if (build_tail_offset_list && tail_offset_list_count++ != 0) + { + tail_offset_list + = mmap (NULL, tail_offset_list_count * sizeof (int), + PROT_READ | PROT_WRITE, MAP_ANONYMOUS | MAP_PRIVATE, -1, 0); + if (tail_offset_list == MAP_FAILED) + dwz_oom (); + } + for (i = 0, k = 0, p = debug_sections[DEBUG_STR].new_data; i < count; i++) + if (arr[i]->off == -1U && arr[i]->new_off == -1U) + continue; + else + { + unsigned int len = strlen ((char *) debug_sections[DEBUG_STR].data + + arr[i]->off) + 1; + unsigned int j; + void **slot; + + memcpy (p, debug_sections[DEBUG_STR].data + arr[i]->off, len); + slot = htab_find_slot_with_hash (strp_htab, p, + hash (p, len - 1), + INSERT); + if (slot == NULL) + dwz_oom (); + assert (*slot == NULL); + *slot = (void *) p; + for (j = i + 1; j < count; j++) + if (arr[j]->new_off >= arr[i]->new_off + len) + break; + else + { + unsigned char *q = p + arr[j]->new_off - arr[i]->new_off; + unsigned int l = len + arr[i]->new_off - arr[j]->new_off; + if (tail_offset_list != NULL) + tail_offset_list[k++] = arr[j]->new_off; + slot = htab_find_slot_with_hash (strp_htab, q, + hash (q, l - 1), + INSERT); + if (slot == NULL) + dwz_oom (); + assert (*slot == NULL); + *slot = (void *) q; + } + p += len; + i = j - 1; + } + assert (p == debug_sections[DEBUG_STR].new_data + strp_index); + if (tail_offset_list != NULL) + { + tail_offset_list[k++] = 0; + assert (k == tail_offset_list_count); + } + obstack_free (&ob, (void *) arr); + return tail_offset_list; +} + +enum mark_refs_mode +{ + MARK_REFS_FOLLOW_DUPS = 1, + MARK_REFS_RETURN_VAL = 2, + MARK_REFS_REFERENCED = 4 +}; + +/* Mark all DIEs referenced from DIE by setting die_ref_seen to 1, + unless already marked. */ +static bool +mark_refs (dw_cu_ref cu, dw_die_ref top_die, dw_die_ref die, int mode) +{ + struct abbrev_tag *t; + unsigned int i; + unsigned char *ptr; + dw_die_ref child; + + t = die->die_abbrev; + for (i = 0; i < t->nattr; ++i) + if (t->attr[i].attr != DW_AT_sibling) + switch (t->attr[i].form) + { + case DW_FORM_ref_addr: + if (unlikely (op_multifile)) + i = -2U; + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + case DW_FORM_indirect: + i = -2U; + break; + } + if (i == -1U) + { + if (unlikely (cu->cu_kind == CU_TYPES)) + ptr = debug_sections[DEBUG_TYPES].data; + else + ptr = debug_sections[DEBUG_INFO].data; + ptr += die->die_offset; + skip_leb128 (ptr); + for (i = 0; i < t->nattr; ++i) + { + uint32_t form = t->attr[i].form; + size_t len = 0; + uint64_t value; + dw_die_ref ref, reft; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + + switch (form) + { + case DW_FORM_ref_addr: + if (unlikely (op_multifile)) + { + value = read_size (ptr, cu->cu_version == 2 + ? ptr_size : 4); + ptr += cu->cu_version == 2 ? ptr_size : 4; + assert (t->attr[i].attr != DW_AT_sibling); + ref = off_htab_lookup (cu, value); + if ((mode & MARK_REFS_REFERENCED) != 0) + ref->die_referenced = 1; + goto finish_ref; + } + ptr += cu->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_addr: + ptr += ptr_size; + break; + case DW_FORM_flag_present: + case DW_FORM_implicit_const: + break; + case DW_FORM_flag: + case DW_FORM_data1: + ++ptr; + break; + case DW_FORM_data2: + ptr += 2; + break; + case DW_FORM_data4: + case DW_FORM_sec_offset: + case DW_FORM_strp: + case DW_FORM_line_strp: + ptr += 4; + break; + case DW_FORM_data8: + case DW_FORM_ref_sig8: + ptr += 8; + break; + case DW_FORM_data16: + ptr += 16; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + skip_leb128 (ptr); + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form) + { + case DW_FORM_ref_udata: value = read_uleb128 (ptr); break; + case DW_FORM_ref1: value = read_8 (ptr); break; + case DW_FORM_ref2: value = read_16 (ptr); break; + case DW_FORM_ref4: value = read_32 (ptr); break; + case DW_FORM_ref8: value = read_64 (ptr); break; + default: abort (); + } + if (t->attr[i].attr == DW_AT_sibling) + break; + ref = off_htab_lookup (cu, cu->cu_offset + value); + if ((mode & MARK_REFS_REFERENCED) != 0) + ref->die_referenced = 1; + if (!ref->die_collapsed_child + && ref->u.p1.die_enter >= top_die->u.p1.die_enter + && ref->u.p1.die_exit <= top_die->u.p1.die_exit) + break; + finish_ref: + reft = ref; + while (!reft->die_root + && reft->die_parent->die_tag != DW_TAG_compile_unit + && reft->die_parent->die_tag != DW_TAG_partial_unit + && !reft->die_parent->die_named_namespace) + reft = reft->die_parent; + if ((mode & MARK_REFS_FOLLOW_DUPS) && reft->die_dup != NULL) + { + reft = reft->die_dup; + if (die_cu (reft)->cu_kind == CU_PU) + break; + } + if (reft->die_ref_seen == 0) + { + if ((mode & MARK_REFS_RETURN_VAL)) + return false; + reft->die_ref_seen = 1; + mark_refs (die_cu (reft), reft, reft, mode); + } + break; + case DW_FORM_string: + ptr = (unsigned char *) strchr ((char *)ptr, '\0') + 1; + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *ptr++; + break; + case DW_FORM_block2: + len = read_16 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + case DW_FORM_exprloc: + len = read_uleb128 (ptr); + form = DW_FORM_block1; + break; + default: + abort (); + } + + if (form == DW_FORM_block1) + ptr += len; + } + } + + for (child = die->die_child; child; child = child->die_sib) + if (!mark_refs (cu, top_die, child, mode)) + return false; + return true; +} + +/* Remove completely unneeded children of DIE and remove unreferenced DIEs + from offset hash tables. */ +static void +remove_dies (dw_cu_ref cu, dw_die_ref die, bool remove) +{ + dw_die_ref child, next; + if (die->die_toplevel && die->die_ref_seen == 0 && !low_mem) + remove = true; + for (child = die->die_child; child; child = next) + { + next = child->die_sib; + remove_dies (cu, child, remove); + } + if (die->die_referenced == 0) + { + htab_t h = cu->cu_kind == CU_TYPES ? types_off_htab : off_htab; + void **slot = htab_find_slot_with_hash (h, die, off_hash (die), + NO_INSERT); + if (slot != NULL) + htab_clear_slot (h, slot); + } + if (!remove) + return; + if (die->die_toplevel == 0) + { + memset (die, '\0', offsetof (struct dw_die, die_dup)); + die->die_sib = die_nontoplevel_freelist; + die_nontoplevel_freelist = die; + } + else + die->die_child = NULL; +} + +/* Remove unneeded children DIEs. During phase 0 die_ref_seen + of toplevel DIEs is computed, during phase 1 mark_refs is called + to find referenced DIEs, during phase 2 unneeded children DIEs + are removed. */ +static void +remove_unneeded (dw_cu_ref cu, dw_die_ref die, unsigned int phase) +{ + dw_die_ref child; + for (child = die->die_child; child; child = child->die_sib) + { + if (child->die_named_namespace) + { + remove_unneeded (cu, child, phase); + if (phase == 2) + child->die_ref_seen = 0; + } + else + switch (phase) + { + case 0: + child->die_ref_seen = child->die_dup == NULL; + break; + case 1: + if (child->die_dup == NULL || low_mem) + mark_refs (cu, child, child, MARK_REFS_REFERENCED); + break; + case 2: + remove_dies (cu, child, false); + child->die_ref_seen = 0; + break; + } + } +} + +/* Entries in meta_abbrev_htab, mapping .debug_abbrev section offsets + to abbrev hash tables. */ +struct meta_abbrev_entry +{ + /* .debug_abbrev offset. */ + unsigned int abbrev_off; + /* Corresponding hash table. */ + htab_t abbrev_htab; +}; + +/* Hash table for mapping of .debug_abbrev section offsets to + abbrev hash tables. */ +static htab_t meta_abbrev_htab; +/* Dummy entry used during OOM handling. */ +static struct meta_abbrev_entry meta_abbrev_fallback; + +/* Hash function for meta_abbrev_htab. */ +static hashval_t +meta_abbrev_hash (const void *p) +{ + struct meta_abbrev_entry *m = (struct meta_abbrev_entry *)p; + + return m->abbrev_off; +} + +/* Equality function for meta_abbrev_htab. */ +static int +meta_abbrev_eq (const void *p, const void *q) +{ + struct meta_abbrev_entry *m1 = (struct meta_abbrev_entry *)p; + struct meta_abbrev_entry *m2 = (struct meta_abbrev_entry *)q; + + return m1->abbrev_off == m2->abbrev_off; +} + +/* Delete function for meta_abbrev_htab. */ +static void +meta_abbrev_del (void *p) +{ + struct meta_abbrev_entry *m = (struct meta_abbrev_entry *)p; + + if (m->abbrev_htab != NULL) + htab_delete (m->abbrev_htab); +} + +/* Collapse children of TOP_DIE to decrease memory usage. */ +static void +collapse_child (dw_cu_ref cu, dw_die_ref top_die, dw_die_ref die, + unsigned int *tick) +{ + dw_die_ref child, next; + bool has_children = die->die_child != NULL; + unsigned int tick_diff = *tick; + for (child = die->die_child; child; child = next) + { + next = child->die_sib; + (*tick)++; + collapse_child (cu, top_die, child, tick); + } + if (has_children) + (*tick)++; + if (top_die == die) + { + die->die_child = NULL; + die->die_collapsed_children = 1; + } + else if (die->die_referenced) + { + die->die_parent = top_die; + if (tick_diff <= 0xffff && !die->die_intercu_referenced) + { + dw_die_ref ref; + void **slot; + if (die_collapsed_child_freelist) + { + ref = die_collapsed_child_freelist; + die_collapsed_child_freelist = ref->die_parent; + } + else + ref = pool_alloc (dw_die, offsetof (struct dw_die, die_child)); + memcpy (ref, die, offsetof (struct dw_die, die_child)); + ref->die_collapsed_child = 1; + ref->die_tag = tick_diff; + slot = htab_find_slot_with_hash (cu->cu_kind == CU_TYPES + ? types_off_htab : off_htab, + ref, off_hash (ref), NO_INSERT); + assert (slot != NULL); + *slot = (void *) ref; + memset (die, '\0', offsetof (struct dw_die, die_dup)); + die->die_sib = die_nontoplevel_freelist; + die_nontoplevel_freelist = die; + } + else + { + die->die_child = NULL; + die->die_sib = NULL; + die->die_ref_seen = tick_diff; + } + } + else + { + memset (die, '\0', offsetof (struct dw_die, die_dup)); + die->die_sib = die_nontoplevel_freelist; + die_nontoplevel_freelist = die; + } +} + +/* Collapse children of all toplevel DIEs that can be collapsed. */ +static void +collapse_children (dw_cu_ref cu, dw_die_ref die) +{ + dw_die_ref child; + for (child = die->die_child; child; child = child->die_sib) + if (child->die_named_namespace) + collapse_children (cu, child); + else if (child->die_child == NULL) + continue; + else if (child->die_nextdup == NULL + || (child->die_dup != NULL + && (die_cu (child->die_dup)->cu_kind != CU_PU + || child->die_dup->die_nextdup != child))) + { + unsigned int tick = 0; + collapse_child (cu, child, child, &tick); + } +} + +/* Count the number of DIEs in the .debug_info section, and see if we run into + some limit. */ +static int +try_debug_info (DSO *dso) +{ + unsigned char *ptr, *endcu, *endsec; + unsigned int value; + htab_t abbrev = NULL; + unsigned int last_abbrev_offset = 0; + struct abbrev_tag tag, *t; + unsigned int ndies; + unsigned ret = 1; + int kind = DEBUG_INFO; + bool low_mem_die_limit_hit = false; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "try_debug_info\n"); + } + + if (tracing) + fprintf (stderr, "Counting DIEs\n"); + + ndies = 0; + ptr = debug_sections[kind].data; + endsec = ptr + debug_sections[kind].size; + while (ptr < endsec) + { + unsigned int culen; + int cu_version; + + /* Note header is one bigger with DWARF version 5. */ + if (ptr + (kind == DEBUG_TYPES ? 23 : 11) > endsec) + { + error (0, 0, "%s: %s CU header too small", dso->filename, + debug_sections[kind].name); + goto fail; + } + + endcu = ptr + 4; + culen = read_32 (ptr); + if (culen >= 0xfffffff0) + { + error (0, 0, "%s: 64-bit DWARF not supported", dso->filename); + goto fail; + } + endcu += culen; + + if (endcu > endsec) + { + error (0, 0, "%s: %s too small", dso->filename, + debug_sections[kind].name); + goto fail; + } + + cu_version = read_16 (ptr); + if (kind == DEBUG_TYPES && (cu_version < 2 || cu_version > 4)) + { + error (0, 0, "%s: DWARF version %d in .debug_types unhandled", + dso->filename, cu_version); + goto fail; + } + else if (cu_version < 2 || cu_version > 5) + { + error (0, 0, "%s: DWARF version %d in .debug_info unhandled", + dso->filename, cu_version); + goto fail; + } + + if (cu_version == 5) + { + value = read_8 (ptr); + if (value != DW_UT_compile && value != DW_UT_partial) + error (0, 0, "%s: DWARF CU type %s unhandled", dso->filename, + get_DW_UT_str (value)); + } + else + { + value = read_32 (ptr); + if (value >= debug_sections[DEBUG_ABBREV].size) + { + if (debug_sections[DEBUG_ABBREV].data == NULL) + error (0, 0, "%s: .debug_abbrev not present", dso->filename); + else + error (0, 0, "%s: DWARF CU abbrev offset too large", + dso->filename); + goto fail; + } + } + + if (ptr_size == 0) + { + ptr_size = read_8 (ptr); + if (ptr_size != 4 && ptr_size != 8) + { + error (0, 0, "%s: Invalid DWARF pointer size %d", + dso->filename, ptr_size); + goto fail; + } + } + else if (read_8 (ptr) != ptr_size) + { + error (0, 0, "%s: DWARF pointer size differs between CUs", + dso->filename); + goto fail; + } + + if (cu_version == 5) + { + /* Above we only checked for the smaller version 4 header size. */ + if (ptr + 4 > endsec) + { + error (0, 0, "%s: %s CU version 5 header too small", + dso->filename, debug_sections[kind].name); + goto fail; + } + value = read_32 (ptr); + if (value >= debug_sections[DEBUG_ABBREV].size) + { + if (debug_sections[DEBUG_ABBREV].data == NULL) + error (0, 0, "%s: .debug_abbrev not present", dso->filename); + else + error (0, 0, "%s: DWARF CU abbrev offset too large", + dso->filename); + goto fail; + } + } + + if (abbrev == NULL || value != last_abbrev_offset) + { + if (abbrev) + htab_delete (abbrev); + abbrev + = read_abbrev (dso, debug_sections[DEBUG_ABBREV].data + value); + if (abbrev == NULL) + { + error (0, 0, "%s: Couldn't read abbrev at offset 0x%x", + dso->filename, value); + goto fail; + } + } + last_abbrev_offset = value; + + while (ptr < endcu) + { + tag.entry = read_uleb128 (ptr); + if (tag.entry == 0) + continue; + if (ndies == max_die_limit) + { + error (0, 0, "%s: Too many DIEs, not optimizing", + dso->filename); + goto fail; + } + /* If we reach the DIE limit, signal the dwz caller that it + should retry with low_mem. */ + if (likely (!low_mem) && ndies == low_mem_die_limit) + { + if (tracing) + fprintf (stderr, "Hit low-mem die-limit\n"); + if (estimate_nr_dies () > max_die_limit) + /* Keep going, we still might hit the max die-limit. */ + low_mem_die_limit_hit = true; + else + { + ret = 2; + goto fail; + } + } + ndies++; + t = htab_find_with_hash (abbrev, &tag, tag.entry); + if (t == NULL) + { + error (0, 0, "%s: Could not find DWARF abbreviation %d", + dso->filename, tag.entry); + goto fail; + } + ptr = skip_attrs_1 (cu_version, t, ptr); + } + } + + if (low_mem_die_limit_hit) + ret = 2; + else + ret = 0; + + fail: + if (abbrev) + htab_delete (abbrev); + + return ret; +} + +/* Read language attribute encoded using FORM from location PTR, return + pointer to location after the attribute. Assign the attribute value + to *LANG. */ +static unsigned char * +read_lang (unsigned char *ptr, enum dwarf_form form, + enum dwarf_source_language *lang) +{ + bool error_p = false; + *lang = read_u16 (ptr, form, error_p); + if (unlikely (error_p)) + { + *lang = 0; + error (0, 0, "Invalid DW_AT_language attribute, ignoring"); + } + return ptr; +} + +/* First phase of the DWARF compression. Parse .debug_info section + (for kind == DEBUG_INFO) or .debug_types section (for kind == DEBUG_TYPES) + for each CU in it construct internal representation for the CU + and its DIE tree, compute checksums of DIEs and look for duplicates. */ +static int +read_debug_info (DSO *dso, int kind, unsigned int *die_count) +{ + unsigned char *ptr, *endcu, *endsec; + unsigned int value; + htab_t abbrev = NULL; + unsigned int last_abbrev_offset = 0; + unsigned int last_debug_line_off = 0; + struct dw_file *cu_files = NULL; + unsigned int cu_nfiles = 0; + bool note_strp_forms = multifile != NULL && !op_multifile + && !rd_multifile && !low_mem; + struct abbrev_tag tag, *t; + unsigned int cu_chunk = 0; + dw_cu_ref cu_tail = NULL, cu_collapse = NULL; + unsigned int cu_kind = rd_multifile ? CU_ALT + : kind == DEBUG_TYPES ? CU_TYPES : CU_NORMAL; + void *to_free = NULL; + int ret = 1; + unsigned int ndies; + bool low_mem_phase1 = low_mem && kind == DEBUG_INFO; + struct dw_cu cu_buf; + struct dw_die die_buf; + bool lang_p = odr || uni_lang_p; + + odr_active_p = false; + if (odr) + odr_phase = 1; + + unsigned int estimated_nr_dies = estimate_nr_dies (); + if (kind == DEBUG_INFO + && multifile_mode == 0 + && die_count_method == estimate) + { + bool do_count = (estimated_nr_dies > max_die_limit + || estimated_nr_dies > low_mem_die_limit); + if (tracing) + fprintf (stderr, "Using die count estimate %u to decide whether to" + " count DIEs: %s\n", estimated_nr_dies, + do_count ? "yes" : "no"); + if (do_count) + { + int try_ret = try_debug_info (dso); + if (try_ret != 0) + return try_ret; + } + } + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "read_debug_info %s%s\n", + kind == DEBUG_INFO ? ".debug_info" : ".debug_types", + low_mem && kind == DEBUG_INFO ? " (low-mem)" : ""); + } + + if (likely (!fi_multifile && kind != DEBUG_TYPES)) + { + dup_htab = htab_try_create (100000, die_hash, die_eq, NULL); + if (dup_htab == NULL) + dwz_oom (); + } + if (unlikely (meta_abbrev_htab == NULL + && (op_multifile || rd_multifile || fi_multifile || low_mem))) + { + meta_abbrev_htab + = htab_try_create (500, meta_abbrev_hash, meta_abbrev_eq, + meta_abbrev_del); + if (meta_abbrev_htab == NULL) + dwz_oom (); + to_free = obstack_alloc (&ob2, 1); + } + + low_mem_phase2: + ndies = 0; + ptr = debug_sections[kind].data; + endsec = ptr + debug_sections[kind].size; + while (ptr < endsec) + { + unsigned int cu_offset = ptr - debug_sections[kind].data; + unsigned int tick = 0, culen; + int cu_version; + dw_cu_ref cu; + dw_die_ref *diep, parent, die; + bool present; + unsigned int debug_line_off; + unsigned int type_offset = 0; + + /* Note header is one bigger with DWARF version 5. */ + if (ptr + (kind == DEBUG_TYPES ? 23 : 11) > endsec) + { + error (0, 0, "%s: %s CU header too small", dso->filename, + debug_sections[kind].name); + goto fail; + } + + endcu = ptr + 4; + culen = read_32 (ptr); + if (culen >= 0xfffffff0) + { + error (0, 0, "%s: 64-bit DWARF not supported", dso->filename); + goto fail; + } + endcu += culen; + + if (endcu > endsec) + { + error (0, 0, "%s: %s too small", dso->filename, + debug_sections[kind].name); + goto fail; + } + + cu_version = read_16 (ptr); + if (kind == DEBUG_TYPES && (cu_version < 2 || cu_version > 4)) + { + error (0, 0, "%s: DWARF version %d in .debug_types unhandled", + dso->filename, cu_version); + goto fail; + } + else if (cu_version < 2 || cu_version > 5) + { + error (0, 0, "%s: DWARF version %d in .debug_info unhandled", + dso->filename, cu_version); + goto fail; + } + + if (cu_version == 5) + { + value = read_8 (ptr); + if (value != DW_UT_compile && value != DW_UT_partial) + { + error (0, 0, "%s: DWARF CU type %s unhandled", dso->filename, + get_DW_UT_str (value)); + goto fail; + } + } + else + { + value = read_32 (ptr); + if (value >= debug_sections[DEBUG_ABBREV].size) + { + if (debug_sections[DEBUG_ABBREV].data == NULL) + error (0, 0, "%s: .debug_abbrev not present", dso->filename); + else + error (0, 0, "%s: DWARF CU abbrev offset too large", + dso->filename); + goto fail; + } + } + + if (ptr_size == 0) + { + ptr_size = read_8 (ptr); + if (ptr_size != 4 && ptr_size != 8) + { + error (0, 0, "%s: Invalid DWARF pointer size %d", + dso->filename, ptr_size); + goto fail; + } + } + else if (read_8 (ptr) != ptr_size) + { + error (0, 0, "%s: DWARF pointer size differs between CUs", + dso->filename); + goto fail; + } + + if (cu_version == 5) + { + /* Above we only checked for the smaller version 4 header size. */ + if (ptr + 4 > endsec) + { + error (0, 0, "%s: %s CU version 5 header too small", + dso->filename, debug_sections[kind].name); + goto fail; + } + value = read_32 (ptr); + if (value >= debug_sections[DEBUG_ABBREV].size) + { + if (debug_sections[DEBUG_ABBREV].data == NULL) + error (0, 0, "%s: .debug_abbrev not present", dso->filename); + else + error (0, 0, "%s: DWARF CU abbrev offset too large", + dso->filename); + goto fail; + } + } + + if (unlikely (op_multifile)) + { + if (ptr == endcu) + { + dw_cu_ref cuf = cu_tail ? cu_tail->cu_next : first_cu; + /* Inside of optimize_multifile, DIE hashes are computed + only after all the CUs from a particular DSO or + executable have been parsed, as we follow + DW_FORM_ref_addr then. */ + for (cu = cuf; cu; cu = cu->cu_next) + if (checksum_die (dso, cu, NULL, cu->cu_die)) + goto fail; + + for (cu = cuf; cu; cu = cu->cu_next) + checksum_ref_die (cu, NULL, cu->cu_die, NULL, NULL); + + if (dump_dies_p) + for (cu = cuf; cu; cu = cu->cu_next) + dump_dies (0, cu->cu_die); + + for (cu = cuf; cu; cu = cu->cu_next) + if (find_dups (cu->cu_die)) + goto fail; + + for (cu = cuf; cu; cu = cu->cu_next) + remove_unneeded (cu, cu->cu_die, 0); + for (cu = cuf; cu; cu = cu->cu_next) + remove_unneeded (cu, cu->cu_die, 1); + for (cu = cuf; cu; cu = cu->cu_next) + remove_unneeded (cu, cu->cu_die, 2); + + if (cu_collapse == NULL) + cu_collapse = first_cu; + while (cu_collapse->cu_chunk < cu_chunk) + { + collapse_children (cu_collapse, cu_collapse->cu_die); + cu_collapse = cu_collapse->cu_next; + } + + cu_tail = last_cu; + cu_chunk++; + continue; + } + } + else + cu_chunk++; + + if (unlikely (meta_abbrev_htab != NULL)) + { + struct meta_abbrev_entry m, *mp; + void **slot; + m.abbrev_off = value; + slot = htab_find_slot_with_hash (meta_abbrev_htab, &m, + m.abbrev_off, INSERT); + if (slot == NULL) + dwz_oom (); + else if (*slot != NULL) + abbrev = ((struct meta_abbrev_entry *) *slot)->abbrev_htab; + else + { + *slot = (void *) &meta_abbrev_fallback; + abbrev + = read_abbrev (dso, debug_sections[DEBUG_ABBREV].data + value); + if (abbrev == NULL) + goto fail; + mp = (struct meta_abbrev_entry *) + obstack_alloc (&ob2, sizeof (*mp)); + mp->abbrev_off = value; + mp->abbrev_htab = abbrev; + *slot = (void *) mp; + } + } + else if (abbrev == NULL || value != last_abbrev_offset) + { + if (abbrev) + htab_delete (abbrev); + abbrev + = read_abbrev (dso, debug_sections[DEBUG_ABBREV].data + value); + if (abbrev == NULL) + { + error (0, 0, "%s: Couldn't read abbrev at offset 0x%x", + dso->filename, value); + + goto fail; + } + } + last_abbrev_offset = value; + + if (unlikely (kind == DEBUG_TYPES)) + { + ptr += 8; + type_offset = read_32 (ptr); + } + + if (unlikely (low_mem_phase1)) + cu = &cu_buf; + else + cu = pool_alloc (dw_cu, sizeof (struct dw_cu)); + memset (cu, '\0', sizeof (*cu)); + cu->cu_kind = cu_kind; + cu->cu_offset = cu_offset; + cu->cu_version = cu_version; + cu->cu_chunk = cu_chunk; + if (unlikely (op_multifile || low_mem)) + cu->cu_abbrev = abbrev; + diep = &cu->cu_die; + parent = NULL; + if (unlikely (low_mem_phase1)) + ; + else if (first_cu == NULL) + first_cu = last_cu = cu; + else + { + last_cu->cu_next = cu; + last_cu = cu; + } + + while (ptr < endcu) + { + unsigned int i; + unsigned int die_offset = ptr - debug_sections[kind].data; + + tag.entry = read_uleb128 (ptr); + if (tag.entry == 0) + { + if (unlikely (low_mem_phase1)) + continue; + if (parent) + { + diep = &parent->die_sib; + parent->u.p1.die_exit = tick++; + if (parent->die_root == 0) + parent = parent->die_parent; + else + parent = NULL; + } + else + diep = NULL; + continue; + } + if (diep == NULL) + { + error (0, 0, "%s: Wrong %s DIE tree", dso->filename, + debug_sections[kind].name); + goto fail; + } + t = htab_find_with_hash (abbrev, &tag, tag.entry); + if (t == NULL) + { + error (0, 0, "%s: Could not find DWARF abbreviation %d", + dso->filename, tag.entry); + goto fail; + } + if (likely (!op_multifile && !rd_multifile && !fi_multifile) + && likely (kind == DEBUG_INFO)) + { + if (ndies == max_die_limit) + { + error (0, 0, "%s: Too many DIEs, not optimizing", + dso->filename); + goto fail; + } + /* If we reach the DIE limit, silently signal the dwz + caller that it should retry with low_mem. */ + if (likely (!low_mem) && ndies == low_mem_die_limit) + { + if (tracing) + fprintf (stderr, "Hit low-mem die-limit\n"); + ret = 2; + goto fail; + } + } + ndies++; + if (unlikely (low_mem_phase1)) + die = &die_buf; + else if (parent == NULL + || parent->die_root + || parent->die_named_namespace) + { + die = pool_alloc (dw_die, sizeof (struct dw_die)); + memset (die, '\0', sizeof (struct dw_die)); + die->die_toplevel = 1; + } + else + { + if (die_nontoplevel_freelist) + { + die = die_nontoplevel_freelist; + die_nontoplevel_freelist = die->die_sib; + } + else + die = pool_alloc (dw_die, offsetof (struct dw_die, die_dup)); + memset (die, '\0', offsetof (struct dw_die, die_dup)); + } + *diep = die; + die->die_tag = t->tag; + die->die_abbrev = t; + die->die_offset = die_offset; + if (parent) + die->die_parent = parent; + else + { + die->die_root = 1; + die->die_parent = (dw_die_ref) cu; + } + die->u.p1.die_enter = tick; + die->u.p1.die_exit = tick++; + if (likely (!low_mem_phase1)) + { + if (t->children) + { + diep = &die->die_child; + parent = die; + } + else + diep = &die->die_sib; + } + for (i = 0; i < t->nattr; ++i) + { + uint32_t form = t->attr[i].form; + size_t len = 0; + + while (form == DW_FORM_indirect) + { + form = read_uleb128 (ptr); + if (ptr > endcu) + { + error (0, 0, "%s: Attributes extend beyond end of CU", + dso->filename); + goto fail; + } + } + + /* Get length of expr/blocks first. Canonicalize all, + except exprloc, to DW_FORM_block1. */ + switch (form) + { + case DW_FORM_block1: + len = *ptr++; + break; + case DW_FORM_block2: + len = read_16 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + len = read_uleb128 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_exprloc: + len = read_uleb128 (ptr); + break; + default: + break; + } + + if (unlikely (low_mem_phase1) + && add_locexpr_dummy_dies (dso, cu, die, ptr, form, + t->attr[i].attr, len)) + goto fail; + + switch (form) + { + case DW_FORM_ref_addr: + if (unlikely (low_mem_phase1)) + { + unsigned int offset + = read_size (ptr, cu->cu_version == 2 ? ptr_size : 4); + add_dummy_die (cu, offset); + } + ptr += cu->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_addr: + ptr += ptr_size; + break; + case DW_FORM_flag_present: + break; + case DW_FORM_implicit_const: + if (lang_p + && (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit) + && t->attr[i].attr == DW_AT_language) + cu->lang = t->values[i]; + break; + case DW_FORM_data1: + if (lang_p + && (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit) + && t->attr[i].attr == DW_AT_language) + cu->lang = *ptr; + /* FALLTHRU */ + case DW_FORM_ref1: + case DW_FORM_flag: + ++ptr; + break; + case DW_FORM_data2: + if (lang_p + && (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit) + && t->attr[i].attr == DW_AT_language) + cu->lang = do_read_16 (ptr); + /* FALLTHRU */ + case DW_FORM_ref2: + ptr += 2; + break; + case DW_FORM_data4: + if (lang_p + && (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit) + && t->attr[i].attr == DW_AT_language) + read_lang (ptr, form, &cu->lang); + /* FALLTHRU */ + case DW_FORM_ref4: + case DW_FORM_sec_offset: + ptr += 4; + break; + case DW_FORM_data8: + if (lang_p + && (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit) + && t->attr[i].attr == DW_AT_language) + read_lang (ptr, form, &cu->lang); + /* FALLTHRU */ + case DW_FORM_ref8: + case DW_FORM_ref_sig8: + ptr += 8; + break; + case DW_FORM_data16: + ptr += 16; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + if (lang_p + && (die->die_tag == DW_TAG_compile_unit + || die->die_tag == DW_TAG_partial_unit) + && t->attr[i].attr == DW_AT_language) + { + ptr = read_lang (ptr, form, &cu->lang); + break; + } + /* FALLTHRU */ + case DW_FORM_ref_udata: + skip_leb128 (ptr); + break; + case DW_FORM_strp: + if (t->attr[i].attr == DW_AT_name + && (die->die_tag == DW_TAG_namespace + || die->die_tag == DW_TAG_module) + && !die->die_root + && (die->die_parent->die_root + || die->die_parent->die_named_namespace)) + die->die_named_namespace = 1; + if (note_strp_forms) + note_strp_offset (read_32 (ptr)); + else + ptr += 4; + break; + case DW_FORM_line_strp: + if (t->attr[i].attr == DW_AT_name + && (die->die_tag == DW_TAG_namespace + || die->die_tag == DW_TAG_module) + && !die->die_root + && (die->die_parent->die_root + || die->die_parent->die_named_namespace)) + die->die_named_namespace = 1; + /* Don't note strp, different string table. */ + ptr += 4; + break; + case DW_FORM_string: + ptr = (unsigned char *) strchr ((char *)ptr, '\0') + 1; + if (t->attr[i].attr == DW_AT_name + && (die->die_tag == DW_TAG_namespace + || die->die_tag == DW_TAG_module) + && !die->die_root + && (die->die_parent->die_root + || die->die_parent->die_named_namespace)) + die->die_named_namespace = 1; + break; + case DW_FORM_indirect: + abort (); + /* All expr/blocks lengths already handled above. + Just canonicalize exprloc to block1 too. */ + case DW_FORM_exprloc: + form = DW_FORM_block1; + break; + case DW_FORM_block1: + break; + case DW_FORM_block2: + case DW_FORM_block4: + case DW_FORM_block: + abort (); + default: + error (0, 0, "%s: Unknown DWARF %s at DIE [%x]", + dso->filename, get_DW_FORM_str (form), die_offset); + goto fail; + } + + if (ptr > endcu) + { + error (0, 0, "%s: Attributes extend beyond end of CU " + "for DIE [%x]", + dso->filename, die_offset); + goto fail; + } + + if (form == DW_FORM_block1) + { + if (len >= (size_t) (endcu - ptr)) + { + error (0, 0, "%s: Attributes extend beyond end of CU " + "for DIE [%x]", + dso->filename, die_offset); + goto fail; + } + + if (t->attr[i].attr > DW_AT_loclists_base + && (t->attr[i].attr < DW_AT_MIPS_fde + || t->attr[i].attr > DW_AT_MIPS_has_inlines) + && (t->attr[i].attr < DW_AT_sf_names + || t->attr[i].attr > DW_AT_body_end) + && (t->attr[i].attr < DW_AT_GNU_call_site_value + || t->attr[i].attr + > DW_AT_GNU_call_site_target_clobbered)) + { + error (0, 0, "%s: Unknown DWARF %s with " + "block DW_FORM for DIE [%x]", + dso->filename, get_DW_AT_str (t->attr[i].attr), + die_offset); + goto fail; + } + + ptr += len; + } + } + die->die_size = (ptr - debug_sections[kind].data) + - die_offset; + if (unlikely (low_mem)) + { + if (low_mem_phase1) + continue; + if (off_htab != NULL && kind == DEBUG_INFO) + { + void **slot + = htab_find_slot_with_hash (off_htab, die, off_hash (die), + INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot != NULL) + { + dw_die_ref ref = (dw_die_ref) *slot; + assert (ref->die_collapsed_child); + die->die_referenced = 1; + die->die_intercu_referenced = 1; + memset (ref, '\0', offsetof (struct dw_die, die_child)); + ref->die_parent = die_collapsed_child_freelist; + die_collapsed_child_freelist = ref; + } + *slot = (void *) die; + continue; + } + } + + off_htab_add_die (cu, die, die_count); + } + + if (unlikely (low_mem_phase1)) + continue; + + if (cu->cu_die == NULL + || (cu->cu_die->die_tag != DW_TAG_compile_unit + && cu->cu_die->die_tag != DW_TAG_partial_unit + && cu->cu_die->die_tag != DW_TAG_type_unit) + || cu->cu_die->die_sib != NULL) + { + error (0, 0, "%s: %s section chunk doesn't contain a single" + " compile_unit or partial_unit", dso->filename, + debug_sections[kind].name); + goto fail; + } + + cu->cu_comp_dir = get_AT_string (cu->cu_die, DW_AT_comp_dir); + if (skip_producers_p + && skip_producer (get_AT_string (cu->cu_die, DW_AT_producer))) + { + cu->cu_die->die_remove = 1; + continue; + } + enum dwarf_form form; + debug_line_off + = get_AT_int (cu->cu_die, DW_AT_stmt_list, &present, &form); + if (present) + { + if (!(form == DW_FORM_sec_offset || form == DW_FORM_data4)) + { + error (0, 0, "%s: DW_AT_stmt_list not DW_FORM_sec_offset or" + " DW_FORM_data4", dso->filename); + goto fail; + } + + if (cu_files != NULL && last_debug_line_off == debug_line_off) + { + cu->cu_nfiles = cu_nfiles; + cu->cu_files = cu_files; + } + else + { + if (read_debug_line (dso, cu, debug_line_off)) + goto fail; + cu_nfiles = cu->cu_nfiles; + cu_files = cu->cu_files; + last_debug_line_off = debug_line_off; + } + } + + if (likely (!op_multifile && !rd_multifile && !fi_multifile) + && likely (kind == DEBUG_INFO)) + { + if (checksum_die (dso, cu, NULL, cu->cu_die)) + goto fail; + checksum_ref_die (cu, NULL, cu->cu_die, NULL, NULL); + if (odr) + { + dw_die_ref die; + FOREACH_LOW_TOPLEVEL_DIE_IN_CU (die, cu) + { + if (die->die_ck_state != CK_KNOWN) + continue; + if (die_odr_state (die) != ODR_NONE) + die->u.p1.die_ref_hash = die->u.p1.die_hash; + else + die->die_ref_hash_computed = 0; + } + checksum_ref_die (cu, NULL, cu->cu_die, NULL, NULL); + } + + if (dump_dies_p) + dump_dies (0, cu->cu_die); + + if (find_dups (cu->cu_die)) + goto fail; + } + if (unlikely (kind == DEBUG_TYPES)) + { + dw_die_ref ref = off_htab_lookup (cu, cu->cu_offset + type_offset); + if (ref == NULL) + { + error (0, 0, "%s: Couldn't find DIE at [%x] " + "referenced by type_offset from cu DIE at [%x]", + dso->filename, cu->cu_offset + type_offset, + cu->cu_die->die_offset); + goto fail; + } + if (unlikely (low_mem)) + { + ref->die_referenced = 1; + ref->die_intercu_referenced = 1; + } + } + if (unlikely (low_mem)) + { + remove_unneeded (cu, cu->cu_die, 1); + remove_unneeded (cu, cu->cu_die, 2); + collapse_children (cu, cu->cu_die); + } + } + + if (unlikely (low_mem_phase1)) + { + low_mem_phase1 = false; + cu_chunk = 0; + goto low_mem_phase2; + } + + if (unlikely (low_mem)) + ; + else if (unlikely (meta_abbrev_htab != NULL)) + { + dw_cu_ref cu; + + if (unlikely (op_multifile)) + for (cu = first_cu; cu; cu = cu->cu_next) + cu->cu_abbrev = NULL; + htab_delete (meta_abbrev_htab); + meta_abbrev_htab = NULL; + obstack_free (&ob2, to_free); + abbrev = NULL; + } + else if (abbrev) + htab_delete (abbrev); + + if (unlikely (kind == DEBUG_TYPES)) + return 0; + + if (unlikely (rd_multifile || fi_multifile)) + { + dw_cu_ref cu; + + /* Inside of read_multifile, DIE hashes are computed + only after all the PUs are parsed, as we follow + DW_FORM_ref_addr then. */ + for (cu = first_cu; cu; cu = cu->cu_next) + if (checksum_die (dso, cu, NULL, cu->cu_die)) + goto fail; + + for (cu = first_cu; cu; cu = cu->cu_next) + checksum_ref_die (cu, NULL, cu->cu_die, NULL, NULL); + + if (dump_dies_p) + for (cu = first_cu; cu; cu = cu->cu_next) + dump_dies (0, cu->cu_die); + + if (rd_multifile) + { + for (cu = first_cu; cu; cu = cu->cu_next) + if (find_dups (cu->cu_die)) + goto fail; + } + else + for (cu = first_cu; cu; cu = cu->cu_next) + if (find_dups_fi (cu->cu_die)) + goto fail; + + return 0; + } + + if (tracing) + { + if (op_multifile) + fprintf (stderr, "Die count: %u\n", ndies); + else + fprintf (stderr, "Die count: %u, %.2f%% of estimate\n", ndies, + (double)ndies / ((double)estimated_nr_dies / 100)); + } + if (tracing) + htab_report (off_htab, "off_htab post-parsing"); + if (stats_p) + stats->die_count = ndies; + if (die_count) + *die_count = ndies; + htab_delete (dup_htab); + dup_htab = NULL; + return 0; +fail: + if (unlikely (meta_abbrev_htab != NULL)) + { + dw_cu_ref cu; + + for (cu = first_cu; cu; cu = cu->cu_next) + cu->cu_abbrev = NULL; + htab_delete (meta_abbrev_htab); + meta_abbrev_htab = NULL; + obstack_free (&ob2, to_free); + } + else if (abbrev) + htab_delete (abbrev); + if (dup_htab && kind == DEBUG_INFO) + { + htab_delete (dup_htab); + dup_htab = NULL; + } + return ret; +} + +/* Compare function called from qsort, which should ensure that + dup candidate dies with the same set of referrer CUs are + adjacent. */ +static int +partition_cmp (const void *p, const void *q) +{ + dw_die_ref die1 = *(dw_die_ref *) p; + dw_die_ref die2 = *(dw_die_ref *) q; + dw_die_ref ref1, ref2; + dw_cu_ref last_cu1 = NULL, last_cu2 = NULL; + ref1 = die1; + ref2 = die2; + if (odr_active_p && odr_mode != ODR_BASIC) + { + while (ref1 && die_odr_state (ref1) == ODR_DECL) + ref1 = ref1->die_nextdup; + if (ref1 == NULL) + ref1 = die1; + while (ref2 && die_odr_state (ref2) == ODR_DECL) + ref2 = ref2->die_nextdup; + if (ref2 == NULL) + ref2 = die2; + } + for (;; ref1 = ref1->die_nextdup, ref2 = ref2->die_nextdup) + { + dw_cu_ref ref1cu = NULL; + dw_cu_ref ref2cu = NULL; + while (ref1 && (ref1cu = die_cu (ref1)) == last_cu1) + ref1 = ref1->die_nextdup; + while (ref2 && (ref2cu = die_cu (ref2)) == last_cu2) + ref2 = ref2->die_nextdup; + if (ref1 == NULL || ref2 == NULL) + break; + last_cu1 = ref1cu; + last_cu2 = ref2cu; + if (last_cu1->cu_offset < last_cu2->cu_offset) + return -1; + else if (last_cu1->cu_offset > last_cu2->cu_offset) + return 1; + } + if (ref1) + return -1; + if (ref2) + return 1; + /* The rest is just to keep sort stable. */ + if (die1->die_offset < die2->die_offset) + return -1; + if (die1->die_offset > die2->die_offset) + return 1; + return 0; +} + +/* Add duplicate chain for DIE to VEC. */ +static void +partition_found_dups (dw_die_ref die, struct obstack *vec) +{ + assert (die->die_ck_state == CK_KNOWN); + obstack_ptr_grow (vec, die); + if (unlikely (verify_dups_p)) + verify_dups (die, true); + + if (stats_p) + { + uint64_t length = 0; + for (; die; die = die->die_nextdup) + length++; + stats->dup_cnt += length; + stats->dup_chain_max_length = MAX (stats->dup_chain_max_length, length); + stats->dup_chain_cnt++; + } +} + +/* Sort duplication chain for HEAD, assuming the chain was formed by + die_eq. */ +static void +sort_dups (dw_die_ref head) +{ + dw_die_ref prev = NULL, die, next; + /* Sort the die_nextdup list by increasing die_cu ()->cu_chunk. + When it is originally added, child has the lowest + cu_offset, then the DIEs are sorted in the linked list + from highest cu_offset down to lowest or second lowest. */ + for (die = head->die_nextdup; die; prev = die, die = next) + { + next = die->die_nextdup; + die->die_nextdup = prev; + } + head->die_nextdup = prev; +} + +/* Merge duplicate chains D and D2, and return the head of the merged +chain. */ +static dw_die_ref +merge_dups (dw_die_ref d, dw_die_ref d2) +{ + if (d == NULL) + return d2; + if (d2 == NULL) + return d; + + dw_die_ref tail = NULL; + dw_die_ref head = NULL; + while (true) + { + dw_die_ref next; + if (d && d2) + { + if (d->die_offset < d2->die_offset) + { + next = d; + d = d->die_nextdup; + } + else + { + next = d2; + d2 = d2->die_nextdup; + } + } + else if (d) + { + next = d; + d = d->die_nextdup; + } + else if (d2) + { + next = d2; + d2 = d2->die_nextdup; + } + else + break; + if (!head) + head = next; + if (tail) + tail->die_nextdup = next; + tail = next; + } + + for (d = head; d; d = d->die_nextdup) + if (d == head) + d->die_dup = NULL; + else + d->die_dup = head; + + if (unlikely (verify_dups_p)) + verify_dups (head, true); + return head; +} + +static void +mark_singletons (dw_cu_ref cu, dw_die_ref top_die, dw_die_ref die, + struct obstack *vec) +{ + struct abbrev_tag *t; + unsigned int i; + unsigned char *ptr; + dw_die_ref child; + bool found; + + t = die->die_abbrev; + + found = false; + for (i = 0; i < t->nattr; ++i) + { + struct abbrev_attr *attr = &t->attr[i]; + if (attr->attr == DW_AT_sibling) + continue; + switch (attr->form) + { + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + case DW_FORM_indirect: + found = true; + break; + } + } + if (!found) + goto handle_children; + + if (unlikely (cu->cu_kind == CU_TYPES)) + ptr = debug_sections[DEBUG_TYPES].data; + else + ptr = debug_sections[DEBUG_INFO].data; + ptr += die->die_offset; + skip_leb128 (ptr); + for (i = 0; i < t->nattr; ++i) + { + struct abbrev_attr *attr = &t->attr[i]; + uint32_t form = attr->form; + uint64_t value; + dw_die_ref ref, reft; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + + switch (form) + { + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form) + { + case DW_FORM_ref_udata: value = read_uleb128 (ptr); break; + case DW_FORM_ref1: value = read_8 (ptr); break; + case DW_FORM_ref2: value = read_16 (ptr); break; + case DW_FORM_ref4: value = read_32 (ptr); break; + case DW_FORM_ref8: value = read_64 (ptr); break; + default: abort (); + } + if (t->attr[i].attr == DW_AT_sibling) + break; + ref = off_htab_lookup (cu, cu->cu_offset + value); + if (!ref->die_collapsed_child + && ref->u.p1.die_enter >= top_die->u.p1.die_enter + && ref->u.p1.die_exit <= top_die->u.p1.die_exit) + break; + reft = ref; + while (!reft->die_root + && reft->die_parent->die_tag != DW_TAG_compile_unit + && reft->die_parent->die_tag != DW_TAG_partial_unit + && !reft->die_parent->die_named_namespace) + reft = reft->die_parent; + if (reft->die_dup != NULL || reft->die_nextdup != NULL) + break; + if (reft->die_ref_seen) + break; + reft->die_ref_seen = 1; + partition_found_dups (reft, vec); + mark_singletons (die_cu (reft), reft, reft, vec); + break; + default: + ptr = skip_attr_no_dw_form_indirect (cu->cu_version, form, ptr); + break; + } + } + + handle_children: + for (child = die->die_child; child; child = child->die_sib) + mark_singletons (cu, top_die, child, vec); +} + +/* Split maximal duplicate chain DIE into smaller chains that contain + structurally equal defs, and combine the decls with one of those. + Return the first chain, and call partition_found_dups for the others. */ +static dw_die_ref +split_dups (dw_die_ref die, struct obstack *vec) +{ + dw_die_ref res = NULL; + + /* Count the DIEs in the duplicate chain. */ + unsigned count = 0; + dw_die_ref d; + for (d = die; d; d = d->die_nextdup) + count++; + assert (count >= 2); + + /* Break up the duplicate chain. */ + dw_die_ref arr[count]; + unsigned int i; + for (d = die, i = 0; d; d = d->die_nextdup, i++) + arr[i] = d; + for (i = 0; i < count; i++) + { + d = arr[i]; + d->die_nextdup = NULL; + d->die_dup = NULL; + } + + /* Build decls duplicate chain. */ + dw_die_ref tail = NULL; + dw_die_ref head = NULL; + for (i = 0; i < count; i++) + { + d = arr[i]; + if (die_odr_state (d) != ODR_DECL) + continue; + if (!head) + head = d; + if (tail) + tail->die_nextdup = d; + if (d != head) + d->die_dup = head; + tail = d; + } + dw_die_ref decls = head; + + /* Build def duplicate chains. */ + unsigned int j; + dw_die_ref d2; + for (i = 0; i < count; i++) + { + d = arr[i]; + if (d->die_dup || d->die_nextdup + || die_odr_state (d) == ODR_DECL) + continue; + tail = d; + for (j = i + 1; j < count; j++) + { + d2 = arr[j]; + if (d2->die_dup || d2->die_nextdup + || die_odr_state (d2) == ODR_DECL) + continue; + die_eq (d, d2); + } + sort_dups (d); + } + + if (odr_mode != ODR_BASIC) + { + /* Find the first duplicate chain containing defs. */ + dw_die_ref def = NULL; + for (i = 0; i < count; i++) + { + d = arr[i]; + if (die_odr_state (d) == ODR_DECL + || d->die_dup != NULL) + continue; + def = d; + break; + } + + /* Merge the def chain with the decls. */ + merge_dups (def, decls); + } + + for (i = 0; i < count; i++) + { + d = arr[i]; + if (d->die_dup == NULL) + /* If DIE is now either: + - no longer part of a duplicate chain, or + - head of a duplicate chain, + don't remove it. */ + d->die_remove = 0; + } + + /* Notice the new duplicate chains. */ + for (i = 0; i < count; i++) + { + d = arr[i]; + if (d->die_dup != NULL) + continue; + if (res == NULL) + res = d; + else + partition_found_dups (d, vec); + } + return res; +} + +/* Search for duplicate removal reference DIE candidates + in tree rooted by PARENT. */ +static void +partition_find_dups (struct obstack *vec, dw_die_ref parent) +{ + dw_die_ref child; + for (child = parent->die_child; child; child = child->die_sib) + { + if (child->die_nextdup != NULL + && child->die_dup == NULL + && child->die_offset != -1U) + { + dw_die_ref die; + + if (unlikely (op_multifile)) + { + /* If all the dups are from the same DSO or executable, + there is nothing in it to optimize in between different + objects. */ + unsigned int cu_chunk = die_cu (child)->cu_chunk; + for (die = child->die_nextdup; die; die = die->die_nextdup) + if (die_cu (die)->cu_chunk != cu_chunk) + break; + if (die == NULL) + continue; + } + sort_dups (child); + partition_found_dups (child, vec); + } + else if (child->die_named_namespace) + partition_find_dups (vec, child); + } +} + +/* Reorder duplicate chain DIE to make sure it doesn't start with a decl. */ +static dw_die_ref +reorder_dups (dw_die_ref die) +{ + unsigned decl_count = 0; + unsigned def_count = 0; + dw_die_ref d; + + if (die_odr_state (die) == ODR_NONE) + return die; + + for (d = die; d; d = d->die_nextdup) + { + if (die_odr_state (d) == ODR_DECL) + decl_count++; + else + def_count++; + } + if (def_count == 0 || decl_count == 0) + return die; + + if (die_odr_state (die) != ODR_DECL) + return die; + + dw_die_ref def = NULL; + dw_die_ref prev = NULL; + for (d = die; d; prev = d, d = d->die_nextdup) + { + if (die_odr_state (d) == ODR_DECL) + continue; + def = d; + break; + } + + assert (!die->die_remove); + assert (def->die_remove); + def->die_remove = 0; + die->die_remove = 1; + def->die_ref_seen = die->die_ref_seen; + dw_die_ref next = def->die_nextdup; + if (prev) + prev->die_nextdup = next; + def->die_nextdup = die; + for (d = def; d; prev = d, d = d->die_nextdup) + { + if (d == def) + d->die_dup = NULL; + else + d->die_dup = def; + } + + if (unlikely (verify_dups_p)) + verify_dups (def, false); + return def; +} + +/* Copy DIE tree of DIE, as children of new DIE PARENT. */ +static dw_die_ref +copy_die_tree (dw_die_ref parent, dw_die_ref die) +{ + dw_die_ref child, new_child, *diep; + dw_die_ref new_die; + if (die->die_toplevel) + { + new_die = pool_alloc (dw_die, sizeof (struct dw_die)); + memset (new_die, '\0', sizeof (*new_die)); + new_die->die_toplevel = 1; + die->die_dup = new_die; + new_die->die_nextdup = die; + if (!die->die_op_type_referenced) + die->die_remove = 1; + } + else + { + new_die = pool_alloc (dw_die, offsetof (struct dw_die, die_dup)); + memset (new_die, '\0', offsetof (struct dw_die, die_dup)); + } + new_die->die_parent = parent; + new_die->die_tag = die->die_tag; + new_die->die_offset = -1U; + new_die->die_size = die->die_size; + diep = &new_die->die_child; + for (child = die->die_child; child; child = child->die_sib) + { + new_child = copy_die_tree (new_die, child); + *diep = new_child; + diep = &new_child->die_sib; + } + return new_die; +} + +/* If all DIEs in the duplication chain DIE are in CUs with the same + language, return that language. Otherwise, return 0. */ +static enum dwarf_source_language +partition_lang (dw_die_ref die) +{ + enum dwarf_source_language lang; + dw_die_ref d; + + if (die == NULL) + return 0; + + lang = die_cu (die)->lang; + switch (lang) + { + case DW_LANG_C_plus_plus: + case DW_LANG_C_plus_plus_03: + case DW_LANG_C_plus_plus_11: + case DW_LANG_C_plus_plus_14: + break; + default: + return 0; + } + + for (d = die->die_nextdup; d; d = d->die_nextdup) + if (die_cu (d)->lang != lang) + return 0; + + return lang; +} + +/* Return how many bytes we need to encode VAL. */ +static unsigned int +nr_bytes_for (uint64_t val) +{ + unsigned int n; + + if (val == 0) + return 1; + + for (n = 0; val > 0; n++) + val = val >> 8; + + return n; +} + +/* Return true if duplicate chains REF1 and REF2 have the same set of + referrer CUs. If so, return the number of unique referrer CUs + in *CNT. */ +static inline unsigned int FORCE_INLINE +same_ref_cus_p (dw_die_ref ref1, dw_die_ref ref2, size_t *cnt) +{ + dw_cu_ref last_cu1 = NULL, last_cu2 = NULL; + + *cnt = 0; + + if (odr_active_p && odr_mode != ODR_BASIC) + { + dw_die_ref orig_ref1 = ref1, orig_ref2 = ref2; + while (ref1 && die_odr_state (ref1) == ODR_DECL) + ref1 = ref1->die_nextdup; + if (ref1 == NULL) + ref1 = orig_ref1; + while (ref2 && die_odr_state (ref2) == ODR_DECL) + ref2 = ref2->die_nextdup; + if (ref2 == NULL) + ref2 = orig_ref2; + } + for (;; ref1 = ref1->die_nextdup, ref2 = ref2->die_nextdup) + { + dw_cu_ref ref1cu = NULL; + dw_cu_ref ref2cu = NULL; + + while (ref1 && (ref1cu = die_cu (ref1)) == last_cu1) + ref1 = ref1->die_nextdup; + while (ref2 && (ref2cu = die_cu (ref2)) == last_cu2) + ref2 = ref2->die_nextdup; + if (ref1 == NULL || ref2 == NULL) + break; + + last_cu1 = ref1cu; + last_cu2 = ref2cu; + + if (last_cu1 != last_cu2) + break; + else + (*cnt)++; + } + + if (ref1 || ref2) + return false; + + return true; +} + +/* Return the number of unique referrer CUs in duplicate chain REF. */ +static inline size_t FORCE_INLINE +cnt_ref_cus (dw_die_ref ref) +{ + dw_cu_ref last_cu1 = NULL; + size_t cnt = 0; + + for (;; ref = ref->die_nextdup) + { + dw_cu_ref refcu = NULL; + while (ref && (refcu = die_cu (ref)) == last_cu1) + ref = ref->die_nextdup; + if (ref == NULL) + break; + last_cu1 = refcu; + cnt++; + } + + return cnt; +} + +/* Helper function of partition_dups_1. Decide what DIEs matching in + multiple CUs might be worthwhile to be moved into partial units, + construct those partial units. */ +static bool +partition_dups_1 (dw_die_ref *arr, size_t nr_partitions, size_t *partitions, + dw_cu_ref *first_partial_cu, + dw_cu_ref *last_partial_cu, + bool second_phase) +{ + size_t i, j, cnt; + bool ret = false; + size_t idx = 0; + for (idx = 0; idx < nr_partitions * 2; idx += 2) + { + i = partitions[idx]; + cnt = partitions[idx + 1]; + j = partitions[idx + 2]; + + if (arr[i]->die_dup != NULL) + continue; + + dw_die_ref ref; + size_t size = 0, k, orig_size, new_size, namespaces = 0; + unsigned int force = 0; + enum dwarf_source_language part_lang + = gen_cu_p ? partition_lang (arr[i]) : 0; + for (k = i; k < j; k++) + { + if (second_phase && arr[k]->die_ref_seen) + force++; + size += calc_sizes (arr[k]); + for (ref = arr[k]->die_parent; + ref->die_named_namespace && ref->die_dup == NULL; + ref = ref->die_parent) + { + ref->die_dup = arr[k]; + namespaces++; + } + } + /* If during second_phase there are some DIEs we want to force + into a partial unit because they are referenced from something + already forced into a partial unit, but also some DIEs with + the same set of referrers, try to see if we can put also those + into the partial unit. They can be put there only if they + don't refer to DIEs that won't be put into partial units. */ + if (unlikely (partition_dups_opt) + && second_phase && force && force < j - i) + { + /* First optimistically assume all such DIEs can be put there, + thus mark all such DIEs as going to be included, so that + even if one of those DIEs references another one from those + DIEs it can be included. */ + for (k = i; k < j; k++) + { + assert (arr[k]->die_ref_seen < 2); + if (arr[k]->die_ref_seen == 0) + arr[k]->die_ref_seen = 2; + } + for (k = i; k < j; k++) + if (arr[k]->die_ref_seen == 2 + && !mark_refs (die_cu (arr[k]), arr[k], arr[k], + (MARK_REFS_FOLLOW_DUPS | MARK_REFS_RETURN_VAL))) + break; + /* If that is not possible and some DIEs couldn't be included, + fallback to assume other DIEs won't be included. */ + if (k < j) + { + for (k = i; k < j; k++) + if (arr[k]->die_ref_seen == 2) + arr[k]->die_ref_seen = 0; + for (k = i; k < j; k++) + if (arr[k]->die_ref_seen == 0) + { + arr[k]->die_ref_seen = 2; + if (!mark_refs (die_cu (arr[k]), arr[k], arr[k], + (MARK_REFS_FOLLOW_DUPS + | MARK_REFS_RETURN_VAL))) + arr[k]->die_ref_seen = 0; + } + } + } + if (namespaces) + { + for (k = i; k < j; k++) + for (ref = arr[k]->die_parent; ref->die_named_namespace; + ref = ref->die_parent) + ref->die_dup = NULL; + } + orig_size = size * cnt; + /* Estimated size of CU header and DW_TAG_partial_unit + with DW_AT_stmt_list and DW_AT_comp_dir attributes + 21 (also child end byte). With DW_AT_language c++, 22. */ + size_t pu_size + = (/* CU Header: unit length (initial length). + 32-bit DWARF: 4 bytes, 64-bit DWARF: 12 bytes. */ + 4 + /* CU Header: version (uhalf). + 2 bytes. */ + + 2 + /* CU Header: debug_abbrev_offset (section offset). + 32-bit DWARF: 4 bytes, 64-bit DWARF: 8 bytes. */ + + 4 + /* CU Header: address_size (ubyte). + 1 byte. */ + + 1 + /* DWARF5 CU header: unit_type (ubyte). */ + + (die_cu (arr[i])->cu_version >= 5 ? 1 : 0) + /* CU Root DIE: abbreviation code (unsigned LEB128). + 1 or more bytes. Optimistically assume 1. */ + + 1 + /* CU Root DIE: DW_AT_stmt_list (lineptr). + 32-bit DWARF: 4 bytes, 64-bit DWARF: 8 bytes. */ + + 4 + /* CU Root DIE: DW_AT_comp_dir (string). + DW_FORM_strp: 32-bit DWARF: 4 bytes, 64-bit DWARF: 8 bytes. + DW_FORM_string: 1 or more bytes. + Assume 4 bytes. */ + + 4 + /* CU Root DIE: DW_AT_language (constant). + 1 or 2 bytes. */ + + ((uni_lang_p || part_lang) + ? nr_bytes_for (die_cu (arr[i])->lang) + : 0) + /* CU root DIE children terminator: abbreviation code 0 + (unsigned LEB128). + 1 byte. */ + + 1); + /* DW_TAG_imported_unit with DW_AT_import attribute + (5 or 9 bytes (the latter for DWARF2 and ptr_size 8)). */ + size_t import_size + = (die_cu (arr[i])->cu_version == 2 ? 1 + ptr_size : 5); + /* For DW_TAG_namespace or DW_TAG_module needed as + parents of the DIEs conservatively assume 10 bytes + for the abbrev index, DW_AT_name attribute and + DW_AT_sibling attribute and child end. */ + size_t namespace_size = 10; + new_size = (/* Size of DIEs. */ + size + /* Size of PU. */ + + pu_size + /* Size of imports. */ + + (part_lang != 0 ? 0 : import_size * cnt) + /* Size of namespace DIEs. */ + + namespace_size * namespaces); + if (!second_phase) + force = ((deduplication_mode == dm_inter_cu) + && (ignore_size || orig_size > new_size)); + if (force) + { + dw_die_ref die, *diep; + dw_cu_ref refcu = die_cu (arr[i]); + dw_cu_ref partial_cu = pool_alloc (dw_cu, sizeof (struct dw_cu)); + memset (partial_cu, '\0', sizeof (*partial_cu)); + if (stats_p) + { + if (!second_phase) + stats->pu_ph1_cnt++; + else + stats->pu_ph2_cnt++; + } + partial_cu->cu_kind = CU_PU; + partial_cu->cu_offset = *last_partial_cu == NULL + ? 0 : (*last_partial_cu)->cu_offset + 1; + if (dump_pus_p) + fprintf (stderr, "Partial unit (%s) @ 0x%x:\n", + second_phase ? "phase two" : "phase one", + partial_cu->cu_offset); + partial_cu->cu_version = refcu->cu_version; + if (uni_lang_p) + partial_cu->lang = refcu->lang; + if (*first_partial_cu == NULL) + *first_partial_cu = *last_partial_cu = partial_cu; + else + { + (*last_partial_cu)->cu_next = partial_cu; + *last_partial_cu = partial_cu; + } + die = pool_alloc (dw_die, sizeof (struct dw_die)); + memset (die, '\0', sizeof (*die)); + die->die_toplevel = 1; + partial_cu->cu_die = die; + die->die_tag = DW_TAG_partial_unit; + die->die_offset = -1U; + die->die_root = 1; + die->die_parent = (dw_die_ref) partial_cu; + die->die_nextdup = refcu->cu_die; + die->die_size = 9; + diep = &die->die_child; + for (k = i; k < j; k++) + { + dw_die_ref child; + if (second_phase && !arr[k]->die_ref_seen) + continue; + if (dump_pus_p) + dump_die (arr[k]); + child = copy_die_tree (die, arr[k]); + if (stats_p) + stats->pu_toplevel_die_cnt++; + for (ref = arr[k]->die_nextdup; ref; ref = ref->die_nextdup) + ref->die_dup = child; + if (unlikely (verify_dups_p)) + verify_dups (child, odr_mode == ODR_BASIC); + if (part_lang != 0) + { + die->die_tag = DW_TAG_compile_unit; + partial_cu->lang = part_lang; + } + if (namespaces) + { + for (ref = arr[k]->die_parent; + ref->die_named_namespace && ref->die_dup == NULL; + ref = ref->die_parent) + { + dw_die_ref namespc + = pool_alloc (dw_die, sizeof (struct dw_die)); + memset (namespc, '\0', sizeof (struct dw_die)); + namespc->die_toplevel = 1; + namespc->die_tag = ref->die_tag; + namespc->die_offset = -1U; + namespc->die_nextdup = ref; + namespc->die_child = child; + namespc->die_parent = die; + namespc->die_size = 9; + namespc->die_named_namespace = 1; + child->die_parent = namespc; + ref->die_dup = namespc; + child = namespc; + } + if (ref->die_dup != NULL) + { + dw_die_ref *diep2; + for (diep2 = &ref->die_dup->die_child->die_sib; + *diep2; diep2 = &(*diep2)->die_sib) + ; + *diep2 = child; + child->die_parent = ref->die_dup; + continue; + } + } + *diep = child; + diep = &child->die_sib; + } + if (namespaces) + { + for (k = i; k < j; k++) + { + if (second_phase && !arr[k]->die_ref_seen) + continue; + for (ref = arr[k]->die_parent; + ref->die_named_namespace; ref = ref->die_parent) + ref->die_dup = NULL; + } + } + } + else if (!second_phase) + ret = true; + if (second_phase) + { + dw_die_ref next; + for (k = i; k < j; k++) + { + if (arr[k]->die_dup != NULL) + continue; + for (ref = arr[k]; ref; ref = next) + { + dw_cu_ref refcu = die_cu (ref); + next = ref->die_nextdup; + ref->die_dup = NULL; + ref->die_nextdup = NULL; + ref->die_remove = 0; + /* If there are dups within a single CU + (arguably a bug in the DWARF producer), + keep them linked together, but don't link + DIEs across different CUs. */ + while (deduplication_mode != dm_none + && next && refcu == die_cu (next)) + { + dw_die_ref cur = next; + next = cur->die_nextdup; + cur->die_dup = ref; + cur->die_nextdup = ref->die_nextdup; + ref->die_nextdup = cur; + } + } + } + } + } + return ret; +} + +/* Partition the duplicate chains in array ARR with size VEC_SIZE, and store + the partitions on obstack ob2, with for each partition two entries: + the start and the number of unique reffer CUs. */ +static void +calculate_partitions (dw_die_ref *arr, size_t vec_size) +{ + size_t i, j; + for (i = 0; i < vec_size; i = j) + { + size_t cnt = 0; + for (j = i + 1; j < vec_size; j++) + { + size_t this_cnt; + if (!same_ref_cus_p (arr[i], arr[j], &this_cnt)) + break; + cnt = this_cnt; + } + if (cnt == 0) + cnt = cnt_ref_cus (arr[i]); + obstack_grow (&ob2, &i, sizeof (size_t)); + obstack_grow (&ob2, &cnt, sizeof (size_t)); + } + + /* Add element to mark end of partition list. This allows us to do + 'j = partitions[idx + 2]' for all partitions. */ + obstack_grow (&ob2, &j, sizeof (size_t)); + size_t zero = 0; + obstack_grow (&ob2, &zero, sizeof (size_t)); +} + +static inline void FORCE_INLINE +reset_die_ref_seen (void) +{ + dw_die_ref die; + dw_cu_ref cu; + FOREACH_CU_NORMAL_LOW_TOPLEVEL_DIE (cu, die) + die->die_ref_seen = 0; +} + +/* If the duplicate chain DIE consists of a singleton ODR_DEF die merged with + the ODR_DECL chain, return the singleton ODR_DEF die. Otherwise, return + NULL. */ +static inline dw_die_ref FORCE_INLINE +merged_singleton (dw_die_ref die) +{ + dw_die_ref res = NULL; + dw_die_ref d; + size_t decl_cnt = 0; + + for (d = die; d; d = d->die_nextdup) + switch (die_odr_state (d)) + { + case ODR_DEF: + if (res) + { + if (die_cu (res) == die_cu (d)) + continue; + else + return NULL; + } + else + res = d; + break; + case ODR_DECL: + decl_cnt++; + break; + default: + return NULL; + } + + if (decl_cnt == 0) + return NULL; + + return res; +} + +/* Decide what DIEs matching in multiple CUs might be worthwhile + to be moved into partial units, construct those partial units. */ +static int +partition_dups (void) +{ + dw_cu_ref cu, first_partial_cu = NULL, last_partial_cu = NULL; + size_t vec_size, i; + unsigned char *to_free; + dw_die_ref *arr; + + if (unlikely (fi_multifile)) + return 0; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "partition_dups\n"); + } + + to_free = obstack_alloc (&ob2, 1); + + if (odr_active_p) + odr_phase = 2; + + for (cu = first_cu; cu; cu = cu->cu_next) + partition_find_dups (&ob2, cu->cu_die); + vec_size = obstack_object_size (&ob2) / sizeof (void *); + + if (odr_active_p) + { + arr = (dw_die_ref *) obstack_base (&ob2); + if (progress_p) + { + report_progress (); + fprintf (stderr, "partition_dups split_dups\n"); + } + for (i = 0; i < vec_size; i++) + { + dw_die_ref die = arr[i]; + if (die_odr_state (die) == ODR_NONE) + continue; + die = split_dups (die, &ob2); + assert (die != NULL); + if (unlikely (verify_dups_p)) + verify_dups (die, true); + arr = (dw_die_ref *) obstack_base (&ob2); + arr[i] = die; + } + + vec_size = obstack_object_size (&ob2) / sizeof (void *); + + reset_die_ref_seen (); + for (i = 0; i < vec_size; i++) + { + dw_die_ref die = arr[i]; + if (die->die_dup == NULL + && die->die_nextdup == NULL) + die->die_ref_seen = 1; + } + for (i = 0; i < vec_size; i++) + { + dw_die_ref die = arr[i]; + if (die->die_dup == NULL + && die->die_nextdup == NULL) + mark_singletons (die_cu (die), die, die, &ob2); + else if (odr_mode != ODR_BASIC + && die_odr_state (die) != ODR_NONE) + { + dw_die_ref s = merged_singleton (die); + if (s) + mark_singletons (die_cu (s), s, s, &ob2); + } + else if (cnt_ref_cus (die) == 1) + mark_singletons (die_cu (die), die, die, &ob2); + + arr = (dw_die_ref *) obstack_base (&ob2); + } + + vec_size = obstack_object_size (&ob2) / sizeof (void *); + } + + if (odr_active_p) + odr_phase = 3; + + if (stats_p) + print_dups_stats (); + + if (vec_size != 0) + { + arr = (dw_die_ref *) obstack_finish (&ob2); + if (odr_active_p) + for (i = 0; i < vec_size; ++i) + { + assert (arr[i] != NULL); + if (unlikely (verify_dups_p)) + verify_dups (arr[i], true); + } + if (dump_dups_p) + { + for (i = 0; i < vec_size; ++i) + { + fprintf (stderr, "duplicate chain:\n"); + dump_dups (arr[i]); + } + } + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "partition_dups qsort\n"); + } + qsort (arr, vec_size, sizeof (dw_die_ref), partition_cmp); + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "partition_dups after qsort\n"); + } + + size_t *partitions = (size_t *) obstack_base (&ob2); + calculate_partitions (arr, vec_size); + size_t nr_partitions + = (obstack_object_size (&ob2) / sizeof (size_t)) / 2 - 1; + partitions = (size_t *) obstack_finish (&ob2); + if (stats_p) + stats->part_cnt += nr_partitions; + + if (odr_active_p && odr_mode != ODR_BASIC) + for (i = 0; i < vec_size; ++i) + arr[i] = reorder_dups (arr[i]); + if (partition_dups_1 (arr, nr_partitions, partitions, &first_partial_cu, + &last_partial_cu, false)) + { + for (i = 0; i < vec_size; i++) + arr[i]->die_ref_seen = arr[i]->die_dup != NULL; + for (i = 0; i < vec_size; i++) + if (arr[i]->die_dup != NULL) + mark_refs (die_cu (arr[i]), arr[i], arr[i], + MARK_REFS_FOLLOW_DUPS); + partition_dups_1 (arr, nr_partitions, partitions, &first_partial_cu, + &last_partial_cu, true); + for (i = 0; i < vec_size; i++) + arr[i]->die_ref_seen = 0; + } + } + if (first_partial_cu) + { + last_partial_cu->cu_next = first_cu; + first_cu = first_partial_cu; + } + obstack_free (&ob2, to_free); + + if (stats_p) + print_part_stats (); + + return 0; +} + +/* The create_import_tree function below and all its helper + data structures and functions attempt to optimize the size of + DW_TAG_imported_unit DIEs, from the initial assumption that + each CU that needs to include some newly created DW_TAG_partial_unit + will contain DW_TAG_imported_unit for each such partial unit (PU) + (so basically a bipartite graph with CUs and PUs as nodes + and DW_TAG_imported_unit DIEs as edges) into a tree, where some + of the partial units may also include DW_TAG_imported_unit + DIEs, or when beneficial new PUs are created to hold some + DW_TAG_imported_unit DIEs. */ + +struct import_edge; + +/* Structure describing details about a CU or PU (i.e. a node + in the graph). */ +struct import_cu +{ + /* Corresponding CU. CU->u1.cu_icu points back to this + structure while in create_import_tree. */ + dw_cu_ref cu; + /* Linked list of incoming resp. outgoing edges. */ + struct import_edge *incoming, *outgoing; + /* The tail of the linked list of incoming edges. */ + struct import_edge *incoming_tail; + /* Next import_cu (used to chain PUs together). */ + struct import_cu *next; + /* Number of incoming resp. outgoing edges. */ + unsigned int incoming_count, outgoing_count; + /* Index. Lowest indexes are assigned to partition_dups + created PUs (sorted by decreasing number of incoming + edges at the start), then referencing CUs + (similarly, sorted by decreasing number of outgoing + edges at the start), then optionally any PUs + created by create_import_tree. */ + unsigned int idx; +}; + +/* An edge in a linked list. */ +struct import_edge +{ + struct import_cu *icu; + struct import_edge *next; +}; + +/* Called through qsort to sort an array of edges by decreasing + incoming resp. outgoing_count (this is called when the graph + is bipartite, so CUs only have non-zero outgoing_count + and PUs only have non-zero incoming_count). */ +static int +import_edge_cmp (const void *p, const void *q) +{ + struct import_edge *e1 = (struct import_edge *) p; + struct import_edge *e2 = (struct import_edge *) q; + if (e1->icu->incoming_count > e2->icu->incoming_count) + return -1; + if (e1->icu->incoming_count < e2->icu->incoming_count) + return 1; + if (e1->icu->outgoing_count > e2->icu->outgoing_count) + return -1; + if (e1->icu->outgoing_count < e2->icu->outgoing_count) + return 1; + /* The rest is just to keep qsort stable. */ + if (e1->icu->cu->cu_offset < e2->icu->cu->cu_offset) + return -1; + if (e1->icu->cu->cu_offset > e2->icu->cu->cu_offset) + return 1; + return 0; +} + +/* Called through qsort to sort an array of CUs/PUs by decreasing + incoming resp. outgoing_count (this is called when the graph + is bipartite, so CUs only have non-zero outgoing_count + and PUs only have non-zero incoming_count). */ +static int +import_cu_cmp (const void *p, const void *q) +{ + struct import_cu *c1 = *(struct import_cu **) p; + struct import_cu *c2 = *(struct import_cu **) q; + if (c1->incoming_count > c2->incoming_count) + return -1; + if (c1->incoming_count < c2->incoming_count) + return 1; + if (c1->outgoing_count > c2->outgoing_count) + return -1; + if (c1->outgoing_count < c2->outgoing_count) + return 1; + /* The rest is just to keep qsort stable. */ + if (c1->cu->cu_offset < c2->cu->cu_offset) + return -1; + if (c1->cu->cu_offset > c2->cu->cu_offset) + return 1; + return 0; +} + +/* Freelist for removed edges. */ +static struct import_edge *edge_freelist; + +/* Prepare edge E to add to edge_freelist. */ +static inline void FORCE_INLINE +prepare_free_edge (struct import_edge *e UNUSED) +{ +#if DEVEL + e->icu = (void *)(uintptr_t)-1; +#endif +} + +/* Add edge E to edge_freelist. */ +static inline void FORCE_INLINE +free_edge (struct import_edge *e) +{ + prepare_free_edge (e); + e->next = edge_freelist; + edge_freelist = e; +} + +/* Add edge list starting at HEAD and ending at TAIL to edge_freelist. + Assume that prepare_free_edge has been called on all elements. */ +static inline void FORCE_INLINE +free_edges (struct import_edge *head, struct import_edge *tail) +{ +#if DEVEL + if (verify_edge_freelist) + { + struct import_edge *e; + for (e = head; e; e = e->next) + { + assert (e->icu == (void *)(uintptr_t)-1); + if (e == tail) + break; + } + assert (e != NULL); + } +#endif + tail->next = edge_freelist; + edge_freelist = head; +} + +/* Detach an edge from edge_freelist, and return it. */ +static inline struct import_edge * FORCE_INLINE +edge_from_freelist (void) +{ +#if DEVEL + assert (edge_freelist); +#endif + struct import_edge *e = edge_freelist; + edge_freelist = edge_freelist->next; +#if DEVEL + e->next = (void *)(uintptr_t)-1; +#endif + return e; +} + +/* Return edge_freelist, and set it to NULL. */ +static inline struct import_edge * FORCE_INLINE +first_edge_from_freelist (void) +{ +#if DEVEL + assert (edge_freelist); +#endif + struct import_edge *e = edge_freelist; +#if DEVEL + edge_freelist = NULL; +#endif + return e; +} + +/* Set edge_freelist to TAIL->next and return HEAD. Assume HEAD was returned + by first_edge_from_freelist, and TAIL is reachable from HEAD. */ +static inline struct import_edge * FORCE_INLINE +last_edge_from_freelist (struct import_edge *head, struct import_edge *tail) +{ +#if DEVEL + assert (!edge_freelist); + if (verify_edge_freelist) + { + struct import_edge *e; + for (e = head; e; e = e->next) + { + if (e == tail) + break; + } + assert (e != NULL); + } +#endif + edge_freelist = tail->next; + tail->next = NULL; + return head; +} + +/* Remove edges in linked list EP that refer to CUS, which + is an array of CUCOUNT CUs/PUs. If ADD is true, additionally + add a new edge at the end of the linked list and return it. */ +static struct import_edge * +remove_import_edges (struct import_edge **ep, struct import_edge **ep_tail, + struct import_cu **cus, unsigned int cucount, bool add) +{ + unsigned int i = 0; + struct import_edge *e, *efirst = NULL, *prev = NULL; + while (*ep) + if (i < cucount && (*ep)->icu == cus[i]) + { + e = *ep; + *ep = e->next; + if (efirst == NULL) + efirst = e; + else + free_edge (e); + i++; + if (ep_tail && *ep_tail == e) + *ep_tail = prev; + if (i == cucount && !add) + return NULL; + } + else + { + if (ep_tail) + prev = *ep; + ep = &(*ep)->next; + } + assert (i == cucount); + *ep = efirst; + efirst->next = NULL; + if (ep_tail) + *ep_tail = efirst; + return efirst; +} + +static void +dump_edges_1 (struct import_cu *ipu) +{ + fprintf (stderr, "idx: %u\n", ipu->idx); + fprintf (stderr, "cu: 0x%x\n", ipu->cu->cu_offset); + struct import_edge *e1; + for (e1 = ipu->incoming; e1; e1 = e1->next) + fprintf (stderr, "incoming: %u\n", e1->icu->idx); + for (e1 = ipu->outgoing; e1; e1 = e1->next) + fprintf (stderr, "outgoing: %u\n", e1->icu->idx); +} + +static void +dump_edges (const char *msg, struct import_cu **ipus, unsigned int npus, + unsigned int ncus) +{ + struct import_cu *ipu; + unsigned int i; + fprintf (stderr, "PRINT_EDGES: %s\n", msg); + fprintf (stderr, "PUs\n"); + for (ipu = ipus[0]; ipu; ipu = ipu->next) + dump_edges_1 (ipu); + fprintf (stderr, "CUs\n"); + for (i = 0; i < ncus; i++) + dump_edges_1 (ipus[i + npus]); +} + +/* Enumerate the different kinds of nodes in the import_cu/import_edge + graph. */ +enum node_kind { NODE_CU, NODE_PU_INITIAL, NODE_PU_NEW }; + +/* Return the node kind for node IDX, given that: + - [0, NPUS - 1] are initial PUs, + - [NPUS, NPUS + NCUS - 1] are CUs, and + - [NPUS + NCUS, ] are new PUs. */ +static enum node_kind +get_node_kind (unsigned int idx, unsigned int npus, unsigned int ncus) +{ + if (idx < npus) + return NODE_PU_INITIAL; + if (idx < npus + ncus) + return NODE_CU; + return NODE_PU_NEW; +} + +/* Verify an edge from SRC to DEST during create_import_tree phase PHASE. */ +static void +verify_edge (enum node_kind src, enum node_kind dest, unsigned int phase) +{ + if (phase == 1) + { + assert (src == NODE_CU && dest == NODE_PU_INITIAL); + return; + } + + assert (IMPLIES (src == NODE_CU, dest != NODE_CU)); + + if (phase == 2) + { + assert (IMPLIES (src == NODE_PU_NEW, dest == NODE_PU_INITIAL)); + assert (src != NODE_PU_INITIAL); + } + else + assert (IMPLIES (src == NODE_PU_NEW, dest != NODE_CU)); +} + +/* Helper function for debugging create_import_tree. Verify + various invariants for CU/PU IPU. */ +static void +verify_edges_1 (struct import_cu *ipu, unsigned int *ic, unsigned int *oc, + enum node_kind kind, unsigned int npus, unsigned int ncus, + unsigned int phase) +{ + struct import_edge *e1, *e2; + unsigned int last_idx, count; + enum node_kind kind2; + + for (last_idx = 0, count = 0, e1 = ipu->incoming; + e1; + last_idx = e1->icu->idx, count++, e1 = e1->next) + { + /* Verify that incoming edges are in ascending idx order. */ + assert (count == 0 || e1->icu->idx > last_idx); + + /* Verify that each incoming edge has a corresponding outgoing edge. */ + for (e2 = e1->icu->outgoing; e2; e2 = e2->next) + if (e2->icu == ipu) + break; + assert (e2); + + kind2 = get_node_kind (e1->icu->idx, npus, ncus); + verify_edge (kind2, kind, phase); + + if (count == ipu->incoming_count - 1) + assert (ipu->incoming_tail == e1); + } + + /* Verify the number of incoming edges. */ + assert (ipu->incoming_count == count); + + for (last_idx = 0, count = 0, e1 = ipu->outgoing; + e1; + last_idx = e1->icu->idx, count++, e1 = e1->next) + { + /* Verify that outgoing edges are in ascending idx order. */ + assert (count == 0 || e1->icu->idx > last_idx); + + /* Verify that each outgoing edge has a corresponding incoming edge. */ + for (e2 = e1->icu->incoming; e2; e2 = e2->next) + if (e2->icu == ipu) + break; + assert (e2); + + kind2 = get_node_kind (e1->icu->idx, npus, ncus); + verify_edge (kind, kind2, phase); + } + + /* Verify the number of outgoing edges. */ + assert (ipu->outgoing_count == count); + + *ic += ipu->incoming_count; + *oc += ipu->outgoing_count; +} + +/* Helper function for debugging create_import_tree. Call verify_edges_1 + on all CUs and PUs. */ +static void +verify_edges (struct import_cu **ipus, unsigned int npus, unsigned int ncus, + unsigned int phase) +{ + struct import_cu *ipu; + unsigned int i, ic, oc; + + ic = 0; + oc = 0; + + /* Verify initial PUs. */ + ipu = NULL; + for (i = 0; i < npus; ++i) + { + ipu = ipus[i]; + assert (ipu->cu != NULL); + if (i < npus - 1) + assert (ipu->next == ipus[i + 1]); + assert (ipu->incoming != NULL); + if (phase <= 2) + assert (ipu->outgoing == NULL); + verify_edges_1 (ipu, &ic, &oc, NODE_PU_INITIAL, npus, ncus, phase); + } + + /* Verify new PUs. */ + assert (ipu != NULL); + for (ipu = ipu->next; ipu; ipu = ipu->next) + { + assert (phase != 1); + assert (ipu->cu == NULL); + assert (ipu->incoming != NULL); + assert (ipu->outgoing != NULL); + verify_edges_1 (ipu, &ic, &oc, NODE_PU_NEW, npus, ncus, phase); + } + + /* Verify CUs. */ + for (i = 0; i < ncus; i++) + { + ipu = ipus[npus + i]; + assert (ipu->cu != NULL); + assert (ipu->next == NULL); + assert (ipu->incoming == NULL); + assert (ipu->outgoing != NULL); + verify_edges_1 (ipu, &ic, &oc, NODE_CU, npus, ncus, phase); + } + + /* Verify that the overall number of incoming and outgoing edges is + equal. */ + assert (ic == oc); +} + +#define BITVECTOR_TYPE unsigned int + +/* Return a bitvector containing NBITS bits. */ +static inline BITVECTOR_TYPE * +bitvector_alloc (unsigned nbits) +{ + size_t nbytes = (nbits / 8) + 1; + size_t size = nbytes + sizeof (BITVECTOR_TYPE); + BITVECTOR_TYPE *res = (BITVECTOR_TYPE *)malloc (size); + if (res == NULL) + dwz_oom (); + memset (res, 0, size); + return res; +} + +/* Set bit IDX in bitvector VECTOR. */ +static inline void FORCE_INLINE +bitvector_set_bit (BITVECTOR_TYPE *vector, unsigned idx) +{ + unsigned div = idx / (sizeof (BITVECTOR_TYPE) * 8); + unsigned mod = idx % (sizeof (BITVECTOR_TYPE) * 8); + vector[div] |= (1U << mod); +} + +/* Test bit IDX in bitvector VECTOR. */ +static inline bool FORCE_INLINE +bitvector_bit_p (BITVECTOR_TYPE *vector, unsigned idx) +{ + unsigned div = idx / (sizeof (BITVECTOR_TYPE) * 8); + unsigned mod = idx % (sizeof (BITVECTOR_TYPE) * 8); + return (vector[div] & (1U << mod)) != 0; +} + +/* Clear at least bits [A, B] in VECTOR, possibly more. */ +static inline void FORCE_INLINE +bitvector_clear_bits (BITVECTOR_TYPE *vector, unsigned int a, unsigned int b) +{ + unsigned int range_min = a / (sizeof (BITVECTOR_TYPE) * 8); + unsigned int range_max = b / (sizeof (BITVECTOR_TYPE) * 8); + memset (&vector[range_min], 0, + (range_max - range_min + 1) * sizeof (BITVECTOR_TYPE)); +} + +/* Function to optimize the size of DW_TAG_imported_unit DIEs by + creating an inclusion tree, instead of each CU importing all + PUs it needs directly, by optionally creating new PUs or + adding DW_TAG_imported_unit to the already created PUs. + At the end this function constructs any new PUs needed, and + adds DW_TAG_imported_unit DIEs to them as well as the CUs + and partition_dups created PUs. */ +static int +create_import_tree (void) +{ + dw_cu_ref pu, cu, last_partial_cu = NULL; + unsigned int i, new_pu_version = 2, min_cu_version, npus, ncus; + struct import_cu **ipus, *ipu, *icu; + unsigned int cu_off; + unsigned int puidx; + struct import_cu *last_pu, *pu_freelist = NULL; + unsigned char *to_free; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "create_import_tree phase 1\n"); + } + + /* size doesn't count anything already created before this + function (partial units etc.) or already preexisting, just + initially the cumulative sizes of DW_TAG_imported_unit DIEs + that would need to be added, and if some new DW_TAG_partial_unit + CUs are going to be created as a result of this routine, that size + too. DW_TAG_imported_unit has size 5 (for DWARF3+) or 1 + ptr_size + (DWARF2), DW_TAG_partial_unit has size 13/14 (11 CU header + 1 byte + abbrev number + 1 byte child end + 1 byte for DWARF5 unit_type). */ + unsigned int size = 0; + /* Size of DW_TAG_imported_unit if the same everywhere, otherwise + (mixing DWARF2 and DWARF3+ with ptr_size != 4) 0. */ + unsigned int edge_cost = 0; + /* Number of bytes needed for outgoing edges of PUs created by + this function (which all have DWARF version new_pu_version). */ + unsigned int new_edge_cost; + + /* If no PUs were created, there is nothing to do here. */ + if (first_cu == NULL || (fi_multifile ? alt_first_cu == NULL + : first_cu->cu_kind != CU_PU)) + return 0; + + edge_freelist = NULL; + to_free = obstack_alloc (&ob2, 1); + min_cu_version = first_cu->cu_version; + /* First construct a bipartite graph between CUs and PUs. */ + for (pu = fi_multifile ? alt_first_cu : first_cu, npus = 0; + pu && pu->cu_kind != CU_NORMAL; pu = pu->cu_next) + { + dw_die_ref die, rdie; + dw_cu_ref prev_cu; + + if (pu->cu_die->die_tag == DW_TAG_compile_unit) + continue; + + last_partial_cu = pu; + for (rdie = pu->cu_die->die_child; + rdie->die_named_namespace; rdie = rdie->die_child) + ; + if (unlikely (fi_multifile) && rdie->die_nextdup == NULL) + { + pu->u1.cu_icu = NULL; + continue; + } + npus++; + if (pu->cu_version > new_pu_version) + new_pu_version = pu->cu_version; + if (pu->cu_version < min_cu_version) + min_cu_version = pu->cu_version; + ipu = (struct import_cu *) obstack_alloc (&ob2, sizeof (*ipu)); + memset (ipu, 0, sizeof (*ipu)); + ipu->cu = pu; + pu->u1.cu_icu = ipu; + assert (rdie->die_toplevel); + dw_die_ref firstdie = NULL; + dw_cu_ref firstdiecu = NULL; + for (die = rdie->die_nextdup, prev_cu = NULL; + die; die = die->die_nextdup) + { + dw_cu_ref diecu = die_cu (die); + if (firstdie == NULL) + { + firstdie = die; + firstdiecu = die_cu (firstdie); + } + if (diecu == prev_cu || (die != firstdie && diecu == firstdiecu)) + continue; + ipu->incoming_count++; + size += 1 + (diecu->cu_version == 2 ? ptr_size : 4); + prev_cu = diecu; + } + ipu->incoming = (struct import_edge *) + obstack_alloc (&ob2, + ipu->incoming_count + * sizeof (*ipu->incoming)); + firstdie = NULL; + firstdiecu = NULL; + for (die = rdie->die_nextdup, i = 0, prev_cu = NULL; + die; die = die->die_nextdup) + { + dw_cu_ref diecu = die_cu (die); + if (firstdie == NULL) + { + firstdie = die; + firstdiecu = die_cu (firstdie); + } + if (diecu == prev_cu || (die != firstdie && diecu == firstdiecu)) + continue; + icu = diecu->u1.cu_icu; + if (icu == NULL) + { + icu = (struct import_cu *) + obstack_alloc (&ob2, sizeof (*ipu)); + memset (icu, 0, sizeof (*icu)); + icu->cu = diecu; + diecu->u1.cu_icu = icu; + } + ipu->incoming[i++].icu = icu; + icu->outgoing_count++; + prev_cu = diecu; + } + ipu->incoming_tail = &ipu->incoming[ipu->incoming_count - 1]; + } + if (npus == 0) + { + obstack_free (&ob2, to_free); + return 0; + } + for (cu = fi_multifile ? first_cu : pu, ncus = 0; cu; cu = cu->cu_next) + if (cu->u1.cu_icu) + { + ncus++; + if (cu->cu_version > new_pu_version) + new_pu_version = cu->cu_version; + if (cu->cu_version < min_cu_version) + min_cu_version = cu->cu_version; + cu->u1.cu_icu->outgoing + = (struct import_edge *) + obstack_alloc (&ob2, + cu->u1.cu_icu->outgoing_count + * sizeof (*cu->u1.cu_icu->outgoing)); + cu->u1.cu_icu->outgoing_count = 0; + } + if (ptr_size == 4 || min_cu_version > 2) + edge_cost = 5; + else if (new_pu_version == 2) + edge_cost = 1 + ptr_size; + new_edge_cost = new_pu_version == 2 ? 1 + ptr_size : 5; + for (pu = fi_multifile ? alt_first_cu : first_cu; + pu && pu->cu_kind != CU_NORMAL; pu = pu->cu_next) + { + ipu = pu->u1.cu_icu; + if (ipu == NULL) + continue; + for (i = 0; i < ipu->incoming_count; i++) + { + icu = ipu->incoming[i].icu; + icu->outgoing[icu->outgoing_count++].icu = ipu; + } + } + ipus = (struct import_cu **) + obstack_alloc (&ob2, (npus + ncus) * sizeof (*ipus)); + for (pu = fi_multifile ? alt_first_cu : first_cu, npus = 0; + pu && pu->cu_kind != CU_NORMAL; pu = pu->cu_next) + { + ipu = pu->u1.cu_icu; + if (ipu == NULL) + continue; + qsort (ipu->incoming, ipu->incoming_count, sizeof (*ipu->incoming), + import_edge_cmp); + for (i = 0; i < ipu->incoming_count; i++) + { + ipu->incoming[i].next + = i != ipu->incoming_count - 1 ? &ipu->incoming[i + 1] : NULL; + } + ipus[npus++] = ipu; + } + for (cu = fi_multifile ? first_cu : pu, ncus = 0; cu; cu = cu->cu_next) + if (cu->u1.cu_icu) + { + icu = cu->u1.cu_icu; + qsort (icu->outgoing, icu->outgoing_count, sizeof (*icu->outgoing), + import_edge_cmp); + for (i = 0; i < icu->outgoing_count - 1; i++) + icu->outgoing[i].next = &icu->outgoing[i + 1]; + icu->outgoing[i].next = NULL; + ipus[npus + ncus] = icu; + ncus++; + } + qsort (ipus, npus, sizeof (*ipus), import_cu_cmp); + qsort (ipus + npus, ncus, sizeof (*ipus), import_cu_cmp); + for (puidx = 0; puidx < npus; puidx++) + { + ipus[puidx]->idx = puidx; + if (puidx + 1 < npus) + ipus[puidx]->next = ipus[puidx + 1]; + } + for (; puidx < npus + ncus; puidx++) + ipus[puidx]->idx = puidx; + last_pu = ipus[npus - 1]; + if (unlikely (dump_edges_p)) + dump_edges ("phase 1", ipus, npus, ncus); + if (unlikely (verify_edges_p)) + verify_edges (ipus, npus, ncus, 1); + if (!import_opt_p) + goto opt_done; + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "create_import_tree phase 2\n"); + } + /* Now, for the above constructed bipartite graph, find K x,2 components + where x >= 5 (for DWARF3 and above or ptr_size 4, for DWARF2 and + ptr_size 8 it can be even x == 4) and add a new PU node, where all + CUs from the component will point to the new PU node and that new PU + will point to all the destination PUs. In theory with DWARF2 + and ptr_size 1 we could need x >= 9. + + The example below demonstrates the type of transformation. The + transformation is an optimization if the benefit of reducing the number + of imports (in other words, edges) is bigger than the cost of adding an + extra PU. OTOH, the transformation can be done in the presence of + additional incoming edges for PU_3 and PU_4. + + Before: After: + + CU_1---------->PU_3 CU_1 PU_3 + \ ^ ^ \ ^ + \ / / \ / + \ / / \ / + x----o / \ / + / \ / \ / + / \ / \ / + / \ / v / + CU_2 x CU_2----->PU_5 + \ / \ ^ \ + \ / \ / \ + \ / \ / \ + x----o \ / \ + / \ \ / \ + / \ \ / \ + / v v / v + CU_3---------->PU_4 CU_3 PU_4 + */ + for (i = 0; i < npus - 1; i++) + { + struct import_cu *pudst[2], *pusrc[10]; + struct import_edge *e1, *e2, *e3, *e4; + struct import_edge *e1next, *e2next, *e3next; + pudst[0] = ipus[i]; + for (e1 = pudst[0]->incoming; e1; e1 = e1next) + { + e1next = e1->next; + if (e1->icu->cu == NULL) + break; + for (e2 = e1->icu->outgoing; e2; e2 = e2next) + { + unsigned int srccount, dstcount, cost; + struct import_cu *npu = NULL; + struct import_edge **ep = NULL; + + e2next = e2->next; + if (e2->icu->idx <= pudst[0]->idx) + continue; + if (e2->icu->cu == NULL) + break; + + pudst[1] = e2->icu; + pusrc[0] = e1->icu; + srccount = 1; + cost = edge_cost; + if (!edge_cost) + cost = pusrc[0]->cu->cu_version == 2 ? 1 + ptr_size : 5; + for (e3 = e1next; e3; e3 = e3next) + { + e3next = e3->next; + if (e3->icu->cu == NULL) + break; + dstcount = 0; + for (e4 = e3->icu->outgoing; e4; e4 = e4->next) + { + if (e4->icu == pudst[0]) + dstcount++; + else if (e4->icu == pudst[1]) + { + dstcount++; + break; + } + else if (e4->icu->idx > pudst[1]->idx) + break; + } + if (dstcount != 2) + continue; + if (npu == NULL) + { + unsigned int header_size; + pusrc[srccount] = e3->icu; + header_size = (pusrc[srccount]->cu->cu_version >= 5 + ? 14 : 13); /* DWARF5 unit_type byte. */ + cost += edge_cost; + if (!edge_cost) + cost += pusrc[srccount]->cu->cu_version == 2 + ? 1 + ptr_size : 5; + srccount++; + if (ignore_size || ((dstcount - 1) * cost + > (header_size + + dstcount * new_edge_cost))) + { + unsigned int j; + + e2next = NULL; + if (pu_freelist) + { + npu = pu_freelist; + pu_freelist = pu_freelist->next; + } + else + npu = (struct import_cu *) + obstack_alloc (&ob2, sizeof (*npu)); + memset (npu, 0, sizeof (*npu)); + npu->incoming_count = srccount; + npu->outgoing_count = dstcount; + npu->idx = puidx++; + last_pu->next = npu; + last_pu = npu; + for (j = 0; j < srccount; j++) + { + if (e1next && e1next->icu == pusrc[j]) + e1next = e1next->next; + remove_import_edges (&pusrc[j]->outgoing, NULL, + pudst, dstcount, true)->icu + = npu; + pusrc[j]->outgoing_count -= dstcount - 1; + } + for (j = 0; j < dstcount; j++) + { + remove_import_edges (&pudst[j]->incoming, + &pudst[j]->incoming_tail, + pusrc, srccount, true)->icu + = npu; + pudst[j]->incoming_count -= srccount - 1; + } + npu->incoming = first_edge_from_freelist (); + for (j = 0, e4 = npu->incoming; j < srccount; j++) + { + e4->icu = pusrc[j]; + if (j == srccount - 1) + { + npu->incoming + = last_edge_from_freelist (npu->incoming, + e4); + npu->incoming_tail = e4; + ep = &e4->next; + } + else + e4 = e4->next; + } + npu->outgoing = first_edge_from_freelist (); + for (j = 0, e4 = npu->outgoing; j < dstcount; j++) + { + e4->icu = pudst[j]; + if (j == dstcount - 1) + npu->outgoing + = last_edge_from_freelist (npu->outgoing, e4); + else + e4 = e4->next; + } + size -= (dstcount - 1) * cost; + size += 13 + dstcount * new_edge_cost; + } + } + else + { + unsigned int j; + + pusrc[srccount] = e3->icu; + cost = edge_cost; + if (!edge_cost) + cost = pusrc[srccount]->cu->cu_version == 2 + ? 1 + ptr_size : 5; + if (e1next && e1next->icu == pusrc[srccount]) + e1next = e1next->next; + remove_import_edges (&pusrc[srccount]->outgoing, NULL, + pudst, dstcount, true)->icu = npu; + pusrc[srccount]->outgoing_count -= dstcount - 1; + for (j = 0; j < dstcount; j++) + { + remove_import_edges (&pudst[j]->incoming, + &pudst[j]->incoming_tail, + pusrc + srccount, 1, false); + pudst[j]->incoming_count--; + } + *ep = edge_from_freelist (); + npu->incoming_count++; + (*ep)->icu = pusrc[srccount]; + (*ep)->next = NULL; + npu->incoming_tail = *ep; + ep = &(*ep)->next; + size -= (dstcount - 1) * cost; + } + } + } + } + } + if (unlikely (dump_edges_p)) + dump_edges ("phase 2", ipus, npus, ncus); + if (unlikely (verify_edges_p)) + verify_edges (ipus, npus, ncus, 2); + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "create_import_tree phase 3\n"); + } + /* Try to merge PUs which have the same set of referrers if + beneficial. + + The example below demonstrates the type of transformation. The + transformation is an optimization because it reduces the number of import + statements (in other words, edges) as well as the number of PUs. It can + however not be done if PU_3 or PU_4 have additional incoming edges. + + Before: After: + + CU_1----->PU_3 CU_1 + \ ^ \ + \ / \ + \ / v + x PU_3_4 + / \ ^ + / \ / + / v / + CU_2----->PU_4 CU_2 + + Or, if one PU has a subset of referrers of the other, attempt to replace + all the incoming edges from the referrers intersection to the PU with + larger number of incoming edges by an edge from the other PU. + + The example below demonstrates the type of transformation. The + transformation is an optimization because it reduces the number of import + statements (in other words, edges). It can however not be done if PU_3 + has additional incoming edges. + + Before: After: + + CU_1----->PU_3 CU_1------>PU_3 + \ ^ ^ | + \ / / | + \ / / | + x / | + / \ / | + / \ / | + / \ / | + CU_2 \ CU_2 o + \ \ | + \ o | + \ | | + \ | | + \ | | + \ | | + v v v + CU_3----->PU_4 CU_3------>PU_4 + */ + /* Flag used during PU merging, set for PUs already considered + for merging for the given first PU. */ + BITVECTOR_TYPE *seen = bitvector_alloc (puidx); + unsigned int min_seen = UINT_MAX; + unsigned int max_seen = 0; + for (ipu = ipus[0]; ipu; ipu = ipu->next) + { + struct import_edge *e1, *e2, *e3, *e4, **e1p, **ep, *prev; + for (e1p = &ipu->incoming, e1 = *e1p; + e1; e1 = *e1p != e1 ? *e1p : (e1p = &e1->next, e1->next)) + { + for (e2 = e1->icu->outgoing; e2; e2 = e2->next) + { + unsigned int size_inc, size_dec; + struct import_cu *ipu2 = e2->icu, *ipusub, *ipusup; + /* True if IPU's src set might be a subset + of IPU2's src set. */ + bool maybe_subset; + /* True if IPU's src set might be a superset + of IPU2's src set. */ + bool maybe_superset; + unsigned int intersection; + + if (ipu2->idx <= ipu->idx || bitvector_bit_p (seen, ipu2->idx)) + continue; + bitvector_set_bit (seen, ipu2->idx); + min_seen = MIN (min_seen, ipu2->idx); + max_seen = MAX (max_seen, ipu2->idx); + maybe_subset = (e1 == ipu->incoming + && ipu->incoming_count <= ipu2->incoming_count); + maybe_superset = ipu->incoming_count >= ipu2->incoming_count; + if (maybe_superset) + { + /* If the referrer nodes of ipu are a superset of the + referrer nodes of ipu2, then ipu's last referrer node + should have index larger or equal to the last referrer + node of ipu2. */ + maybe_superset + = (ipu->incoming_tail->icu->idx + >= ipu2->incoming_tail->icu->idx); + } + if (maybe_subset) + { + /* If the referrer nodes of ipu are a subset of the + referrer nodes of ipu2, then ipu's last referrer node + should have index smaller or equal to the last referrer + node of ipu2. */ + maybe_subset + = (ipu->incoming_tail->icu->idx + <= ipu2->incoming_tail->icu->idx); + } + e3 = e1; + e4 = ipu2->incoming; + intersection = 0; + while ((maybe_subset || maybe_superset) && e3 && e4) + { + if (e3->icu == e4->icu) + { + intersection++; + e3 = e3->next; + e4 = e4->next; + continue; + } + if (e3->icu->idx < e4->icu->idx) + { + maybe_subset = false; + e3 = e3->next; + continue; + } + maybe_superset = false; + e4 = e4->next; + } + if (e3) + maybe_subset = false; + if (e4) + maybe_superset = false; + if ((!maybe_superset && !maybe_subset) || intersection < 2) + continue; + if (maybe_superset && maybe_subset) + { + if (unlikely (fi_multifile) && ipu2->idx < npus + ncus) + continue; + if (odr_active_p && odr_mode != ODR_BASIC + && ipu2->idx < npus + ncus) + continue; + /* If IPU and IPU2 have the same set of src nodes, then + (if beneficial, with edge_cost != 0 always), merge + IPU2 node into IPU, by removing all incoming edges + of IPU2 and moving over all outgoing edges of IPU2 + to IPU. */ + assert (ipu2->idx >= npus + ncus); + size_inc = 0; + if (edge_cost) + size_dec = 13 + ipu2->incoming_count * edge_cost; + else + { + size_dec = 13; + if (ipu->cu && ipu->cu->cu_version == 2) + { + if (ptr_size > 4) + size_inc = ipu2->outgoing_count * (ptr_size - 4); + else + size_dec += ipu2->outgoing_count * (4 - ptr_size); + } + for (e4 = ipu2->incoming; e4; e4 = e4->next) + size_dec += (e4->icu->cu + && e4->icu->cu->cu_version == 2) + ? 1 + ptr_size : 5; + } + if (!ignore_size || size_dec > size_inc) + { + struct import_cu **ipup; + for (e4 = ipu2->incoming, e3 = NULL; e4; e4 = e4->next) + { + remove_import_edges (&e4->icu->outgoing, NULL, &ipu2, + 1, false); + e4->icu->outgoing_count--; + prepare_free_edge (e4); + e3 = e4; + } + free_edges (ipu2->incoming, e3); + for (e4 = ipu2->outgoing; e4; e4 = e4->next) + { + for (ep = &e4->icu->incoming; *ep; ep = &(*ep)->next) + if ((*ep)->icu->idx >= ipu->idx) + break; + assert ((*ep)->icu != ipu); + if ((*ep)->icu == ipu2) + (*ep)->icu = ipu; + else + { + struct import_edge **ep2; + for (ep2 = &(*ep)->next; + *ep2; ep2 = &(*ep2)->next) + if ((*ep2)->icu == ipu2) + break; + e3 = *ep2; + *ep2 = e3->next; + e3->next = *ep; + *ep = e3; + e3->icu = ipu; + while (e4->icu->incoming_tail->next != NULL) + e4->icu->incoming_tail + = e4->icu->incoming_tail->next; + } + } + e3 = ipu->outgoing; + ep = &ipu->outgoing; + for (e4 = ipu2->outgoing; e3 && e4; ) + if (e3->icu->idx < e4->icu->idx) + { + *ep = e3; + ep = &e3->next; + e3 = e3->next; + } + else + { + assert (e3->icu != e4->icu); + *ep = e4; + ep = &e4->next; + e4 = e4->next; + } + if (e3) + *ep = e3; + else if (e4) + *ep = e4; + else + *ep = NULL; + ipu->outgoing_count += ipu2->outgoing_count; + size -= size_dec - size_inc; + if (ipu->idx >= npus + ncus) + ipup = &ipu->next; + else + ipup = &ipus[npus - 1]->next; + while (*ipup != ipu2) + ipup = &(*ipup)->next; + *ipup = ipu2->next; + ipu2->next = pu_freelist; + pu_freelist = ipu2; + continue; + } + } + if (maybe_superset) + { + ipusup = ipu; + ipusub = ipu2; + } + else + { + ipusub = ipu; + ipusup = ipu2; + } + /* If IPUSUB's src set is a subset of IPUSUP's src set + and intersection is at least 2, remove edges from + IPUSUB's src set to IPUSUP node and instead add + an edge from IPUSUB to IPUSUP. */ + size_inc = 0; + if (edge_cost) + size_dec = (ipusub->incoming_count - 1) * edge_cost; + else + { + size_inc = ipusub->cu && ipusub->cu->cu_version == 2 + ? 1 + ptr_size : 5; + size_dec = 0; + for (e3 = ipusub->incoming; e3; e3 = e3->next) + size_dec += (e3->icu->cu + && e3->icu->cu->cu_version == 2) + ? 1 + ptr_size : 5; + } + if (size_dec > size_inc + && (!fi_multifile || ipusub->idx >= npus + ncus)) + { + for (e3 = ipusub->incoming, ep = &ipusup->incoming, + prev = NULL; + e3; e3 = e3->next) + { + remove_import_edges (&e3->icu->outgoing, NULL, &ipusup, 1, + false); + e3->icu->outgoing_count--; + while ((*ep)->icu != e3->icu) + { + prev = *ep; + ep = &(*ep)->next; + } + e4 = *ep; + *ep = e4->next; + free_edge (e4); + if (ipusup->incoming_tail == e4) + ipusup->incoming_tail = prev; + } + for (ep = &ipusub->outgoing; *ep; ep = &(*ep)->next) + if ((*ep)->icu->idx >= ipusup->idx) + break; + assert (*ep == NULL || (*ep)->icu != ipusup); + e4 = edge_from_freelist (); + e4->icu = ipusup; + e4->next = *ep; + *ep = e4; + ipusub->outgoing_count++; + for (ep = &ipusup->incoming; *ep; ep = &(*ep)->next) + if ((*ep)->icu->idx >= ipusub->idx) + break; + assert (*ep == NULL || (*ep)->icu != ipusub); + e4 = edge_from_freelist (); + e4->icu = ipusub; + e4->next = *ep; + *ep = e4; + if (ipusup->incoming_tail->next == e4) + ipusup->incoming_tail = e4; + ipusup->incoming_count -= ipusub->incoming_count - 1; + size -= size_dec - size_inc; + if (ipusup == ipu) + break; + } + } + } + if (min_seen <= max_seen) + { + bitvector_clear_bits (seen, min_seen, max_seen); + min_seen = UINT_MAX; + max_seen = 0; + } + } + free (seen); + if (unlikely (dump_edges_p)) + dump_edges ("phase 3", ipus, npus, ncus); + if (unlikely (verify_edges_p)) + verify_edges (ipus, npus, ncus, 3); + opt_done: + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "create_import_tree phase 4 (create partial units)\n"); + } + /* Create DW_TAG_partial_unit (and containing dw_cu structures). */ + if (fi_multifile) + { + cu_off = 0; + last_partial_cu = NULL; + } + else + cu_off = last_partial_cu->cu_offset + 1; + for (ipu = ipus[npus - 1]->next; ipu; ipu = ipu->next) + { + dw_die_ref die; + dw_cu_ref partial_cu = pool_alloc (dw_cu, sizeof (struct dw_cu)); + memset (partial_cu, '\0', sizeof (*partial_cu)); + partial_cu->cu_kind = CU_PU; + partial_cu->cu_offset = cu_off++; + partial_cu->cu_version = new_pu_version; + partial_cu->u1.cu_icu = ipu; + if (unlikely (last_partial_cu == NULL)) + { + partial_cu->cu_next = first_cu; + first_cu = partial_cu; + } + else + { + partial_cu->cu_next = last_partial_cu->cu_next; + last_partial_cu->cu_next = partial_cu; + } + last_partial_cu = partial_cu; + die = pool_alloc (dw_die, sizeof (struct dw_die)); + memset (die, '\0', sizeof (struct dw_die)); + die->die_toplevel = 1; + partial_cu->cu_die = die; + die->die_tag = DW_TAG_partial_unit; + die->die_offset = -1U; + die->die_root = 1; + die->die_parent = (dw_die_ref) partial_cu; + die->die_size = 1; + ipu->cu = partial_cu; + } + /* Next add all needed DW_TAG_imported_unit DIEs. */ + for (cu = first_cu; cu; cu = cu->cu_next) + { + struct import_edge *e; + + icu = cu->u1.cu_icu; + if (icu == NULL) + continue; + for (e = icu->outgoing; e; e = e->next) + { + dw_die_ref *diep; + dw_die_ref die = pool_alloc (dw_die, sizeof (struct dw_die)); + memset (die, '\0', sizeof (*die)); + die->die_toplevel = 1; + die->die_tag = DW_TAG_imported_unit; + die->die_offset = -1U; + die->die_nextdup = e->icu->cu->cu_die; + die->die_parent = cu->cu_die; + assert (e->icu->cu->cu_die->die_tag == DW_TAG_partial_unit); + die->die_size = (cu->cu_version == 2 ? 1 + ptr_size : 5); + /* Put the new DW_TAG_imported_unit DIE after all typed DWARF + stack referenced base types and after all previously added + new DW_TAG_imported_unit DIEs. */ + for (diep = &die->die_parent->die_child; + *diep; diep = &(*diep)->die_sib) + if (!(*diep)->die_op_type_referenced + && ((*diep)->die_tag != DW_TAG_imported_unit + || (*diep)->die_offset != -1U)) + break; + die->die_sib = *diep; + *diep = die; + } + } + for (cu = first_cu; cu; cu = cu->cu_next) + cu->u1.cu_icu = NULL; + if (unlikely (fi_multifile)) + for (cu = alt_first_cu; cu; cu = cu->cu_next) + cu->u1.cu_icu = NULL; + obstack_free (&ob2, to_free); + return 0; +} + +/* Helper function for die_find_dup, when ORIG has collapsed children. */ +static dw_die_ref +die_find_collapsed_dup (dw_die_ref die, unsigned int *tick) +{ + dw_die_ref child, ret; + + for (child = die->die_child; child; child = child->die_sib) + if ((*tick)-- == 0) + return child; + else if (child->die_child == NULL) + continue; + else if ((ret = die_find_collapsed_dup (child, tick)) != NULL) + return ret; + (*tick)--; + return NULL; +} + +/* If DIE is equal to ORIG, return DUP, otherwise if DIE is + a child of ORIG, return corresponding child in DUP's subtree, + or return NULL. */ +static dw_die_ref +die_find_dup (dw_die_ref orig, dw_die_ref dup, dw_die_ref die) +{ + dw_die_ref orig_child, dup_child; + if (orig == die) + return dup; + if (orig->die_collapsed_children) + { + dw_die_ref ret; + unsigned int tick; + if (die->die_collapsed_child) + tick = die->die_tag - 1; + else + tick = die->die_ref_seen - 1; + assert (dup->die_collapsed_children == 0 + && die->die_parent == orig); + ret = die_find_collapsed_dup (dup, &tick); + assert (die->die_collapsed_child || ret->die_tag == die->die_tag); + return ret; + } + for (orig_child = orig->die_child, dup_child = dup->die_child; + orig_child; + orig_child = orig_child->die_sib, dup_child = dup_child->die_sib) + { + dw_die_ref ret = die_find_dup (orig_child, dup_child, die); + if (ret) + return ret; + } + return NULL; +} + +/* Return number of bytes needed to encode VAL using + uleb128. */ +static unsigned int +size_of_uleb128 (uint64_t val) +{ + unsigned int size; + for (size = 1; (val >>= 7) != 0; size++) + ; + return size; +} + +/* Return number of bytes needed to encode VAL using + sleb128. */ +static unsigned int +size_of_sleb128 (int64_t val) +{ + unsigned int size = 0; + unsigned char c; + do + { + c = val & 0x7f; + val >>= 7; + size++; + } + while ((val != 0 || (c & 0x40) != 0) + && (val != -1 || (c & 0x40) == 0)); + return size; +} + +/* Hash table mapping original file IDs to new ids. */ +static htab_t line_htab; +/* Current new maximum file ID. */ +static unsigned int max_line_id; + +struct line_entry +{ + /* File pointer. */ + struct dw_file *file; + /* Precomputed hash value. */ + unsigned int hash; + /* Corresponding new file ID. */ + unsigned int new_id; +}; +ALIGN_STRUCT (line_entry) + +/* Hash function in line_htab. */ +static hashval_t +line_hash (const void *p) +{ + struct line_entry *s = (struct line_entry *)p; + + return s->hash; +} + +/* Equality function in line_htab. */ +static int +line_eq (const void *p, const void *q) +{ + struct line_entry *s1 = (struct line_entry *)p; + struct line_entry *s2 = (struct line_entry *)q; + + if (s1->hash != s2->hash) + return 0; + if (s1->file == s2->file) + return 1; + if (strcmp (s1->file->file, s2->file->file) != 0) + return 0; + if ((s1->file->dir == NULL) ^ (s2->file->dir == NULL)) + return 0; + if (s1->file->dir && strcmp (s1->file->dir, s2->file->dir) != 0) + return 0; + return s1->file->time == s2->file->time && s1->file->size == s2->file->size; +} + +/* Map original file ID to new file ID. */ +static unsigned int +line_htab_lookup (dw_cu_ref cu, unsigned int id) +{ + void **slot; + struct line_entry le; + if (id == 0) + return 0; + assert (id <= cu->cu_nfiles); + le.file = &cu->cu_files[id - 1]; + hash_init_state (); + hash_update_state_object (le.file->time); + hash_update_state_object (le.file->size); + hash_update_state (le.file->file, strlen (le.file->file) + 1); + if (le.file->dir) + hash_update_state (le.file->dir, strlen (le.file->dir) + 1); + if (line_htab == NULL) + { + line_htab = htab_try_create (50, line_hash, line_eq, NULL); + if (line_htab == NULL) + dwz_oom (); + max_line_id = 1; + } + le.hash = hash_digest (); + slot = htab_find_slot_with_hash (line_htab, &le, le.hash, INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot == NULL) + { + struct line_entry *l = pool_alloc (line_entry, sizeof (*l)); + l->file = le.file; + l->hash = le.hash; + l->new_id = max_line_id++; + *slot = (void *) l; + return l->new_id; + } + else + return ((struct line_entry *) *slot)->new_id; +} + +/* Hash table for finding duplicate .debug_macro opcode sequences. + This hash table is used with two different sets of hash/equality + callbacks. One is used either within handle_macro function (from within + optimize_multifile), or from handle_macro onwards (read_multifile). + The second set is used from read_macro onwards during fi_multifile. */ +static htab_t macro_htab; + +/* At the end of read_multifile macro_htab is copied to this variable. */ +static htab_t alt_macro_htab; + +struct macro_entry +{ + /* Start of the sequence. */ + unsigned char *ptr; + /* Precomputed hash value. LSB bit is used for a flag whether + a particular .debug_macro sequence is seen more than once. */ + unsigned int hash; + /* And it's length or 0 if non-shareable. */ + unsigned int len; +}; +ALIGN_STRUCT (macro_entry) + +/* Hash function in macro_htab. */ +static hashval_t +macro_hash (const void *p) +{ + struct macro_entry *m = (struct macro_entry *)p; + + return m->hash & ~1U; +} + +/* Equality function in macro_htab. */ +static int +macro_eq (const void *p, const void *q) +{ + struct macro_entry *m1 = (struct macro_entry *)p; + struct macro_entry *m2 = (struct macro_entry *)q; + unsigned char *p1, *p2, *s1, op; + unsigned int strp1, strp2; + + if (m1->hash != m2->hash || m1->len != m2->len) + return 0; + if (rd_multifile) + return 0; + + s1 = m1->ptr; + p2 = m2->ptr; + p1 = s1 + 3; + + while (1) + { + op = read_8 (p1); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (p1); + p1 = (unsigned char *) strchr ((char *) p1, '\0') + 1; + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + skip_leb128 (p1); + if (memcmp (s1, p2, p1 - s1) != 0) + return 0; + p2 += p1 - s1; + strp1 = read_32 (p1); + strp2 = read_32 (p2); + if (op_multifile) + { + if (strcmp ((char *) debug_sections[DEBUG_STR].data + strp1, + (char *) debug_sections[DEBUG_STR].data + strp2) + != 0) + return 0; + } + else if (lookup_strp_offset (strp2) != strp1) + return 0; + s1 = p1; + break; + default: + abort (); + } + } + return memcmp (s1, p2, p1 - s1) == 0; +} + +/* Hash function in macro_htab. */ +static hashval_t +macro_hash2 (const void *p) +{ + struct macro_entry *m = (struct macro_entry *)p; + + return m->ptr - debug_sections[DEBUG_MACRO].data; +} + +/* Equality function in macro_htab. */ +static int +macro_eq2 (const void *p, const void *q) +{ + struct macro_entry *m1 = (struct macro_entry *)p; + struct macro_entry *m2 = (struct macro_entry *)q; + return m1->ptr == m2->ptr; +} + +/* Parse .debug_macro section, either during write_multifile + or during fi_multifile phase. During write_multifile it + selects potentially shareable .debug_macro sequences and + writes them into debug_sections[DEBUG_MACRO].new_data + block it allocates. During fi_multifile it populates + macro_htab. In both cases it calls note_strp_offset + on DW_FORM_strp offsets. */ +static int +read_macro (DSO *dso) +{ + unsigned char *ptr, *endsec, *dst = NULL; + unsigned int version, flags, op, strp; + struct macro_entry me, *m; + + ptr = debug_sections[DEBUG_MACRO].data; + endsec = ptr + debug_sections[DEBUG_MACRO].size; + debug_sections[DEBUG_MACRO].new_size = 0; + if (!wr_multifile) + { + macro_htab = htab_try_create (50, macro_hash2, macro_eq2, NULL); + if (macro_htab == NULL) + dwz_oom (); + } + + while (ptr < endsec) + { + unsigned char *start = ptr, *s = ptr; + bool can_share = true; + hashval_t hash = 0; + unsigned int strp; + void **slot; + + if (ptr + 4 > endsec) + { + error (0, 0, "%s: .debug_macro header too small", dso->filename); + return 1; + } + + version = read_16 (ptr); + bool supported_version_p = version >= 4 && version <= 5; + if (!supported_version_p) + { + error (0, 0, "%s: Unhandled .debug_macro version %d", dso->filename, + version); + return 1; + } + flags = read_8 (ptr); + if ((flags & ~2U) != 0) + { + error (0, 0, "%s: Unhandled .debug_macro flags %d", dso->filename, + flags); + return 1; + } + if ((flags & 2) != 0) + { + ptr += 4; + can_share = false; + } + if (fi_multifile && alt_macro_htab == NULL) + can_share = false; + + op = -1U; + while (ptr < endsec) + { + op = read_8 (ptr); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (ptr); + ptr = (unsigned char *) strchr ((char *) ptr, '\0') + 1; + break; + case DW_MACRO_start_file: + skip_leb128 (ptr); + skip_leb128 (ptr); + can_share = false; + break; + case DW_MACRO_end_file: + can_share = false; + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + skip_leb128 (ptr); + strp = read_32 (ptr); + note_strp_offset (strp); + if (wr_multifile) + break; + if (can_share) + hash = iterative_hash (s, ptr - 4 - s, hash); + if (can_share) + { + unsigned char *p = debug_sections[DEBUG_STR].data + strp; + unsigned int len = strlen ((char *) p); + hash = iterative_hash (p, len, hash); + s = ptr; + } + break; + case DW_MACRO_import: + ptr += 4; + can_share = false; + break; + default: + error (0, 0, "%s: Unhandled .debug_macro opcode 0x%x", + dso->filename, op); + return 1; + } + } + if (op != 0) + { + error (0, 0, "%s: .debug_macro section not zero terminated", + dso->filename); + return 1; + } + if (wr_multifile) + { + if (can_share) + debug_sections[DEBUG_MACRO].new_size += ptr - start; + continue; + } + + me.ptr = start; + if (can_share) + { + hash = iterative_hash (s, ptr - s, hash); + me.hash = hash & ~1U; + me.len = ptr - start; + m = (struct macro_entry *) + htab_find_with_hash (alt_macro_htab, &me, me.hash); + if (m == NULL) + can_share = false; + else + me.hash = m->ptr - alt_data[DEBUG_MACRO]; + } + if (!can_share) + { + me.len = 0; + me.hash = debug_sections[DEBUG_MACRO].new_size; + debug_sections[DEBUG_MACRO].new_size += ptr - start; + } + slot + = htab_find_slot_with_hash (macro_htab, &me, + me.ptr - debug_sections[DEBUG_MACRO].data, + INSERT); + if (slot == NULL) + dwz_oom (); + else + { + assert (*slot == NULL); + m = pool_alloc (macro_entry, sizeof (*m)); + *m = me; + *slot = (void *) m; + } + } + + if (!wr_multifile) + return 0; + + debug_sections[DEBUG_MACRO].new_data + = (unsigned char *) malloc (debug_sections[DEBUG_MACRO].new_size); + if (debug_sections[DEBUG_MACRO].new_data == NULL) + dwz_oom (); + dst = debug_sections[DEBUG_MACRO].new_data; + for (ptr = debug_sections[DEBUG_MACRO].data; ptr < endsec; ) + { + unsigned char *start = ptr; + bool can_share = true; + + ptr += 2; + flags = read_8 (ptr); + if ((flags & 2) != 0) + { + ptr += 4; + can_share = false; + } + + while (1) + { + op = read_8 (ptr); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (ptr); + ptr = (unsigned char *) strchr ((char *) ptr, '\0') + 1; + break; + case DW_MACRO_start_file: + skip_leb128 (ptr); + skip_leb128 (ptr); + can_share = false; + break; + case DW_MACRO_end_file: + can_share = false; + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + skip_leb128 (ptr); + ptr += 4; + break; + case DW_MACRO_import: + ptr += 4; + can_share = false; + break; + default: + abort (); + } + } + if (can_share) + { + ptr = start + 3; + + while (1) + { + op = read_8 (ptr); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (ptr); + ptr = (unsigned char *) strchr ((char *) ptr, '\0') + 1; + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + skip_leb128 (ptr); + memcpy (dst, start, ptr - start); + dst += ptr - start; + strp = lookup_strp_offset (read_32 (ptr)); + write_32 (dst, strp); + start = ptr; + break; + default: + abort (); + } + } + memcpy (dst, start, ptr - start); + dst += ptr - start; + } + } + assert (dst == debug_sections[DEBUG_MACRO].new_data + + debug_sections[DEBUG_MACRO].new_size); + + return 0; +} + +/* Helper function for handle_macro, called through htab_traverse. + Write .debug_macro opcode sequence seen by more than one + executable or shared library. */ +static int +optimize_write_macro (void **slot, void *data) +{ + struct macro_entry *m = (struct macro_entry *) *slot; + unsigned char **pp = (unsigned char **) data; + unsigned char *s = m->ptr; + unsigned char *p = s + 3, *q, op; + unsigned int strp; + + if ((m->hash & 1) == 0) + return 1; + while (1) + { + op = read_8 (p); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (p); + p = (unsigned char *) strchr ((char *) p, '\0') + 1; + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + skip_leb128 (p); + memcpy (*pp, s, p - s); + *pp += p - s; + strp = read_32 (p); + q = *pp; + write_32 (q, lookup_strp_offset (strp)); + *pp += 4; + s = p; + break; + default: + abort (); + } + } + memcpy (*pp, s, p - s); + *pp += p - s; + return 1; +} + +/* Parse .debug_macro section, during optimize_multifile + or during read_multifile. It parses .debug_macro written + by write_multifile, so it only contains shareable sequences. + Find duplicate sequences, during optimize_multifile write them + into debug_sections[DEBUG_MACRO].new_data it allocates, + during read_multifile just populates macro_htab (soon to be + alt_macro_htab). */ +static void +handle_macro (void) +{ + unsigned char *ptr, *endsec, op; + unsigned char *to_free = NULL; + struct macro_entry me, *m; + + macro_htab = htab_try_create (50, macro_hash, macro_eq, NULL); + if (macro_htab == NULL) + dwz_oom (); + + endsec = debug_sections[DEBUG_MACRO].data + debug_sections[DEBUG_MACRO].size; + if (op_multifile) + { + debug_sections[DEBUG_MACRO].new_size = 0; + to_free = obstack_alloc (&ob, 1); + } + + for (ptr = debug_sections[DEBUG_MACRO].data; ptr < endsec; ) + { + unsigned char *start = ptr, *s = ptr, *p; + hashval_t hash = 0; + unsigned int len; + void **slot; + bool can_share = true; + + ptr += 3; + while (1) + { + op = read_8 (ptr); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (ptr); + ptr = (unsigned char *) strchr ((char *) ptr, '\0') + 1; + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + skip_leb128 (ptr); + hash = iterative_hash (s, ptr - s, hash); + p = debug_sections[DEBUG_STR].data + read_32 (ptr); + len = strlen ((char *) p); + hash = iterative_hash (p, len, hash); + if (op_multifile + /* This should only happen if there were multiple + same transparent units within a single object file. */ + && htab_find_with_hash (strp_htab, p, + hash (p, len)) == NULL) + can_share = false; + s = ptr; + break; + default: + abort (); + } + } + if (!can_share) + continue; + hash = iterative_hash (s, ptr - s, hash); + me.ptr = start; + me.hash = hash & ~1U; + me.len = ptr - start; + slot = htab_find_slot_with_hash (macro_htab, &me, me.hash, INSERT); + if (slot == NULL) + dwz_oom (); + else if (*slot != NULL) + { + m = (struct macro_entry *) *slot; + if (op_multifile && (m->hash & 1) == 0) + { + m->hash |= 1; + debug_sections[DEBUG_MACRO].new_size += me.len; + } + } + else if (op_multifile) + { + m = (struct macro_entry *) obstack_alloc (&ob, sizeof (*m)); + *m = me; + *slot = (void *) m; + } + else + { + m = pool_alloc (macro_entry, sizeof (*m)); + *m = me; + *slot = (void *) m; + } + } + + if (op_multifile) + { + if (debug_sections[DEBUG_MACRO].new_size) + { + unsigned char *p; + debug_sections[DEBUG_MACRO].new_data + = malloc (debug_sections[DEBUG_MACRO].new_size); + p = debug_sections[DEBUG_MACRO].new_data; + htab_traverse (macro_htab, optimize_write_macro, &p); + assert (p == debug_sections[DEBUG_MACRO].new_data + + debug_sections[DEBUG_MACRO].new_size); + htab_delete (macro_htab); + macro_htab = NULL; + } + obstack_free (&ob, (void *) to_free); + } +} + +/* Write new content of .debug_macro section during fi_multifile phase. */ +static void +write_macro (void) +{ + unsigned char *ptr, *endsec, *dst; + unsigned int op, strp; + struct macro_entry me, *m; + + endsec = debug_sections[DEBUG_MACRO].data + debug_sections[DEBUG_MACRO].size; + debug_sections[DEBUG_MACRO].new_data + = (unsigned char *) malloc (debug_sections[DEBUG_MACRO].new_size); + if (debug_sections[DEBUG_MACRO].new_data == NULL) + dwz_oom (); + dst = debug_sections[DEBUG_MACRO].new_data; + for (ptr = debug_sections[DEBUG_MACRO].data; ptr < endsec; ) + { + unsigned char *s = ptr; + unsigned char flags; + + me.ptr = ptr; + m = (struct macro_entry *) + htab_find_with_hash (macro_htab, &me, + me.ptr - debug_sections[DEBUG_MACRO].data); + if (m->len) + { + ptr += m->len; + continue; + } + + ptr += 2; + flags = read_8 (ptr); + if ((flags & 2) != 0) + ptr += 4; + + while (1) + { + op = read_8 (ptr); + if (op == 0) + break; + + switch (op) + { + case DW_MACRO_define: + case DW_MACRO_undef: + skip_leb128 (ptr); + ptr = (unsigned char *) strchr ((char *) ptr, '\0') + 1; + break; + case DW_MACRO_start_file: + skip_leb128 (ptr); + skip_leb128 (ptr); + break; + case DW_MACRO_end_file: + break; + case DW_MACRO_define_strp: + case DW_MACRO_undef_strp: + memcpy (dst, s, ptr - 1 - s); + dst += ptr - 1 - s; + s = ptr - 1; + skip_leb128 (ptr); + strp = read_32 (ptr); + switch (note_strp_offset2 (strp)) + { + case DW_FORM_GNU_strp_alt: + case DW_FORM_strp_sup: + *dst = op == DW_MACRO_define_strp + ? DW_MACRO_define_sup + : DW_MACRO_undef_sup; + dst++; + s++; + break; + default: + break; + } + memcpy (dst, s, ptr - 4 - s); + dst += ptr - 4 - s; + write_32 (dst, lookup_strp_offset (strp)); + s = ptr; + break; + case DW_MACRO_import: + memcpy (dst, s, ptr - 1 - s); + dst += ptr - 1 - s; + me.ptr = debug_sections[DEBUG_MACRO].data + read_32 (ptr); + m = (struct macro_entry *) + htab_find_with_hash (macro_htab, &me, + me.ptr + - debug_sections[DEBUG_MACRO].data); + if (m->len) + *dst = DW_MACRO_import_sup; + else + *dst = DW_MACRO_import; + dst++; + write_32 (dst, m->hash); + s = ptr; + break; + default: + abort (); + } + } + memcpy (dst, s, ptr - s); + dst += ptr - s; + } + assert (dst == debug_sections[DEBUG_MACRO].new_data + + debug_sections[DEBUG_MACRO].new_size); +} + +/* Compute new abbreviations for DIE (with reference DIE REF). + T is a temporary buffer. Fill in *NDIES - number of DIEs + in the tree, and record pairs of referrer/referree DIEs for + intra-CU references into obstack vector VEC. */ +static int +build_abbrevs_for_die (htab_t h, dw_cu_ref cu, dw_die_ref die, + dw_cu_ref refcu, dw_die_ref ref, + struct abbrev_tag *t, unsigned int *ndies, + struct obstack *vec, bool recompute) +{ + dw_die_ref child, ref_child, sib = NULL, origin = NULL; + unsigned int i, j; + uint64_t low_pc = 0; + void **slot; + + if (unlikely (recompute) && die->u.p2.die_new_abbrev != NULL) + { + if (cu->cu_intracu_form == DW_FORM_ref_udata) + die->die_ref_seen = 1; + else + { + die->die_size -= size_of_uleb128 (die->u.p2.die_new_abbrev->entry) + + die->u.p2.die_intracu_udata_size; + die->die_ref_seen = 0; + } + for (child = die->die_child; child; child = child->die_sib) + if (build_abbrevs_for_die (h, cu, child, NULL, NULL, t, ndies, vec, + true)) + return 1; + return 0; + } + + die->u.p2.die_new_abbrev = NULL; + die->u.p2.die_new_offset = 0; + die->u.p2.die_intracu_udata_size = 0; + die->die_ref_seen = 0; + + if (wr_multifile ? die->die_no_multifile : die->die_remove) + return 0; + t->entry = 0; + t->tag = die->die_tag; + t->children = die->die_child != NULL; + t->op_type_referenced = false; + t->nusers = 1; + if (die->die_offset == -1U) + { + if (ref != NULL) + ; + else if (die_safe_nextdup (die) && die->die_nextdup->die_dup == die) + { + ref = die->die_nextdup; + if (ref != NULL) + refcu = die_cu (ref); + } + if (ref == NULL) + origin = die->die_nextdup; + } + else + { + ref = die; + refcu = cu; + if (wr_multifile + && (die->die_root || die->die_named_namespace)) + origin = die; + } + if (die->die_child && die->die_sib) + for (sib = die->die_sib; sib; sib = sib->die_sib) + if (wr_multifile ? !sib->die_no_multifile : !sib->die_remove) + break; + if (ref != NULL && origin == NULL) + { + unsigned char *base + = cu->cu_kind == CU_TYPES + ? debug_sections[DEBUG_TYPES].data + : debug_sections[DEBUG_INFO].data; + unsigned char *ptr = base + ref->die_offset; + struct abbrev_tag *reft = ref->die_abbrev; + + skip_leb128 (ptr); + /* No longer count the abbrev uleb128 size in die_size. + We'll add it back after determining the new abbrevs. */ + if (unlikely (wr_multifile || op_multifile || fi_multifile) + || unlikely (recompute)) + i = -1U; + else + for (i = 0; i < reft->nattr; i++) + switch (reft->attr[i].form) + { + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + case DW_FORM_ref_udata: + case DW_FORM_indirect: + i = -2U; + break; + case DW_FORM_data4: + case DW_FORM_data8: + if (reft->attr[i].attr == DW_AT_high_pc) + i = -2U; + break; + case DW_FORM_addr: + if (reft->attr[i].attr == DW_AT_high_pc + && cu->cu_version >= 4) + i = -2U; + break; + default: + break; + } + if (i != -1U) + { + die->die_size -= ptr - (base + ref->die_offset); + /* If there are no references, size stays the same + and no need to walk the actual attribute values. */ + for (i = 0; i < reft->nattr; i++) + { + t->attr[i].attr = reft->attr[i].attr; + t->attr[i].form = reft->attr[i].form; + if (t->attr[i].form == DW_FORM_implicit_const) + t->values[i] = reft->values[i]; + } + t->nattr = reft->nattr; + } + else + { + die->die_size = 0; + /* Otherwise, we need to walk the actual attributes. */ + for (i = 0, j = 0; i < reft->nattr; ++i) + { + uint32_t form = reft->attr[i].form; + size_t len = 0; + dw_die_ref refd; + uint64_t value = 0; + unsigned char *orig_ptr = ptr; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + + if (unlikely (wr_multifile || op_multifile) + && (reft->attr[i].attr == DW_AT_decl_file + || reft->attr[i].attr == DW_AT_call_file)) + { + switch (form) + { + case DW_FORM_data1: value = read_8 (ptr); break; + case DW_FORM_data2: value = read_16 (ptr); break; + case DW_FORM_data4: value = read_32 (ptr); break; + case DW_FORM_data8: value = read_64 (ptr); break; + case DW_FORM_udata: value = read_uleb128 (ptr); break; + case DW_FORM_sdata: value = read_sleb128 (ptr); break; + case DW_FORM_implicit_const: + value = reft->values[i]; + break; + default: + error (0, 0, "Unhandled %s for %s", + get_DW_FORM_str (form), + get_DW_AT_str (reft->attr[i].attr)); + return 1; + } + value = line_htab_lookup (refcu, value); + if (form != DW_FORM_implicit_const) + { + if (value <= 0xff) + { + form = DW_FORM_data1; + die->die_size++; + } + else if (value <= 0xffff) + { + form = DW_FORM_data2; + die->die_size += 2; + } + else if (value <= 0xffffffff) + { + form = DW_FORM_data4; + die->die_size += 4; + } + else + { + form = DW_FORM_data8; + die->die_size += 8; + } + } + t->attr[j].attr = reft->attr[i].attr; + t->attr[j].form = form; + if (form == DW_FORM_implicit_const) + t->values[j] = value; + j++; + continue; + } + + if (unlikely (fi_multifile) + && (reft->attr[i].attr == DW_AT_GNU_macros + || reft->attr[i].attr == DW_AT_macros) + && alt_macro_htab != NULL) + { + struct macro_entry me, *m; + + switch (form) + { + case DW_FORM_data4: + case DW_FORM_sec_offset: + value = read_32 (ptr); + break; + default: + error (0, 0, "Unhandled %s for %s", + get_DW_FORM_str (form), + get_DW_AT_str (reft->attr[i].attr)); + return 1; + } + me.ptr = debug_sections[DEBUG_MACRO].data + value; + m = (struct macro_entry *) + htab_find_with_hash (macro_htab, &me, value); + if (m->len) + { + error (0, 0, "%s referencing transparent include", + get_DW_AT_str (reft->attr[i].attr)); + return 1; + } + ptr -= 4; + } + + switch (form) + { + case DW_FORM_ref_addr: + if (unlikely (fi_multifile)) + { + dw_die_ref refdt; + value = read_size (ptr, + refcu->cu_version == 2 + ? ptr_size : 4); + ptr += refcu->cu_version == 2 ? ptr_size : 4; + refd = off_htab_lookup (NULL, value); + assert (refd != NULL); + refdt = refd; + while (refdt->die_toplevel == 0) + refdt = refdt->die_parent; + if (refdt->die_dup + && !refdt->die_op_type_referenced + && die_cu (refdt->die_dup)->cu_kind == CU_ALT) + { + t->attr[j].attr = reft->attr[i].attr; + t->attr[j++].form + = dwarf_5 ? DW_FORM_ref_sup4 : DW_FORM_GNU_ref_alt; + die->die_size += 4; + continue; + } + break; + } + ptr += refcu->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_addr: + ptr += ptr_size; + if (reft->attr[i].attr == DW_AT_low_pc + && cu->cu_version >= 4) + low_pc = read_size (ptr - ptr_size, ptr_size); + else if (reft->attr[i].attr == DW_AT_high_pc + && low_pc) + { + uint64_t high_pc = read_size (ptr - ptr_size, ptr_size); + /* If both DW_AT_low_pc and DW_AT_high_pc attributes + are present and have DW_FORM_addr, attempt to shrink + the DIE by using DW_FORM_udata or DW_FORM_data4 + form for the latter in DWARF4+. Don't try + DW_FORM_data[12], that might increase .debug_abbrev + size too much or increase the uleb128 size of too + many abbrev numbers. */ + if (high_pc > low_pc) + { + unsigned int nform = 0; + unsigned int sz = size_of_uleb128 (high_pc - low_pc); + if (sz <= 4 && sz <= (unsigned) ptr_size) + nform = DW_FORM_udata; + else if (ptr_size > 4 + && high_pc - low_pc <= 0xffffffff) + { + nform = DW_FORM_data4; + sz = 4; + } + else if (sz <= (unsigned) ptr_size) + nform = DW_FORM_udata; + if (nform) + { + t->attr[j].attr = reft->attr[i].attr; + t->attr[j++].form = nform; + die->die_size += sz; + continue; + } + } + } + break; + case DW_FORM_flag_present: + case DW_FORM_implicit_const: + break; + case DW_FORM_flag: + case DW_FORM_data1: + ++ptr; + break; + case DW_FORM_data2: + ptr += 2; + break; + case DW_FORM_data4: + if (reft->attr[i].attr == DW_AT_high_pc) + { + uint32_t range_len = read_32 (ptr); + unsigned int sz = size_of_uleb128 (range_len); + if (sz <= 4) + { + t->attr[j].attr = reft->attr[i].attr; + t->attr[j++].form = DW_FORM_udata; + die->die_size += sz; + continue; + } + break; + } + ptr += 4; + break; + case DW_FORM_sec_offset: + ptr += 4; + break; + case DW_FORM_data8: + if (reft->attr[i].attr == DW_AT_high_pc) + { + unsigned int nform = 0; + uint64_t range_len = read_64 (ptr); + unsigned int sz = size_of_uleb128 (range_len); + if (sz <= 4) + nform = DW_FORM_udata; + else if (range_len <= 0xffffffff) + { + nform = DW_FORM_data4; + sz = 4; + } + else if (sz <= 8) + nform = DW_FORM_udata; + if (nform) + { + t->attr[j].attr = reft->attr[i].attr; + t->attr[j++].form = nform; + die->die_size += sz; + continue; + } + break; + } + ptr += 8; + break; + case DW_FORM_ref_sig8: + ptr += 8; + break; + case DW_FORM_data16: + ptr += 16; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + skip_leb128 (ptr); + break; + case DW_FORM_strp: + if (unlikely (op_multifile || fi_multifile)) + { + form = note_strp_offset2 (read_32 (ptr)); + if (form != DW_FORM_strp) + { + t->attr[j].attr = reft->attr[i].attr; + t->attr[j++].form = form; + die->die_size += 4; + continue; + } + } + else + ptr += 4; + break; + case DW_FORM_line_strp: + /* Since we don't register the line_strp we cannot + change the form in the case of multifile. */ + ptr += 4; + break; + case DW_FORM_string: + ptr = (unsigned char *) strchr ((char *)ptr, '\0') + 1; + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *ptr++; + break; + case DW_FORM_block2: + len = read_16 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + case DW_FORM_exprloc: + len = read_uleb128 (ptr); + form = DW_FORM_block1; + break; + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + case DW_FORM_ref_udata: + switch (form) + { + case DW_FORM_ref1: value = read_8 (ptr); break; + case DW_FORM_ref2: value = read_16 (ptr); break; + case DW_FORM_ref4: value = read_32 (ptr); break; + case DW_FORM_ref8: value = read_64 (ptr); break; + case DW_FORM_ref_udata: value = read_uleb128 (ptr); break; + default: abort (); + } + if (reft->attr[i].attr == DW_AT_sibling) + { + if (sib == NULL) + continue; + form = DW_FORM_ref4; + refd = sib; + } + else + { + dw_die_ref refdt; + refd = off_htab_lookup (refcu, refcu->cu_offset + value); + assert (refd != NULL); + refdt = refd; + while (refdt->die_toplevel == 0) + refdt = refdt->die_parent; + if (refdt->die_dup && refdt->die_op_type_referenced) + { + if (cu == die_cu (refdt)) + form = DW_FORM_ref4; + else if (cu == die_cu (refdt->die_dup)) + { + form = DW_FORM_ref4; + refd = die_find_dup (refdt, refdt->die_dup, + refd); + } + else + form = DW_FORM_ref_addr; + } + else + { + if (refdt->die_dup) + refd = die_find_dup (refdt, refdt->die_dup, refd); + if (cu == die_cu (refd)) + form = DW_FORM_ref4; + else if (die_cu (refd)->cu_kind == CU_ALT) + form = (dwarf_5 + ? DW_FORM_ref_sup4 : DW_FORM_GNU_ref_alt); + else + form = DW_FORM_ref_addr; + } + } + if (form == DW_FORM_ref_addr) + die->die_size += cu->cu_version == 2 ? ptr_size : 4; + else if (form == DW_FORM_GNU_ref_alt + || form == DW_FORM_ref_sup4) + die->die_size += 4; + else + { + if (unlikely (recompute)) + form = cu->cu_intracu_form; + if (likely (!recompute) || form == DW_FORM_ref_udata) + { + obstack_ptr_grow (vec, die); + obstack_ptr_grow (vec, refd); + } + } + t->attr[j].attr = reft->attr[i].attr; + t->attr[j++].form = form; + continue; + default: + abort (); + } + + if (form == DW_FORM_block1) + ptr += len; + t->attr[j].attr = reft->attr[i].attr; + t->attr[j].form = reft->attr[i].form; + if (reft->attr[i].form == DW_FORM_implicit_const) + t->values[j] = reft->values[i]; + j++; + die->die_size += ptr - orig_ptr; + } + t->nattr = j; + } + } + else + switch (die->die_tag) + { + case DW_TAG_partial_unit: + case DW_TAG_compile_unit: + t->nattr = 0; + die->die_size = 0; + if (origin == NULL) + break; + refcu = die_cu (origin); + if (refcu->cu_nfiles) + { + t->attr[0].attr = DW_AT_stmt_list; + t->attr[0].form = cu->cu_version < 4 + ? DW_FORM_data4 : DW_FORM_sec_offset; + die->die_size += 4; + t->nattr++; + } + if (uni_lang_p || cu->cu_die->die_tag == DW_TAG_compile_unit) + { + unsigned int lang_size = nr_bytes_for (cu->lang); + die->die_size += lang_size; + t->attr[t->nattr].attr = DW_AT_language; + switch (lang_size) + { + case 1: + t->attr[t->nattr].form = DW_FORM_data1; + break; + case 2: + t->attr[t->nattr].form = DW_FORM_data2; + break; + default: + abort (); + } + t->nattr++; + } + if (refcu->cu_comp_dir) + { + enum dwarf_form form; + unsigned char *ptr = get_AT (origin, DW_AT_comp_dir, &form); + assert (ptr && (form == DW_FORM_string + || form == DW_FORM_strp + || form == DW_FORM_line_strp)); + if (form == DW_FORM_strp) + { + if (unlikely (op_multifile || fi_multifile)) + form = note_strp_offset2 (read_32 (ptr)); + die->die_size += 4; + } + else if (form == DW_FORM_line_strp) + die->die_size += 4; + else + die->die_size + += strlen (refcu->cu_comp_dir) + 1; + t->attr[t->nattr].attr = DW_AT_comp_dir; + t->attr[t->nattr].form = form; + t->nattr++; + } + break; + case DW_TAG_namespace: + case DW_TAG_module: + { + enum dwarf_form form; + unsigned char *ptr = get_AT (origin, DW_AT_name, &form); + assert (ptr && (form == DW_FORM_string + || form == DW_FORM_strp + || form == DW_FORM_line_strp)); + if (form == DW_FORM_strp) + { + if (unlikely (op_multifile || fi_multifile)) + form = note_strp_offset2 (read_32 (ptr)); + die->die_size = 4; + } + else if (form == DW_FORM_line_strp) + die->die_size += 4; + else + die->die_size = strlen ((char *) ptr) + 1; + t->attr[0].attr = DW_AT_name; + t->attr[0].form = form; + t->nattr = 1; + if (sib) + { + t->attr[1].attr = DW_AT_sibling; + t->attr[1].form = DW_FORM_ref4; + obstack_ptr_grow (vec, die); + obstack_ptr_grow (vec, sib); + t->nattr++; + } + break; + } + case DW_TAG_imported_unit: + t->attr[0].attr = DW_AT_import; + t->nattr = 1; + if (die_cu (die->die_nextdup)->cu_kind == CU_ALT) + { + t->attr[0].form = dwarf_5 ? DW_FORM_ref_sup4 : DW_FORM_GNU_ref_alt; + die->die_size = 4; + } + else + { + t->attr[0].form = DW_FORM_ref_addr; + die->die_size = cu->cu_version == 2 ? ptr_size : 4; + } + break; + default: + abort (); + } + compute_abbrev_hash (t); + slot = htab_find_slot_with_hash (h, t, t->hash, + recompute ? NO_INSERT : INSERT); + if (slot == NULL) + dwz_oom (); + if (unlikely (recompute)) + assert (*slot); + if (*slot) + { + if (likely (!recompute)) + ((struct abbrev_tag *)*slot)->nusers++; + die->u.p2.die_new_abbrev = (struct abbrev_tag *)*slot; + } + else + { + struct abbrev_tag *newt = pool_clone_abbrev (t); + *slot = newt; + die->u.p2.die_new_abbrev = newt; + } + (*ndies)++; + if (ref != NULL && ref != die) + { + for (child = die->die_child, ref_child = ref->die_child; + child; child = child->die_sib, ref_child = ref_child->die_sib) + if (build_abbrevs_for_die (h, cu, child, refcu, ref_child, + t, ndies, vec, recompute)) + return 1; + } + else + for (child = die->die_child; child; child = child->die_sib) + if (build_abbrevs_for_die (h, cu, child, NULL, NULL, t, ndies, vec, + recompute)) + return 1; + return 0; +} + +/* Build new abbreviations for CU. T, NDIES and VEC arguments like + for build_abbrevs_for_die. */ +static int +build_abbrevs (dw_cu_ref cu, struct abbrev_tag *t, unsigned int *ndies, + struct obstack *vec) +{ + htab_t h = htab_try_create (50, abbrev_hash, abbrev_eq2, NULL); + + if (h == NULL) + dwz_oom (); + + if (build_abbrevs_for_die (h, cu, cu->cu_die, NULL, NULL, t, ndies, vec, + false)) + { + htab_delete (h); + return 1; + } + + cu->cu_new_abbrev = h; + return 0; +} + +/* Helper to record all abbrevs from the hash table into ob obstack + vector. Called through htab_traverse. */ +static int +list_abbrevs (void **slot, void *data) +{ + struct obstack *obp = (struct obstack *) data; + obstack_ptr_grow (obp, *slot); + return 1; +} + +/* Comparison function for abbreviations. Used for CUs that + need 128 or more abbreviations. Use lowest numbers (i.e. sort earlier) + abbrevs used for typed DWARF stack referenced DIEs, then sort + by decreasing number of users (abbrev numbers are uleb128 encoded, + the bigger number of them that can be 1 byte encoded the better). */ +static int +abbrev_cmp (const void *p, const void *q) +{ + struct abbrev_tag *t1 = *(struct abbrev_tag **)p; + struct abbrev_tag *t2 = *(struct abbrev_tag **)q; + unsigned int i; + + if (t1->op_type_referenced && !t2->op_type_referenced) + return -1; + if (!t1->op_type_referenced && t2->op_type_referenced) + return 1; + if (t1->nusers > t2->nusers) + return -1; + if (t1->nusers < t2->nusers) + return 1; + /* The rest just so that we have a stable sort. */ + if (t1->tag < t2->tag) + return -1; + if (t1->tag > t2->tag) + return 1; + if (t1->nattr < t2->nattr) + return -1; + if (t1->nattr > t2->nattr) + return 1; + if (t1->children && !t2->children) + return -1; + if (!t1->children && t2->children) + return 1; + for (i = 0; i < t1->nattr; i++) + { + if (t1->attr[i].attr < t2->attr[i].attr) + return -1; + if (t1->attr[i].attr > t2->attr[i].attr) + return 1; + if (t1->attr[i].form < t2->attr[i].form) + return -1; + if (t1->attr[i].form > t2->attr[i].form) + return 1; + if (t1->attr[i].form == DW_FORM_implicit_const) + { + if (t1->values[i] < t2->values[i]) + return -1; + if (t1->values[i] > t2->values[i]) + return 1; + } + } + return 0; +} + +/* First phase of computation of u.p2.die_new_offset and + new CU sizes. */ +static unsigned int +init_new_die_offsets (dw_die_ref die, unsigned int off, + unsigned int intracusize) +{ + dw_die_ref child; + unsigned int i; + struct abbrev_tag *t = die->u.p2.die_new_abbrev; + if (wr_multifile ? die->die_no_multifile : die->die_remove) + return off; + die->u.p2.die_new_offset = off; + if (likely (die->die_ref_seen == 0)) + { + die->die_size += size_of_uleb128 (die->u.p2.die_new_abbrev->entry); + die->u.p2.die_intracu_udata_size = 0; + for (i = 0; i < t->nattr; ++i) + switch (t->attr[i].form) + { + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref_udata: + die->u.p2.die_intracu_udata_size += intracusize; + break; + default: + break; + } + die->die_size += die->u.p2.die_intracu_udata_size; + } + off += die->die_size; + for (child = die->die_child; child; child = child->die_sib) + off = init_new_die_offsets (child, off, intracusize); + if (die->die_child) + off++; + return off; +} + +/* Second phase of computation of u.p2.die_new_offset and + new CU sizes. This step is called possibly many times, + for deciding if DW_FORM_ref_udata is worthwhile. + init_new_die_offsets starts with assuming each uleb128 will + need maximum number of bytes for the CU of the given size, + each new invocation of this function (except the last) + will shrink one or more uleb128s. Each shrinking can create + new opportunities to shrink other uleb128s. */ +static unsigned int +update_new_die_offsets (dw_die_ref die, unsigned int off, + dw_die_ref **intracuvec) +{ + dw_die_ref child; + if (wr_multifile ? die->die_no_multifile : die->die_remove) + return off; + assert (off <= die->u.p2.die_new_offset); + die->u.p2.die_new_offset = off; + if ((*intracuvec)[0] == die) + { + unsigned int intracu_udata_size = 0; + assert (die->u.p2.die_intracu_udata_size); + while ((*intracuvec)[0] == die) + { + intracu_udata_size + += size_of_uleb128 ((*intracuvec)[1]->u.p2.die_new_offset); + *intracuvec += 2; + } + assert (die->u.p2.die_intracu_udata_size >= intracu_udata_size); + die->die_size -= die->u.p2.die_intracu_udata_size - intracu_udata_size; + die->u.p2.die_intracu_udata_size = intracu_udata_size; + } + else + assert (die->u.p2.die_intracu_udata_size == 0 || die->die_ref_seen); + off += die->die_size; + for (child = die->die_child; child; child = child->die_sib) + off = update_new_die_offsets (child, off, intracuvec); + if (die->die_child) + off++; + return off; +} + +/* Final phase of computation of u.p2.die_new_offset. Called when already + decided what intra-CU form will be used. Can return -1U if + a problem is detected and the tool should give up. */ +static unsigned int +finalize_new_die_offsets (dw_cu_ref cu, dw_die_ref die, unsigned int off, + unsigned int intracusize, dw_die_ref **intracuvec) +{ + dw_die_ref child; + unsigned int ref_seen = die->die_ref_seen; + if (wr_multifile ? die->die_no_multifile : die->die_remove) + return off; + die->u.p2.die_new_offset = off; + die->die_ref_seen = 0; + /* As we aren't adjusting sizes of exprloc, if in the new layout + a DIE referenced through DW_OP_call2 is placed after 64K into + the CU, punt. */ + if (die->die_op_call2_referenced && off >= 65536) + return -1U; + /* Similarly punt if + DW_OP_GNU_{{regval,const,deref}_type,convert,reinterpret} + references a DIE that needs more uleb128 bytes to encode + the new offset compared to uleb128 bytes to encode the old offset. + GCC emits DW_TAG_base_type dies referenced that way at the + beginning of the CU and we try to preserve that, so this shouldn't + trigger for GCC generated code. */ + if (die->die_op_type_referenced + && !wr_multifile + && size_of_uleb128 (off) + > size_of_uleb128 (die->die_offset - cu->cu_offset)) + return -1U; + if ((*intracuvec)[0] == die) + { + unsigned int intracu_udata_size = 0; + assert (die->u.p2.die_intracu_udata_size); + while ((*intracuvec)[0] == die) + { + intracu_udata_size += intracusize; + *intracuvec += 2; + } + if (intracusize != 0) + { + die->die_size + -= die->u.p2.die_intracu_udata_size - intracu_udata_size; + die->u.p2.die_intracu_udata_size = intracu_udata_size; + } + } + else + assert (die->u.p2.die_intracu_udata_size == 0 || ref_seen); + off += die->die_size; + for (child = die->die_child; child; child = child->die_sib) + { + off = finalize_new_die_offsets (cu, child, off, intracusize, intracuvec); + if (off == -1U) + return off; + } + if (die->die_child) + off++; + return off; +} + +/* Comparison function, called through qsort, to sort CUs + by increasing number of needed new abbreviations. */ +static int +cu_abbrev_cmp (const void *p, const void *q) +{ + dw_cu_ref cu1 = *(dw_cu_ref *)p; + dw_cu_ref cu2 = *(dw_cu_ref *)q; + unsigned int nabbrevs1 = htab_elements (cu1->cu_new_abbrev); + unsigned int nabbrevs2 = htab_elements (cu2->cu_new_abbrev); + + if (nabbrevs1 < nabbrevs2) + return -1; + if (nabbrevs1 > nabbrevs2) + return 1; + /* The rest is just to get stable sort. */ + if (cu1->cu_kind != CU_PU && cu2->cu_kind == CU_PU) + return -1; + if (cu1->cu_kind == CU_PU && cu2->cu_kind != CU_PU) + return 1; + if (cu1->cu_offset < cu2->cu_offset) + return -1; + if (cu1->cu_offset > cu2->cu_offset) + return 1; + return 0; +} + +/* Compute new abbreviations for all CUs, size the new + .debug_abbrev section and all new .debug_info CUs. */ +static int +compute_abbrevs (DSO *dso) +{ + unsigned long total_size = 0, types_size = 0, abbrev_size = 0; + dw_cu_ref cu, *cuarr; + struct abbrev_tag *t; + unsigned int ncus, nlargeabbrevs = 0, i, laststart; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "compute_abbrevs\n"); + } + + t = (struct abbrev_tag *) + obstack_alloc (&ob2, + sizeof (*t) + + (max_nattr + 4) * sizeof (struct abbrev_attr) + + (max_nattr + 4) * sizeof (int64_t)); + t->values = (int64_t *) &t->attr[max_nattr + 4]; + for (cu = first_cu, ncus = 0; cu; cu = cu->cu_next) + { + unsigned int intracu, ndies = 0, tagsize = 0, nchildren = 0; + unsigned int nabbrevs, diesize, cusize, off, intracusize; + struct abbrev_tag **arr; + dw_die_ref *intracuarr, *intracuvec; + enum dwarf_form intracuform = DW_FORM_ref4; + dw_die_ref child, *lastotr, child_next, *last; + unsigned int headersz = (cu->cu_kind == CU_TYPES + ? 23 : (cu->cu_version >= 5 ? 12 : 11)); + + if (unlikely (fi_multifile) && cu->cu_die->die_remove) + continue; + if (unlikely (low_mem) && cu->cu_kind != CU_PU) + expand_children (cu->cu_die); + ncus++; + if (build_abbrevs (cu, t, &ndies, &ob2)) + return 1; + nabbrevs = htab_elements (cu->cu_new_abbrev); + htab_traverse (cu->cu_new_abbrev, list_abbrevs, &ob); + assert (obstack_object_size (&ob) == nabbrevs * sizeof (void *)); + arr = (struct abbrev_tag **) obstack_finish (&ob); + intracu = obstack_object_size (&ob2) / sizeof (void *) / 2; + obstack_ptr_grow (&ob2, NULL); + intracuarr = (dw_die_ref *) obstack_finish (&ob2); + if (nabbrevs >= 128) + { + unsigned int limit, uleb128_size; + + for (child = cu->cu_die->die_child; child; child = child->die_sib) + if (child->die_op_type_referenced && !wr_multifile) + { + child->u.p2.die_new_abbrev->op_type_referenced = 1; + /* If the old offset was close to uleb128 boundary, ensure + that DW_TAG_compile_unit gets small abbrev number + as well. */ + if (size_of_uleb128 (child->die_offset - cu->cu_offset) + < size_of_uleb128 (child->die_offset - cu->cu_offset + 1)) + cu->cu_die->u.p2.die_new_abbrev->op_type_referenced = 1; + } + qsort (arr, nabbrevs, sizeof (*arr), abbrev_cmp); + for (i = 0, limit = 128, uleb128_size = 1; i < nabbrevs; i++) + { + if (i + 1 == limit) + { + limit <<= 7; + uleb128_size++; + } + arr[i]->entry = i + 1; + tagsize += arr[i]->nusers * uleb128_size; + if (arr[i]->children) + nchildren += arr[i]->nusers; + } + nlargeabbrevs++; + } + else + { + tagsize = ndies; + for (i = 0; i < nabbrevs; i++) + { + arr[i]->entry = i + 1; + if (arr[i]->children) + nchildren += arr[i]->nusers; + } + } + + /* Move all base types with die_op_type_reference + to front, to increase the likelyhood that the offset + will fit. */ + for (last = &cu->cu_die->die_child, lastotr = last, child = *last; + child; child = child_next) + { + child_next = child->die_sib; + if (child->die_op_type_referenced) + { + if (lastotr != last) + { + child->die_sib = *lastotr; + *lastotr = child; + lastotr = &child->die_sib; + *last = child_next; + continue; + } + lastotr = &child->die_sib; + } + last = &child->die_sib; + } + + cu->u2.cu_largest_entry = nabbrevs; + diesize = calc_sizes (cu->cu_die); + cusize = headersz + tagsize + diesize + nchildren; + intracusize = size_of_uleb128 (cusize + intracu); + do + { + i = size_of_uleb128 (cusize + intracu * intracusize); + if (i == intracusize) + break; + intracusize = i; + } + while (1); + cu->initial_intracusize = intracusize; + off = init_new_die_offsets (cu->cu_die, headersz, intracusize); + do + { + intracuvec = intracuarr; + i = update_new_die_offsets (cu->cu_die, headersz, &intracuvec); + assert (*intracuvec == NULL); + if (i == off) + break; + assert (i < off); + off = i; + } + while (1); + if (cusize + intracu <= 256) + { + intracuform = DW_FORM_ref1; + intracusize = 1; + cusize += intracu; + } + else if (cusize + intracu * 2 <= 65536) + { + intracuform = DW_FORM_ref2; + intracusize = 2; + cusize += intracu * 2; + } + else + { + cusize += intracu * 4; + intracusize = 4; + } + if (off <= cusize) + { + intracuform = DW_FORM_ref_udata; + intracusize = 0; + cusize = off; + } + + intracuvec = intracuarr; + off = finalize_new_die_offsets (cu, cu->cu_die, headersz, intracusize, + &intracuvec); + if (off == -1U) + { + error (0, 0, "%s: DW_OP_call2 or typed DWARF stack referenced DIE" + " layed out at too big offset", dso->filename); + return 1; + } + assert (*intracuvec == NULL && off == cusize); + cu->cu_intracu_form = intracuform; + + if (intracuform != DW_FORM_ref4) + { + unsigned int j; + htab_empty (cu->cu_new_abbrev); + for (i = 0; i < nabbrevs; i++) + { + void **slot; + for (j = 0; j < arr[i]->nattr; j++) + if (arr[i]->attr[j].form == DW_FORM_ref4) + arr[i]->attr[j].form = intracuform; + compute_abbrev_hash (arr[i]); + slot = htab_find_slot_with_hash (cu->cu_new_abbrev, arr[i], + arr[i]->hash, INSERT); + if (slot == NULL) + dwz_oom (); + assert (slot != NULL && *slot == NULL); + *slot = arr[i]; + } + } + obstack_free (&ob, (void *) arr); + obstack_free (&ob2, (void *) intracuarr); + if (cu->cu_kind == CU_TYPES) + { + cu->cu_new_offset = types_size; + types_size += cusize; + } + else + { + cu->cu_new_offset = (wr_multifile ? multi_info_off : 0) + total_size; + total_size += cusize; + } + + if (unlikely (low_mem) && cu->cu_kind != CU_PU) + collapse_children (cu, cu->cu_die); + } + if (wr_multifile) + total_size += 11; /* See the end of write_info. */ + obstack_free (&ob2, (void *) t); + cuarr = (dw_cu_ref *) obstack_alloc (&ob2, ncus * sizeof (dw_cu_ref)); + for (cu = first_cu, i = 0; cu; cu = cu->cu_next) + if (cu->u1.cu_new_abbrev_owner == NULL + && (likely (!fi_multifile) + || cu->cu_kind != CU_NORMAL + || !cu->cu_die->die_remove)) + cuarr[i++] = cu; + assert (i == ncus); + qsort (cuarr, ncus, sizeof (dw_cu_ref), cu_abbrev_cmp); + /* For CUs with < 128 abbrevs, try to see if either all of the + abbrevs are at < 128 positions in >= 128 abbrev CUs, or + can be merged with some other small abbrev table to form + a < 128 abbrev table. */ + laststart = ncus - nlargeabbrevs; + for (i = ncus - 1; i != -1U; i--) + { + struct abbrev_tag **arr; + unsigned int nabbrevs, j, k, nattempts; + + if (cuarr[i]->u1.cu_new_abbrev_owner != NULL) + continue; + nabbrevs = htab_elements (cuarr[i]->cu_new_abbrev); + htab_traverse (cuarr[i]->cu_new_abbrev, list_abbrevs, &ob2); + assert (obstack_object_size (&ob2) == nabbrevs * sizeof (void *)); + arr = (struct abbrev_tag **) obstack_finish (&ob2); + if (nabbrevs >= 128) + { + nattempts = 0; + for (j = i + 1; j < ncus; j++) + { + unsigned int entry; + if (cuarr[j]->u1.cu_new_abbrev_owner) + continue; + if (++nattempts == 100) + break; + entry = cuarr[j]->u2.cu_largest_entry; + for (k = 0; k < nabbrevs; k++) + { + struct abbrev_tag *t + = htab_find_with_hash (cuarr[j]->cu_new_abbrev, + arr[k], arr[k]->hash); + if (t == NULL) + { + ++entry; + if (size_of_uleb128 (entry) + != size_of_uleb128 (arr[k]->entry)) + break; + } + else if (size_of_uleb128 (t->entry) + != size_of_uleb128 (arr[k]->entry)) + break; + } + if (k != nabbrevs) + continue; + entry = cuarr[j]->u2.cu_largest_entry; + for (k = 0; k < nabbrevs; k++) + { + void **slot + = htab_find_slot_with_hash (cuarr[j]->cu_new_abbrev, + arr[k], arr[k]->hash, + INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot != NULL) + arr[k]->entry = ((struct abbrev_tag *) *slot)->entry; + else + { + struct abbrev_tag *newt; + arr[k]->entry = ++entry; + newt = pool_clone_abbrev (arr[k]); + *slot = newt; + } + } + cuarr[j]->u2.cu_largest_entry = entry; + cuarr[i]->u1.cu_new_abbrev_owner = cuarr[j]; + break; + } + obstack_free (&ob2, (void *) arr); + continue; + } + /* Don't search all CUs, that might be too expensive. So just search + 100 of >= 128 abbrev tables, if there are more than 100, different + set each time. We are looking for a full match (i.e. that + cuarr[i] abbrevs are a subset of cuarr[j] abbrevs, and all of them + are in the low positions. */ + for (j = laststart, nattempts = -1U; nlargeabbrevs; j++) + { + if (j == ncus) + j -= nlargeabbrevs; + if (nattempts != -1U && j == laststart) + break; + if (nattempts == -1U) + nattempts = 0; + if (cuarr[j]->u1.cu_new_abbrev_owner) + continue; + if (++nattempts == 100) + break; + for (k = 0; k < nabbrevs; k++) + { + struct abbrev_tag *t + = htab_find_with_hash (cuarr[j]->cu_new_abbrev, + arr[k], arr[k]->hash); + if (t == NULL || t->entry >= 128) + break; + } + if (k == nabbrevs) + { + for (k = 0; k < nabbrevs; k++) + { + struct abbrev_tag *t + = htab_find_with_hash (cuarr[j]->cu_new_abbrev, + arr[k], arr[k]->hash); + arr[k]->entry = t->entry; + } + cuarr[i]->u1.cu_new_abbrev_owner = cuarr[j]; + break; + } + } + if (nlargeabbrevs > 100) + laststart = j; + if (cuarr[i]->u1.cu_new_abbrev_owner == NULL) + { + unsigned int maxdups = 0, maxdupidx = 0; + /* Next search up to 100 of small abbrev CUs, looking + for best match. */ + nattempts = 0; + for (j = i + 1; j < ncus - nlargeabbrevs; j++) + { + unsigned int curdups = 0; + if (cuarr[j]->u1.cu_new_abbrev_owner) + continue; + if (++nattempts == 100) + break; + for (k = 0; k < nabbrevs; k++) + { + struct abbrev_tag *t + = htab_find_with_hash (cuarr[j]->cu_new_abbrev, + arr[k], arr[k]->hash); + if (t != NULL) + curdups++; + } + if (curdups > maxdups + && cuarr[j]->u2.cu_largest_entry - curdups + nabbrevs < 128) + { + maxdups = curdups; + maxdupidx = j; + if (maxdups == nabbrevs) + break; + } + } + if (maxdups) + { + unsigned int entry = cuarr[maxdupidx]->u2.cu_largest_entry; + j = maxdupidx; + for (k = 0; k < nabbrevs; k++) + { + void **slot + = htab_find_slot_with_hash (cuarr[j]->cu_new_abbrev, + arr[k], arr[k]->hash, + INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot != NULL) + arr[k]->entry = ((struct abbrev_tag *) *slot)->entry; + else + { + struct abbrev_tag *newt; + arr[k]->entry = ++entry; + newt = pool_clone_abbrev (arr[k]); + *slot = newt; + } + } + cuarr[j]->u2.cu_largest_entry = entry; + cuarr[i]->u1.cu_new_abbrev_owner = cuarr[j]; + } + } + obstack_free (&ob2, (void *) arr); + } + obstack_free (&ob2, (void *) t); + for (cu = first_cu; cu; cu = cu->cu_next) + { + struct abbrev_tag **arr; + unsigned int nabbrevs, j; + + if (unlikely (fi_multifile) + && cu->cu_kind == CU_NORMAL + && cu->cu_die->die_remove) + continue; + if (cu->u1.cu_new_abbrev_owner != NULL) + { + cu->u2.cu_new_abbrev_offset = -1U; + if (cu->cu_new_abbrev) + htab_delete (cu->cu_new_abbrev); + cu->cu_new_abbrev = NULL; + continue; + } + cu->u2.cu_new_abbrev_offset + = (wr_multifile ? multi_abbrev_off : 0) + abbrev_size; + nabbrevs = htab_elements (cu->cu_new_abbrev); + htab_traverse (cu->cu_new_abbrev, list_abbrevs, &ob); + assert (obstack_object_size (&ob) == nabbrevs * sizeof (void *)); + arr = (struct abbrev_tag **) obstack_finish (&ob); + for (i = 0; i < nabbrevs; i++) + { + abbrev_size += size_of_uleb128 (arr[i]->entry); + abbrev_size += size_of_uleb128 (arr[i]->tag); + abbrev_size += 1; + for (j = 0; j < arr[i]->nattr; j++) + { + abbrev_size += size_of_uleb128 (arr[i]->attr[j].attr); + abbrev_size += size_of_uleb128 (arr[i]->attr[j].form); + if (arr[i]->attr[j].form == DW_FORM_implicit_const) + abbrev_size += size_of_sleb128 (arr[i]->values[j]); + } + abbrev_size += 2; + } + abbrev_size += 1; + obstack_free (&ob, (void *) arr); + } + for (cu = first_cu; cu; cu = cu->cu_next) + if (unlikely (fi_multifile) + && cu->cu_kind == CU_NORMAL + && cu->cu_die->die_remove) + continue; + else if (cu->u2.cu_new_abbrev_offset == -1U) + { + dw_cu_ref owner = cu; + unsigned int cu_new_abbrev_offset; + while (owner->u1.cu_new_abbrev_owner != NULL) + owner = owner->u1.cu_new_abbrev_owner; + cu_new_abbrev_offset = owner->u2.cu_new_abbrev_offset; + owner = cu; + while (owner->u1.cu_new_abbrev_owner != NULL) + { + owner->u2.cu_new_abbrev_offset = cu_new_abbrev_offset; + owner = owner->u1.cu_new_abbrev_owner; + } + } + debug_sections[DEBUG_INFO].new_size = total_size; + debug_sections[DEBUG_ABBREV].new_size = abbrev_size; + debug_sections[DEBUG_TYPES].new_size = types_size; + return 0; +} + +/* Comparison function, sort abbreviations by increasing + entry value. */ +static int +abbrev_entry_cmp (const void *p, const void *q) +{ + struct abbrev_tag *t1 = *(struct abbrev_tag **)p; + struct abbrev_tag *t2 = *(struct abbrev_tag **)q; + + if (t1->entry < t2->entry) + return -1; + if (t1->entry > t2->entry) + return 1; + return 0; +} + +/* Construct the new .debug_abbrev section + in malloced memory, store it as debug_sections[DEBUG_ABBREV].new_data. */ +static void +write_abbrev (void) +{ + dw_cu_ref cu; + unsigned char *abbrev = malloc (debug_sections[DEBUG_ABBREV].new_size); + unsigned char *ptr = abbrev; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_abbrev\n"); + } + + if (abbrev == NULL) + dwz_oom (); + + debug_sections[DEBUG_ABBREV].new_data = abbrev; + for (cu = first_cu; cu; cu = cu->cu_next) + { + struct abbrev_tag **arr; + unsigned int nabbrevs, i, j; + + if (unlikely (fi_multifile) + && cu->cu_kind == CU_NORMAL + && cu->cu_die->die_remove) + continue; + if (cu->u1.cu_new_abbrev_owner != NULL) + continue; + nabbrevs = htab_elements (cu->cu_new_abbrev); + htab_traverse (cu->cu_new_abbrev, list_abbrevs, &ob); + assert (obstack_object_size (&ob) == nabbrevs * sizeof (void *)); + arr = (struct abbrev_tag **) obstack_finish (&ob); + qsort (arr, nabbrevs, sizeof (*arr), abbrev_entry_cmp); + for (i = 0; i < nabbrevs; i++) + { + write_uleb128 (ptr, arr[i]->entry); + write_uleb128 (ptr, arr[i]->tag); + *ptr++ = arr[i]->children ? DW_CHILDREN_yes : DW_CHILDREN_no; + for (j = 0; j < arr[i]->nattr; j++) + { + write_uleb128 (ptr, arr[i]->attr[j].attr); + write_uleb128 (ptr, arr[i]->attr[j].form); + if (arr[i]->attr[j].form == DW_FORM_implicit_const) + write_sleb128 (ptr, arr[i]->values[j]); + } + *ptr++ = 0; + *ptr++ = 0; + } + *ptr++ = 0; + obstack_free (&ob, (void *) arr); + if (likely (!low_mem)) + { + htab_delete (cu->cu_new_abbrev); + cu->cu_new_abbrev = NULL; + } + } + assert (abbrev + debug_sections[DEBUG_ABBREV].new_size == ptr); +} + +/* Adjust DWARF expression starting at PTR, LEN bytes long, referenced by + DIE, with REF being the original DIE. */ +static void +adjust_exprloc (dw_cu_ref cu, dw_die_ref die, dw_cu_ref refcu, + dw_die_ref ref, unsigned char *ptr, size_t len) +{ + unsigned char *end = ptr + len, *orig_ptr = NULL; + unsigned char op; + uint32_t leni; + GElf_Addr addr; + dw_die_ref refd, refdt; + + while (ptr < end) + { + op = *ptr++; + switch (op) + { + case DW_OP_addr: + ptr += ptr_size; + break; + case DW_OP_deref: + case DW_OP_dup: + case DW_OP_drop: + case DW_OP_over: + case DW_OP_swap: + case DW_OP_rot: + case DW_OP_xderef: + case DW_OP_abs: + case DW_OP_and: + case DW_OP_div: + case DW_OP_minus: + case DW_OP_mod: + case DW_OP_mul: + case DW_OP_neg: + case DW_OP_not: + case DW_OP_or: + case DW_OP_plus: + case DW_OP_shl: + case DW_OP_shr: + case DW_OP_shra: + case DW_OP_xor: + case DW_OP_eq: + case DW_OP_ge: + case DW_OP_gt: + case DW_OP_le: + case DW_OP_lt: + case DW_OP_ne: + case DW_OP_lit0 ... DW_OP_lit31: + case DW_OP_reg0 ... DW_OP_reg31: + case DW_OP_nop: + case DW_OP_push_object_address: + case DW_OP_form_tls_address: + case DW_OP_call_frame_cfa: + case DW_OP_stack_value: + case DW_OP_GNU_push_tls_address: + case DW_OP_GNU_uninit: + break; + case DW_OP_const1u: + case DW_OP_pick: + case DW_OP_deref_size: + case DW_OP_xderef_size: + case DW_OP_const1s: + ++ptr; + break; + case DW_OP_const2u: + case DW_OP_const2s: + case DW_OP_skip: + case DW_OP_bra: + ptr += 2; + break; + case DW_OP_call2: + case DW_OP_call4: + case DW_OP_GNU_parameter_ref: + if (op == DW_OP_call2) + addr = read_16 (ptr); + else + addr = read_32 (ptr); + refd = off_htab_lookup (refcu, refcu->cu_offset + addr); + assert (refd != NULL && !refd->die_remove); + if (op == DW_OP_call2) + { + assert (refd->u.p2.die_new_offset <= 65535); + ptr -= 2; + write_16 (ptr, refd->u.p2.die_new_offset); + } + else + { + ptr -= 4; + write_32 (ptr, refd->u.p2.die_new_offset); + } + break; + case DW_OP_const4u: + case DW_OP_const4s: + ptr += 4; + break; + case DW_OP_call_ref: + case DW_OP_GNU_implicit_pointer: + case DW_OP_implicit_pointer: + case DW_OP_GNU_variable_value: + addr = read_size (ptr, refcu->cu_version == 2 ? ptr_size : 4); + assert (cu->cu_version == refcu->cu_version); + refd = off_htab_lookup (NULL, addr); + assert (refd != NULL); + refdt = refd; + while (refdt->die_toplevel == 0) + refdt = refdt->die_parent; + if (refdt->die_dup && !refdt->die_op_type_referenced) + refd = die_find_dup (refdt, refdt->die_dup, refd); + write_size (ptr, cu->cu_version == 2 ? ptr_size : 4, + die_cu (refd)->cu_new_offset + + refd->u.p2.die_new_offset); + if (cu->cu_version == 2) + ptr += ptr_size; + else + ptr += 4; + if (op == DW_OP_GNU_implicit_pointer || op == DW_OP_implicit_pointer) + skip_leb128 (ptr); + break; + case DW_OP_const8u: + case DW_OP_const8s: + ptr += 8; + break; + case DW_OP_constu: + case DW_OP_plus_uconst: + case DW_OP_regx: + case DW_OP_piece: + case DW_OP_consts: + case DW_OP_breg0 ... DW_OP_breg31: + case DW_OP_fbreg: + skip_leb128 (ptr); + break; + case DW_OP_bregx: + case DW_OP_bit_piece: + skip_leb128 (ptr); + skip_leb128 (ptr); + break; + case DW_OP_implicit_value: + leni = read_uleb128 (ptr); + ptr += leni; + break; + case DW_OP_GNU_entry_value: + case DW_OP_entry_value: + leni = read_uleb128 (ptr); + assert ((uint64_t) (end - ptr) >= leni); + adjust_exprloc (cu, die, refcu, ref, ptr, leni); + ptr += leni; + break; + case DW_OP_GNU_convert: + case DW_OP_convert: + case DW_OP_GNU_reinterpret: + case DW_OP_reinterpret: + orig_ptr = ptr; + addr = read_uleb128 (ptr); + if (addr == 0) + break; + goto typed_dwarf; + case DW_OP_GNU_regval_type: + case DW_OP_regval_type: + skip_leb128 (ptr); + orig_ptr = ptr; + addr = read_uleb128 (ptr); + goto typed_dwarf; + case DW_OP_GNU_const_type: + case DW_OP_const_type: + orig_ptr = ptr; + addr = read_uleb128 (ptr); + goto typed_dwarf; + case DW_OP_GNU_deref_type: + case DW_OP_deref_type: + ++ptr; + orig_ptr = ptr; + addr = read_uleb128 (ptr); + typed_dwarf: + refd = off_htab_lookup (refcu, refcu->cu_offset + addr); + assert (refd != NULL && refd->die_op_type_referenced); + leni = ptr - orig_ptr; + assert (size_of_uleb128 (refd->u.p2.die_new_offset) <= leni); + ptr = orig_ptr; + write_uleb128 (ptr, refd->u.p2.die_new_offset); + /* If the new offset ends up being shorter uleb128 + encoded than the old, pad it up to make it still valid, + but not shortest, uleb128. Changing sizes of + exprloc would be a nightmare. Another alternative would + be to pad with DW_OP_nop after the op. */ + if (ptr < orig_ptr + leni) + { + ptr[-1] |= 0x80; + while (ptr < orig_ptr + leni - 1) + *ptr++ = 0x80; + *ptr++ = 0; + } + if (op == DW_OP_GNU_const_type || op == DW_OP_const_type) + ptr += *ptr + 1; + break; + default: + abort (); + } + } +} + +/* Write DW_TAG_unit_* DIE (with ORIGIN being the corresponding original DIE) to + memory starting at PTR, return pointer after the DIE. */ +static unsigned char * +write_unit_die (unsigned char *ptr, dw_die_ref die, dw_die_ref origin) +{ + struct abbrev_tag *t = die->u.p2.die_new_abbrev; + unsigned int i; + + for (i = 0; i < t->nattr; ++i) + { + struct abbrev_attr *attr = &t->attr[i]; + switch (attr->attr) + { + case DW_AT_stmt_list: + { + enum dwarf_form form; + unsigned char *p = get_AT (origin, DW_AT_stmt_list, &form); + assert (p && (form == DW_FORM_sec_offset + || form == DW_FORM_data4)); + if (wr_multifile) + write_32 (ptr, multi_line_off); + else if (op_multifile) + write_32 (ptr, 0); + else + { + memcpy (ptr, p, 4); + ptr += 4; + } + } + break; + case DW_AT_comp_dir: + { + enum dwarf_form form; + unsigned char *p = get_AT (origin, DW_AT_comp_dir, &form); + assert (p); + assert (form == attr->form + || (form == DW_FORM_strp + && (attr->form == DW_FORM_GNU_strp_alt + || attr->form == DW_FORM_strp_sup))); + if (form == DW_FORM_strp) + { + if (unlikely (wr_multifile || op_multifile || fi_multifile)) + { + unsigned int strp = lookup_strp_offset (read_32 (p)); + write_32 (ptr, strp); + } + else + { + memcpy (ptr, p, 4); + ptr += 4; + } + } + else if (form == DW_FORM_line_strp) + { + memcpy (ptr, p, 4); + ptr += 4; + } + else + { + size_t len = strlen ((char *) p) + 1; + memcpy (ptr, p, len); + ptr += len; + } + } + break; + case DW_AT_language: + { + enum dwarf_source_language lang = die_cu (die)->lang; + unsigned int lang_size = nr_bytes_for (lang); + write_size (ptr, lang_size, lang); + ptr += lang_size; + } + break; + default: + assert (false); + break; + } + } + + return ptr; +} + +/* Write DIE (with REF being the corresponding original DIE) to + memory starting at PTR, return pointer after the DIE. */ +static unsigned char * +write_die (unsigned char *ptr, dw_cu_ref cu, dw_die_ref die, + dw_cu_ref refcu, dw_die_ref ref, unsigned int *die_count) +{ + uint64_t low_pc = 0; + dw_die_ref child, sib = NULL, origin = NULL; + struct abbrev_tag *t; + + if (wr_multifile ? die->die_no_multifile : die->die_remove) + return ptr; + if (die_count) + (*die_count)++; + if (die->die_offset == -1U) + { + if (ref != NULL) + ; + else if (die_safe_nextdup (die) && die->die_nextdup->die_dup == die) + { + ref = die->die_nextdup; + refcu = die_cu (ref); + } + if (ref == NULL) + origin = die->die_nextdup; + } + else + { + ref = die; + refcu = cu; + if (wr_multifile + && (die->die_root || die->die_named_namespace)) + origin = die; + } + if (die->die_child && die->die_sib) + for (sib = die->die_sib; sib; sib = sib->die_sib) + if (wr_multifile ? !sib->die_no_multifile : !sib->die_remove) + break; + t = die->u.p2.die_new_abbrev; + write_uleb128 (ptr, t->entry); + if (ref != NULL && origin == NULL) + { + unsigned char *base + = cu->cu_kind == CU_TYPES + ? debug_sections[DEBUG_TYPES].data + : debug_sections[DEBUG_INFO].data; + unsigned char *inptr = base + ref->die_offset; + struct abbrev_tag *reft = ref->die_abbrev; + unsigned int i, j; + + skip_leb128 (inptr); + for (i = 0, j = 0; i < reft->nattr; ++i) + { + uint32_t form = reft->attr[i].form; + size_t len = 0; + uint64_t value; + unsigned char *orig_ptr = inptr; + + while (form == DW_FORM_indirect) + form = read_uleb128 (inptr); + + if (unlikely (wr_multifile || op_multifile) + && (reft->attr[i].attr == DW_AT_decl_file + || reft->attr[i].attr == DW_AT_call_file)) + { + switch (form) + { + case DW_FORM_data1: + value = read_8 (inptr); + break; + case DW_FORM_data2: + value = read_16 (inptr); + break; + case DW_FORM_data4: + value = read_32 (inptr); + break; + case DW_FORM_data8: + value = read_64 (inptr); + break; + case DW_FORM_udata: + value = read_uleb128 (inptr); + break; + case DW_FORM_sdata: + value = read_sleb128 (inptr); + break; + case DW_FORM_implicit_const: + /* DW_FORM_implicit_const should have been updated + already when computing abbrevs. */ + j++; + continue; + default: abort (); + } + value = line_htab_lookup (refcu, value); + switch (t->attr[j].form) + { + case DW_FORM_data1: write_8 (ptr, value); break; + case DW_FORM_data2: write_16 (ptr, value); break; + case DW_FORM_data4: write_32 (ptr, value); break; + case DW_FORM_data8: write_64 (ptr, value); break; + case DW_FORM_udata: write_uleb128 (ptr, value); break; + case DW_FORM_sdata: write_sleb128 (ptr, value); break; + default: abort (); + } + j++; + continue; + } + + if (unlikely (fi_multifile) + && (reft->attr[i].attr == DW_AT_GNU_macros + || reft->attr[i].attr == DW_AT_macros) + && alt_macro_htab != NULL) + { + struct macro_entry me, *m; + + memcpy (ptr, orig_ptr, inptr - orig_ptr); + ptr += inptr - orig_ptr; + value = read_32 (inptr); + me.ptr = debug_sections[DEBUG_MACRO].data + value; + m = (struct macro_entry *) + htab_find_with_hash (macro_htab, &me, value); + write_32 (ptr, m->hash); + j++; + continue; + } + + switch (form) + { + case DW_FORM_ref_addr: + { + dw_die_ref refd, refdt; + if (t->attr[j].form != DW_FORM_GNU_ref_alt + && t->attr[j].form != DW_FORM_ref_sup4) + { + memcpy (ptr, orig_ptr, inptr - orig_ptr); + ptr += inptr - orig_ptr; + } + value = read_size (inptr, refcu->cu_version == 2 + ? ptr_size : 4); + inptr += refcu->cu_version == 2 ? ptr_size : 4; + refd = off_htab_lookup (NULL, value); + if (refd == NULL || refd->die_tag == 0) + error (1, 0, "Couldn't find DIE at DW_FORM_ref_addr offset" + " 0x%" PRIx64, value); + assert (refd != NULL); + refdt = refd; + while (refdt->die_toplevel == 0) + refdt = refdt->die_parent; + if (refdt->die_dup && !refdt->die_op_type_referenced) + { + refd = die_find_dup (refdt, refdt->die_dup, refd); + if (t->attr[j].form == DW_FORM_GNU_ref_alt + || t->attr[j].form == DW_FORM_ref_sup4) + { + assert (die_cu (refd)->cu_kind == CU_ALT); + write_32 (ptr, refd->die_offset); + j++; + continue; + } + } + assert (refd->u.p2.die_new_offset + && t->attr[j].form != DW_FORM_GNU_ref_alt + && t->attr[j].form != DW_FORM_ref_sup4); + value = die_cu (refd)->cu_new_offset + + refd->u.p2.die_new_offset; + write_size (ptr, cu->cu_version == 2 ? ptr_size : 4, + value); + ptr += cu->cu_version == 2 ? ptr_size : 4; + if (unlikely (op_multifile)) + assert (die_cu (refd)->cu_kind == CU_PU); + j++; + continue; + } + case DW_FORM_addr: + inptr += ptr_size; + if (reft->attr[i].attr == DW_AT_low_pc) + low_pc = read_size (inptr - ptr_size, ptr_size); + if (reft->attr[i].attr == DW_AT_high_pc + && t->attr[j].form != reft->attr[i].form) + { + uint64_t high_pc = read_size (inptr - ptr_size, ptr_size); + switch (t->attr[j].form) + { + case DW_FORM_udata: + write_uleb128 (ptr, high_pc - low_pc); + break; + case DW_FORM_data4: + write_32 (ptr, high_pc - low_pc); + break; + default: + abort (); + } + j++; + continue; + } + break; + case DW_FORM_flag_present: + case DW_FORM_implicit_const: + break; + case DW_FORM_flag: + case DW_FORM_data1: + ++inptr; + break; + case DW_FORM_data2: + inptr += 2; + break; + case DW_FORM_data4: + if (reft->attr[i].attr == DW_AT_high_pc + && t->attr[j].form != reft->attr[i].form) + { + uint32_t range_len = read_32 (inptr); + switch (t->attr[j].form) + { + case DW_FORM_udata: + write_uleb128 (ptr, range_len); + break; + default: + abort (); + } + j++; + continue; + } + inptr += 4; + break; + case DW_FORM_sec_offset: + inptr += 4; + break; + case DW_FORM_data8: + if (reft->attr[i].attr == DW_AT_high_pc + && t->attr[j].form != reft->attr[i].form) + { + uint64_t range_len = read_64 (inptr); + switch (t->attr[j].form) + { + case DW_FORM_udata: + write_uleb128 (ptr, range_len); + break; + case DW_FORM_data4: + write_32 (ptr, range_len); + break; + default: + abort (); + } + j++; + continue; + } + inptr += 8; + break; + case DW_FORM_ref_sig8: + inptr += 8; + break; + case DW_FORM_data16: + inptr += 16; + break; + case DW_FORM_sdata: + case DW_FORM_udata: + skip_leb128 (inptr); + break; + case DW_FORM_strp: + if (unlikely (wr_multifile || op_multifile || fi_multifile)) + { + unsigned int strp = lookup_strp_offset (read_32 (inptr)); + memcpy (ptr, orig_ptr, inptr - 4 - orig_ptr); + ptr += inptr - 4 - orig_ptr; + write_32 (ptr, strp); + j++; + continue; + } + inptr += 4; + break; + case DW_FORM_line_strp: + inptr += 4; + break; + case DW_FORM_string: + inptr = (unsigned char *) strchr ((char *)inptr, '\0') + 1; + break; + case DW_FORM_indirect: + abort (); + case DW_FORM_block1: + len = *inptr++; + break; + case DW_FORM_block2: + len = read_16 (inptr); + form = DW_FORM_block1; + break; + case DW_FORM_block4: + len = read_32 (inptr); + form = DW_FORM_block1; + break; + case DW_FORM_block: + len = read_uleb128 (inptr); + form = DW_FORM_block1; + break; + case DW_FORM_exprloc: + len = read_uleb128 (inptr); + break; + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + case DW_FORM_ref_udata: + switch (form) + { + case DW_FORM_ref1: value = read_8 (inptr); break; + case DW_FORM_ref2: value = read_16 (inptr); break; + case DW_FORM_ref4: value = read_32 (inptr); break; + case DW_FORM_ref8: value = read_64 (inptr); break; + case DW_FORM_ref_udata: value = read_uleb128 (inptr); break; + default: abort (); + } + if (reft->attr[i].attr == DW_AT_sibling) + { + if (j == t->nattr + || t->attr[j].attr != DW_AT_sibling) + continue; + assert (sib); + value = sib->u.p2.die_new_offset; + } + else + { + dw_die_ref refdt, refd + = off_htab_lookup (refcu, refcu->cu_offset + value); + assert (refd != NULL); + refdt = refd; + while (refdt->die_toplevel == 0) + refdt = refdt->die_parent; + if (refdt->die_dup && refdt->die_op_type_referenced + && cu->cu_kind != CU_PU) + { + if (cu == die_cu (refdt->die_dup)) + refd = die_find_dup (refdt, refdt->die_dup, refd); + } + else if (refdt->die_dup) + refd = die_find_dup (refdt, refdt->die_dup, refd); + if (t->attr[j].form == DW_FORM_GNU_ref_alt + || t->attr[j].form == DW_FORM_ref_sup4) + { + value = refd->die_offset; + assert (die_cu (refd)->cu_kind == CU_ALT); + } + else + { + dw_cu_ref refdcu = die_cu (refd); + value = refd->u.p2.die_new_offset; + assert (IMPLIES (cu->cu_kind == CU_PU, + die_cu (refd)->cu_kind == CU_PU)); + assert (value && refdcu->cu_kind != CU_ALT); + if (t->attr[j].form == DW_FORM_ref_addr) + { + value += refdcu->cu_new_offset; + if (unlikely (op_multifile)) + assert (refdcu->cu_kind == CU_PU); + } + else + assert (refdcu == cu); + } + } + switch (t->attr[j].form) + { + case DW_FORM_ref1: write_8 (ptr, value); break; + case DW_FORM_ref2: write_16 (ptr, value); break; + case DW_FORM_ref4: write_32 (ptr, value); break; + case DW_FORM_ref_udata: write_uleb128 (ptr, value); break; + case DW_FORM_ref_addr: + write_size (ptr, cu->cu_version == 2 ? ptr_size : 4, + value); + ptr += cu->cu_version == 2 ? ptr_size : 4; + break; + case DW_FORM_GNU_ref_alt: + case DW_FORM_ref_sup4: + write_32 (ptr, value); + break; + case DW_FORM_ref_sup8: + write_64 (ptr, value); + break; + default: + abort (); + } + j++; + continue; + default: + abort (); + } + + if (form == DW_FORM_block1 || form == DW_FORM_exprloc) + inptr += len; + + memcpy (ptr, orig_ptr, inptr - orig_ptr); + ptr += inptr - orig_ptr; + + /* Old DWARF uses blocks instead of exprlocs. */ + if (form == DW_FORM_block1 && cu->cu_version < 4) + switch (reft->attr[i].attr) + { + case DW_AT_frame_base: + case DW_AT_location: + case DW_AT_data_member_location: + case DW_AT_vtable_elem_location: + case DW_AT_byte_size: + case DW_AT_bit_offset: + case DW_AT_bit_size: + case DW_AT_string_length: + case DW_AT_lower_bound: + case DW_AT_return_addr: + case DW_AT_bit_stride: + case DW_AT_upper_bound: + case DW_AT_count: + case DW_AT_segment: + case DW_AT_static_link: + case DW_AT_use_location: + case DW_AT_allocated: + case DW_AT_associated: + case DW_AT_data_location: + case DW_AT_byte_stride: + case DW_AT_rank: + case DW_AT_call_value: + case DW_AT_call_target: + case DW_AT_call_target_clobbered: + case DW_AT_call_data_location: + case DW_AT_call_data_value: + case DW_AT_GNU_call_site_value: + case DW_AT_GNU_call_site_data_value: + case DW_AT_GNU_call_site_target: + case DW_AT_GNU_call_site_target_clobbered: + adjust_exprloc (cu, die, refcu, ref, ptr - len, len); + default: + break; + } + else if (form == DW_FORM_exprloc) + adjust_exprloc (cu, die, refcu, ref, ptr - len, len); + j++; + } + assert (j == t->nattr); + } + else + switch (die->die_tag) + { + case DW_TAG_partial_unit: + case DW_TAG_compile_unit: + ptr = write_unit_die (ptr, die, origin); + break; + case DW_TAG_namespace: + case DW_TAG_module: + { + enum dwarf_form form; + unsigned char *p = get_AT (origin, DW_AT_name, &form); + assert (p && (form == t->attr[0].form + || (form == DW_FORM_strp + && (t->attr[0].form == DW_FORM_GNU_strp_alt + || t->attr[0].form == DW_FORM_strp_sup)))); + if (form == DW_FORM_strp) + { + if (unlikely (wr_multifile || op_multifile || fi_multifile)) + { + unsigned int strp = lookup_strp_offset (read_32 (p)); + write_32 (ptr, strp); + } + else + { + memcpy (ptr, p, 4); + ptr += 4; + } + } + else if (form == DW_FORM_line_strp) + { + memcpy (ptr, p, 4); + ptr += 4; + } + else + { + size_t len = strlen ((char *) p) + 1; + memcpy (ptr, p, len); + ptr += len; + } + if (t->nattr > 1) + { + assert (sib); + switch (t->attr[1].form) + { + case DW_FORM_ref1: + write_8 (ptr, sib->u.p2.die_new_offset); + break; + case DW_FORM_ref2: + write_16 (ptr, sib->u.p2.die_new_offset); + break; + case DW_FORM_ref4: + write_32 (ptr, sib->u.p2.die_new_offset); + break; + case DW_FORM_ref_udata: + write_uleb128 (ptr, sib->u.p2.die_new_offset); + break; + default: + abort (); + } + } + break; + } + case DW_TAG_imported_unit: + refcu = die_cu (origin); + if (t->attr[0].form == DW_FORM_GNU_ref_alt + || t->attr[0].form == DW_FORM_ref_sup4) + { + assert (refcu->cu_kind == CU_ALT); + write_32 (ptr, origin->die_offset); + break; + } + assert (refcu->cu_kind != CU_ALT); + write_size (ptr, cu->cu_version == 2 ? ptr_size : 4, + refcu->cu_new_offset + + origin->u.p2.die_new_offset); + ptr += cu->cu_version == 2 ? ptr_size : 4; + break; + default: + abort (); + } + if (ref != NULL && ref != die) + { + dw_die_ref ref_child; + for (child = die->die_child, ref_child = ref->die_child; + child; child = child->die_sib, ref_child = ref_child->die_sib) + ptr = write_die (ptr, cu, child, refcu, ref_child, die_count); + } + else + for (child = die->die_child; child; child = child->die_sib) + ptr = write_die (ptr, cu, child, NULL, NULL, die_count); + if (die->die_child) + write_8 (ptr, 0); + return ptr; +} + +/* Recompute abbrevs for CU. If any children were collapsed during + compute_abbrevs, their ->u.p2.die_new_abbrev and ->u.p2.die_new_offset + fields are no longer available and need to be computed again. */ +static void +recompute_abbrevs (dw_cu_ref cu, unsigned int cu_size) +{ + unsigned int headersz = (cu->cu_kind == CU_TYPES + ? 23 : (cu->cu_version >= 5 ? 12 : 11)); + struct abbrev_tag *t; + unsigned int ndies = 0, intracusize, off, i; + dw_die_ref *intracuarr, *intracuvec; + + t = (struct abbrev_tag *) + obstack_alloc (&ob2, + sizeof (*t) + + (max_nattr + 4) * sizeof (struct abbrev_attr) + + (max_nattr + 4) * sizeof (int64_t)); + t->values = (int64_t *) &t->attr[max_nattr + 4]; + + build_abbrevs_for_die (cu->u1.cu_new_abbrev_owner + ? cu->u1.cu_new_abbrev_owner->cu_new_abbrev + : cu->cu_new_abbrev, cu, cu->cu_die, NULL, NULL, t, + &ndies, &ob2, true); + + obstack_ptr_grow (&ob2, NULL); + intracuarr = (dw_die_ref *) obstack_finish (&ob2); + if (cu->cu_intracu_form != DW_FORM_ref_udata) + { + switch (cu->cu_intracu_form) + { + case DW_FORM_ref1: intracusize = 1; break; + case DW_FORM_ref2: intracusize = 2; break; + case DW_FORM_ref4: intracusize = 4; break; + default: abort (); + } + off = init_new_die_offsets (cu->cu_die, headersz, intracusize); + } + else + { + intracusize = cu->initial_intracusize; + + off = init_new_die_offsets (cu->cu_die, headersz, intracusize); + do + { + intracuvec = intracuarr; + i = update_new_die_offsets (cu->cu_die, headersz, &intracuvec); + assert (*intracuvec == NULL); + if (i == off) + break; + assert (i < off); + off = i; + } + while (1); + + intracuvec = intracuarr; + off = finalize_new_die_offsets (cu, cu->cu_die, headersz, 0, + &intracuvec); + assert (*intracuvec == NULL); + } + obstack_free (&ob2, (void *) t); + assert (off == cu_size); +} + +/* Construct new .debug_info section in malloced memory, + store it to debug_sections[DEBUG_INFO].new_data. */ +static void +write_info (unsigned int *die_count) +{ + dw_cu_ref cu, cu_next; + unsigned char *info = malloc (debug_sections[DEBUG_INFO].new_size); + unsigned char *ptr = info; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_info\n"); + } + + if (info == NULL) + dwz_oom (); + if (die_count) + *die_count = 0; + debug_sections[DEBUG_INFO].new_data = info; + cu = first_cu; + if (unlikely (fi_multifile)) + while (cu + && cu->cu_kind == CU_NORMAL + && cu->cu_die->die_remove) + cu = cu->cu_next; + for (; cu; cu = cu_next) + { + unsigned long next_off = debug_sections[DEBUG_INFO].new_size; + /* Ignore .debug_types CUs. */ + if (cu->cu_kind == CU_TYPES) + break; + cu_next = cu->cu_next; + if (unlikely (fi_multifile)) + while (cu_next + && cu_next->cu_kind == CU_NORMAL + && cu_next->cu_die->die_remove) + cu_next = cu_next->cu_next; + if (cu_next && cu_next->cu_kind == CU_TYPES) + cu_next = NULL; + if (cu_next) + next_off = cu_next->cu_new_offset; + else if (wr_multifile) + next_off += multi_info_off - 11L; + if (unlikely (low_mem) + && cu->cu_kind != CU_PU + && expand_children (cu->cu_die)) + recompute_abbrevs (cu, next_off - cu->cu_new_offset); + /* Write CU header. */ + write_32 (ptr, next_off - cu->cu_new_offset - 4); + write_16 (ptr, cu->cu_version); + if (cu->cu_version >= 5) + { + *ptr++ = (cu->cu_die->die_tag == DW_TAG_compile_unit + ? DW_UT_compile : DW_UT_partial); + write_8 (ptr, ptr_size); + } + write_32 (ptr, cu->u2.cu_new_abbrev_offset); + if (cu->cu_version < 5) + write_8 (ptr, ptr_size); + ptr = write_die (ptr, cu, cu->cu_die, NULL, NULL, die_count); + assert (info + (next_off - (wr_multifile ? multi_info_off : 0)) == ptr); + if (unlikely (low_mem) && cu->cu_kind != CU_PU) + collapse_children (cu, cu->cu_die); + } + if (wr_multifile) + { + /* And terminate the contribution by the current object file. */ + write_32 (ptr, 7); + write_16 (ptr, 2); + write_32 (ptr, 0); + write_8 (ptr, ptr_size); + } + assert (info + debug_sections[DEBUG_INFO].new_size == ptr); +} + +/* Adjust .debug_loc range determined by *SLOT, called through + htab_traverse. */ +static int +adjust_loclist (void **slot, void *data) +{ + struct debug_loc_adjust *adj = (struct debug_loc_adjust *) *slot; + unsigned char *ptr, *endsec; + GElf_Addr low, high; + size_t len; + + (void)data; + + ptr = debug_sections[DEBUG_LOC].new_data + adj->start_offset; + endsec = ptr + debug_sections[DEBUG_LOC].size; + while (ptr < endsec) + { + low = read_size (ptr, ptr_size); + high = read_size (ptr + ptr_size, ptr_size); + ptr += 2 * ptr_size; + if (low == 0 && high == 0) + break; + + if (low == ~ (GElf_Addr) 0 || (ptr_size == 4 && low == 0xffffffff)) + continue; + + len = read_16 (ptr); + assert (ptr + len <= endsec); + + adjust_exprloc (adj->cu, adj->cu->cu_die, adj->cu, adj->cu->cu_die, + ptr, len); + + ptr += len; + } + + return 1; +} + +/* Adjust .debug_loclists range determined by *SLOT, called through + htab_traverse. */ +static int +adjust_loclists (void **slot, void *data) +{ + struct debug_loc_adjust *adj = (struct debug_loc_adjust *) *slot; + unsigned char *ptr, *endsec; + size_t len = 0; + + (void)data; + + ptr = debug_sections[DEBUG_LOCLISTS].new_data + adj->start_offset; + endsec = ptr + debug_sections[DEBUG_LOCLISTS].size; + +again: + while (ptr < endsec) + { + uint8_t lle = *ptr++; + switch (lle) + { + case DW_LLE_end_of_list: + goto done; + + case DW_LLE_base_addressx: + skip_leb128 (ptr); + goto again; + + case DW_LLE_startx_endx: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_startx_length: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_offset_pair: + skip_leb128 (ptr); + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_default_location: + len = read_uleb128 (ptr); + break; + + case DW_LLE_base_address: + ptr += ptr_size; + goto again; + + case DW_LLE_start_end: + ptr += 2 * ptr_size; + len = read_uleb128 (ptr); + break; + + case DW_LLE_start_length: + ptr += ptr_size; + skip_leb128 (ptr); + len = read_uleb128 (ptr); + break; + + case DW_LLE_GNU_view_pair: + /* Note we cannot check CU version here, but we'll get a + warning on the original parsing if CU version is not 5.*/ + skip_leb128 (ptr); + skip_leb128 (ptr); + goto again; + + default: + error (0, 0, "unhandled location list entry 0x%x", lle); + return 1; + } + + assert (ptr + len <= endsec); + + adjust_exprloc (adj->cu, adj->cu->cu_die, adj->cu, adj->cu->cu_die, + ptr, len); + + ptr += len; + } + +done: + return 1; +} + +/* Create new .debug_loc section in malloced memory if .debug_loc + needs to be adjusted. */ +static void +write_loc (void) +{ + unsigned char *loc; + if (loc_htab == NULL) + return; + loc = malloc (debug_sections[DEBUG_LOC].size); + if (loc == NULL) + dwz_oom (); + memcpy (loc, debug_sections[DEBUG_LOC].data, debug_sections[DEBUG_LOC].size); + debug_sections[DEBUG_LOC].new_data = loc; + htab_traverse (loc_htab, adjust_loclist, NULL); +} + +/* Create new .debug_loclists section in malloced memory if .debug_loclists + needs to be adjusted. */ +static void +write_loclists (void) +{ + unsigned char *loc; + if (loclists_htab == NULL) + return; + loc = malloc (debug_sections[DEBUG_LOCLISTS].size); + if (loc == NULL) + dwz_oom (); + memcpy (loc, debug_sections[DEBUG_LOCLISTS].data, + debug_sections[DEBUG_LOCLISTS].size); + debug_sections[DEBUG_LOCLISTS].new_data = loc; + htab_traverse (loclists_htab, adjust_loclists, NULL); +} + +/* Create new .debug_types section in malloced memory. */ +static void +write_types (void) +{ + dw_cu_ref cu; + unsigned char *types, *ptr, *inptr; + dw_die_ref ref; + + if (debug_sections[DEBUG_TYPES].data == NULL) + return; + types = malloc (debug_sections[DEBUG_TYPES].new_size); + if (types == NULL) + dwz_oom (); + debug_sections[DEBUG_TYPES].new_data = types; + ptr = types; + for (cu = first_cu; cu; cu = cu->cu_next) + { + unsigned long next_off = debug_sections[DEBUG_TYPES].new_size; + /* Ignore .debug_info CUs. */ + if (cu->cu_kind != CU_TYPES) + continue; + if (cu->cu_next) + next_off = cu->cu_next->cu_new_offset; + if (unlikely (low_mem) + && expand_children (cu->cu_die)) + recompute_abbrevs (cu, next_off - cu->cu_new_offset); + /* Write CU header. */ + write_32 (ptr, next_off - cu->cu_new_offset - 4); + write_16 (ptr, cu->cu_version); + write_32 (ptr, cu->u2.cu_new_abbrev_offset); + write_8 (ptr, ptr_size); + inptr = debug_sections[DEBUG_TYPES].data + cu->cu_offset + 19; + memcpy (ptr, inptr - 8, 8); + ptr += 8; + ref = off_htab_lookup (cu, cu->cu_offset + read_32 (inptr)); + assert (ref && die_safe_dup(ref) == NULL); + write_32 (ptr, ref->u.p2.die_new_offset); + ptr = write_die (ptr, cu, cu->cu_die, NULL, NULL, NULL); + assert (types + next_off == ptr); + if (unlikely (low_mem)) + collapse_children (cu, cu->cu_die); + } + assert (types + debug_sections[DEBUG_TYPES].new_size == ptr); +} + +/* Construct new .debug_aranges section in malloced memory, + store it to debug_sections[DEBUG_ARANGES].new_data. */ +static int +write_aranges (DSO *dso) +{ + dw_cu_ref cu, cufirst = NULL, cucur; + unsigned char *aranges, *ptr, *end; + + if (debug_sections[DEBUG_ARANGES].data == NULL) + return 0; + + aranges = malloc (debug_sections[DEBUG_ARANGES].size); + if (aranges == NULL) + dwz_oom (); + memcpy (aranges, debug_sections[DEBUG_ARANGES].data, + debug_sections[DEBUG_ARANGES].size); + debug_sections[DEBUG_ARANGES].new_data = aranges; + ptr = aranges; + end = aranges + debug_sections[DEBUG_ARANGES].size; + for (cu = first_cu; cu; cu = cu->cu_next) + if (cu->cu_kind != CU_PU) + break; + cufirst = cu; + while (ptr < end) + { + unsigned int culen, value, cuoff; + + if (end - ptr < 12) + { + error (0, 0, "%s: Corrupted .debug_aranges section", + dso->filename); + return 1; + } + culen = read_32 (ptr); + if (culen >= 0xfffffff0) + { + error (0, 0, "%s: 64-bit DWARF not supported", dso->filename); + return 1; + } + + value = read_16 (ptr); + if (value != 2) + { + error (0, 0, "%s: DWARF version %d in .debug_aranges unhandled", + dso->filename, value); + return 1; + } + + cuoff = read_32 (ptr); + cucur = cu; + /* Optimistically assume that .debug_aranges CU offsets only increase, + otherwise this might be too expensive and need a hash table. */ + for (; cu; cu = cu->cu_next) + { + if (cu->cu_kind == CU_TYPES) + { + cu = NULL; + break; + } + else if (cu->cu_offset == cuoff) + break; + } + if (cu == NULL) + { + for (cu = cufirst; cu != cucur; cu = cu->cu_next) + if (cu->cu_offset == cuoff) + break; + if (cu == cucur) + { + error (0, 0, "%s: Couldn't find CU for .debug_aranges " + "offset 0x%x", dso->filename, cuoff); + return 1; + } + } + if (unlikely (fi_multifile) + && cu->cu_kind == CU_NORMAL + && cu->cu_die->die_remove) + { + error (0, 0, "%s: Partial unit referenced in .debug_aranges", + dso->filename); + return 1; + } + ptr -= 4; + write_32 (ptr, cu->cu_new_offset); + ptr += culen - 6; + } + return 0; +} + +/* Helper function of write_gdb_index, called through qsort. + Sort an array of unsigned integer pairs, by increasing + first integer. The first integer is the TU offset + in the .gdb_index TU table, the second is its index in + the TU table from the start of that table. */ +static int +gdb_index_tu_cmp (const void *p, const void *q) +{ + unsigned int *t1 = (unsigned int *) p; + unsigned int *t2 = (unsigned int *) q; + + if (t1[0] < t2[0]) + return -1; + if (t1[0] > t2[0]) + return 1; + + if (t1[1] < t2[1]) + return -1; + if (t1[1] > t2[1]) + return 1; + return 0; +} + +/* Construct new .gdb_index section in malloced memory + if it needs adjustment. */ +static void +write_gdb_index (void) +{ + dw_cu_ref cu, cu_next, first_tu = NULL; + unsigned char *gdb_index, *ptr, *inptr, *end; + unsigned int ncus = 0, npus = 0, ntus = 0, ndelcus = 0, ver; + unsigned int culistoff, cutypesoff, addressoff, symboloff, constoff; + unsigned int *tuindices = NULL, tuidx = 0, *cumap = NULL, i, j, k; + bool fail = false; + + debug_sections[GDB_INDEX].new_size = 0; + if (likely (!op_multifile) + && (debug_sections[GDB_INDEX].data == NULL + || debug_sections[GDB_INDEX].size < 0x18)) + return; + inptr = (unsigned char *) debug_sections[GDB_INDEX].data; + if (unlikely (op_multifile)) + ver = multi_gdb_index_ver; + else + ver = buf_read_ule32 (inptr); + if (ver < 4 || ver > 8) + return; + + for (cu = first_cu; cu; cu = cu->cu_next) + if (cu->cu_kind == CU_PU) + npus++; + else if (cu->cu_kind == CU_NORMAL) + { + ncus++; + if (unlikely (fi_multifile) && cu->cu_die->die_remove) + ndelcus++; + } + else if (cu->cu_kind == CU_TYPES) + ntus++; + + /* Starting with version 7 CU indexes are limited to 24 bits, + so if we have more CUs, give up. */ + if (npus + ncus + ntus - ndelcus >= (1U << 24)) + return; + + if (unlikely (op_multifile)) + { + assert (ncus == 0 && ntus == 0); + debug_sections[GDB_INDEX].new_size + = 0x18 + npus * 16 + 16; + gdb_index = malloc (debug_sections[GDB_INDEX].new_size); + if (gdb_index == NULL) + dwz_oom (); + debug_sections[GDB_INDEX].new_data = gdb_index; + /* Write new header. */ + buf_write_le32 (gdb_index + 0x00, ver); + buf_write_le32 (gdb_index + 0x04, 0x18); + buf_write_le32 (gdb_index + 0x08, 0x18 + npus * 16); + buf_write_le32 (gdb_index + 0x0c, 0x18 + npus * 16); + buf_write_le32 (gdb_index + 0x10, 0x18 + npus * 16); + buf_write_le32 (gdb_index + 0x14, 0x18 + npus * 16 + 16); + ptr = gdb_index + 0x18; + /* Write new CU list. */ + for (cu = first_cu; cu; cu = cu->cu_next) + { + unsigned long next_off = debug_sections[DEBUG_INFO].new_size; + if (cu->cu_next) + next_off = cu->cu_next->cu_new_offset; + buf_write_le64 (ptr, cu->cu_new_offset); + buf_write_le64 (ptr + 8, next_off - cu->cu_new_offset); + ptr += 16; + } + /* Write an empty hash table (with two entries). */ + memset (ptr, '\0', 16); + return; + } + + culistoff = buf_read_ule32 (inptr + 0x04); + cutypesoff = buf_read_ule32 (inptr + 0x08); + addressoff = buf_read_ule32 (inptr + 0x0c); + symboloff = buf_read_ule32 (inptr + 0x10); + constoff = buf_read_ule32 (inptr + 0x14); + if (culistoff != 0x18 + || cutypesoff != 0x18 + ncus * 16 + || addressoff != cutypesoff + ntus * 24 + || symboloff < addressoff + || ((symboloff - addressoff) % 20) != 0 + || constoff < symboloff + || ((constoff - symboloff) & (constoff - symboloff - 1)) != 0 + || ((constoff - symboloff) & 7) != 0 + || debug_sections[GDB_INDEX].size < constoff) + return; + inptr += 0x18; + if (ndelcus) + cumap = (unsigned int *) + obstack_alloc (&ob2, ncus * sizeof (unsigned int)); + for (cu = first_cu, i = 0, j = 0; cu; cu = cu->cu_next) + if (cu->cu_kind == CU_NORMAL) + { + if (buf_read_ule64 (inptr) != cu->cu_offset) + { + if (cumap) + obstack_free (&ob2, (void *) cumap); + return; + } + inptr += 16; + if (cumap) + { + if (cu->cu_die->die_remove) + cumap[i++] = -1U; + else + cumap[i++] = j++; + } + } + else if (cu->cu_kind == CU_TYPES) + { + if (tuindices == NULL) + { + tuindices = (unsigned int *) + obstack_alloc (&ob2, ntus * 2 * sizeof (unsigned int)); + first_tu = cu; + } + tuindices[2 * tuidx] = buf_read_ule64 (inptr); + tuindices[2 * tuidx + 1] = tuidx * 24; + tuidx++; + inptr += 24; + } + if (ntus) + { + qsort (tuindices, ntus, 2 * sizeof (unsigned int), gdb_index_tu_cmp); + for (tuidx = 0, cu = first_tu; tuidx < ntus; tuidx++, cu = cu->cu_next) + if (tuindices[2 * tuidx] != cu->cu_offset) + { + if (cumap) + obstack_free (&ob2, (void *) cumap); + else + obstack_free (&ob2, (void *) tuindices); + return; + } + } + + if (multifile + && !fi_multifile + && !low_mem + && multi_gdb_index_ver < ver) + multi_gdb_index_ver = ver; + + debug_sections[GDB_INDEX].new_size + = debug_sections[GDB_INDEX].size + npus * 16 - ndelcus * 16; + gdb_index = malloc (debug_sections[GDB_INDEX].new_size); + if (gdb_index == NULL) + dwz_oom (); + debug_sections[GDB_INDEX].new_data = gdb_index; + /* Write new header. */ + buf_write_le32 (gdb_index + 0x00, ver); + buf_write_le32 (gdb_index + 0x04, culistoff); + buf_write_le32 (gdb_index + 0x08, cutypesoff + npus * 16 - ndelcus * 16); + buf_write_le32 (gdb_index + 0x0c, addressoff + npus * 16 - ndelcus * 16); + buf_write_le32 (gdb_index + 0x10, symboloff + npus * 16 - ndelcus * 16); + buf_write_le32 (gdb_index + 0x14, constoff + npus * 16 - ndelcus * 16); + ptr = gdb_index + 0x18; + /* Write new CU list. */ + for (cu = first_cu; cu; cu = cu_next) + { + unsigned long next_off = debug_sections[DEBUG_INFO].new_size; + if (cu->cu_kind == CU_TYPES) + break; + cu_next = cu->cu_next; + if (unlikely (fi_multifile)) + { + while (cu_next + && cu_next->cu_kind == CU_NORMAL + && cu_next->cu_die->die_remove) + cu_next = cu_next->cu_next; + if (cu->cu_die->die_remove) + continue; + } + if (cu_next && cu_next->cu_kind != CU_TYPES) + next_off = cu_next->cu_new_offset; + buf_write_le64 (ptr, cu->cu_new_offset); + buf_write_le64 (ptr + 8, next_off - cu->cu_new_offset); + ptr += 16; + } + /* Write new TU list. */ + for (tuidx = 0; cu; cu = cu->cu_next, tuidx++) + { + unsigned char *p; + unsigned int tuoff = tuindices[2 * tuidx + 1]; + dw_die_ref ref; + assert (cu->cu_kind == CU_TYPES); + buf_write_le64 (ptr + tuoff, cu->cu_new_offset); + p = debug_sections[DEBUG_TYPES].data + cu->cu_offset + 19; + ref = off_htab_lookup (cu, cu->cu_offset + read_32 (p)); + assert (ref && ref->die_dup == NULL); + buf_write_le64 (ptr + tuoff + 8, ref->u.p2.die_new_offset); + p -= 12; + buf_write_le64 (ptr + tuoff + 16, read_64 (p)); + } + ptr += ntus * 24; + end = inptr + (symboloff - addressoff); + /* Copy address area, adjusting all CU indexes. */ + while (inptr < end) + { + memcpy (ptr, inptr, 16); + i = buf_read_ule32 (inptr + 16); + if (cumap && i < ncus) + { + if (cumap[i] == -1U) + fail = true; + i = cumap[i] + npus; + } + else + i += npus - ndelcus; + buf_write_le32 (ptr + 16, i); + ptr += 20; + inptr += 20; + } + /* Copy the symbol hash table. */ + memcpy (ptr, inptr, constoff - symboloff); + /* Clear the const pool initially. */ + memset (ptr + (constoff - symboloff), '\0', + debug_sections[GDB_INDEX].size - constoff); + ptr = ptr + (constoff - symboloff); + end = inptr + (constoff - symboloff); + /* Finally copy over const objects into the const pool, strings as is, + CU vectors with CU indexes adjusted. */ + while (inptr < end) + { + unsigned int name = buf_read_ule32 (inptr); + unsigned int cuvec = buf_read_ule32 (inptr + 4); + + inptr += 8; + if (name == 0 && cuvec == 0) + continue; + if (name > debug_sections[GDB_INDEX].size - constoff - 1 + || cuvec > debug_sections[GDB_INDEX].size - constoff - 4) + { + fail: + free (gdb_index); + debug_sections[GDB_INDEX].new_size = 0; + return; + } + if (ptr[name] == '\0') + { + unsigned char *strend = end + name; + while (*strend != '\0') + { + if (strend + 1 + == end + (debug_sections[GDB_INDEX].size - constoff)) + goto fail; + strend++; + } + memcpy (ptr + name, end + name, strend + 1 - (end + name)); + } + if (buf_read_ule32 (ptr + cuvec) == 0) + { + unsigned int count = buf_read_ule32 (end + cuvec); + if (count * 4 + > debug_sections[GDB_INDEX].size - constoff - cuvec - 4) + goto fail; + buf_write_le32 (ptr + cuvec, count); + for (i = 0; i < count; i++) + { + j = buf_read_ule32 (end + cuvec + (i + 1) * 4); + if (ver >= 7) + k = j & ((1U << 24) - 1); + else + k = j; + if (cumap && k < ncus) + { + if (cumap[k] == -1U) + fail = true; + k = cumap[k] + npus; + } + else + k += npus - ndelcus; + if (ver >= 7) + j = (j & (~0U << 24)) | k; + else + j = k; + buf_write_le32 (ptr + cuvec + (i + 1) * 4, j); + } + } + } + if (cumap) + obstack_free (&ob2, (void *) cumap); + else if (tuindices) + obstack_free (&ob2, (void *) tuindices); + if (fail) + { + free (debug_sections[GDB_INDEX].new_data); + debug_sections[GDB_INDEX].new_data = NULL; + debug_sections[GDB_INDEX].new_size = 0; + } +} + +/* Return a string from section SEC at offset OFFSET. */ +static const char * +strptr (DSO *dso, int sec, off_t offset) +{ + Elf_Scn *scn; + Elf_Data *data; + + scn = dso->scn[sec]; + if (offset >= 0 && (GElf_Addr) offset < dso->shdr[sec].sh_size) + { + data = NULL; + while ((data = elf_rawdata (scn, data)) != NULL) + { + if (data->d_buf + && offset >= data->d_off + && offset < (off_t) (data->d_off + data->d_size)) + return (const char *) data->d_buf + (offset - data->d_off); + } + } + + return NULL; +} + +/* Initialize do_read_* and do_write_* callbacks based on + ENDIANITY. */ +static void +init_endian (int endianity) +{ + if (endianity == ELFDATA2LSB) + { + do_read_16 = buf_read_ule16; + do_read_32 = buf_read_ule32; + do_read_64 = buf_read_ule64; + do_write_16 = buf_write_le16; + do_write_32 = buf_write_le32; + do_write_64 = buf_write_le64; + } + else if (endianity == ELFDATA2MSB) + { + do_read_16 = buf_read_ube16; + do_read_32 = buf_read_ube32; + do_read_64 = buf_read_ube64; + do_write_16 = buf_write_be16; + do_write_32 = buf_write_be32; + do_write_64 = buf_write_be64; + } + else + abort (); +} + +/* Read DWARF sections from DSO. */ +static int +read_dwarf (DSO *dso, bool quieter, unsigned int *die_count) +{ + Elf_Data *data; + Elf_Scn *scn; + int i, j; + + for (i = 1; i < dso->ehdr.e_shnum; ++i) + if (! (dso->shdr[i].sh_flags & (SHF_ALLOC | SHF_WRITE | SHF_EXECINSTR)) + && dso->shdr[i].sh_size) + { + const char *name = strptr (dso, dso->ehdr.e_shstrndx, + dso->shdr[i].sh_name); + + if (strncmp (name, ".debug_", sizeof (".debug_") - 1) == 0 + || strcmp (name, ".gdb_index") == 0 + || strcmp (name, ".gnu_debugaltlink") == 0) + { + if (dso->shdr[i].sh_flags & SHF_COMPRESSED) + { + error (0, 0, + "%s: Found compressed %s section, not attempting dwz" + " compression", + dso->filename, name); + return 1; + } + for (j = 0; debug_sections[j].name; ++j) + if (strcmp (name, debug_sections[j].name) == 0) + { + if (debug_sections[j].data) + { + error (0, 0, "%s: Found two copies of %s section", + dso->filename, name); + return 1; + } + + scn = dso->scn[i]; + data = elf_rawdata (scn, NULL); + assert (data != NULL); + if (data->d_buf == NULL) + { + error (0, 0, "%s: Found empty %s section, not attempting" + " dwz compression", dso->filename, name); + return 1; + } + assert (elf_rawdata (scn, data) == NULL); + assert (data->d_off == 0); + assert (data->d_size == dso->shdr[i].sh_size); + debug_sections[j].data = data->d_buf; + debug_sections[j].size = data->d_size; + debug_sections[j].new_size = data->d_size; + debug_sections[j].sec = i; + break; + } + + if (debug_sections[j].name == NULL) + { + error (0, 0, "%s: Unknown debugging section %s", + dso->filename, name); + return 1; + } + } + } + + if (dso->ehdr.e_ident[EI_DATA] == ELFDATA2LSB + || dso->ehdr.e_ident[EI_DATA] == ELFDATA2MSB) + init_endian (dso->ehdr.e_ident[EI_DATA]); + else + { + error (0, 0, "%s: Wrong ELF data encoding", dso->filename); + return 1; + } + + if (debug_sections[DEBUG_INFO].data == NULL + && !rd_multifile) + { + if (!quieter) + error (0, 0, "%s: .debug_info section not present", + dso->filename); + return 3; + } + + if (debug_sections[DEBUG_SUP].data != NULL && !(dwarf_5 && rd_multifile)) + { + error (0, 0, "%s: .debug_sup section already present", + dso->filename); + return 1; + } + + if (debug_sections[GNU_DEBUGALTLINK].data != NULL) + { + error (0, 0, "%s: .gnu_debugaltlink section already present", + dso->filename); + return 1; + } + + int res; + res = read_debug_info (dso, DEBUG_INFO, die_count); + if (res == 0 && stats_p) + print_parse_stats (); + return res; +} + +/* Open an ELF file NAME. */ +static DSO * +fdopen_dso (int fd, const char *name) +{ + Elf *elf = NULL; + GElf_Ehdr ehdr; + int i; + DSO *dso = NULL; + + elf = elf_begin (fd, ELF_C_READ_MMAP, NULL); + if (elf == NULL) + { + error (0, 0, "cannot open ELF file: %s", elf_errmsg (-1)); + goto error_out; + } + + if (elf_kind (elf) != ELF_K_ELF) + { + error (0, 0, "\"%s\" is not an ELF file", name); + goto error_out; + } + + if (gelf_getehdr (elf, &ehdr) == NULL) + { + error (0, 0, "cannot get the ELF header: %s", + elf_errmsg (-1)); + goto error_out; + } + + if (ehdr.e_type != ET_DYN && ehdr.e_type != ET_EXEC + && (!rd_multifile || ehdr.e_type != ET_REL)) + { + error (0, 0, "\"%s\" is not a shared library", name); + goto error_out; + } + + /* Allocate DSO structure. */ + dso = (DSO *) + malloc (sizeof(DSO) + ehdr.e_shnum * sizeof(GElf_Shdr) + + ehdr.e_shnum * sizeof(Elf_Scn *) + + strlen (name) + 1); + if (!dso) + { + error (0, ENOMEM, "Could not open DSO"); + goto error_out; + } + + elf_flagelf (elf, ELF_C_SET, ELF_F_LAYOUT | ELF_F_PERMISSIVE); + + memset (dso, 0, sizeof(DSO)); + dso->elf = elf; + dso->ehdr = ehdr; + dso->scn = (Elf_Scn **) &dso->shdr[ehdr.e_shnum]; + + for (i = 0; i < ehdr.e_shnum; ++i) + { + dso->scn[i] = elf_getscn (elf, i); + gelf_getshdr (dso->scn[i], dso->shdr + i); + } + + dso->filename = (const char *) &dso->scn[ehdr.e_shnum]; + strcpy ((char *) &dso->scn[ehdr.e_shnum], name); + return dso; + +error_out: + free (dso); + if (elf) + elf_end (elf); + if (fd != -1) + close (fd); + return NULL; +} + +/* Implicit arg for compare_section_numbers. Could be passed in as explicit arg + when using qsort_r instead. */ +static DSO *compare_section_numbers_implicit_arg; + +/* Helper function for sort_section_numbers. */ +static int +compare_section_numbers (const void *p1, const void *p2) +{ + DSO *dso = compare_section_numbers_implicit_arg; + const int i1 = *(const int *)p1; + const int i2 = *(const int *)p2; + GElf_Off o1; + GElf_Off o2; + + /* Keep element 0 at 0. */ + if (i1 == 0 || i2 == 0) + { + if (i1 == i2) + return 0; + if (i1 == 0) + return -1; + if (i2 == 0) + return 1; + } + + /* Get file offsets. */ + o1 = (i1 == dso->ehdr.e_shnum + ? dso->ehdr.e_shoff + : dso->shdr[i1].sh_offset); + o2 = (i2 == dso->ehdr.e_shnum + ? dso->ehdr.e_shoff + : dso->shdr[i2].sh_offset); + + /* Compare file offsets. */ + if (o1 < o2) + return -1; + if (o1 > o2) + return 1; + + /* In case file offset is the same, keep the original relative order. */ + if (i1 < i2) + return -1; + if (i1 > i2) + return 1; + + return 0; +} + +/* Sort SORTED_SECTION_NUMBERS in file offset order. */ +static void +sort_section_numbers (DSO *dso, unsigned int *sorted_section_numbers) +{ + unsigned int i; + unsigned int nr_sections = dso->ehdr.e_shnum; + + /* Treat section header table as another section, with index + dso->ehdr.e_shnum. */ + nr_sections += 1; + + for (i = 0; i < nr_sections; ++i) + sorted_section_numbers[i] = i; + + compare_section_numbers_implicit_arg = dso; + qsort (sorted_section_numbers, nr_sections, + sizeof (sorted_section_numbers[0]), compare_section_numbers); + compare_section_numbers_implicit_arg = NULL; + + assert (sorted_section_numbers[0] == 0); +} + +/* Verify file offset and size of sections and section header table. */ +static void +verify_sections (DSO *dso, unsigned int *sorted_section_numbers, + GElf_Off *distance, int addsec, GElf_Off addsize, + GElf_Ehdr ehdr) +{ + int i, j; + int prev, update_prev; + GElf_Off offset, prev_offset, prev_size; + GElf_Off section_header_table_size + = dso->ehdr.e_shentsize * ehdr.e_shnum; + + prev = -1; + for (i = 1; i < (dso->ehdr.e_shnum + 1); ++i, prev = update_prev) + { + j = sorted_section_numbers[i]; + + if (j != dso->ehdr.e_shnum && dso->shdr[j].sh_type == SHT_NOBITS) + { + update_prev = prev; + continue; + } + update_prev = j; + + if (prev == -1) + continue; + + offset = (j == dso->ehdr.e_shnum + ? ehdr.e_shoff + : dso->shdr[j].sh_offset); + + prev_offset = (prev == dso->ehdr.e_shnum + ? ehdr.e_shoff + : dso->shdr[prev].sh_offset); + + prev_size = (prev == dso->ehdr.e_shnum + ? section_header_table_size + : (dso->shdr[prev].sh_type == SHT_NOBITS + ? 0 + : dso->shdr[prev].sh_size)); + + if (distance != NULL) + assert ((prev_offset + prev_size + distance[prev] + + (prev == addsec ? addsize : 0)) + == offset); + else + assert ((prev_offset + prev_size + (prev == addsec ? addsize : 0)) + <= offset); + } +} + +/* Calculate distance between sections and section header table. */ +static int +calculate_section_distance (DSO *dso, unsigned int *sorted_section_numbers, + GElf_Off *distance) +{ + int i, j; + int prev, update_prev; + GElf_Off offset, prev_offset, prev_size; + GElf_Off section_header_table_size + = dso->ehdr.e_shentsize * dso->ehdr.e_shnum; + + prev = -1; + for (i = 1; i < (dso->ehdr.e_shnum + 1); ++i, prev = update_prev) + { + j = sorted_section_numbers[i]; + + if (j != dso->ehdr.e_shnum && dso->shdr[j].sh_type == SHT_NOBITS) + { + update_prev = prev; + continue; + } + update_prev = j; + + if (prev == -1) + continue; + + offset = (j == dso->ehdr.e_shnum + ? dso->ehdr.e_shoff + : dso->shdr[j].sh_offset); + + prev_offset = (prev == dso->ehdr.e_shnum + ? dso->ehdr.e_shoff + : dso->shdr[prev].sh_offset); + + prev_size = (prev == dso->ehdr.e_shnum + ? section_header_table_size + : dso->shdr[prev].sh_size); + + if (prev_offset + prev_size > offset) + { + error (0, 0, "Section overlap detected"); + if (prev == dso->ehdr.e_shnum) + error (0, 0, "Section header table: [0x%llx, 0x%llx)", + (unsigned long long)prev_offset, + (unsigned long long)(prev_offset + prev_size)); + else + error (0, 0, "Section %d: [0x%llx, 0x%llx)", j, + (unsigned long long)prev_offset, + (unsigned long long)(prev_offset + prev_size)); + if (j == dso->ehdr.e_shnum) + error (0, 0, "Section header table: 0x%llx", + (unsigned long long)offset); + else + error (0, 0, "Section %d: 0x%llx", j, (unsigned long long)offset); + return 1; + } + + distance[prev] = offset - (prev_offset + prev_size); + } + + verify_sections (dso, sorted_section_numbers, distance, -1, 0, dso->ehdr); + + return 0; +} + +/* Store new ELF into FILE. debug_sections array contains + new_data/new_size pairs where needed. */ +static int +write_dso (DSO *dso, const char *file, struct stat *st, bool save_to_temp) +{ + Elf *elf = NULL; + GElf_Ehdr ehdr; + GElf_Off min_shoff = ~(GElf_Off) 0; + char *e_ident; + int fd, i, j, addsec = -1, ret; + GElf_Off off, diff, addsize = 0; + char *filename = NULL; + GElf_Word shstrtabadd = 0; + char *shstrtab = NULL; + bool remove_sections[SECTION_COUNT]; + GElf_Off distance[dso->ehdr.e_shnum + 1]; + /* Array of sections and section header table sorted by file offset. */ + unsigned int sorted_section_numbers[dso->ehdr.e_shnum + 1]; + GElf_Off old_sh_offset[dso->ehdr.e_shnum]; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_dso\n"); + } + + for (i = 1; i < dso->ehdr.e_shnum; ++i) + old_sh_offset[i] = dso->shdr[i].sh_offset; + + memset (remove_sections, '\0', sizeof (remove_sections)); + ehdr = dso->ehdr; + + sort_section_numbers (dso, sorted_section_numbers); + if (calculate_section_distance (dso, sorted_section_numbers, distance)) + return 1; + + for (i = 0; debug_sections[i].name; i++) + if (debug_sections[i].new_size != debug_sections[i].size) + { + if (debug_sections[i].size == 0 + && debug_sections[i].sec == 0) + { + unsigned int len; + if (addsec == -1) + for (j = 0; debug_sections[j].name; j++) + if (debug_sections[j].new_size + && debug_sections[j].sec + && debug_sections[j].sec > addsec) + addsec = debug_sections[j].sec; + ehdr.e_shnum++; + if (ehdr.e_shoff < min_shoff) + min_shoff = ehdr.e_shoff; + for (j = 1; j < dso->ehdr.e_shnum; ++j) + { + if (dso->shdr[j].sh_offset > ehdr.e_shoff) + dso->shdr[j].sh_offset += ehdr.e_shentsize; + if (dso->shdr[j].sh_link > (unsigned int) addsec) + dso->shdr[j].sh_link++; + if ((dso->shdr[j].sh_type == SHT_REL + || dso->shdr[j].sh_type == SHT_RELA + || (dso->shdr[j].sh_flags & SHF_INFO_LINK)) + && dso->shdr[j].sh_info + > (unsigned int) addsec) + dso->shdr[j].sh_info++; + } + if (dso->ehdr.e_shstrndx > addsec) + ehdr.e_shstrndx++; + len = strlen (debug_sections[i].name) + 1; + dso->shdr[dso->ehdr.e_shstrndx].sh_size += len; + if (dso->shdr[dso->ehdr.e_shstrndx].sh_offset < min_shoff) + min_shoff = dso->shdr[dso->ehdr.e_shstrndx].sh_offset; + for (j = 1; j < dso->ehdr.e_shnum; ++j) + if (dso->shdr[j].sh_offset + > dso->shdr[dso->ehdr.e_shstrndx].sh_offset) + dso->shdr[j].sh_offset += len; + if (ehdr.e_shoff > dso->shdr[dso->ehdr.e_shstrndx].sh_offset) + ehdr.e_shoff += len; + shstrtabadd += len; + diff = debug_sections[i].new_size; + addsize += diff; + off = dso->shdr[addsec].sh_offset; + } + else + { + diff = (GElf_Off) debug_sections[i].new_size + - (GElf_Off) dso->shdr[debug_sections[i].sec].sh_size; + off = dso->shdr[debug_sections[i].sec].sh_offset; + } + if (off < min_shoff) + min_shoff = off; + for (j = 1; j < dso->ehdr.e_shnum; ++j) + if (dso->shdr[j].sh_offset > off) + dso->shdr[j].sh_offset += diff; + if (ehdr.e_shoff > off) + ehdr.e_shoff += diff; + dso->shdr[debug_sections[i].sec].sh_size + = debug_sections[i].new_size; + if (debug_sections[i].new_size == 0) + { + remove_sections[i] = true; + ehdr.e_shnum--; + if (ehdr.e_shoff < min_shoff) + min_shoff = ehdr.e_shoff; + for (j = 1; j < dso->ehdr.e_shnum; ++j) + { + if (dso->shdr[j].sh_offset > ehdr.e_shoff) + dso->shdr[j].sh_offset -= ehdr.e_shentsize; + if (dso->shdr[j].sh_link + > (unsigned int) debug_sections[i].sec) + dso->shdr[j].sh_link--; + if ((dso->shdr[j].sh_type == SHT_REL + || dso->shdr[j].sh_type == SHT_RELA + || (dso->shdr[j].sh_flags & SHF_INFO_LINK)) + && dso->shdr[j].sh_info + > (unsigned int) debug_sections[i].sec) + dso->shdr[j].sh_info--; + } + if (dso->ehdr.e_shstrndx > debug_sections[i].sec) + ehdr.e_shstrndx--; + } + } + + /* Verify that we did not change section layout, by checking that the + distances between sections and section header table remained the same. */ + verify_sections (dso, sorted_section_numbers, distance, addsec, addsize, + ehdr); + + if (min_shoff != ~(GElf_Off) 0) + { + for (j = 1; j < dso->ehdr.e_shnum; ++j) + if (dso->shdr[j].sh_offset >= min_shoff + && dso->shdr[j].sh_addralign > 1 + && (dso->shdr[j].sh_offset & (dso->shdr[j].sh_addralign - 1)) != 0) + break; + if (j < dso->ehdr.e_shnum + || (ehdr.e_shoff >= min_shoff + && (ehdr.e_shoff & (ehdr.e_ident[EI_CLASS] == ELFCLASS64 + ? 7 : 3)) != 0)) + { + /* Need to fix up sh_offset/e_shoff. Punt if all the sections + >= min_shoff aren't non-ALLOC. */ + GElf_Off last_shoff = 0; + int k = -1; + int l; + for (l = 1; l <= dso->ehdr.e_shnum; ++l) + { + j = sorted_section_numbers[l]; + if (j == dso->ehdr.e_shnum) + continue; + else if (!last_shoff + && (dso->shdr[j].sh_offset < min_shoff + || (dso->shdr[j].sh_offset == min_shoff + && (dso->shdr[j].sh_size == 0 + || dso->shdr[j].sh_type == SHT_NOBITS)))) + continue; + else if (dso->shdr[j].sh_type == SHT_NOBITS) + continue; + else if ((dso->shdr[j].sh_flags & SHF_ALLOC) != 0) + { + error (0, 0, "Allocatable section in %s after " + "non-allocatable ones", dso->filename); + return 1; + } + else + { + assert (dso->shdr[j].sh_offset >= last_shoff); + + if (k == -1) + k = l; + last_shoff = dso->shdr[j].sh_offset + dso->shdr[j].sh_size; + } + } + last_shoff = min_shoff; + for (l = k; l <= dso->ehdr.e_shnum; ++l) + { + j = sorted_section_numbers[l]; + if (j == dso->ehdr.e_shnum) + { + if (ehdr.e_ident[EI_CLASS] == ELFCLASS64) + ehdr.e_shoff = (last_shoff + 7) & -8; + else + ehdr.e_shoff = (last_shoff + 3) & -4; + last_shoff = ehdr.e_shoff + ehdr.e_shnum * ehdr.e_shentsize; + continue; + } + /* Ignore SHT_NOBITS sections. */ + if (dso->shdr[j].sh_type == SHT_NOBITS) + continue; + dso->shdr[j].sh_offset = last_shoff; + if (dso->shdr[j].sh_addralign > 1) + dso->shdr[j].sh_offset + = (last_shoff + dso->shdr[j].sh_addralign - 1) + & ~(dso->shdr[j].sh_addralign - (GElf_Off) 1); + last_shoff = dso->shdr[j].sh_offset + dso->shdr[j].sh_size; + if (addsec != -1 && j == addsec) + last_shoff += addsize; + } + } + } + + for (i = 1; i < dso->ehdr.e_shnum; ++i) + if (dso->shdr[i].sh_type == SHT_NOBITS) + dso->shdr[i].sh_offset = old_sh_offset[i]; + + verify_sections (dso, sorted_section_numbers, NULL, addsec, addsize, + ehdr); + + if (shstrtabadd != 0) + { + shstrtab = (char *) malloc (dso->shdr[dso->ehdr.e_shstrndx].sh_size); + if (shstrtab == NULL) + { + error (0, ENOMEM, "Failed to adjust .shstrtab for %s", + dso->filename); + return 1; + } + } + + if (file == NULL) + { + size_t len = strlen (dso->filename); + filename = alloca (len + sizeof (".#dwz#.XXXXXX")); + memcpy (filename, dso->filename, len); + memcpy (filename + len, ".#dwz#.XXXXXX", sizeof (".#dwz#.XXXXXX")); + fd = mkstemp (filename); + file = (const char *) filename; + if (fd == -1) + { + error (0, errno, "Failed to create temporary file for %s", + dso->filename); + free (shstrtab); + return 1; + } + } + else + { + fd = open (file, O_RDWR | O_CREAT, 0600); + if (fd == -1) + { + error (0, errno, "Failed to open %s for writing", file); + free (shstrtab); + return 1; + } + } + + elf = elf_begin (fd, ELF_C_WRITE, NULL); + if (elf == NULL) + { + error (0, 0, "cannot open ELF file: %s", elf_errmsg (-1)); + unlink (file); + close (fd); + free (shstrtab); + return 1; + } + + /* Some gelf_newehdr implementations don't return the resulting + ElfNN_Ehdr, so we have to do it the hard way instead of: + e_ident = (char *) gelf_newehdr (elf, gelf_getclass (dso->elf)); */ + switch (gelf_getclass (dso->elf)) + { + case ELFCLASS32: + e_ident = (char *) elf32_newehdr (elf); + break; + case ELFCLASS64: + e_ident = (char *) elf64_newehdr (elf); + break; + default: + e_ident = NULL; + break; + } + + if (e_ident == NULL + /* This is here just for the gelfx wrapper, so that gelf_update_ehdr + already has the correct ELF class. */ + || memcpy (e_ident, dso->ehdr.e_ident, EI_NIDENT) == NULL + || gelf_update_ehdr (elf, &ehdr) == 0 + || gelf_newphdr (elf, ehdr.e_phnum) == 0) + { + error (0, 0, "Could not create new ELF headers"); + unlink (file); + elf_end (elf); + close (fd); + free (shstrtab); + return 1; + } + elf_flagelf (elf, ELF_C_SET, ELF_F_LAYOUT | ELF_F_PERMISSIVE); + for (i = 0; i < ehdr.e_phnum; ++i) + { + GElf_Phdr *phdr, phdr_mem; + phdr = gelf_getphdr (dso->elf, i, &phdr_mem); + gelf_update_phdr (elf, i, phdr); + } + + for (i = 1; i < dso->ehdr.e_shnum; ++i) + { + Elf_Scn *scn; + Elf_Data *data1, *data2; + + for (j = 0; debug_sections[j].name; j++) + if (i == debug_sections[j].sec) + break; + if (debug_sections[j].name && remove_sections[j]) + continue; + scn = elf_newscn (elf); + elf_flagscn (scn, ELF_C_SET, ELF_F_DIRTY); + gelf_update_shdr (scn, &dso->shdr[i]); + data1 = elf_getdata (dso->scn[i], NULL); + data2 = elf_newdata (scn); + memcpy (data2, data1, sizeof (*data1)); + if (debug_sections[j].name + && debug_sections[j].new_data != NULL) + { + data2->d_buf = debug_sections[j].new_data; + data2->d_size = dso->shdr[i].sh_size; + } + if (i == dso->ehdr.e_shstrndx && shstrtabadd) + { + memcpy (shstrtab, data1->d_buf, + dso->shdr[dso->ehdr.e_shstrndx].sh_size + - shstrtabadd); + data2->d_buf = shstrtab; + data2->d_size = dso->shdr[i].sh_size; + } + if (i == addsec) + { + GElf_Word sh_name = dso->shdr[dso->ehdr.e_shstrndx].sh_size + - shstrtabadd; + GElf_Shdr shdr; + + off = dso->shdr[i].sh_offset + dso->shdr[i].sh_size; + for (j = 0; debug_sections[j].name; j++) + if (debug_sections[j].new_size + && debug_sections[j].size == 0 + && debug_sections[j].sec == 0) + { + scn = elf_newscn (elf); + elf_flagscn (scn, ELF_C_SET, ELF_F_DIRTY); + memset (&shdr, '\0', sizeof (shdr)); + shdr.sh_name = sh_name; + sh_name += strlen (debug_sections[j].name) + 1; + strcpy (shstrtab + shdr.sh_name, debug_sections[j].name); + shdr.sh_type = SHT_PROGBITS; + shdr.sh_offset = off; + shdr.sh_size = debug_sections[j].new_size; + shdr.sh_addralign = 1; + off += shdr.sh_size; + gelf_update_shdr (scn, &shdr); + data2 = elf_newdata (scn); + data2->d_buf = debug_sections[j].new_data; + data2->d_type = ELF_T_BYTE; + data2->d_version = EV_CURRENT; + data2->d_size = shdr.sh_size; + data2->d_off = 0; + data2->d_align = 1; + } + } + } + + if (elf_update (elf, ELF_C_WRITE_MMAP) == -1) + { + error (0, 0, "%s: elf_update failed", dso->filename); + unlink (file); + elf_end (elf); + close (fd); + free (shstrtab); + return 1; + } + + if (elf_end (elf) < 0) + { + error (0, 0, "elf_end failed: %s", elf_errmsg (elf_errno ())); + unlink (file); + elf_end (elf); + close (fd); + free (shstrtab); + return 1; + } + + free (shstrtab); + ret = fchown (fd, st->st_uid, st->st_gid); + fchmod (fd, st->st_mode & 07777); + close (fd); + + if (filename != NULL && rename (filename, dso->filename)) + { + error (0, errno, "Failed to rename temporary file over %s", + dso->filename); + unlink (file); + /* | (ret & 1) to silence up __wur warning for fchown. */ + return 1 | (ret & 1); + } + if (save_to_temp) + { + const char *prefix = "dwz."; + size_t buf_len = strlen (prefix) + strlen (dso->filename) + 1; + char *buf = (char *)alloca (buf_len); + size_t offset = 0; + strcpy (&buf[offset], prefix); + offset += strlen (prefix); + strcpy (&buf[offset], dso->filename); + offset += strlen (dso->filename); + assert (offset == buf_len - 1); + assert (buf[offset] == '\0'); + unlink (buf); + if (link (dso->filename, buf) != 0) + { + error (0, errno, "Failed to link file: %s", dso->filename); + return 1; + } + } + return 0; +} + +/* Free memory and clear global variables. */ +static void +cleanup (void) +{ + dw_cu_ref cu; + unsigned int i; + + for (cu = first_cu; cu; cu = cu->cu_next) + { + if (cu->cu_new_abbrev) + htab_delete (cu->cu_new_abbrev); + cu->cu_new_abbrev = NULL; + } + if (off_htab != NULL) + { + if (tracing) + htab_report (off_htab, "off_htab final"); + htab_delete (off_htab); + } + off_htab = NULL; + if (types_off_htab != NULL) + htab_delete (types_off_htab); + types_off_htab = NULL; + if (loc_htab != NULL) + htab_delete (loc_htab); + loc_htab = NULL; + if (loclists_htab != NULL) + htab_delete (loclists_htab); + loclists_htab = NULL; + if (dup_htab != NULL) + htab_delete (dup_htab); + dup_htab = NULL; + if (strp_htab != NULL) + htab_delete (strp_htab); + strp_htab = NULL; + if (line_htab != NULL) + htab_delete (line_htab); + line_htab = NULL; + if (macro_htab != NULL) + htab_delete (macro_htab); + macro_htab = NULL; + if (meta_abbrev_htab != NULL) + htab_delete (meta_abbrev_htab); + meta_abbrev_htab = NULL; + + for (i = 0; i < SAVED_SECTIONS; ++i) + { + free (saved_new_data[i]); + saved_new_data[i] = NULL; + } + + obstack_free (&ob2, NULL); + obstack_free (&ob, NULL); + memset (&ob2, '\0', sizeof (ob2)); + memset (&ob, '\0', sizeof (ob2)); + die_nontoplevel_freelist = NULL; + die_collapsed_child_freelist = NULL; + pool_destroy (NULL); + first_cu = NULL; + last_cu = NULL; + ptr_size = 0; + max_nattr = 0; + do_read_16 = NULL; + do_read_32 = NULL; + do_read_64 = NULL; + do_write_16 = NULL; + do_write_32 = NULL; + do_write_64 = NULL; + edge_freelist = NULL; + multifile_mode = 0; + max_strp_off = 0; + max_line_id = 0; +} + +/* Propagate the die_no_multifile property along the duplicate chain of which + DIE is a member. If the property was changed on any die, set *CHANGED to + true. */ +static void +propagate_multifile_duplicate_chain (dw_die_ref die, bool *changed) +{ + dw_die_ref dup = first_dup (die); + if (!dup) + return; + + while (dup && dup->die_offset == -1U) + dup = dup->die_nextdup; + if (dup != die) + return; + + bool any_no_multifile = false; + bool any_multifile = false; + bool prop_needed = false; + dw_die_ref d; + for (d = dup; d && !prop_needed; d = d->die_nextdup) + { + if (d->die_no_multifile) + any_no_multifile = true; + else + any_multifile = true; + prop_needed = any_no_multifile && any_multifile; + } + if (!prop_needed) + return; + + *changed = true; + + for (d = dup; d; d = d->die_nextdup) + d->die_no_multifile = 1; +} + +/* Propagate the die_no_multifile property backwards along the outgoing + references of DIE, which is a member of CU and of the subtree of lower + toplevel die TOP_DIE. If the property was changed on any die, set *CHANGED + to true. */ +static void +propagate_multifile_refs_backward (dw_cu_ref cu, dw_die_ref top_die, + dw_die_ref die, bool *changed) +{ + struct abbrev_tag *t = die->die_abbrev; + unsigned int i; + unsigned char *ptr; + dw_die_ref child; + + if (die->die_offset == -1U) + return; + + ptr = debug_sections[DEBUG_INFO].data + die->die_offset; + skip_leb128 (ptr); + for (i = 0; i < t->nattr; ++i) + { + uint32_t form = t->attr[i].form; + uint64_t value; + dw_die_ref ref, reft; + + while (form == DW_FORM_indirect) + form = read_uleb128 (ptr); + + switch (form) + { + case DW_FORM_ref_addr: + value = read_size (ptr, cu->cu_version == 2 ? ptr_size : 4); + ptr += cu->cu_version == 2 ? ptr_size : 4; + ref = off_htab_lookup (cu, value); + goto finish_ref; + break; + case DW_FORM_ref_udata: + case DW_FORM_ref1: + case DW_FORM_ref2: + case DW_FORM_ref4: + case DW_FORM_ref8: + switch (form) + { + case DW_FORM_ref_udata: value = read_uleb128 (ptr); break; + case DW_FORM_ref1: value = read_8 (ptr); break; + case DW_FORM_ref2: value = read_16 (ptr); break; + case DW_FORM_ref4: value = read_32 (ptr); break; + case DW_FORM_ref8: value = read_64 (ptr); break; + default: abort (); + } + if (t->attr[i].attr == DW_AT_sibling) + break; + ref = off_htab_lookup (cu, cu->cu_offset + value); + finish_ref: + reft = ref; + while (!reft->die_root + && reft->die_parent->die_tag != DW_TAG_compile_unit + && reft->die_parent->die_tag != DW_TAG_partial_unit + && !reft->die_parent->die_named_namespace) + reft = reft->die_parent; + if (reft->die_root) + ; + else if (reft->die_ck_state == CK_KNOWN + && !top_die->die_no_multifile && reft->die_no_multifile) + { + top_die->die_no_multifile = 1; + *changed = true; + } + break; + default: + ptr = skip_attr_no_dw_form_indirect (cu->cu_version, form, ptr); + } + } + + for (child = die->die_child; child; child = child->die_sib) + propagate_multifile_refs_backward (cu, top_die, child, changed); +} + +/* Do propagation of the die_no_multifile property that was not covered in + checksum_die and checksum_ref_die. */ +static void +propagate_multifile (void) +{ + bool changed; + dw_cu_ref cu; + dw_die_ref die; + + changed = false; + + FOREACH_CU_NORMAL_LOW_TOPLEVEL_DIE (cu, die) + propagate_multifile_duplicate_chain (die, &changed); + + if (!changed) + return; + + do + { + changed = false; + + FOREACH_CU_NORMAL_LOW_TOPLEVEL_DIE (cu, die) + propagate_multifile_refs_backward (cu, die, die, &changed); + + FOREACH_CU_NORMAL_LOW_TOPLEVEL_DIE (cu, die) + propagate_multifile_duplicate_chain (die, &changed); + } + while (changed); +} + +/* Returns true if DIE contains any toplevel children that can be + potentially shared between different executables or shared libraries. */ +static bool +check_multifile (dw_die_ref die) +{ + dw_die_ref child; + + die->die_no_multifile = 1; + for (child = die->die_child; child; child = child->die_sib) + if (child->die_named_namespace) + { + if (check_multifile (child)) + die->die_no_multifile = 0; + } + else if (child->die_offset == -1U) + { + if (child->die_nextdup && child->die_nextdup->die_dup == child) + { + if (child->die_nextdup->die_ck_state == CK_KNOWN + && child->die_nextdup->die_no_multifile == 0) + { + child->die_no_multifile = 0; + die->die_no_multifile = 0; + } + else + child->die_no_multifile = 1; + } + else + child->die_no_multifile = 1; + } + else + { + child->die_op_type_referenced = 0; + if (child->die_dup == NULL + && child->die_ck_state == CK_KNOWN + && child->die_no_multifile == 0) + die->die_no_multifile = 0; + else + child->die_no_multifile = 1; + } + return die->die_no_multifile == 0; +} + +/* Helper function for write_multifile_strp to sort strp_entry + by increasing new_off. */ +static int +strp_off_cmp (const void *p, const void *q) +{ + struct strp_entry *s1 = *(struct strp_entry **)p; + struct strp_entry *s2 = *(struct strp_entry **)q; + if (s1->new_off < s2->new_off) + return -1; + if (s1->new_off > s2->new_off) + return 1; + return 0; +} + +/* Write tail optimized strings into the temporary .debug_str file. */ +static int +write_multifile_strp (void) +{ + unsigned int count = htab_elements (strp_htab), i, buf_alloc, buf_size; + struct strp_entry **arr = (struct strp_entry **) + obstack_alloc (&ob, count * sizeof (*arr)); + struct strp_entry **end = arr; + unsigned char *buf; + int ret = 0; + + htab_traverse (strp_htab, list_strp_entries, (void *) &end); + assert (arr + count == end); + qsort (arr, count, sizeof (struct strp_entry *), strp_off_cmp); + buf_alloc = max_strp_off - debug_sections[DEBUG_STR].size; + if (buf_alloc > 131072) + buf_alloc = 131072; + buf = (unsigned char *) obstack_alloc (&ob, buf_alloc); + buf_size = 0; + for (i = 0; i < count; i++) + { + unsigned char *p = debug_sections[DEBUG_STR].data + arr[i]->off; + unsigned int len = strlen ((char *) p) + 1; + if (buf_alloc - buf_size < len) + { + if (buf_size + && write (multi_str_fd, buf, buf_size) != (ssize_t) buf_size) + { + ret = 1; + break; + } + buf_size = 0; + if (buf_alloc < len) + { + if (write (multi_str_fd, p, len) != (ssize_t) len) + { + ret = 1; + break; + } + continue; + } + } + memcpy (buf + buf_size, p, len); + buf_size += len; + } + if (buf_size + && ret == 0 + && write (multi_str_fd, buf, buf_size) != (ssize_t) buf_size) + ret = 1; + obstack_free (&ob, (void *) arr); + return ret; +} + +/* Hold some statistics on the line entries so we know whether to emit + time and/or sizes. Used by list_line_entries used by + write_multifile_line. */ +struct line_stats +{ + struct line_entry ***end; + bool has_time; + bool has_size; +}; + +/* Helper to find the end of the line_htab entries and other stats. + Called through htab_traverse. */ +static int +list_line_entries (void **slot, void *data) +{ + struct line_stats *stats = (struct line_stats *) data; + struct line_entry *entry = (struct line_entry *) *slot; + struct line_entry ***end = stats->end; + **end = entry; + (*end)++; + if (entry->file->time != 0) + stats->has_time = true; + if (entry->file->size != 0) + stats->has_size = true; + return 1; +} + +/* Helper function for write_multifile_strp to sort line_entry + by increasing new_id. */ +static int +line_id_cmp (const void *p, const void *q) +{ + struct line_entry *s1 = *(struct line_entry **)p; + struct line_entry *s2 = *(struct line_entry **)q; + if (s1->new_id < s2->new_id) + return -1; + if (s1->new_id > s2->new_id) + return 1; + return 0; +} + +/* Write a minimal .debug_line entry. If not op_multifile, write it + into the temporary .debug_line file (if line_htab is non-NULL, fill + its directory and file table from it, otherwise emit an entry + with no directories or files), if op_multifile, store the entry + into debug_sections[DEBUG_LINE].new_data which it allocates. */ +static int +write_multifile_line (void) +{ + unsigned int filecnt = 0, dircnt = 0, filetbllen = 0, dirtbllen = 0; + unsigned int header_len, len, i, j; + unsigned char *line, *ptr; + struct line_entry **filearr = NULL; + struct line_stats line_stats; + unsigned int *diridx = NULL, *dirarr = NULL; + unsigned char buf[45]; /* Max header_len, see below. */ + int ret = 0; + + line_stats.has_time = line_stats.has_size = false; + if (line_htab) + { + struct line_entry **end; + filecnt = htab_elements (line_htab); + filearr = (struct line_entry **) + obstack_alloc (&ob, filecnt * sizeof (*filearr)); + end = filearr; + line_stats.end = &end; + htab_traverse (line_htab, list_line_entries, (void *) &line_stats); + assert (filearr + filecnt == end); + diridx = (unsigned int *) + obstack_alloc (&ob, filecnt * sizeof (*diridx)); + qsort (filearr, filecnt, sizeof (struct line_entry *), line_id_cmp); + for (i = 0; i < filecnt; i++) + { + unsigned int direntrylen = 0; + const char *file = filearr[i]->file->file; + if (filearr[i]->file->dir == NULL) + { + const char *r = strrchr (file, '/'), *s; + + j = 0; + direntrylen = r ? r - file : 0; + while (direntrylen && file[direntrylen - 1] == '/') + direntrylen--; + if (direntrylen) + { + direntrylen++; + for (j = 0; j < dircnt; j++) + if (filearr[dirarr[j]]->file->dir == NULL + && strncmp (filearr[dirarr[j]]->file->file, + file, direntrylen) == 0) + { + s = filearr[dirarr[j]]->file->file + direntrylen; + while (*s == '/') + s++; + if (strchr (s, '/')) + continue; + break; + } + j++; + file = r + 1; + } + } + else + { + for (j = 0; j < dircnt; j++) + if (filearr[dirarr[j]]->file->dir + && strcmp (filearr[dirarr[j]]->file->dir, + filearr[i]->file->dir) == 0) + break; + j++; + direntrylen = strlen (filearr[i]->file->dir) + 1; + } + if (j <= dircnt) + diridx[i] = j; + else + { + obstack_int_grow (&ob, i); + diridx[i] = ++dircnt; + dirarr = (unsigned int *) obstack_base (&ob); + dirtbllen += direntrylen; + } + filetbllen += strlen (file) + 1; + filetbllen += size_of_uleb128 (diridx[i]); + if (lowest_line_version < 5 || line_stats.has_time) + filetbllen += size_of_uleb128 (filearr[i]->file->time); + if (lowest_line_version < 5 || line_stats.has_size) + filetbllen += size_of_uleb128 (filearr[i]->file->size); + } + dirarr = (unsigned int *) obstack_finish (&ob); + } + + /* standard .debug_line "header" length (both version 2 and 5): + unit_length (4) + version (2) + header_length (4) + + min_instr_length (1) + default_is_stmt (1) + line_base (1) + + line_range (1) + opcode_base (1) = 15 + + version 2 adds 2 bytes, one zero byte to terminate dir and file lists. + + version 5 adds at least 11 bytes, max_ops_per_instr (1) + + address_size (1) + segment_size (1) + dir_entry_format_cnt (1) + + format_pair (2), file_entry_format_cnt (1) + file_format_pairs + (4). Plus dircnt (uleb128) + format_pair (2) if has_time + + format_pair (2) if has_size) + filecnt (uleb128). + + version 5 also has 2 extra 6 byte "<dwz>" string entries for dir + and file entry zero, plus one for the zero file entry dir idx. + */ + header_len = 15; + if (lowest_line_version < 5) + header_len += 2; + else + { + header_len += 11; + header_len += size_of_uleb128 (dircnt + 1); + header_len += size_of_uleb128 (filecnt + 1); + if (line_stats.has_time) + header_len += 2; + if (line_stats.has_size) + header_len += 2; + header_len += 2 * 6 + 1; + } + len = header_len + filetbllen + dirtbllen; + if (unlikely (op_multifile)) + { + debug_sections[DEBUG_LINE].new_size = len; + debug_sections[DEBUG_LINE].new_data = malloc (len); + if (debug_sections[DEBUG_LINE].new_data == NULL) + dwz_oom (); + line = debug_sections[DEBUG_LINE].new_data; + } + else + { + if (multi_line_off + len < multi_line_off) + { + if (line_htab) + obstack_free (&ob, (void *) filearr); + return 1; + } + + if (len == header_len) + { + line = buf; + assert (sizeof (buf) >= header_len); + } + else + line = (unsigned char *) obstack_alloc (&ob, len); + } + ptr = line; + write_32 (ptr, len - 4); /* Total length. */ + if (lowest_line_version < 5) + write_16 (ptr, 2); /* DWARF version. */ + else + { + write_16 (ptr, 5); /* DWARF version. */ + write_8 (ptr, multi_ptr_size); /* Address size. */ + write_8 (ptr, 0); /* Segment size. */ + } + write_32 (ptr, /* Header length. */ + len - (lowest_line_version < 5 ? 10 : 12)); + write_8 (ptr, 1); /* Minimum insn length. */ + if (lowest_line_version >= 5) + write_8 (ptr, 1); /* Maximum ops per instr. */ + write_8 (ptr, 1); /* Default is_stmt. */ + write_8 (ptr, 0); /* Line base. */ + write_8 (ptr, 1); /* Line range. */ + write_8 (ptr, 1); /* Opcode base. */ + + if (lowest_line_version >= 5) + { + write_8 (ptr, 1); /* Dir entry format count. */ + write_uleb128 (ptr, DW_LNCT_path); + write_uleb128 (ptr, DW_FORM_string); + write_uleb128 (ptr, dircnt + 1); /* Dir cnt. */ + memcpy (ptr, "<dwz>", 6); /* Zero entry empty dir path. */ + ptr += 6; + } + + for (i = 0; i < dircnt; i++) + { + unsigned int l; + if (filearr[dirarr[i]]->file->dir) + { + l = strlen (filearr[dirarr[i]]->file->dir) + 1; + memcpy (ptr, filearr[dirarr[i]]->file->dir, l); + } + else + { + const char *file = filearr[dirarr[i]]->file->file; + const char *r = strrchr (file, '/'); + + while (r && r > file && r[-1] == '/') + r--; + l = r - file + 1; + memcpy (ptr, file, l - 1); + ptr[l - 1] = '\0'; + } + ptr += l; + } + if (lowest_line_version < 5) + write_8 (ptr, 0); /* Terminate dir table. */ + else + { + unsigned int format_cnt = 2 + line_stats.has_size + line_stats.has_time; + write_8 (ptr, format_cnt); /* File entry format count. */ + write_uleb128 (ptr, DW_LNCT_path); + write_uleb128 (ptr, DW_FORM_string); + write_uleb128 (ptr, DW_LNCT_directory_index); + write_uleb128 (ptr, DW_FORM_udata); + if (line_stats.has_time) + { + write_uleb128 (ptr, DW_LNCT_timestamp); + write_uleb128 (ptr, DW_FORM_udata); + } + if (line_stats.has_size) + { + write_uleb128 (ptr, DW_LNCT_size); + write_uleb128 (ptr, DW_FORM_udata); + } + write_uleb128 (ptr, filecnt + 1); /* File names cnt. */ + memcpy (ptr, "<dwz>", 6); /* Zero entry empty file path. */ + ptr += 6; + write_8 (ptr, 0); /* Zero entry zero diridx. */ + if (line_stats.has_time) + write_8 (ptr, 0); + if (line_stats.has_size) + write_8 (ptr, 0); + } + + for (i = 0; i < filecnt; i++) + { + const char *file = filearr[i]->file->file; + unsigned int l; + if (diridx[i] && filearr[i]->file->dir == NULL) + file = strrchr (file, '/') + 1; + l = strlen (file) + 1; + memcpy (ptr, file, l); + ptr += l; + write_uleb128 (ptr, diridx[i]); + if (lowest_line_version < 5 || line_stats.has_time) + write_uleb128 (ptr, filearr[i]->file->time); + if (lowest_line_version < 5 || line_stats.has_size) + write_uleb128 (ptr, filearr[i]->file->size); + } + if (lowest_line_version < 5) + write_8 (ptr, 0); /* Terminate file table. */ + assert (ptr == line + len); + + if (likely (!op_multifile)) + { + if (write (multi_line_fd, line, len) != (ssize_t) len) + ret = 1; + else + multi_line_off += len; + if (line_htab) + obstack_free (&ob, (void *) filearr); + else if (line != buf) + obstack_free (&ob, (void *) line); + } + else if (line_htab) + obstack_free (&ob, (void *) filearr); + return ret; +} + +#if DEVEL +/* In struct dw_die we have a union u with fields p1 and p2. The p1 field is + used during phase 1, after which the space is reused for the p2 field + during phase 2. Clear the p2 field to get rid of values stored to p1 + during phase 1. */ +static int +clear_p2_field (void) +{ + dw_cu_ref cu; + dw_die_ref die; + + FOREACH_DIE (cu, die) + { + assert (die->die_collapsed_child == 0); + die->u.p2.die_new_abbrev = NULL; + die->u.p2.die_new_offset = 0; + die->u.p2.die_intracu_udata_size = 0; + } + + return 0; +} +#endif + +/* Helper structure for file state. */ +struct file_result +{ + /* -3: Uninitialized. + -2: Already processed under different name. + -1: Ignore. + 0: Processed, changed. + 1: Processed, unchanged. */ + int res; + int ret; + size_t hardlink_to; + unsigned int die_count; + bool skip_multifile; + bool low_mem_p; +}; + +/* Collect potentially shareable DIEs, strings and .debug_macro + opcode sequences into temporary .debug_* files. */ +static int +write_multifile_1 (DSO *dso, struct file_result *res) +{ + dw_cu_ref cu; + bool any_cus = false; + unsigned int i; + int ret = 0; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_multifile\n"); + } + + if (multi_ehdr.e_ident[0] == '\0') + multi_ehdr = dso->ehdr; + + if (multifile_force_ptr_size && ptr_size != multifile_force_ptr_size) + { + error (0, 0, "File %s skipped for multi-file optimization, different" + " pointer size", dso->filename); + res->skip_multifile = true; + return 1; + } + else if (multi_ptr_size == 0) + multi_ptr_size = ptr_size; + else if (ptr_size != multi_ptr_size) + { + error (0, 0, "Multi-file optimization not allowed for different" + " pointer sizes"); + multifile = NULL; + return 1; + } + else + { + /* Same ptr_size. */ + } + + int endianity = (do_read_32 == buf_read_ule32 + ? ELFDATA2LSB + : ELFDATA2MSB); + if (multifile_force_endian && endianity != multifile_force_endian) + { + error (0, 0, "File %s skipped for multi-file optimization, different" + " endianity", dso->filename); + res->skip_multifile = true; + return 1; + } + else if (multi_endian == 0) + multi_endian = endianity; + else if (multi_endian != endianity) + { + error (0, 0, "Multi-file optimization not allowed for different" + " endianity"); + multifile = NULL; + return 1; + } + else + { + /* Same endianity. */ + } + +#if DEVEL + clear_p2_field (); +#endif + + for (i = 0; i < SAVED_SECTIONS; i++) + { + saved_new_data[i] = debug_sections[i].new_data; + saved_new_size[i] = debug_sections[i].new_size; + debug_sections[i].new_data = NULL; + debug_sections[i].new_size = debug_sections[i].size; + } + propagate_multifile (); + for (cu = first_cu; cu && cu->cu_kind != CU_TYPES; cu = cu->cu_next) + { + cu->u1.cu_new_abbrev_owner = NULL; + cu->u2.cu_new_abbrev_offset = 0; + cu->cu_new_offset = 0; + any_cus |= check_multifile (cu->cu_die); + } + if (any_cus) + { + dw_cu_ref *cup; + + for (cup = &first_cu; *cup && (*cup)->cu_kind != CU_TYPES; ) + { + if ((*cup)->cu_new_abbrev) + htab_delete ((*cup)->cu_new_abbrev); + + if ((*cup)->cu_die->die_no_multifile == 0) + cup = &(*cup)->cu_next; + else + *cup = (*cup)->cu_next; + } + *cup = NULL; + multifile_mode = MULTIFILE_MODE_WR; + if (tracing) + fprintf (stderr, "Write-multifile %s\n", dso->filename); + if (compute_abbrevs (NULL)) + ret = 1; + else if (debug_sections[DEBUG_MACRO].data && read_macro (dso)) + ret = 1; + else if ((unsigned int) (multi_info_off + + debug_sections[DEBUG_INFO].new_size) + < multi_info_off + || (unsigned int) (multi_abbrev_off + + debug_sections[DEBUG_ABBREV].new_size) + < multi_abbrev_off + || (unsigned int) (multi_str_off + + (max_strp_off ? max_strp_off + : debug_sections[DEBUG_ABBREV].size)) + < multi_str_off + || (unsigned int) (multi_macro_off + + debug_sections[DEBUG_MACRO].new_size) + < multi_macro_off) + { + error (0, 0, "Multifile temporary files too large"); + multifile = NULL; + ret = 1; + } + else + { + const char *mfile; + write_abbrev (); + write_info (NULL); + /* Any error in this is fatal for multifile handling of further + files. */ + mfile = multifile; + multifile = NULL; + if (write (multi_abbrev_fd, debug_sections[DEBUG_ABBREV].new_data, + debug_sections[DEBUG_ABBREV].new_size) + != (ssize_t) debug_sections[DEBUG_ABBREV].new_size + || write (multi_info_fd, debug_sections[DEBUG_INFO].new_data, + debug_sections[DEBUG_INFO].new_size) + != (ssize_t) debug_sections[DEBUG_INFO].new_size + || write (multi_str_fd, debug_sections[DEBUG_STR].data, + debug_sections[DEBUG_STR].size) + != (ssize_t) debug_sections[DEBUG_STR].size + || (debug_sections[DEBUG_MACRO].new_data + && write (multi_macro_fd, + debug_sections[DEBUG_MACRO].new_data, + debug_sections[DEBUG_MACRO].new_size) + != (ssize_t) debug_sections[DEBUG_MACRO].new_size) + || (strp_htab != NULL && write_multifile_strp ()) + || write_multifile_line ()) + { + error (0, 0, "Error writing multi-file temporary files"); + ret = 1; + } + else + { + multi_info_off += debug_sections[DEBUG_INFO].new_size; + multi_abbrev_off += debug_sections[DEBUG_ABBREV].new_size; + multi_str_off += max_strp_off ? max_strp_off + : debug_sections[DEBUG_STR].size; + multi_macro_off += debug_sections[DEBUG_MACRO].new_size; + multifile = mfile; + } + } + } + multifile_mode = 0; + for (i = 0; i < SAVED_SECTIONS; i++) + { + free (debug_sections[i].new_data); + debug_sections[i].new_data = saved_new_data[i]; + debug_sections[i].new_size = saved_new_size[i]; + saved_new_data[i] = NULL; + } + return ret; +} + +struct pipe +{ + int readfd; + int writefd; +}; + +static bool write_multifile_parallel_p; +static int child_id; +static struct pipe *pipes; + +/* Get token. */ +static void +get_token (void) +{ + int n = child_id; + int readfd = pipes[n].readfd; + int writefd = pipes[n].writefd; + close (writefd); + char buf; + read (readfd, &buf, 1); + close (readfd); +} + +/* Pass token to child N. */ +static void +pass_token (int n) +{ + int readfd = pipes[n].readfd; + int writefd = pipes[n].writefd; + close (readfd); + char buf = '\0'; + write (writefd, &buf, 1); + close (writefd); +} + +/* Wrapper around write_multifile_1 that ensures write_multifile_1 is called + in file order. */ +static int +write_multifile (DSO *dso, struct file_result *res) +{ + int ret; + + if (write_multifile_parallel_p) + { + get_token (); + + multi_info_off = lseek (multi_info_fd, 0L, SEEK_END); + multi_abbrev_off = lseek (multi_abbrev_fd, 0L, SEEK_END); + multi_line_off = lseek (multi_line_fd, 0L, SEEK_END); + multi_str_off = lseek (multi_str_fd, 0L, SEEK_END); + multi_macro_off = lseek (multi_macro_fd, 0L, SEEK_END); + } + + ret = write_multifile_1 (dso, res); + + return ret; +} + +/* During fi_multifile phase, see what DIEs in a partial unit + contain no children worth keeping where all real DIEs have + dups in the shared .debug_info section and what remains is + just the DW_TAG_partial_unit, a single DW_TAG_imported_unit + and perhaps some empty named namespaces. Then all the + references to that partial unit can be replaced by references + to the shared partial unit DW_TAG_import_unit has been importing. */ +static bool +remove_empty_pu (dw_die_ref die) +{ + dw_die_ref child = die->die_child, dup = NULL; + if (!die->die_named_namespace) + { + if (die->die_tag != DW_TAG_partial_unit + || child == NULL + || child->die_tag != DW_TAG_imported_unit + || child->die_offset != -1U) + return false; + if (die->die_abbrev->nattr > 2) + return false; + if (die->die_abbrev->nattr + && die->die_abbrev->attr[0].attr != DW_AT_stmt_list) + return false; + if (die->die_abbrev->nattr == 2 + && die->die_abbrev->attr[1].attr != DW_AT_comp_dir) + return false; + dup = child->die_nextdup; + child = child->die_sib; + } + else + { + if (die->die_abbrev->nattr > 2) + return false; + if (die->die_abbrev->nattr + && die->die_abbrev->attr[0].attr != DW_AT_name) + return false; + if (die->die_abbrev->nattr == 2 + && die->die_abbrev->attr[1].attr != DW_AT_sibling) + return false; + } + for (; child; child = child->die_sib) + if (!child->die_named_namespace) + { + if (!child->die_remove) + /* Signal that DIE can't be removed, but + perhaps we could still remove_empty_pu + some named namespaces that are children of DIE. */ + dup = die; + if (dup == NULL && die->die_named_namespace) + dup = child->die_dup->die_parent; + } + else if (!remove_empty_pu (child)) + return false; + else if (dup == NULL && die->die_named_namespace) + dup = child->die_dup->die_parent; + if (dup == NULL || dup == die) + return false; + die->die_remove = 1; + assert (dup->die_tag == die->die_tag); + die->die_dup = dup; + return true; +} + +/* Call remove_empty_pu on all partial units. */ +static int +remove_empty_pus (void) +{ + dw_cu_ref cu; + for (cu = first_cu; cu; cu = cu->cu_next) + if (cu->cu_kind == CU_NORMAL + && cu->cu_die->die_tag == DW_TAG_partial_unit) + remove_empty_pu (cu->cu_die); + return 0; +} + +/* Handle compression of a single file FILE. If OUTFILE is + non-NULL, the result will be stored into that file, otherwise + the result will be written into a temporary file that is renamed + over FILE. */ +static int +dwz (const char *file, const char *outfile, struct file_result *res) +{ + DSO *dso; + int ret = 0, fd; + unsigned int i; + struct stat st; + + if (res->res == -1) + return 1; + + res->res = -1; + fd = open (file, O_RDONLY); + if (fd < 0) + { + error (0, errno, "Failed to open input file %s", file); + return 1; + } + if (fstat (fd, &st) < 0) + { + close (fd); + error (0, errno, "Failed to stat input file %s", file); + return 1; + } + + res->res = 1; + + if (tracing) + { + fprintf (stderr, "Compressing %s", file); + if (multifile_mode == 0) + ; + else if (low_mem) + fprintf (stderr, " in low-mem mode"); + else if (fi_multifile) + fprintf (stderr, " in finalize-multifile mode"); + else + abort (); + fprintf (stderr, "\n"); + } + + dso = fdopen_dso (fd, file); + if (dso == NULL) + return 1; + + obstack_alloc_failed_handler = dwz_oom; + if (setjmp (oom_buf)) + { + error (0, ENOMEM, "%s: Could not allocate memory", dso->filename); + + cleanup (); + ret = 1; + } + else + { + obstack_init (&ob); + obstack_init (&ob2); + + unsigned int *die_count = multifile ? &res->die_count : NULL; + ret = read_dwarf (dso, quiet && outfile == NULL, die_count); + if (ret) + cleanup (); + else if (partition_dups () + || create_import_tree () + || (unlikely (fi_multifile) + && (remove_empty_pus () + || read_macro (dso))) + || read_debug_info (dso, DEBUG_TYPES, NULL) +#if DEVEL + || clear_p2_field () +#endif + || compute_abbrevs (dso) + || (unlikely (fi_multifile) && (finalize_strp (false), 0))) + { + cleanup (); + ret = 1; + } + else if (!(ignore_size || force_p) + && ((debug_sections[DEBUG_INFO].new_size + + debug_sections[DEBUG_ABBREV].new_size + + debug_sections[DEBUG_STR].new_size + + debug_sections[DEBUG_MACRO].new_size + + debug_sections[DEBUG_TYPES].new_size) + >= (debug_sections[DEBUG_INFO].size + + debug_sections[DEBUG_ABBREV].size + + debug_sections[DEBUG_STR].size + + debug_sections[DEBUG_MACRO].size + + debug_sections[DEBUG_TYPES].size))) + { + if (!quiet || outfile != NULL) + error (0, 0, "%s: DWARF compression not beneficial " + "- old size %ld new size %ld", dso->filename, + (unsigned long) (debug_sections[DEBUG_INFO].size + + debug_sections[DEBUG_ABBREV].size + + debug_sections[DEBUG_STR].size + + debug_sections[DEBUG_MACRO].size + + debug_sections[DEBUG_TYPES].size), + (unsigned long) (debug_sections[DEBUG_INFO].new_size + + debug_sections[DEBUG_ABBREV].new_size + + debug_sections[DEBUG_STR].new_size + + debug_sections[DEBUG_MACRO].new_size + + debug_sections[DEBUG_TYPES].new_size)); + + if (multifile && !fi_multifile && !low_mem) + write_multifile (dso, res); + + cleanup (); + if (outfile != NULL) + ret = 1; + } + else if (write_aranges (dso)) + { + failure: + cleanup (); + ret = 1; + } + else + { + if (unlikely (fi_multifile)) + { + size_t len; + const char *name = multifile_name; + enum debug_section_kind sec_kind; + unsigned char *ptr; + if (multifile_name == NULL) + { + if (!multifile_relative) + name = multifile; + else + { + char *p1 = realpath (file, NULL); + char *p2 = realpath (multifile, NULL); + char *p3, *p4, *p5, *p6; + unsigned int dotdot = 0; + if (p1 == NULL || p2 == NULL) + { + if (p1) + free (p1); + else if (p2) + free (p2); + error (0, 0, "Could not compute relative multifile " + "pathname from %s to %s", + file, multifile); + goto failure; + } + p3 = p1; + p4 = p2; + do + { + p5 = strchr (p3, '/'); + p6 = strchr (p4, '/'); + if (p5 == NULL + || p6 == NULL + || p5 - p3 != p6 - p4 + || memcmp (p3, p4, p5 - p3) != 0) + break; + p3 = p5 + 1; + p4 = p6 + 1; + } + while (1); + while (p5 != NULL) + { + dotdot++; + p5 = strchr (p5 + 1, '/'); + } + len = strlen (p4); + p3 = (char *) malloc (dotdot * 3 + len + 1); + if (p3 == NULL) + dwz_oom (); + p5 = p3; + while (dotdot) + { + memcpy (p5, "../", 3); + p5 += 3; + dotdot--; + } + memcpy (p5, p4, len + 1); + free (p1); + free (p2); + name = p3; + } + } + len = strlen (name) + 1; + sec_kind = dwarf_5 ? DEBUG_SUP : GNU_DEBUGALTLINK; + debug_sections[sec_kind].new_size + = len + 0x14 + (dwarf_5 ? 4 : 0); + debug_sections[sec_kind].new_data + = malloc (debug_sections[sec_kind].new_size); + if (debug_sections[sec_kind].new_data == NULL) + dwz_oom (); + ptr = debug_sections[sec_kind].new_data; + if (dwarf_5) + { + write_16 (ptr, 5); + write_8 (ptr, 0); + } + memcpy (ptr, name, len); + ptr += len; + if (dwarf_5) + write_uleb128 (ptr, 0x14); + memcpy (ptr, multifile_sha1, 0x14); + if (name != multifile_name && name != multifile) + free ((void *) name); + write_macro (); + } + write_abbrev (); + write_info (die_count); + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_loc\n"); + } + write_loc (); + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_loclists\n"); + } + write_loclists (); + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_types\n"); + } + write_types (); + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "write_gdb_index\n"); + } + write_gdb_index (); + /* These sections are optional and it is unclear + how to adjust them. Just remove them. */ + debug_sections[DEBUG_PUBNAMES].new_data = NULL; + debug_sections[DEBUG_PUBNAMES].new_size = 0; + debug_sections[DEBUG_PUBTYPES].new_data = NULL; + debug_sections[DEBUG_PUBTYPES].new_size = 0; + debug_sections[DEBUG_GNU_PUBNAMES].new_data = NULL; + debug_sections[DEBUG_GNU_PUBNAMES].new_size = 0; + debug_sections[DEBUG_GNU_PUBTYPES].new_data = NULL; + debug_sections[DEBUG_GNU_PUBTYPES].new_size = 0; + + if (multifile && !fi_multifile && !low_mem) + write_multifile (dso, res); + + bool save_to_temp = save_temps && multifile && multifile_mode == 0; + cleanup (); + + if (write_dso (dso, outfile, &st, save_to_temp)) + ret = 1; + else + res->res = 0; + + if (unlikely (progress_p)) + report_progress (); + } + } + + for (i = 0; debug_sections[i].name; ++i) + { + debug_sections[i].data = NULL; + debug_sections[i].size = 0; + free (debug_sections[i].new_data); + debug_sections[i].new_data = NULL; + debug_sections[i].new_size = 0; + debug_sections[i].sec = 0; + } + + if (elf_end (dso->elf) < 0) + { + error (0, 0, "elf_end failed: %s", elf_errmsg (elf_errno ())); + ret = 1; + } + close (fd); + + free (dso); + if (ret == 3) + { + ret = (outfile != NULL) ? 1 : 0; + res->res = -1; + } + return ret; +} + +/* In order to free all malloced memory at the end of optimize_multifile, + communicate .debug_str tail optimized offset list from optimize_multifile + to read_multifile using an mmapped chunk of memory pointed by this + variable. */ +static unsigned int *strp_tail_off_list; + +/* Process temporary .debug_* files, see what can be beneficially shared + and write a new ET_REL file, containing the shared .debug_* sections. */ +static int +optimize_multifile (unsigned int *die_count) +{ + DSO dsobuf, *dso; + int fd = -1; + volatile int vfd = -1; + unsigned int i; + Elf *elf = NULL; + Elf *volatile velf = NULL; + GElf_Shdr shdr; + Elf_Scn *scn; + Elf_Data *data; + char *e_ident; + static const char shstrtab_gnu[] + = "\0.shstrtab\0.note.gnu.build-id\0.gdb_index\0" + ".debug_info\0.debug_abbrev\0.debug_line\0.debug_str\0.debug_macro"; + static const char shstrtab_dwarf5[] + = "\0.shstrtab\0.gdb_index\0" + ".debug_info\0.debug_abbrev\0.debug_line\0.debug_str\0.debug_macro\0" + ".debug_sup"; + const char *const shstrtab = dwarf_5 ? shstrtab_dwarf5 : shstrtab_gnu; + const size_t shstrtab_len = (dwarf_5 + ? sizeof shstrtab_dwarf5 + : sizeof shstrtab_gnu); + const char *p; + unsigned char note[0x24], *np, *supp; + struct sha1_ctx ctx; + + if (multi_ehdr.e_ident[0] == '\0' + || multi_ptr_size == 0 + || multi_endian == 0) + return -1; + + if (multi_line_off == 0) + { + init_endian (multi_endian); + if (write_multifile_line ()) + { + error (0, 0, "Error writing multi-file temporary files"); + return -1; + } + } + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "optimize_multifile\n"); + } + + debug_sections[DEBUG_INFO].size = multi_info_off; + debug_sections[DEBUG_INFO].data + = (multi_info_off + ? mmap (NULL, multi_info_off, PROT_READ, MAP_PRIVATE, multi_info_fd, 0) + : NULL); + debug_sections[DEBUG_ABBREV].size = multi_abbrev_off; + debug_sections[DEBUG_ABBREV].data + = (multi_abbrev_off + ? mmap (NULL, multi_abbrev_off, PROT_READ, MAP_PRIVATE, + multi_abbrev_fd, 0) + : NULL); + debug_sections[DEBUG_LINE].size = multi_line_off; + debug_sections[DEBUG_LINE].data + = mmap (NULL, multi_line_off, PROT_READ, MAP_PRIVATE, multi_line_fd, 0); + debug_sections[DEBUG_STR].size = multi_str_off; + debug_sections[DEBUG_STR].data + = multi_str_off + ? mmap (NULL, multi_str_off, PROT_READ, MAP_PRIVATE, multi_str_fd, 0) + : NULL; + debug_sections[DEBUG_MACRO].size = multi_macro_off; + debug_sections[DEBUG_MACRO].data + = multi_macro_off + ? mmap (NULL, multi_macro_off, PROT_READ, MAP_PRIVATE, multi_macro_fd, 0) + : NULL; + if (debug_sections[DEBUG_INFO].data == MAP_FAILED + || debug_sections[DEBUG_ABBREV].data == MAP_FAILED + || debug_sections[DEBUG_LINE].data == MAP_FAILED + || debug_sections[DEBUG_STR].data == MAP_FAILED + || debug_sections[DEBUG_MACRO].data == MAP_FAILED) + { + error (0, 0, "Error mmapping multi-file temporary files"); + fail: + cleanup (); + if (velf) + elf_end (velf); + if (vfd != -1) + { + unlink (multifile); + close (vfd); + } + if (debug_sections[DEBUG_INFO].data != MAP_FAILED) + munmap (debug_sections[DEBUG_INFO].data, + debug_sections[DEBUG_INFO].size); + if (debug_sections[DEBUG_ABBREV].data != MAP_FAILED) + munmap (debug_sections[DEBUG_ABBREV].data, + debug_sections[DEBUG_ABBREV].size); + if (debug_sections[DEBUG_LINE].data != MAP_FAILED) + munmap (debug_sections[DEBUG_LINE].data, + debug_sections[DEBUG_LINE].size); + if (debug_sections[DEBUG_STR].data != MAP_FAILED + && debug_sections[DEBUG_STR].data != NULL) + munmap (debug_sections[DEBUG_STR].data, + debug_sections[DEBUG_STR].size); + if (debug_sections[DEBUG_MACRO].data != MAP_FAILED + && debug_sections[DEBUG_MACRO].data != NULL) + munmap (debug_sections[DEBUG_MACRO].data, + debug_sections[DEBUG_MACRO].size); + return -1; + } + + init_endian (multi_endian); + ptr_size = multi_ptr_size; + memset (&dsobuf, '\0', sizeof (dsobuf)); + dso = &dsobuf; + dso->filename = multifile; + if (tracing) + fprintf (stderr, "Optimize-multifile\n"); + multifile_mode = MULTIFILE_MODE_OP; + + obstack_alloc_failed_handler = dwz_oom; + if (unoptimized_multifile) + { + for (i = 0; i < SAVED_SECTIONS; i++) + { + debug_sections[i].new_data = debug_sections[i].data; + debug_sections[i].new_size = debug_sections[i].size; + } + } + else if (setjmp (oom_buf)) + { + error (0, ENOMEM, "%s: Could not allocate memory", dso->filename); + goto fail; + } + else + { + dw_cu_ref *cup; + unsigned char *p, *q; + unsigned int strp_count; + + obstack_init (&ob); + obstack_init (&ob2); + + if (read_debug_info (dso, DEBUG_INFO, NULL) + || partition_dups ()) + goto fail; + +#if DEVEL + clear_p2_field (); +#endif + + for (cup = &first_cu; *cup && (*cup)->cu_kind == CU_PU; + cup = &(*cup)->cu_next) + ; + + *cup = NULL; + + strp_count = debug_sections[DEBUG_STR].size / 64; + if (strp_count < 64) + strp_count = 64; + strp_htab = htab_try_create (strp_count, + strp_hash2, strp_eq2, NULL); + if (strp_htab == NULL) + dwz_oom (); + + for (p = debug_sections[DEBUG_STR].data; + p < debug_sections[DEBUG_STR].data + debug_sections[DEBUG_STR].size; + p = q + 1) + { + void **slot; + struct strp_entry se; + hashval_t hash; + + q = (unsigned char *) strchr ((char *) p, '\0'); + hash = hash (p, q - p); + se.off = p - debug_sections[DEBUG_STR].data; + se.new_off = hash & ~1U; + slot = htab_find_slot_with_hash (strp_htab, &se, se.new_off, INSERT); + if (slot == NULL) + dwz_oom (); + if (*slot == NULL) + { + struct strp_entry *s = pool_alloc (strp_entry, sizeof (*s)); + *s = se; + *slot = (void *) s; + } + else + ((struct strp_entry *) *slot)->new_off |= 1; + } + + if (first_cu != NULL) + { + if (compute_abbrevs (dso)) + goto fail; + + strp_tail_off_list = finalize_strp (true); + + write_abbrev (); + write_info (die_count); + write_gdb_index (); + if (write_multifile_line ()) + goto fail; + } + else + strp_tail_off_list = finalize_strp (true); + + if (debug_sections[DEBUG_MACRO].data) + handle_macro (); + } + + np = note; + write_32 (np, sizeof ("GNU")); + write_32 (np, 0x14); + write_32 (np, NT_GNU_BUILD_ID); + + supp = NULL; + if (dwarf_5) + { + debug_sections[DEBUG_SUP].new_size = 0x14 + 5; + debug_sections[DEBUG_SUP].new_data + = malloc (debug_sections[DEBUG_SUP].new_size); + if (debug_sections[DEBUG_SUP].new_data == NULL) + dwz_oom (); + supp = debug_sections[DEBUG_SUP].new_data; + write_16 (supp, 5); + write_8 (supp, 1); + write_8 (supp, 0); + write_uleb128 (supp, 0x14); + } + + cleanup (); + fd = open (multifile, O_RDWR | O_CREAT, 0600); + vfd = fd; + if (fd < 0) + { + error (0, errno, "Failed to open multi-file common file %s", multifile); + goto fail; + } + + elf = elf_begin (fd, ELF_C_WRITE, NULL); + velf = elf; + if (elf == NULL) + { + error (0, 0, "cannot open ELF file: %s", elf_errmsg (-1)); + goto fail; + } + + multi_ehdr.e_type = ET_REL; + multi_ehdr.e_entry = 0; + multi_ehdr.e_phoff = 0; + multi_ehdr.e_phnum = 0; + multi_ehdr.e_shoff = multi_ehdr.e_ehsize; + multi_ehdr.e_shnum = 2; + if (!dwarf_5) + { + multi_ehdr.e_shoff += 0x24; + multi_ehdr.e_shnum++; + } + for (i = 0; debug_sections[i].name; i++) + if (debug_sections[i].new_size) + { + multi_ehdr.e_shoff += debug_sections[i].new_size; + multi_ehdr.e_shnum++; + } + multi_ehdr.e_shstrndx = multi_ehdr.e_shnum - 1; + + /* Some gelf_newehdr implementations don't return the resulting + ElfNN_Ehdr, so we have to do it the hard way instead of: + e_ident = (char *) gelf_newehdr (elf, gelf_getclass (dso->elf)); */ + switch (multi_ehdr.e_ident[EI_CLASS]) + { + case ELFCLASS32: + e_ident = (char *) elf32_newehdr (elf); + multi_ehdr.e_shoff = (multi_ehdr.e_shoff + 3) & -4; + break; + case ELFCLASS64: + e_ident = (char *) elf64_newehdr (elf); + multi_ehdr.e_shoff = (multi_ehdr.e_shoff + 7) & -8; + break; + default: + e_ident = NULL; + break; + } + + if (e_ident == NULL + /* This is here just for the gelfx wrapper, so that gelf_update_ehdr + already has the correct ELF class. */ + || memcpy (e_ident, multi_ehdr.e_ident, EI_NIDENT) == NULL + || gelf_update_ehdr (elf, &multi_ehdr) == 0) + { + error (0, 0, "Could not create new ELF headers"); + goto fail; + } + elf_flagelf (elf, ELF_C_SET, ELF_F_LAYOUT | ELF_F_PERMISSIVE); + + sha1_init_ctx (&ctx); + for (i = 0; debug_sections[i].name; i++) + { + if (debug_sections[i].new_size == 0) + continue; + sha1_process_bytes (debug_sections[i].new_data, + debug_sections[i].new_size, &ctx); + } + sha1_finish_ctx (&ctx, multifile_sha1); + + memcpy (np, "GNU", sizeof ("GNU")); + memcpy (np + 4, multifile_sha1, 0x14); + + if (dwarf_5) + memcpy (supp, multifile_sha1, 0x14); + + memset (&shdr, '\0', sizeof (shdr)); + shdr.sh_offset = multi_ehdr.e_ehsize; + if (!dwarf_5) + { + shdr.sh_type = SHT_NOTE; + shdr.sh_addralign = 4; + shdr.sh_size = 0x24; + scn = elf_newscn (elf); + elf_flagscn (scn, ELF_C_SET, ELF_F_DIRTY); + shdr.sh_name = (strchr (shstrtab + 1, '\0') + 1) - shstrtab; + gelf_update_shdr (scn, &shdr); + data = elf_newdata (scn); + data->d_buf = (char *) note; + data->d_type = ELF_T_BYTE; + data->d_version = EV_CURRENT; + data->d_size = shdr.sh_size; + data->d_off = 0; + data->d_align = 1; + } + + shdr.sh_type = SHT_PROGBITS; + shdr.sh_offset += shdr.sh_size; + shdr.sh_addralign = 1; + for (i = 0; debug_sections[i].name; i++) + { + if (debug_sections[i].new_size == 0) + continue; + scn = elf_newscn (elf); + elf_flagscn (scn, ELF_C_SET, ELF_F_DIRTY); + for (p = shstrtab + 1; p < shstrtab + shstrtab_len; + p = strchr (p, '\0') + 1) + if (strcmp (p, debug_sections[i].name) == 0) + { + shdr.sh_name = p - shstrtab; + break; + } + shdr.sh_size = debug_sections[i].new_size; + if (i == DEBUG_STR) + { + shdr.sh_flags = SHF_MERGE | SHF_STRINGS; + shdr.sh_entsize = 1; + } + else + { + shdr.sh_flags = 0; + shdr.sh_entsize = 0; + } + gelf_update_shdr (scn, &shdr); + data = elf_newdata (scn); + data->d_buf = debug_sections[i].new_data; + data->d_type = ELF_T_BYTE; + data->d_version = EV_CURRENT; + data->d_size = shdr.sh_size; + data->d_off = 0; + data->d_align = 1; + shdr.sh_offset += shdr.sh_size; + } + scn = elf_newscn (elf); + elf_flagscn (scn, ELF_C_SET, ELF_F_DIRTY); + shdr.sh_name = 1; + shdr.sh_offset = multi_ehdr.e_shoff + + multi_ehdr.e_shnum * multi_ehdr.e_shentsize; + shdr.sh_size = shstrtab_len; + shdr.sh_type = SHT_STRTAB; + shdr.sh_flags = 0; + shdr.sh_entsize = 0; + gelf_update_shdr (scn, &shdr); + data = elf_newdata (scn); + data->d_buf = (char *) shstrtab; + data->d_type = ELF_T_BYTE; + data->d_version = EV_CURRENT; + data->d_size = shdr.sh_size; + data->d_off = 0; + data->d_align = 1; + + if (elf_update (elf, ELF_C_WRITE_MMAP) == -1) + { + error (0, 0, "%s: elf_update failed", multifile); + goto fail; + } + + if (elf_end (elf) < 0) + { + error (0, 0, "elf_end failed: %s", elf_errmsg (elf_errno ())); + goto fail; + } + + fchmod (fd, 0644); + + if (dwarf_5) + { + free (debug_sections[DEBUG_SUP].new_data); + debug_sections[DEBUG_SUP].new_data = NULL; + } + munmap (debug_sections[DEBUG_INFO].data, debug_sections[DEBUG_INFO].size); + munmap (debug_sections[DEBUG_ABBREV].data, + debug_sections[DEBUG_ABBREV].size); + munmap (debug_sections[DEBUG_LINE].data, debug_sections[DEBUG_LINE].size); + if (debug_sections[DEBUG_STR].data) + munmap (debug_sections[DEBUG_STR].data, debug_sections[DEBUG_STR].size); + if (debug_sections[DEBUG_MACRO].data) + munmap (debug_sections[DEBUG_MACRO].data, + debug_sections[DEBUG_MACRO].size); + + for (i = 0; debug_sections[i].name; ++i) + { + debug_sections[i].data = NULL; + debug_sections[i].size = 0; + if (!unoptimized_multifile) + free (debug_sections[i].new_data); + debug_sections[i].new_data = NULL; + debug_sections[i].new_size = 0; + debug_sections[i].sec = 0; + } + + return fd; +} + +/* Parse the .debug_* sections from shared ET_REL file written + by optimize_multifile into data structures for fi_multifile + phase. */ +static DSO * +read_multifile (int fd, unsigned int die_count) +{ + DSO *dso, *volatile ret; + unsigned int i; + + if (unlikely (progress_p)) + { + report_progress (); + fprintf (stderr, "read_multifile\n"); + } + + if (tracing) + fprintf (stderr, "Read-multifile\n"); + + multifile_mode = MULTIFILE_MODE_RD; + dso = fdopen_dso (fd, multifile); + if (dso == NULL) + { + multifile_mode = 0; + return NULL; + } + + ret = dso; + obstack_alloc_failed_handler = dwz_oom; + if (setjmp (oom_buf)) + { + error (0, ENOMEM, "%s: Could not allocate memory", dso->filename); + + fail: + elf_end (dso->elf); + close (fd); + free (dso); + ret = NULL; + alt_off_htab = NULL; + } + else + { + obstack_init (&ob); + obstack_init (&ob2); + + if (read_dwarf (dso, false, &die_count)) + goto fail; + + if (debug_sections[DEBUG_STR].size) + { + unsigned char *p, *q; + unsigned int strp_count = debug_sections[DEBUG_STR].size / 64; + void **slot; + unsigned int *pi; + + if (strp_count < 100) + strp_count = 100; + strp_htab = htab_try_create (strp_count, strp_hash3, strp_eq3, NULL); + if (strp_htab == NULL) + dwz_oom (); + for (p = debug_sections[DEBUG_STR].data; + p < debug_sections[DEBUG_STR].data + + debug_sections[DEBUG_STR].size; p = q) + { + q = (unsigned char *) strchr ((char *) p, '\0') + 1; + slot = htab_find_slot_with_hash (strp_htab, p, + hash (p, q - p - 1), INSERT); + if (slot == NULL) + dwz_oom (); + assert (*slot == NULL); + *slot = (void *) p; + } + if (strp_tail_off_list) + { + for (pi = strp_tail_off_list; *pi; pi++) + { + p = debug_sections[DEBUG_STR].data + *pi; + q = (unsigned char *) strchr ((char *) p, '\0'); + slot = htab_find_slot_with_hash (strp_htab, p, + hash (p, q - p), INSERT); + if (slot == NULL) + dwz_oom (); + assert (*slot == NULL); + *slot = (void *) p; + } + pi++; + munmap (strp_tail_off_list, + (char *) pi - (char *) strp_tail_off_list); + } + } + + if (debug_sections[DEBUG_MACRO].data) + handle_macro (); + + alt_strp_htab = strp_htab; + strp_htab = NULL; + alt_off_htab = off_htab; + off_htab = NULL; + alt_dup_htab = dup_htab; + dup_htab = NULL; + alt_macro_htab = macro_htab; + macro_htab = NULL; + alt_first_cu = first_cu; + alt_pool = finalize_pool (); + alt_ob = ob; + alt_ob2 = ob2; + memset (&ob, '\0', sizeof (ob)); + memset (&ob2, '\0', sizeof (ob2)); + for (i = 0; i < SAVED_SECTIONS; i++) + { + alt_data[i] = debug_sections[i].data; + alt_size[i] = debug_sections[i].size; + } + } + + cleanup (); + + for (i = 0; debug_sections[i].name; ++i) + { + debug_sections[i].data = NULL; + debug_sections[i].size = 0; + debug_sections[i].new_data = NULL; + debug_sections[i].new_size = 0; + debug_sections[i].sec = 0; + } + + return ret; +} + +/* Clear all die_nextdup fields among toplevel children + of DIE. */ +static void +alt_clear_dups (dw_die_ref die) +{ + dw_die_ref child; + assert (die->die_dup == NULL); + die->die_nextdup = NULL; + for (child = die->die_child; child; child = child->die_sib) + { + assert (child->die_dup == NULL); + child->die_nextdup = NULL; + if (child->die_named_namespace) + alt_clear_dups (child); + } +} + +/* Create a temporary file using NAME. Return the corresponding file + descriptor if successful, otherwise return -1. */ +static int +make_temp_file (const char *name) +{ + const char *tmpdir = "/tmp/"; + const char *template_suffix = ".XXXXXX"; + int fd; + size_t buf_len, offset, name_len; + char *buf; + + if (save_temps) + { + FILE *f = fopen (name, "w+"); + if (f == NULL) + fd = -1; + else + fd = fileno (f); + return fd; + } + + name_len = strlen (name); + buf_len = (strlen (tmpdir) + + name_len + + strlen (template_suffix) + + 1); + if (buf_len < name_len) + return -1; + buf = (char *)malloc (buf_len); + if (buf == NULL) + return -1; + offset = 0; + + strcpy (&buf[offset], tmpdir); + offset += strlen (tmpdir); + + strcpy (&buf[offset], name); + offset += name_len; + + strcpy (&buf[offset], template_suffix); + offset += strlen (template_suffix); + + assert (offset == buf_len - 1); + assert (buf[offset] == '\0'); + + fd = mkstemp (buf); + if (fd == -1) + goto done; + + /* Unlink the filename, such that the file is disposed of once the file + descriptor is closed. */ + unlink (buf); + + done: + free (buf); + return fd; +} + +/* As dwz, but retry with MULTIFILE_MODE_LOW_MEM if the low_mem_die_limit + is hit. */ +static int +dwz_with_low_mem (const char *file, const char *outfile, + struct file_result *res) +{ + int ret; + + res->low_mem_p = false; + + ret = (low_mem_die_limit == 0 + ? 2 + : dwz (file, outfile, res)); + + if (ret == 2) + { + multifile_mode = MULTIFILE_MODE_LOW_MEM; + res->low_mem_p = true; + + ret = dwz (file, outfile, res); + } + + return ret; +} + +/* Initialize struct file_result RES. */ +static void +init_file_result (struct file_result *res) +{ + res->die_count = 0; + res->res = -3; + res->skip_multifile = false; + res->low_mem_p = false; +} + +/* Dwarf-compress FILE. If OUTFILE, write to result to OUTFILE, otherwise + modify FILE. */ +static int +dwz_one_file (const char *file, const char *outfile) +{ + struct file_result res; + + if (stats_p) + init_stats (file); + + init_file_result (&res); + + return dwz_with_low_mem (file, outfile, &res); +} + +/* Helper structure for hardlink discovery. */ +struct hl_stat +{ + dev_t dev; + ino_t ino; + nlink_t nlink; +}; + +/* Detect which FILES are hardlinks, and mark those in RESA. */ +static bool +detect_hardlinks (int nr_files, char *files[], struct file_result *resa) +{ + bool found = false; + struct hl_stat hl_stat[nr_files]; + int i; + + /* Try to open all files. */ + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + int fd; + struct stat st; + + const char *file = files[i]; + res->res = -1; + + fd = open (file, O_RDONLY); + if (fd < 0) + error (0, errno, "Failed to open input file %s", file); + else if (fstat (fd, &st) < 0) + error (0, errno, "Failed to stat input file %s", file); + else + { + res->res = 1; + hl_stat[i].dev = st.st_dev; + hl_stat[i].ino = st.st_ino; + hl_stat[i].nlink = st.st_nlink; + } + + close (fd); + } + + /* Detect hard links. */ + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + int n; + for (n = 0; n != i; n++) + if (resa[n].res >= 0 + && hl_stat[n].nlink > 1 + && hl_stat[n].dev == hl_stat[i].dev + && hl_stat[n].ino == hl_stat[i].ino) + break; + if (n == i) + continue; + res->res = -2; + res->hardlink_to = n; + found = true; + } + + return found; +} + +/* Update the FILES marked as hardlink in RESA. */ +static void +update_hardlinks (int nr_files, char *files[], struct file_result *resa) +{ + int i; + + /* Update hardlinks. */ + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + const char *file = files[i]; + size_t n; + if (res->res != -2) + continue; + n = res->hardlink_to; + + /* If a hardlink to this has been processed before + and we didn't change it, just assume the same + state. */ + if (resa[n].res == 1) + { + if (tracing) + fprintf (stderr, "Skipping hardlink %s to unchanged file\n", + file); + continue; + } + + /* If it changed, try to hardlink it again. */ + if (resa[n].res == 0) + { + size_t len = strlen (file); + char *filename = alloca (len + sizeof (".#dwz#.XXXXXX")); + int fd2; + if (tracing) + fprintf (stderr, "Updating hardlink %s to changed file\n", + file); + memcpy (filename, file, len); + memcpy (filename + len, ".#dwz#.XXXXXX", + sizeof (".#dwz#.XXXXXX")); + fd2 = mkstemp (filename); + if (fd2 >= 0) + { + close (fd2); + unlink (filename); + if (link (files[n], filename) == 0) + { + if (rename (filename, file) == 0) + ; + else + unlink (filename); + } + } + } + } +} + +/* Encode child process exit status. */ +static int +encode_child_exit_status (int thisret, struct file_result *res) +{ + assert (thisret == 0 || thisret == 1); + if (thisret == 0 && res->low_mem_p) + thisret = 2; + assert (res->res >= -3 && res->res <= 1); + return (thisret + + ((res->res + 3) << 2) + + ((res->skip_multifile ? 1 : 0) << 5)); +} + +/* Decode child process exit status. */ +static int +decode_child_exit_status (int state, struct file_result *res) +{ + int ret; + if (!WIFEXITED (state)) + error (1, 0, "Child dwz process got killed"); + int status = WEXITSTATUS (state); + ret = status & 0x3; + status >>= 2; + + res->low_mem_p = false; + if (ret == 2) + { + ret = 0; + res->low_mem_p = true; + } + + res->res = (int)(status & 0x7) - 3; + status >>= 3; + + res->skip_multifile = (status & 0x1) ? true : false; + + return ret; +} + +/* Wait on child exit with PID, update PIDS and RES. */ +static void +wait_child_exit (pid_t pid, pid_t *pids, int nr_pids, + struct file_result *resa) +{ + int state; + pid_t got_pid = waitpid (pid, &state, 0); + + int i; + for (i = 0; i < nr_pids; ++i) + if (pids[i] == got_pid) + { + pids[i] = 0; + break; + } + assert (i < nr_pids); + + resa[i].ret = decode_child_exit_status (state, &resa[i]); +} + +static int *workset; +static int workset_size = 0; +int current_multifile_owner = -1; +int current_multifile_owner_file_idx = -1; + +/* Wait on exit of chilren in PIDS, update RESA. */ +static void +wait_children_exit (pid_t *pids, int nr_files, struct file_result *resa) +{ + int i; + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + if (pids[i] == 0) + continue; + wait_child_exit (pids[i], &pids[i], 1, res); + if (current_multifile_owner_file_idx == -1 + || i < current_multifile_owner_file_idx) + continue; + assert (i == current_multifile_owner_file_idx); + current_multifile_owner++; + if (current_multifile_owner == workset_size) + continue; + current_multifile_owner_file_idx + = workset[current_multifile_owner]; + pass_token (current_multifile_owner); + } +} + +/* Dwarf-compress FILES. If HARDLINK, detect if some files are hardlinks and + if so, dwarf-compress just one, and relink the others. */ +static int +dwz_files_1 (int nr_files, char *files[], bool hardlink, + struct file_result *resa) +{ + int ret = 0; + int i, j; + const char *file; + int successcount = 0; + + for (i = 0; i < nr_files; ++i) + init_file_result (&resa[i]); + + if (multifile) + { + if (multifile_force_ptr_size) + multi_ptr_size = multifile_force_ptr_size; + if (multifile_force_endian) + multi_endian = multifile_force_endian; + + multi_info_fd = make_temp_file ("dwz.debug_info"); + multi_abbrev_fd = make_temp_file ("dwz.debug_abbrev"); + multi_line_fd = make_temp_file ("dwz.debug_line"); + multi_str_fd = make_temp_file ("dwz.debug_str"); + multi_macro_fd = make_temp_file ("dwz.debug_macro"); + if (multi_info_fd == -1 + || multi_abbrev_fd == -1 + || multi_line_fd == -1 + || multi_str_fd == -1 + || multi_macro_fd == -1) + { + error (0, 0, "Could not create multifile temporary files"); + multifile = NULL; + } + } + + if (hardlink) + hardlink = detect_hardlinks (nr_files, files, resa); + + workset = malloc (nr_files * sizeof (int)); + if (workset == NULL) + error (1, ENOMEM, "failed to allocate workset array"); + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + if (res->res == -2) + /* Skip hard links. */ + continue; + workset[workset_size] = i; + workset_size++; + } + + bool initial_parallel_p = max_forks > 1; + if (initial_parallel_p && multifile) + { + if (multifile_force_ptr_size != 0 && multifile_force_endian != 0) + { + write_multifile_parallel_p = true; + pipes = malloc (workset_size * 2 * sizeof (int)); + if (pipes == NULL) + error (1, ENOMEM, "failed to allocate pipes array"); + for (i = 0; i < workset_size; i++) + { + int fds[2]; + if (pipe (fds) != 0) + error (1, ENOMEM, "failed to initialize pipe"); + pipes[i].readfd = fds[0]; + pipes[i].writefd = fds[1]; + } + } + else + initial_parallel_p = false; + } + if (initial_parallel_p) + { + pid_t pids[nr_files]; + int nr_forks = 0; + for (i = 0; i < nr_files; i++) + pids[i] = 0; + for (j = 0; j < workset_size; j++) + { + int i = workset[j]; + + if (nr_forks == max_forks) + { + if (multifile == NULL) + wait_child_exit (-1, pids, i, resa); + else + { + int k = current_multifile_owner_file_idx; + wait_child_exit (pids[k], &pids[k], 1, &resa[k]); + current_multifile_owner++; + current_multifile_owner_file_idx + = workset[current_multifile_owner]; + pass_token (current_multifile_owner); + } + nr_forks--; + } + + pid_t fork_res = fork (); + assert (fork_res != -1); + if (fork_res == 0) + { + child_id = j; + file = files[i]; + struct file_result *res = &resa[i]; + int thisret = dwz_with_low_mem (file, NULL, res); + return encode_child_exit_status (thisret, res); + } + else + { + if (multifile && j == 0) + { + current_multifile_owner = j; + current_multifile_owner_file_idx + = workset[current_multifile_owner]; + pass_token (current_multifile_owner); + } + pids[i] = fork_res; + nr_forks++; + } + } + if (nr_forks > 0) + wait_children_exit (pids, nr_files, resa); + } + else + { + for (j = 0; j < workset_size; j++) + { + int i = workset[j]; + file = files[i]; + struct file_result *res = &resa[i]; + if (stats_p) + init_stats (file); + res->ret = dwz_with_low_mem (file, NULL, res); + } + } + + for (j = 0; j < workset_size; j++) + { + int i = workset[j]; + struct file_result *res = &resa[i]; + int thisret = res->ret; + if (thisret == 1) + ret = 1; + else if (!res->low_mem_p && !res->skip_multifile && res->res >= 0) + successcount++; + } + + if (hardlink) + update_hardlinks (nr_files, files, resa); + + if (multifile == NULL) + return ret; + + if (successcount < 2) + { + error (0, 0, "Too few files for multifile optimization"); + return ret; + } + + if (write_multifile_parallel_p) + { + multi_info_off = lseek (multi_info_fd, 0L, SEEK_END); + multi_abbrev_off = lseek (multi_abbrev_fd, 0L, SEEK_END); + multi_line_off = lseek (multi_line_fd, 0L, SEEK_END); + multi_str_off = lseek (multi_str_fd, 0L, SEEK_END); + multi_macro_off = lseek (multi_macro_fd, 0L, SEEK_END); + } + if (multi_info_off == 0 && multi_str_off == 0 && multi_macro_off == 0) + { + if (!quiet) + error (0, 0, "No suitable DWARF found for multifile optimization"); + return ret; + } + + if (write_multifile_parallel_p) + { + /* We reproduce here what happens when we run sequentially. This is a + kludge that probably needs to be replaced by IPC. */ + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + if (!res->low_mem_p && !res->skip_multifile && res->res >= 0) + { + int fd = open (files[i], O_RDONLY); + if (fd < 0) + return ret; + DSO *dso = fdopen_dso (fd, files[i]); + if (dso == NULL) + { + close (fd); + return ret; + } + assert (multi_ehdr.e_ident[0] == '\0'); + multi_ehdr = dso->ehdr; + break; + } + } + } + + unsigned int multifile_die_count = 0; + int multi_fd = optimize_multifile (&multifile_die_count); + DSO *dso; + if (multi_fd == -1) + return 1; + + dso = read_multifile (multi_fd, multifile_die_count); + if (dso == NULL) + { + ret = 1; + goto cleanup; + } + + workset_size = 0; + for (i = 0; i < nr_files; i++) + { + struct file_result *res = &resa[i]; + /* Don't process again files that couldn't + be processed successfully. Also skip hard links. */ + if (res->res == -1 || res->res == -2 + || res->skip_multifile) + continue; + workset[workset_size] = i; + workset_size++; + } + + bool finalize_multifile_parallel_p = max_forks > 1; + if (finalize_multifile_parallel_p) + { + pid_t pids[nr_files]; + int nr_forks = 0; + for (i = 0; i < nr_files; i++) + pids[i] = 0; + for (j = 0; j < workset_size; j++) + { + int i = workset[j]; + + if (nr_forks == max_forks) + { + wait_child_exit (-1, pids, i, resa); + nr_forks--; + } + + pid_t fork_res = fork (); + assert (fork_res != -1); + if (fork_res == 0) + { + file = files[i]; + struct file_result *res = &resa[i]; + multifile_mode = MULTIFILE_MODE_FI; + int thisret = dwz (file, NULL, res); + return encode_child_exit_status (thisret, res); + } + else + { + pids[i] = fork_res; + nr_forks++; + } + } + if (nr_forks > 0) + wait_children_exit (pids, nr_files, resa); + } + else + { + for (j = 0; j < workset_size; j++) + { + int i = workset[j]; + struct file_result *res = &resa[i]; + dw_cu_ref cu; + file = files[i]; + if (stats_p) + init_stats (file); + multifile_mode = MULTIFILE_MODE_FI; + for (cu = alt_first_cu; cu; cu = cu->cu_next) + alt_clear_dups (cu->cu_die); + res->ret = dwz (file, NULL, res); + } + } + + for (j = 0; j < workset_size; j++) + { + int i = workset[j]; + struct file_result *res = &resa[i]; + int thisret = res->ret; + ret |= thisret; + } + + if (hardlink) + update_hardlinks (nr_files, files, resa); + + elf_end (dso->elf); + close (multi_fd); + free (dso); + + cleanup: + cleanup (); + + strp_htab = alt_strp_htab; + off_htab = alt_off_htab; + dup_htab = alt_dup_htab; + macro_htab = alt_macro_htab; + ob = alt_ob; + ob2 = alt_ob2; + cleanup (); + pool_destroy (alt_pool); + + return ret; +} + +/* Wrapper around dwz_files_1 that takes care of malloc and free of resa. */ +static int +dwz_files (int nr_files, char *files[], bool hardlink) +{ + int ret; + struct file_result *resa + = (struct file_result *) malloc ((nr_files) * sizeof (*resa)); + if (resa == NULL) + error (1, ENOMEM, "failed to allocate result array"); + + ret = dwz_files_1 (nr_files, files, hardlink, resa); + + free (resa); + return ret; +} + +int +main (int argc, char *argv[]) +{ + int ret; + const char *outfile; + bool hardlink; + int nr_files; + char **files; + + state = XXH64_createState (); + + if (elf_version (EV_CURRENT) == EV_NONE) + error (1, 0, "library out of date"); + + outfile = NULL; + hardlink = false; + parse_args (argc, argv, &hardlink, &outfile); + nr_files = argc - optind; + files = &argv[optind]; + + if (nr_files <= 1) + { + const char *file = nr_files == 0 ? "a.out" : files[0]; + + if (multifile != NULL) + { + error (0, 0, "Too few files for multifile optimization"); + multifile = NULL; + } + + ret = dwz_one_file (file, outfile); + } + else + { + if (outfile != NULL) + error (1, 0, "-o option not allowed for multiple files"); + + ret = dwz_files (nr_files, files, hardlink); + } + + if (stats_p) + free (stats); + + return ret; +} |