/* corefile.c Copyright (C) 1999-2026 Free Software Foundation, Inc. This file is part of GNU Binutils. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, MA 02110-1301, USA. */ #include "config.h" #include "util.h" #include "bfd.h" #include "gp-gmon.h" #include "source.h" #include "symtab.h" #include "safe-ctype.h" #include /* For UINT_MAX. */ #include #include #include #include #include "gp-experiment.h" #include #define _(String) (String) bfd *core_bfd; static int core_num_syms; static asymbol **core_syms; asection *core_text_sect; void * core_text_space; /* Greatest common divisor of instruction sizes and alignments. */ static int insn_boundary; int offset_to_code; /* For mapping symbols to specific .o files during file ordering. */ static struct function_map * symbol_map; static unsigned int symbol_map_count; static int core_sym_class (asymbol *); static bool get_src_info (bfd_vma, const char **, const char **, int *); #define BUFSIZE (1024) /* This is BUFSIZE - 1 as a string. Suitable for use in fprintf/sscanf format strings. */ #define STR_BUFSIZE "1023" int core_init (const char * aout_name, const char *whoami) { int core_sym_bytes; asymbol *synthsyms; long synth_count; core_bfd = bfd_openr (aout_name, 0); if (!core_bfd) { perror (aout_name); return -1; } core_bfd->flags |= BFD_DECOMPRESS; if (!bfd_check_format (core_bfd, bfd_object)) { fprintf (stderr, _("%s: %s: not in executable format\n"), whoami, aout_name); return -1; } /* Get core's text section. */ core_text_sect = bfd_get_section_by_name (core_bfd, ".text"); if (!core_text_sect) { core_text_sect = bfd_get_section_by_name (core_bfd, "$CODE$"); if (!core_text_sect) { fprintf (stderr, _("%s: can't find .text section in %s\n"), whoami, aout_name); return -1; } } /* Read core's symbol table. */ /* This will probably give us more than we need, but that's ok. */ core_sym_bytes = bfd_get_symtab_upper_bound (core_bfd); if (core_sym_bytes < 0) { fprintf (stderr, "%s: %s: %s\n", whoami, aout_name, bfd_errmsg (bfd_get_error ())); return -1; } core_syms = (asymbol **) xmalloc (core_sym_bytes); core_num_syms = bfd_canonicalize_symtab (core_bfd, core_syms); if (core_num_syms < 0) { fprintf (stderr, "%s: %s: %s\n", whoami, aout_name, bfd_errmsg (bfd_get_error ())); return -1; } synth_count = bfd_get_synthetic_symtab (core_bfd, core_num_syms, core_syms, 0, NULL, &synthsyms); if (synth_count > 0) { asymbol **symp; long new_size; long i; new_size = (core_num_syms + synth_count + 1) * sizeof (*core_syms); core_syms = (asymbol **) xrealloc (core_syms, new_size); symp = core_syms + core_num_syms; core_num_syms += synth_count; for (i = 0; i < synth_count; i++) *symp++ = synthsyms + i; *symp = 0; } insn_boundary = 1; offset_to_code = 0; switch (bfd_get_arch (core_bfd)) { case bfd_arch_vax: offset_to_code = 2; break; case bfd_arch_mips:/* and microMIPS */ case bfd_arch_powerpc:/* and VLE */ case bfd_arch_riscv:/* and RVC */ case bfd_arch_sh: insn_boundary = 2; break; case bfd_arch_alpha: insn_boundary = 4; break; default: break; } return 0; } /* Return class of symbol SYM. The returned class can be any of: 0 -> symbol is not interesting to us 'T' -> symbol is a global name 't' -> symbol is a local (static) name. */ static int core_sym_class (asymbol *sym) { symbol_info syminfo; const char *name; char sym_prefix; int i; if (sym->section == NULL || (sym->flags & BSF_DEBUGGING) != 0) return 0; bfd_get_symbol_info (core_bfd, sym, &syminfo); i = syminfo.type; if (i == 'T') return i; /* It's a global symbol. */ if (i == 'W') /* Treat weak symbols as text symbols. FIXME: a weak symbol may also be a data symbol. */ return 'T'; if (i != 't') { /* Not a static text symbol. */ DBG (AOUTDEBUG, printf ("[core_sym_class] %s is of class %c\n", sym->name, i)); return 0; } /* Can't zero-length name or funny characters in name, where `funny' includes: `.' (.o file names) and `$' (Pascal labels). */ if (!sym->name || sym->name[0] == '\0') return 0; for (name = sym->name; *name; ++name) { if (*name == '$') return 0; while (*name == '.') { /* Allow both nested subprograms (which end with ".NNN", where N is a digit) and GCC cloned functions (which contain ".clone"). Allow for multiple iterations of both - apparently GCC can clone clones and subprograms. */ int digit_seen = 0; #define CLONE_NAME ".clone." #define CLONE_NAME_LEN strlen (CLONE_NAME) #define CONSTPROP_NAME ".constprop." #define CONSTPROP_NAME_LEN strlen (CONSTPROP_NAME) if (strlen (name) > CLONE_NAME_LEN && strncmp (name, CLONE_NAME, CLONE_NAME_LEN) == 0) name += CLONE_NAME_LEN - 1; else if (strlen (name) > CONSTPROP_NAME_LEN && strncmp (name, CONSTPROP_NAME, CONSTPROP_NAME_LEN) == 0) name += CONSTPROP_NAME_LEN - 1; for (name++; *name; name++) if (digit_seen && *name == '.') break; else if (ISDIGIT (*name)) digit_seen = 1; else return 0; } } /* On systems where the C compiler adds an underscore to all names, static names without underscores seem usually to be labels in hand written assembler in the library. We don't want these names. This is certainly necessary on a Sparc running SunOS 4.1 (try profiling a program that does a lot of division). I don't know whether it has harmful side effects on other systems. Perhaps it should be made configurable. */ sym_prefix = bfd_get_symbol_leading_char (core_bfd); if ((sym_prefix && sym_prefix != sym->name[0]) /* GCC may add special symbols to help gdb figure out the file language. We want to ignore these, since sometimes they mask the real function. (dj@ctron) */ || !strncmp (sym->name, "__gnu_compiled", 14) || !strncmp (sym->name, "___gnu_compiled", 15)) { return 0; } return 't'; /* It's a static text symbol. */ } /* Get whatever source info we can get regarding address ADDR. */ static bool get_src_info (bfd_vma addr, const char **filename, const char **name, int *line_num) { const char *fname = 0, *func_name = 0; int l = 0; if (bfd_find_nearest_line (core_bfd, core_text_sect, core_syms, addr - core_text_sect->vma, &fname, &func_name, (unsigned int *) &l) && fname && func_name && l) { DBG (AOUTDEBUG, printf ("[get_src_info] 0x%lx -> %s:%d (%s)\n", (unsigned long) addr, fname, l, func_name)); *filename = fname; *name = func_name; *line_num = l; return true; } else { DBG (AOUTDEBUG, printf ("[get_src_info] no info for 0x%lx (%s:%d,%s)\n", (unsigned long) addr, fname ? fname : "", l, func_name ? func_name : "")); return false; } } static int search_mapped_symbol (const void * l, const void * r) { return strcmp ((const char *) l, ((const struct function_map *) r)->function_name); } Source_File *first_src_file = 0; Source_File * source_file_lookup_path (const char *path) { Source_File *sf; for (sf = first_src_file; sf; sf = sf->next) { if (FILENAME_CMP (path, sf->name) == 0) break; } if (!sf) { /* Create a new source file descriptor. */ sf = (Source_File *) xmalloc (sizeof (*sf)); memset (sf, 0, sizeof (*sf)); sf->name = xstrdup (path); sf->next = first_src_file; first_src_file = sf; } return sf; } /* Read in symbol table from core. One symbol per function is entered. */ static void core_create_function_syms (const char *whoami) { int cxxclass; long i; struct function_map * found = NULL; int core_has_func_syms = 0; Sym_Table *symtab = get_symtab_direct (); switch (core_bfd->xvec->flavour) { default: break; case bfd_target_coff_flavour: case bfd_target_ecoff_flavour: case bfd_target_xcoff_flavour: case bfd_target_elf_flavour: case bfd_target_som_flavour: core_has_func_syms = 1; } /* Pass 1 - determine upper bound on number of function names. */ symtab->len = 0; for (i = 0; i < core_num_syms; ++i) { if (!core_sym_class (core_syms[i])) continue; /* Don't create a symtab entry for a function that has a mapping to a file, unless it's the first function in the file. */ if (symbol_map_count != 0) { /* Note: some systems (SunOS 5.8) crash if bsearch base argument is NULL. */ found = (struct function_map *) bsearch (core_syms[i]->name, symbol_map, symbol_map_count, sizeof (struct function_map), search_mapped_symbol); } if (found == NULL || found->is_first) ++symtab->len; } if (symtab->len == 0) { fprintf (stderr, _("%s: file has no symbols\n"), whoami); done (1); } symtab->base = (Sym *) xmalloc (symtab->len * sizeof (Sym)); /* Pass 2 - create symbols. */ symtab->limit = symtab->base; for (i = 0; i < core_num_syms; ++i) { asection *sym_sec; cxxclass = core_sym_class (core_syms[i]); if (!cxxclass) { DBG (AOUTDEBUG, printf ("[core_create_function_syms] rejecting: 0x%lx %s\n", (unsigned long) core_syms[i]->value, core_syms[i]->name)); continue; } if (symbol_map_count != 0) { /* Note: some systems (SunOS 5.8) crash if bsearch base argument is NULL. */ found = (struct function_map *) bsearch (core_syms[i]->name, symbol_map, symbol_map_count, sizeof (struct function_map), search_mapped_symbol); } if (found && ! found->is_first) continue; sym_init (symtab->limit); /* Symbol offsets are always section-relative. */ sym_sec = core_syms[i]->section; symtab->limit->addr = core_syms[i]->value; if (sym_sec) symtab->limit->addr += bfd_section_vma (sym_sec); if (found) { symtab->limit->name = found->file_name; symtab->limit->mapped = 1; } else { symtab->limit->name = core_syms[i]->name; symtab->limit->mapped = 0; } /* Lookup filename and line number, if we can. */ { const char * filename; const char * func_name; if (get_src_info (symtab->limit->addr, & filename, & func_name, & symtab->limit->line_num)) { symtab->limit->file = source_file_lookup_path (filename); /* FIXME: Checking __osf__ here does not work with a cross gprof. */ #ifdef __osf__ /* Suppress symbols that are not function names. This is useful to suppress code-labels and aliases. This is known to be useful under DEC's OSF/1. Under SunOS 4.x, labels do not appear in the symbol table info, so this isn't necessary. */ if (strcmp (symtab->limit->name, func_name) != 0) { /* The symbol's address maps to a different name, so it can't be a function-entry point. This happens for labels, for example. */ DBG (AOUTDEBUG, printf ("[core_create_function_syms: rej %s (maps to %s)\n", symtab->limit->name, func_name)); continue; } #endif } } symtab->limit->is_func = (!core_has_func_syms || (core_syms[i]->flags & BSF_FUNCTION) != 0); symtab->limit->is_bb_head = true; if (cxxclass == 't') symtab->limit->is_static = true; DBG (AOUTDEBUG, printf ("[core_create_function_syms] %ld %s 0x%lx\n", (long) (symtab->limit - symtab->base), symtab->limit->name, (unsigned long) symtab->limit->addr)); ++symtab->limit; } symtab->len = symtab->limit - symtab->base; symtab_finalize (symtab); } /* Initialize the symbol table. */ void symtab_init (const char *whoami) { core_create_function_syms (whoami); }