blob: 46a81153921760c833e31258bca347483e842741 [file]
/* corefile.c
Copyright (C) 1999-2026 Free Software Foundation, Inc.
This file is part of GNU Binutils.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street - Fifth Floor, Boston, MA
02110-1301, USA. */
#include "config.h"
#include "util.h"
#include "bfd.h"
#include "gp-gmon.h"
#include "source.h"
#include "symtab.h"
#include "safe-ctype.h"
#include <limits.h> /* For UINT_MAX. */
#include <stdio.h>
#include <unistd.h>
#include <stdint.h>
#include <sys/mman.h>
#include "gp-experiment.h"
#include <filenames.h>
#define _(String) (String)
bfd *core_bfd;
static int core_num_syms;
static asymbol **core_syms;
asection *core_text_sect;
void * core_text_space;
/* Greatest common divisor of instruction sizes and alignments. */
static int insn_boundary;
int offset_to_code;
/* For mapping symbols to specific .o files during file ordering. */
static struct function_map * symbol_map;
static unsigned int symbol_map_count;
static int core_sym_class (asymbol *);
static bool get_src_info
(bfd_vma, const char **, const char **, int *);
#define BUFSIZE (1024)
/* This is BUFSIZE - 1 as a string. Suitable for use in fprintf/sscanf format strings. */
#define STR_BUFSIZE "1023"
int
core_init (const char * aout_name, const char *whoami)
{
int core_sym_bytes;
asymbol *synthsyms;
long synth_count;
core_bfd = bfd_openr (aout_name, 0);
if (!core_bfd)
{
perror (aout_name);
return -1;
}
core_bfd->flags |= BFD_DECOMPRESS;
if (!bfd_check_format (core_bfd, bfd_object))
{
fprintf (stderr, _("%s: %s: not in executable format\n"), whoami, aout_name);
return -1;
}
/* Get core's text section. */
core_text_sect = bfd_get_section_by_name (core_bfd, ".text");
if (!core_text_sect)
{
core_text_sect = bfd_get_section_by_name (core_bfd, "$CODE$");
if (!core_text_sect)
{
fprintf (stderr, _("%s: can't find .text section in %s\n"),
whoami, aout_name);
return -1;
}
}
/* Read core's symbol table. */
/* This will probably give us more than we need, but that's ok. */
core_sym_bytes = bfd_get_symtab_upper_bound (core_bfd);
if (core_sym_bytes < 0)
{
fprintf (stderr, "%s: %s: %s\n", whoami, aout_name,
bfd_errmsg (bfd_get_error ()));
return -1;
}
core_syms = (asymbol **) xmalloc (core_sym_bytes);
core_num_syms = bfd_canonicalize_symtab (core_bfd, core_syms);
if (core_num_syms < 0)
{
fprintf (stderr, "%s: %s: %s\n", whoami, aout_name,
bfd_errmsg (bfd_get_error ()));
return -1;
}
synth_count = bfd_get_synthetic_symtab (core_bfd, core_num_syms, core_syms,
0, NULL, &synthsyms);
if (synth_count > 0)
{
asymbol **symp;
long new_size;
long i;
new_size = (core_num_syms + synth_count + 1) * sizeof (*core_syms);
core_syms = (asymbol **) xrealloc (core_syms, new_size);
symp = core_syms + core_num_syms;
core_num_syms += synth_count;
for (i = 0; i < synth_count; i++)
*symp++ = synthsyms + i;
*symp = 0;
}
insn_boundary = 1;
offset_to_code = 0;
switch (bfd_get_arch (core_bfd))
{
case bfd_arch_vax:
offset_to_code = 2;
break;
case bfd_arch_mips:/* and microMIPS */
case bfd_arch_powerpc:/* and VLE */
case bfd_arch_riscv:/* and RVC */
case bfd_arch_sh:
insn_boundary = 2;
break;
case bfd_arch_alpha:
insn_boundary = 4;
break;
default:
break;
}
return 0;
}
/* Return class of symbol SYM. The returned class can be any of:
0 -> symbol is not interesting to us
'T' -> symbol is a global name
't' -> symbol is a local (static) name. */
static int
core_sym_class (asymbol *sym)
{
symbol_info syminfo;
const char *name;
char sym_prefix;
int i;
if (sym->section == NULL || (sym->flags & BSF_DEBUGGING) != 0)
return 0;
bfd_get_symbol_info (core_bfd, sym, &syminfo);
i = syminfo.type;
if (i == 'T')
return i; /* It's a global symbol. */
if (i == 'W')
/* Treat weak symbols as text symbols. FIXME: a weak symbol may
also be a data symbol. */
return 'T';
if (i != 't')
{
/* Not a static text symbol. */
DBG (AOUTDEBUG, printf ("[core_sym_class] %s is of class %c\n",
sym->name, i));
return 0;
}
/* Can't zero-length name or funny characters in name, where
`funny' includes: `.' (.o file names) and `$' (Pascal labels). */
if (!sym->name || sym->name[0] == '\0')
return 0;
for (name = sym->name; *name; ++name)
{
if (*name == '$')
return 0;
while (*name == '.')
{
/* Allow both nested subprograms (which end with ".NNN", where N is
a digit) and GCC cloned functions (which contain ".clone").
Allow for multiple iterations of both - apparently GCC can clone
clones and subprograms. */
int digit_seen = 0;
#define CLONE_NAME ".clone."
#define CLONE_NAME_LEN strlen (CLONE_NAME)
#define CONSTPROP_NAME ".constprop."
#define CONSTPROP_NAME_LEN strlen (CONSTPROP_NAME)
if (strlen (name) > CLONE_NAME_LEN
&& strncmp (name, CLONE_NAME, CLONE_NAME_LEN) == 0)
name += CLONE_NAME_LEN - 1;
else if (strlen (name) > CONSTPROP_NAME_LEN
&& strncmp (name, CONSTPROP_NAME, CONSTPROP_NAME_LEN) == 0)
name += CONSTPROP_NAME_LEN - 1;
for (name++; *name; name++)
if (digit_seen && *name == '.')
break;
else if (ISDIGIT (*name))
digit_seen = 1;
else
return 0;
}
}
/* On systems where the C compiler adds an underscore to all
names, static names without underscores seem usually to be
labels in hand written assembler in the library. We don't want
these names. This is certainly necessary on a Sparc running
SunOS 4.1 (try profiling a program that does a lot of
division). I don't know whether it has harmful side effects on
other systems. Perhaps it should be made configurable. */
sym_prefix = bfd_get_symbol_leading_char (core_bfd);
if ((sym_prefix && sym_prefix != sym->name[0])
/* GCC may add special symbols to help gdb figure out the file
language. We want to ignore these, since sometimes they mask
the real function. (dj@ctron) */
|| !strncmp (sym->name, "__gnu_compiled", 14)
|| !strncmp (sym->name, "___gnu_compiled", 15))
{
return 0;
}
return 't'; /* It's a static text symbol. */
}
/* Get whatever source info we can get regarding address ADDR. */
static bool
get_src_info (bfd_vma addr, const char **filename, const char **name,
int *line_num)
{
const char *fname = 0, *func_name = 0;
int l = 0;
if (bfd_find_nearest_line (core_bfd, core_text_sect, core_syms,
addr - core_text_sect->vma,
&fname, &func_name, (unsigned int *) &l)
&& fname && func_name && l)
{
DBG (AOUTDEBUG, printf ("[get_src_info] 0x%lx -> %s:%d (%s)\n",
(unsigned long) addr, fname, l, func_name));
*filename = fname;
*name = func_name;
*line_num = l;
return true;
}
else
{
DBG (AOUTDEBUG, printf ("[get_src_info] no info for 0x%lx (%s:%d,%s)\n",
(unsigned long) addr,
fname ? fname : "<unknown>", l,
func_name ? func_name : "<unknown>"));
return false;
}
}
static int
search_mapped_symbol (const void * l, const void * r)
{
return strcmp ((const char *) l, ((const struct function_map *) r)->function_name);
}
Source_File *first_src_file = 0;
Source_File *
source_file_lookup_path (const char *path)
{
Source_File *sf;
for (sf = first_src_file; sf; sf = sf->next)
{
if (FILENAME_CMP (path, sf->name) == 0)
break;
}
if (!sf)
{
/* Create a new source file descriptor. */
sf = (Source_File *) xmalloc (sizeof (*sf));
memset (sf, 0, sizeof (*sf));
sf->name = xstrdup (path);
sf->next = first_src_file;
first_src_file = sf;
}
return sf;
}
/* Read in symbol table from core.
One symbol per function is entered. */
static void
core_create_function_syms (const char *whoami)
{
int cxxclass;
long i;
struct function_map * found = NULL;
int core_has_func_syms = 0;
Sym_Table *symtab = get_symtab_direct ();
switch (core_bfd->xvec->flavour)
{
default:
break;
case bfd_target_coff_flavour:
case bfd_target_ecoff_flavour:
case bfd_target_xcoff_flavour:
case bfd_target_elf_flavour:
case bfd_target_som_flavour:
core_has_func_syms = 1;
}
/* Pass 1 - determine upper bound on number of function names. */
symtab->len = 0;
for (i = 0; i < core_num_syms; ++i)
{
if (!core_sym_class (core_syms[i]))
continue;
/* Don't create a symtab entry for a function that has
a mapping to a file, unless it's the first function
in the file. */
if (symbol_map_count != 0)
{
/* Note: some systems (SunOS 5.8) crash if bsearch base argument
is NULL. */
found = (struct function_map *) bsearch
(core_syms[i]->name, symbol_map, symbol_map_count,
sizeof (struct function_map), search_mapped_symbol);
}
if (found == NULL || found->is_first)
++symtab->len;
}
if (symtab->len == 0)
{
fprintf (stderr, _("%s: file has no symbols\n"), whoami);
done (1);
}
symtab->base = (Sym *) xmalloc (symtab->len * sizeof (Sym));
/* Pass 2 - create symbols. */
symtab->limit = symtab->base;
for (i = 0; i < core_num_syms; ++i)
{
asection *sym_sec;
cxxclass = core_sym_class (core_syms[i]);
if (!cxxclass)
{
DBG (AOUTDEBUG,
printf ("[core_create_function_syms] rejecting: 0x%lx %s\n",
(unsigned long) core_syms[i]->value,
core_syms[i]->name));
continue;
}
if (symbol_map_count != 0)
{
/* Note: some systems (SunOS 5.8) crash if bsearch base argument
is NULL. */
found = (struct function_map *) bsearch
(core_syms[i]->name, symbol_map, symbol_map_count,
sizeof (struct function_map), search_mapped_symbol);
}
if (found && ! found->is_first)
continue;
sym_init (symtab->limit);
/* Symbol offsets are always section-relative. */
sym_sec = core_syms[i]->section;
symtab->limit->addr = core_syms[i]->value;
if (sym_sec)
symtab->limit->addr += bfd_section_vma (sym_sec);
if (found)
{
symtab->limit->name = found->file_name;
symtab->limit->mapped = 1;
}
else
{
symtab->limit->name = core_syms[i]->name;
symtab->limit->mapped = 0;
}
/* Lookup filename and line number, if we can. */
{
const char * filename;
const char * func_name;
if (get_src_info (symtab->limit->addr, & filename, & func_name,
& symtab->limit->line_num))
{
symtab->limit->file = source_file_lookup_path (filename);
/* FIXME: Checking __osf__ here does not work with a cross
gprof. */
#ifdef __osf__
/* Suppress symbols that are not function names. This is
useful to suppress code-labels and aliases.
This is known to be useful under DEC's OSF/1. Under SunOS 4.x,
labels do not appear in the symbol table info, so this isn't
necessary. */
if (strcmp (symtab->limit->name, func_name) != 0)
{
/* The symbol's address maps to a different name, so
it can't be a function-entry point. This happens
for labels, for example. */
DBG (AOUTDEBUG,
printf ("[core_create_function_syms: rej %s (maps to %s)\n",
symtab->limit->name, func_name));
continue;
}
#endif
}
}
symtab->limit->is_func = (!core_has_func_syms
|| (core_syms[i]->flags & BSF_FUNCTION) != 0);
symtab->limit->is_bb_head = true;
if (cxxclass == 't')
symtab->limit->is_static = true;
DBG (AOUTDEBUG, printf ("[core_create_function_syms] %ld %s 0x%lx\n",
(long) (symtab->limit - symtab->base),
symtab->limit->name,
(unsigned long) symtab->limit->addr));
++symtab->limit;
}
symtab->len = symtab->limit - symtab->base;
symtab_finalize (symtab);
}
/* Initialize the symbol table. */
void
symtab_init (const char *whoami)
{
core_create_function_syms (whoami);
}