aboutsummaryrefslogtreecommitdiff
path: root/elf/sprof.c
diff options
context:
space:
mode:
authorUlrich Drepper <drepper@redhat.com>1998-03-02 18:02:11 +0000
committerUlrich Drepper <drepper@redhat.com>1998-03-02 18:02:11 +0000
commitae828bc6f9a3ff47cb92846f71a9a7f8c6d5c941 (patch)
treebb606d530a4fb73de56d29c0a3433f6fe7f4ac27 /elf/sprof.c
parentfb973e7f76fae77b6678921bc689960b65acf7ad (diff)
downloadglibc-ae828bc6f9a3ff47cb92846f71a9a7f8c6d5c941.tar
glibc-ae828bc6f9a3ff47cb92846f71a9a7f8c6d5c941.tar.gz
glibc-ae828bc6f9a3ff47cb92846f71a9a7f8c6d5c941.tar.bz2
glibc-ae828bc6f9a3ff47cb92846f71a9a7f8c6d5c941.zip
Update.
1998-03-02 17:55 Ulrich Drepper <drepper@cygnus.com> * sysdeps/i386/add_n.S: Change to use ENTRY and END macro. * sysdeps/i386/addmul_1.S: Likewise. * sysdeps/i386/lshift.S: Likewise. * sysdeps/i386/mul_1.S: Likewise. * sysdeps/i386/rshift.S: Likewise. * sysdeps/i386/sub_n.S: Likewise. * sysdeps/i386/submul_1.S: Likewise. * sysdeps/i386/i586/add_n.S: Likewise. * sysdeps/i386/i586/addmul_1.S: Likewise. * sysdeps/i386/i586/lshift.S: Likewise. * sysdeps/i386/i586/mul_1.S: Likewise. * sysdeps/i386/i586/rshift.S: Likewise. * sysdeps/i386/i586/sub_n.S: Likewise. * sysdeps/i386/i586/submul_1.S: Likewise. * sysdeps/i386/sysdep.h: Extend last change. * sysdeps/unix/sysv/linux/i386/sysdep.h: Follow Intel's advice to have only one exit point for functions. 1998-03-02 Ulrich Drepper <drepper@cygnus.com> * configure.in: Fix msgfmt test. Fix handling of //s in sysdeps search. 1998-03-02 13:28 Ulrich Drepper <drepper@cygnus.com> * Makerules: Generate libc.so with absolute paths for the used shared objects. * config.make.in: Add MAKEINFO definition. 1998-03-02 Ulrich Drepper <drepper@cygnus.com> * sysdeps/i386/sysdep.h (ASM_SIZE_DIRECTIVE): Add ; at the end. (ENTRY): Use STABS_FUN. (END): Use STABS_FUN_END. (STABS_FUN, STABS_FUN2, STABS_FUN_END): New macro to emit stabs info. * elf/Makefile: Add rules to build sprof program. * elf/sprof.c: New file. 1998-02-28 Andreas Jaeger <aj@arthur.rhein-neckar.de> * misc/syslog.c (openlog_internal): Insert missing closing brace. 1998-02-06 Andreas Jaeger <aj@arthur.rhein-neckar.de> * configure.in: Check for working msgfmt version (from GNU gettext 0.10 or later). 1998-03-02 Ulrich Drepper <drepper@cygnus.com> * configure.in: Avoid //s in sysdirs. Patch by Roland McGrath. * stdlib/a64l.c (a64l): Rewrite by Joe Keane <jgk@jgk.org>. 1998-03-02 07:17 H.J. Lu <hjl@gnu.org> * elf/dl-open.c (_dl_open): Update _dl_global_scope_end when setting _dl_global_scope for RTLD_GLOBAL. 1998-02-27 Andreas Schwab <schwab@issan.informatik.uni-dortmund.de> * sysdeps/unix/make-syscalls.sh: Fix last change so that all possible lists of object-suffixes are taken care of. 1998-03-02 10:16 Ulrich Drepper <drepper@cygnus.com> * timezone/private.h: Update from tzcode1998c. * timezone/zic.c: Likewise. * timezone/antarctica: Updated from tzdata1998c. * timezone/asia: Likewise. * timezone/australasia: Likewise. * timezone/europe: Likewise. * timezone/southamerica: Likewise. 1998-03-02 Ulrich Drepper <drepper@cygnus.com> * posix/glob.c (glob_in_dir): Add support for cases insensitive VMS. Patch by John W. Eaton <jwe@bevo.che.wisc.edu>.
Diffstat (limited to 'elf/sprof.c')
-rw-r--r--elf/sprof.c937
1 files changed, 937 insertions, 0 deletions
diff --git a/elf/sprof.c b/elf/sprof.c
new file mode 100644
index 0000000000..0d50806126
--- /dev/null
+++ b/elf/sprof.c
@@ -0,0 +1,937 @@
+/* Read and display shared object profiling data.
+ Copyright (C) 1997, 1998 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+ Contributed by Ulrich Drepper <drepper@cygnus.com>, 1997.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Library General Public License as
+ published by the Free Software Foundation; either version 2 of the
+ License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Library General Public License for more details.
+
+ You should have received a copy of the GNU Library General Public
+ License along with the GNU C Library; see the file COPYING.LIB. If not,
+ write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+ Boston, MA 02111-1307, USA. */
+
+#include <argp.h>
+#include <dlfcn.h>
+#include <elf.h>
+#include <endian.h>
+#include <error.h>
+#include <fcntl.h>
+#include <inttypes.h>
+#include <libintl.h>
+#include <link.h>
+#include <locale.h>
+#include <obstack.h>
+#include <search.h>
+#include <stab.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <unistd.h>
+#include <sys/gmon.h>
+#include <sys/gmon_out.h>
+#include <sys/mman.h>
+#include <sys/param.h>
+#include <sys/stat.h>
+
+/* Undefine the following line line in the production version. */
+/* #define _NDEBUG 1 */
+#include <assert.h>
+
+/* Get libc version number. */
+#include "../version.h"
+
+#define PACKAGE _libc_intl_domainname
+
+
+#include <endian.h>
+#if BYTE_ORDER == BIG_ENDIAN
+#define byteorder ELFDATA2MSB
+#define byteorder_name "big-endian"
+#elif BYTE_ORDER == LITTLE_ENDIAN
+#define byteorder ELFDATA2LSB
+#define byteorder_name "little-endian"
+#else
+#error "Unknown BYTE_ORDER " BYTE_ORDER
+#define byteorder ELFDATANONE
+#endif
+
+
+extern int __profile_frequency __P ((void));
+
+/* Name and version of program. */
+static void print_version (FILE *stream, struct argp_state *state);
+void (*argp_program_version_hook) (FILE *, struct argp_state *) = print_version;
+
+#define OPT_COUNT_TOTAL 1
+#define OPT_TEST 2
+
+/* Definitions of arguments for argp functions. */
+static const struct argp_option options[] =
+{
+ { NULL, 0, NULL, 0, N_("Output selection:") },
+ { "count-total", OPT_COUNT_TOTAL, NULL, 0,
+ N_("print number of invocations for each function") },
+ { "test", OPT_TEST, NULL, OPTION_HIDDEN, NULL },
+ { NULL, 0, NULL, 0, NULL }
+};
+
+/* Short description of program. */
+static const char doc[] = N_("Read and display shared object profiling data");
+
+/* Strings for arguments in help texts. */
+static const char args_doc[] = N_("SHOBJ [PROFDATA]");
+
+/* Prototype for option handler. */
+static error_t parse_opt (int key, char *arg, struct argp_state *state);
+
+/* Data structure to communicate with argp functions. */
+static struct argp argp =
+{
+ options, parse_opt, args_doc, doc, NULL, NULL
+};
+
+
+/* Operation modes. */
+static enum
+{
+ NONE = 0,
+ COUNT_TOTAL
+} mode;
+
+/* If nonzero the total number of invocations of a function is emitted. */
+int count_total;
+
+/* Nozero for testing. */
+int do_test;
+
+/* Strcuture describing calls. */
+struct here_fromstruct
+ {
+ struct here_cg_arc_record volatile *here;
+ uint16_t link;
+ };
+
+/* We define a special type to address the elements of the arc table.
+ This is basically the `gmon_cg_arc_record' format but it includes
+ the room for the tag and it uses real types. */
+struct here_cg_arc_record
+ {
+ uintptr_t from_pc;
+ uintptr_t self_pc;
+ uint32_t count;
+ } __attribute__ ((packed));
+
+/* Information about the stab debugging info. This should be in a
+ head but it is not. */
+#define STRDXOFF (0)
+#define TYPEOFF (4)
+#define OTHEROFF (5)
+#define DESCOFF (6)
+#define VALOFF (8)
+#define STABSIZE (12)
+
+
+struct known_symbol
+{
+ const char *name;
+ uintptr_t addr;
+ size_t size;
+};
+
+
+struct shobj
+{
+ const char *name; /* User-provided name. */
+
+ struct link_map *map;
+ const char *strtab; /* String table of shared object. */
+ const char *soname; /* Soname of shared object. */
+
+ uintptr_t lowpc;
+ uintptr_t highpc;
+ unsigned long int kcountsize;
+ size_t expected_size; /* Expected size of profiling file. */
+ size_t tossize;
+ size_t fromssize;
+ size_t fromlimit;
+ unsigned int hashfraction;
+ int s_scale;
+
+ void *stab_map;
+ size_t stab_mapsize;
+ const char *stab;
+ size_t stab_size;
+ const char *stabstr;
+ size_t stabstr_size;
+
+ struct obstack ob_str;
+ struct obstack ob_sym;
+};
+
+
+struct profdata
+{
+ void *addr;
+ off_t size;
+
+ char *hist;
+ uint16_t *kcount;
+ uint32_t narcs; /* Number of arcs in toset. */
+ struct here_cg_arc_record *data;
+ uint16_t *tos;
+ struct here_fromstruct *froms;
+};
+
+/* Search tree for symbols. */
+void *symroot;
+static const struct known_symbol **sortsym;
+static size_t symidx;
+
+/* Prototypes for local functions. */
+static struct shobj *load_shobj (const char *name);
+static void unload_shobj (struct shobj *shobj);
+static struct profdata *load_profdata (const char *name, struct shobj *shobj);
+static void unload_profdata (struct profdata *profdata);
+static void count_total_ticks (struct shobj *shobj, struct profdata *profdata);
+static void read_symbols (struct shobj *shobj);
+
+
+int
+main (int argc, char *argv[])
+{
+ const char *shobj;
+ const char *profdata;
+ struct shobj *shobj_handle;
+ struct profdata *profdata_handle;
+ int remaining;
+
+ setlocale (LC_ALL, "");
+
+ /* Initialize the message catalog. */
+ textdomain (_libc_intl_domainname);
+
+ /* Parse and process arguments. */
+ argp_parse (&argp, argc, argv, 0, &remaining, NULL);
+
+ if (argc - remaining == 0 || argc - remaining > 2)
+ {
+ /* We need exactly two non-option parameter. */
+ argp_help (&argp, stdout, ARGP_HELP_SEE | ARGP_HELP_EXIT_ERR,
+ program_invocation_short_name);
+ exit (1);
+ }
+
+ /* Get parameters. */
+ shobj = argv[remaining];
+ if (argc - remaining == 2)
+ profdata = argv[remaining + 1];
+ else
+ /* No filename for the profiling data given. We will determine it
+ from the soname of the shobj, later. */
+ profdata = NULL;
+
+ /* First see whether we can load the shared object. */
+ shobj_handle = load_shobj (shobj);
+ if (shobj_handle == NULL)
+ exit (1);
+
+ /* We can now determine the filename for the profiling data, if
+ nececessary. */
+ if (profdata == NULL)
+ {
+ char *newp;
+
+ if (shobj_handle->soname == NULL)
+ {
+ unload_shobj (shobj_handle);
+
+ error (EXIT_FAILURE, 0, _("\
+no filename for profiling data given and shared object `%s' has no soname"),
+ shobj);
+ }
+
+ newp = (char *) alloca (strlen (shobj_handle->soname)
+ + sizeof ".profile");
+ stpcpy (stpcpy (newp, shobj_handle->soname), ".profile");
+ profdata = newp;
+ }
+
+ /* Now see whether the profiling data file matches the given object. */
+ profdata_handle = load_profdata (profdata, shobj_handle);
+ if (profdata_handle == NULL)
+ {
+ unload_shobj (shobj_handle);
+
+ exit (1);
+ }
+
+ read_symbols (shobj_handle);
+
+ /* Do some work. */
+ switch (mode)
+ {
+ case COUNT_TOTAL:
+ count_total_ticks (shobj_handle, profdata_handle);
+ break;
+ case NONE:
+ /* Do nothing. */
+ break;
+ default:
+ assert (! "Internal error");
+ }
+
+ /* Free the resources. */
+ unload_shobj (shobj_handle);
+ unload_profdata (profdata_handle);
+
+ return 0;
+}
+
+
+/* Handle program arguments. */
+static error_t
+parse_opt (int key, char *arg, struct argp_state *state)
+{
+ switch (key)
+ {
+ case OPT_COUNT_TOTAL:
+ mode = COUNT_TOTAL;
+ break;
+ case OPT_TEST:
+ do_test = 1;
+ break;
+ default:
+ return ARGP_ERR_UNKNOWN;
+ }
+ return 0;
+}
+
+
+/* Print the version information. */
+static void
+print_version (FILE *stream, struct argp_state *state)
+{
+ fprintf (stream, "sprof (GNU %s) %s\n", PACKAGE, VERSION);
+ fprintf (stream, gettext ("\
+Copyright (C) %s Free Software Foundation, Inc.\n\
+This is free software; see the source for copying conditions. There is NO\n\
+warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n\
+"),
+ "1997, 1998");
+ fprintf (stream, gettext ("Written by %s.\n"), "Ulrich Drepper");
+}
+
+
+/* Note that we must not use `dlopen' etc. The shobj object must not
+ be loaded for use. */
+static struct shobj *
+load_shobj (const char *name)
+{
+ struct link_map *map = NULL;
+ struct shobj *result;
+ ElfW(Addr) mapstart = ~((ElfW(Addr)) 0);
+ ElfW(Addr) mapend = 0;
+ const ElfW(Phdr) *ph;
+ size_t textsize;
+ unsigned int log_hashfraction;
+ ElfW(Ehdr) *ehdr;
+ int fd;
+ ElfW(Shdr) *shdr;
+ void *ptr;
+ size_t pagesize = getpagesize ();
+ const char *shstrtab;
+ int idx;
+ ElfW(Shdr) *stab_entry;
+ ElfW(Shdr) *stabstr_entry;
+
+ /* Since we use dlopen() we must be prepared to work around the sometimes
+ strange lookup rules for the shared objects. If we have a file foo.so
+ in the current directory and the user specfies foo.so on the command
+ line (without specifying a directory) we should load the file in the
+ current directory even if a normal dlopen() call would read the other
+ file. We do this by adding a directory portion to the name. */
+ if (strchr (name, '/') == NULL)
+ {
+ char *load_name = (char *) alloca (strlen (name) + 3);
+ stpcpy (stpcpy (load_name, "./"), name);
+
+ map = (struct link_map *) dlopen (load_name, RTLD_LAZY);
+ }
+ if (map == NULL)
+ {
+ map = (struct link_map *) dlopen (name, RTLD_LAZY);
+ if (map == NULL)
+ {
+ error (0, errno, _("failed to load shared object `%s'"), name);
+ return NULL;
+ }
+ }
+
+ /* Prepare the result. */
+ result = (struct shobj *) calloc (1, sizeof (struct shobj));
+ if (result == NULL)
+ {
+ error (0, errno, _("cannot create internal descriptors"));
+ dlclose (map);
+ return NULL;
+ }
+ result->name = name;
+ result->map = map;
+
+ /* Compute the size of the sections which contain program code.
+ This must match the code in dl-profile.c (_dl_start_profile). */
+ for (ph = map->l_phdr; ph < &map->l_phdr[map->l_phnum]; ++ph)
+ if (ph->p_type == PT_LOAD && (ph->p_flags & PF_X))
+ {
+ ElfW(Addr) start = (ph->p_vaddr & ~(_dl_pagesize - 1));
+ ElfW(Addr) end = ((ph->p_vaddr + ph->p_memsz + _dl_pagesize - 1)
+ & ~(_dl_pagesize - 1));
+
+ if (start < mapstart)
+ mapstart = start;
+ if (end > mapend)
+ mapend = end;
+ }
+
+ result->lowpc = ROUNDDOWN ((uintptr_t) (mapstart + map->l_addr),
+ HISTFRACTION * sizeof (HISTCOUNTER));
+ result->highpc = ROUNDUP ((uintptr_t) (mapend + map->l_addr),
+ HISTFRACTION * sizeof (HISTCOUNTER));
+ if (do_test)
+ printf ("load addr: %0#*" PRIxPTR "\n"
+ "lower bound PC: %0#*" PRIxPTR "\n"
+ "upper bound PC: %0#*" PRIxPTR "\n",
+ __ELF_NATIVE_CLASS == 32 ? 10 : 18, map->l_addr,
+ __ELF_NATIVE_CLASS == 32 ? 10 : 18, result->lowpc,
+ __ELF_NATIVE_CLASS == 32 ? 10 : 18, result->highpc);
+
+ textsize = result->highpc - result->lowpc;
+ result->kcountsize = textsize / HISTFRACTION;
+ result->hashfraction = HASHFRACTION;
+ if ((HASHFRACTION & (HASHFRACTION - 1)) == 0)
+ /* If HASHFRACTION is a power of two, mcount can use shifting
+ instead of integer division. Precompute shift amount. */
+ log_hashfraction = __builtin_ffs (result->hashfraction
+ * sizeof (struct here_fromstruct)) - 1;
+ else
+ log_hashfraction = -1;
+ if (do_test)
+ printf ("hashfraction = %d\ndivider = %d\n",
+ result->hashfraction,
+ result->hashfraction * sizeof (struct here_fromstruct));
+ result->tossize = textsize / HASHFRACTION;
+ result->fromlimit = textsize * ARCDENSITY / 100;
+ if (result->fromlimit < MINARCS)
+ result->fromlimit = MINARCS;
+ if (result->fromlimit > MAXARCS)
+ result->fromlimit = MAXARCS;
+ result->fromssize = result->fromlimit * sizeof (struct here_fromstruct);
+
+ result->expected_size = (sizeof (struct gmon_hdr)
+ + 4 + sizeof (struct gmon_hist_hdr)
+ + result->kcountsize
+ + 4 + 4
+ + (result->fromssize
+ * sizeof (struct here_cg_arc_record)));
+
+ if (do_test)
+ {
+#define SCALE_1_TO_1 0x10000L
+
+ printf ("expected size: %Zd\n", result->expected_size);
+
+ if (result->kcountsize < result->highpc - result->lowpc)
+ {
+ size_t range = result->highpc - result->lowpc;
+ size_t quot = range / result->kcountsize;
+
+ if (quot >= SCALE_1_TO_1)
+ result->s_scale = 1;
+ else if (quot >= SCALE_1_TO_1 / 256)
+ result->s_scale = SCALE_1_TO_1 / quot;
+ else if (range > ULONG_MAX / 256)
+ result->s_scale = ((SCALE_1_TO_1 * 256)
+ / (range / (result->kcountsize / 256)));
+ else
+ result->s_scale = ((SCALE_1_TO_1 * 256)
+ / ((range * 256) / result->kcountsize));
+ }
+ else
+ result->s_scale = SCALE_1_TO_1;
+
+ printf ("s_scale: %d\n", result->s_scale);
+ }
+
+ /* Determine the string table. */
+ if (map->l_info[DT_STRTAB] == NULL)
+ result->strtab = NULL;
+ else
+ result->strtab = (const char *) (map->l_addr
+ + map->l_info[DT_STRTAB]->d_un.d_ptr);
+ if (do_test)
+ printf ("string table: %p\n", result->strtab);
+
+ /* Determine the soname. */
+ if (map->l_info[DT_SONAME] == NULL)
+ result->soname = NULL;
+ else
+ result->soname = result->strtab + map->l_info[DT_SONAME]->d_un.d_val;
+ if (do_test)
+ printf ("soname: %s\n", result->soname);
+
+ /* Now the hard part, we have to load the debugging data. For now
+ we support stabs only.
+
+ First load the section header table. */
+ ehdr = (ElfW(Ehdr) *) map->l_addr;
+
+ /* Make sure we are on the right party. */
+ if (ehdr->e_shentsize != sizeof (ElfW(Shdr)))
+ abort ();
+
+ /* And we need the shared object file descriptor again. */
+ fd = open (map->l_name, O_RDONLY);
+ if (fd == -1)
+ /* Dooh, this really shouldn't happen. We know the file is available. */
+ error (EXIT_FAILURE, errno, _("Reopening shared object `%s' failed"));
+
+ /* Now map the section header. */
+ ptr = mmap (NULL, (ehdr->e_phnum * sizeof (ElfW(Shdr))
+ + (ehdr->e_shoff & (pagesize - 1))), PROT_READ,
+ MAP_SHARED|MAP_FILE, fd, ehdr->e_shoff & ~(pagesize - 1));
+ if (ptr == MAP_FAILED)
+ error (EXIT_FAILURE, errno, _("mapping of section headers failed"));
+ shdr = (ElfW(Shdr) *) ((char *) ptr + (ehdr->e_shoff & (pagesize - 1)));
+
+ /* Get the section header string table. */
+ ptr = mmap (NULL, (shdr[ehdr->e_shstrndx].sh_size
+ + (shdr[ehdr->e_shstrndx].sh_offset & (pagesize - 1))),
+ PROT_READ, MAP_SHARED|MAP_FILE, fd,
+ shdr[ehdr->e_shstrndx].sh_offset & ~(pagesize - 1));
+ if (ptr == MAP_FAILED)
+ error (EXIT_FAILURE, errno,
+ _("mapping of section header string table failed"));
+ shstrtab = ((const char *) ptr
+ + (shdr[ehdr->e_shstrndx].sh_offset & (pagesize - 1)));
+
+ /* Search for the ".stab" and ".stabstr" section (and ".rel.stab" ?). */
+ stab_entry = NULL;
+ stabstr_entry = NULL;
+ for (idx = 0; idx < ehdr->e_shnum; ++idx)
+ /* We only have to look for sections which are not loaded. */
+ if (shdr[idx].sh_addr == 0)
+ {
+ if (strcmp (shstrtab + shdr[idx].sh_name, ".stab") == 0)
+ stab_entry = &shdr[idx];
+ else if (strcmp (shstrtab + shdr[idx].sh_name, ".stabstr") == 0)
+ stabstr_entry = &shdr[idx];
+ }
+
+ /* We don't need the sectin header string table anymore. */
+ munmap (ptr, (shdr[ehdr->e_shstrndx].sh_size
+ + (shdr[ehdr->e_shstrndx].sh_offset & (pagesize - 1))));
+
+ if (stab_entry == NULL || stabstr_entry == NULL)
+ {
+ fprintf (stderr, _("\
+*** The file `%s' is stripped: no detailed analysis possible\n"),
+ name);
+ result->stab = NULL;
+ result->stabstr = NULL;
+ }
+ else
+ {
+ if (stab_entry->sh_offset + stab_entry->sh_size
+ != stabstr_entry->sh_offset)
+ abort ();
+ if (stab_entry->sh_size % STABSIZE != 0)
+ abort ();
+
+ result->stab_map = mmap (NULL, (stab_entry->sh_size
+ + stabstr_entry->sh_size
+ + (stab_entry->sh_offset
+ & (pagesize - 1))),
+ PROT_READ, MAP_SHARED|MAP_FILE, fd,
+ stab_entry->sh_offset & ~(pagesize - 1));
+ if (result->stab_map == NULL)
+ error (EXIT_FAILURE, errno, _("failed to load stab data:"));
+
+ result->stab = ((const char *) result->stab_map
+ + (stab_entry->sh_offset & (pagesize - 1)));
+ result->stab_size = stab_entry->sh_size;
+ result->stabstr = result->stab + stab_entry->sh_size;
+ result->stabstr_size = stabstr_entry->sh_size;
+ result->stab_mapsize = (stab_entry->sh_size + stabstr_entry->sh_size
+ + (stab_entry->sh_offset & (pagesize - 1)));
+ }
+
+ /* Now we also don't need the sectio header table anymore. */
+ munmap ((char *) shdr - (ehdr->e_shoff & (pagesize - 1)),
+ (ehdr->e_phnum * sizeof (ElfW(Shdr))
+ + (ehdr->e_shoff & (pagesize - 1))));
+
+ /* Free the descriptor for the shared object. */
+ close (fd);
+
+ return result;
+}
+
+
+static void
+unload_shobj (struct shobj *shobj)
+{
+ munmap (shobj->stab_map, shobj->stab_mapsize);
+ dlclose (shobj->map);
+}
+
+
+static struct profdata *
+load_profdata (const char *name, struct shobj *shobj)
+{
+ struct profdata *result;
+ int fd;
+ struct stat st;
+ void *addr;
+ struct gmon_hdr gmon_hdr;
+ struct gmon_hist_hdr hist_hdr;
+ uint32_t *narcsp;
+ size_t fromlimit;
+ struct here_cg_arc_record *data;
+ struct here_fromstruct *froms;
+ uint16_t *tos;
+ size_t fromidx;
+ size_t idx;
+
+ fd = open (name, O_RDONLY);
+ if (fd == -1)
+ {
+ char *ext_name;
+
+ if (errno != ENOENT || strchr (name, '/') != NULL)
+ /* The file exists but we are not allowed to read it or the
+ file does not exist and the name includes a path
+ specification.. */
+ return NULL;
+
+ /* A file with the given name does not exist in the current
+ directory, try it in the default location where the profiling
+ files are created. */
+ ext_name = (char *) alloca (strlen (name) + sizeof "/var/tmp/");
+ stpcpy (stpcpy (ext_name, "/var/tmp/"), name);
+ name = ext_name;
+
+ fd = open (ext_name, O_RDONLY);
+ if (fd == -1)
+ {
+ /* Even this file does not exist. */
+ error (0, errno, _("cannot load profiling data"));
+ return NULL;
+ }
+ }
+
+ /* We have found the file, now make sure it is the right one for the
+ data file. */
+ if (fstat (fd, &st) < 0)
+ {
+ error (0, errno, _("while stat'ing profiling data file"));
+ close (fd);
+ return NULL;
+ }
+
+ if (st.st_size != shobj->expected_size)
+ {
+ error (0, 0, _("profiling data file `%s' does match shared object `%s'"),
+ name, shobj->name);
+ close (fd);
+ return NULL;
+ }
+
+ /* The data file is most probably the right one for our shared
+ object. Map it now. */
+ addr = mmap (NULL, st.st_size, PROT_READ, MAP_SHARED|MAP_FILE, fd, 0);
+ if (addr == MAP_FAILED)
+ {
+ error (0, errno, _("failed to mmap the profiling data file"));
+ close (fd);
+ return NULL;
+ }
+
+ /* We don't need the file desriptor anymore. */
+ if (close (fd) < 0)
+ {
+ error (0, errno, _("error while closing the profiling data file"));
+ munmap (addr, st.st_size);
+ return NULL;
+ }
+
+ /* Prepare the result. */
+ result = (struct profdata *) calloc (1, sizeof (struct profdata));
+ if (result == NULL)
+ {
+ error (0, errno, _("cannot create internal descriptor"));
+ munmap (addr, st.st_size);
+ return NULL;
+ }
+
+ /* Store the address and size so that we can later free the resources. */
+ result->addr = addr;
+ result->size = st.st_size;
+
+ /* Pointer to data after the header. */
+ result->hist = (char *) ((struct gmon_hdr *) addr + 1);
+ result->kcount = (uint16_t *) ((char *) result->hist + sizeof (uint32_t)
+ + sizeof (struct gmon_hist_hdr));
+
+ /* Compute pointer to array of the arc information. */
+ narcsp = (uint32_t *) ((char *) result->kcount + shobj->kcountsize
+ + sizeof (uint32_t));
+ result->narcs = *narcsp;
+ result->data = (struct here_cg_arc_record *) ((char *) narcsp
+ + sizeof (uint32_t));
+
+ /* Create the gmon_hdr we expect or write. */
+ memset (&gmon_hdr, '\0', sizeof (struct gmon_hdr));
+ memcpy (&gmon_hdr.cookie[0], GMON_MAGIC, sizeof (gmon_hdr.cookie));
+ *(int32_t *) gmon_hdr.version = GMON_SHOBJ_VERSION;
+
+ /* Create the hist_hdr we expect or write. */
+ *(char **) hist_hdr.low_pc = (char *) shobj->lowpc - shobj->map->l_addr;
+ *(char **) hist_hdr.high_pc = (char *) shobj->highpc - shobj->map->l_addr;
+ if (do_test)
+ printf ("low_pc = %p\nhigh_pc = %p\n",
+ hist_hdr.low_pc, hist_hdr.high_pc);
+ *(int32_t *) hist_hdr.hist_size = shobj->kcountsize / sizeof (HISTCOUNTER);
+ *(int32_t *) hist_hdr.prof_rate = __profile_frequency ();
+ strncpy (hist_hdr.dimen, "seconds", sizeof (hist_hdr.dimen));
+ hist_hdr.dimen_abbrev = 's';
+
+ /* Test whether the header of the profiling data is ok. */
+ if (memcmp (addr, &gmon_hdr, sizeof (struct gmon_hdr)) != 0
+ || *(uint32_t *) result->hist != GMON_TAG_TIME_HIST
+ || memcmp (result->hist + sizeof (uint32_t), &hist_hdr,
+ sizeof (struct gmon_hist_hdr)) != 0
+ || narcsp[-1] != GMON_TAG_CG_ARC)
+ {
+ free (result);
+ error (0, 0, _("`%s' is no correct profile data file for `%s'"),
+ name, shobj->name);
+ munmap (addr, st.st_size);
+ return NULL;
+ }
+
+ /* We are pretty sure now that this is a correct input file. Set up
+ the remaining information in the result structure and return. */
+ result->tos = (uint16_t *) calloc (shobj->tossize + shobj->fromssize, 1);
+ if (result->tos == NULL)
+ {
+ error (0, errno, _("cannot create internal descriptor"));
+ munmap (addr, st.st_size);
+ free (result);
+ return NULL;
+ }
+
+ result->froms = (struct here_fromstruct *) ((char *) result->tos
+ + shobj->tossize);
+ fromidx = 0;
+
+ /* Now we have to process all the arc count entries. */
+ fromlimit = shobj->fromlimit;
+ data = result->data;
+ froms = result->froms;
+ tos = result->tos;
+ for (idx = 0; idx < MIN (*narcsp, fromlimit); ++idx)
+ {
+ size_t to_index;
+ size_t newfromidx;
+ to_index = (data[idx].self_pc / (shobj->hashfraction * sizeof (*tos)));
+ newfromidx = fromidx++;
+ froms[newfromidx].here = &data[idx];
+ froms[newfromidx].link = tos[to_index];
+ tos[to_index] = newfromidx;
+ }
+
+ return result;
+}
+
+
+static void
+unload_profdata (struct profdata *profdata)
+{
+ free (profdata->tos);
+ munmap (profdata->addr, profdata->size);
+ free (profdata);
+}
+
+
+static void
+count_total_ticks (struct shobj *shobj, struct profdata *profdata)
+{
+ volatile uint16_t *kcount = profdata->kcount;
+ uint64_t sum = 0;
+ size_t idx;
+ size_t factor = 2 * (65536 / shobj->s_scale);
+
+ for (idx = shobj->kcountsize / sizeof (*kcount); idx > 0; )
+ {
+ --idx;
+ if (kcount[idx] != 0)
+ {
+ size_t n;
+
+ for (n = 0; n < symidx; ++n)
+ if (sortsym[n]->addr <= factor * idx
+ && sortsym[n]->addr + sortsym[n]->size > factor * idx)
+ break;
+
+ if (n < symidx)
+ printf ("idx = %d, count = %d, name = %s\n", idx, kcount[idx],
+ sortsym[n]->name);
+ else
+ printf ("idx = %d, N/A\n", idx);
+ }
+ sum += kcount[idx];
+ }
+
+ printf ("total ticks: %10" PRId64 "\n", sum);
+}
+
+
+static int
+symorder (const void *o1, const void *o2)
+{
+ const struct known_symbol *p1 = (struct known_symbol *) o1;
+ const struct known_symbol *p2 = (struct known_symbol *) o2;
+
+ return p1->addr - p2->addr;
+}
+
+
+static void
+printsym (const void *node, VISIT value, int level)
+{
+ if (value == leaf || value == postorder)
+ {
+ const struct known_symbol *sym = *(const struct known_symbol **) node;
+
+ printf ("Name: %30s, Start: %6x, Len: %5d\n",
+ sym->name, sym->addr, sym->size);
+
+ sortsym[symidx++] = sym;
+ }
+}
+
+
+static void
+read_symbols (struct shobj *shobj)
+{
+ void *load_addr = (void *) shobj->map->l_addr;
+ int n = 0;
+ int idx;
+ const char *last_name = NULL;
+ uintptr_t last_addr = 0;
+
+ /* Initialize the obstacks. */
+#define obstack_chunk_alloc malloc
+#define obstack_chunk_free free
+ obstack_init (&shobj->ob_str);
+ obstack_init (&shobj->ob_sym);
+
+ /* Process the stabs. */
+ for (idx = 0; idx < shobj->stab_size; idx += 12)
+ if (*(shobj->stab + idx + TYPEOFF) == N_FUN)
+ {
+ const char *str = (shobj->stabstr
+ + *((uint32_t *) (shobj->stab + idx + STRDXOFF)));
+
+ if (*str != '\0')
+ {
+ last_name = str;
+ last_addr = *((uint32_t *) (shobj->stab + idx + VALOFF));
+ }
+ else
+ {
+ const char *endp;
+ char *name0;
+ struct known_symbol *newsym;
+
+ if (last_name == NULL)
+ abort ();
+
+ endp = strchr (last_name, ':');
+
+ name0 = (char *) obstack_copy0 (&shobj->ob_str, last_name,
+ endp - last_name);
+ if (name0 != NULL)
+ newsym =
+ (struct known_symbol *) obstack_alloc (&shobj->ob_sym,
+ sizeof (*newsym));
+ else
+ /* Keep the stupid compiler happy. */
+ newsym = NULL;
+ if (name0 == NULL || newsym == NULL)
+ error (EXIT_FAILURE, errno, _("cannot allocate symbol data"));
+
+ newsym->name = name0;
+ newsym->addr = last_addr;
+ newsym->size = *((uint32_t *) (shobj->stab + idx + VALOFF));
+
+ tsearch (newsym, &symroot, symorder);
+ ++n;
+
+ last_name = NULL;
+ last_addr = 0;
+ }
+ }
+
+ if (shobj->stab == NULL)
+ {
+ /* Blarg, the binary is stripped. We have to rely on the
+ information contained in the dynamic section of the object. */
+ const ElfW(Sym) *symtab = (load_addr
+ + shobj->map->l_info[DT_SYMTAB]->d_un.d_ptr);
+ const char *strtab = (load_addr
+ + shobj->map->l_info[DT_STRTAB]->d_un.d_ptr);
+
+ /* We assume that the string table follows the symbol table,
+ because there is no way in ELF to know the size of the
+ dynamic symbol table!! */
+ while ((void *) symtab < (void *) strtab)
+ {
+ if (/*(ELFW(ST_TYPE)(symtab->st_info) == STT_FUNC
+ || ELFW(ST_TYPE)(symtab->st_info) == STT_NOTYPE)
+ &&*/ symtab->st_size != 0)
+ {
+ struct known_symbol *newsym;
+
+ newsym =
+ (struct known_symbol *) obstack_alloc (&shobj->ob_sym,
+ sizeof (*newsym));
+ if (newsym == NULL)
+ error (EXIT_FAILURE, errno, _("cannot allocate symbol data"));
+
+ newsym->name = &strtab[symtab->st_name];
+ newsym->addr = symtab->st_value;
+ newsym->size = symtab->st_size;
+
+ tsearch (newsym, &symroot, symorder);
+ ++n;
+ }
+ }
+
+ ++symtab;
+ }
+
+ sortsym = malloc (n * sizeof (struct known_symbol *));
+ if (sortsym == NULL)
+ abort ();
+
+ twalk (symroot, printsym);
+}