2014-04-30 20:25:10 +07:00
|
|
|
#include <asm/bug.h>
|
perf tools: Cache dso data file descriptor
Caching dso data file descriptors to avoid expensive re-opens
especially during DWARF unwind.
We keep dsos data file descriptors open until their count reaches
the half of the current fd open limit (RLIMIT_NOFILE). In this case
we close file descriptor of the first opened dso object.
We've got overall speedup (~27% for my workload) of report:
'perf report --stdio -i perf-test.data' (3 runs)
(perf-test.data size was around 12GB)
current code:
545,640,944,228 cycles ( +- 0.53% )
785,255,798,320 instructions ( +- 0.03% )
366.340910010 seconds time elapsed ( +- 3.65% )
after change:
435,895,036,114 cycles ( +- 0.26% )
636,790,271,176 instructions ( +- 0.04% )
266.481463387 seconds time elapsed ( +- 0.13% )
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Arnaldo Carvalho de Melo <acme@kernel.org>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jean Pihet <jean.pihet@linaro.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1401892622-30848-7-git-send-email-jolsa@kernel.org
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
2014-04-30 20:47:27 +07:00
|
|
|
#include <sys/time.h>
|
|
|
|
#include <sys/resource.h>
|
2012-10-28 04:18:32 +07:00
|
|
|
#include "symbol.h"
|
|
|
|
#include "dso.h"
|
2012-11-09 21:32:52 +07:00
|
|
|
#include "machine.h"
|
2015-04-09 22:53:55 +07:00
|
|
|
#include "auxtrace.h"
|
2012-10-28 04:18:32 +07:00
|
|
|
#include "util.h"
|
|
|
|
#include "debug.h"
|
|
|
|
|
|
|
|
char dso__symtab_origin(const struct dso *dso)
|
|
|
|
{
|
|
|
|
static const char origin[] = {
|
2013-09-18 20:56:14 +07:00
|
|
|
[DSO_BINARY_TYPE__KALLSYMS] = 'k',
|
|
|
|
[DSO_BINARY_TYPE__VMLINUX] = 'v',
|
|
|
|
[DSO_BINARY_TYPE__JAVA_JIT] = 'j',
|
|
|
|
[DSO_BINARY_TYPE__DEBUGLINK] = 'l',
|
|
|
|
[DSO_BINARY_TYPE__BUILD_ID_CACHE] = 'B',
|
|
|
|
[DSO_BINARY_TYPE__FEDORA_DEBUGINFO] = 'f',
|
|
|
|
[DSO_BINARY_TYPE__UBUNTU_DEBUGINFO] = 'u',
|
|
|
|
[DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO] = 'o',
|
|
|
|
[DSO_BINARY_TYPE__BUILDID_DEBUGINFO] = 'b',
|
|
|
|
[DSO_BINARY_TYPE__SYSTEM_PATH_DSO] = 'd',
|
|
|
|
[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE] = 'K',
|
2014-11-04 08:14:27 +07:00
|
|
|
[DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP] = 'm',
|
2013-09-18 20:56:14 +07:00
|
|
|
[DSO_BINARY_TYPE__GUEST_KALLSYMS] = 'g',
|
|
|
|
[DSO_BINARY_TYPE__GUEST_KMODULE] = 'G',
|
2014-11-04 08:14:27 +07:00
|
|
|
[DSO_BINARY_TYPE__GUEST_KMODULE_COMP] = 'M',
|
2013-09-18 20:56:14 +07:00
|
|
|
[DSO_BINARY_TYPE__GUEST_VMLINUX] = 'V',
|
2012-10-28 04:18:32 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
if (dso == NULL || dso->symtab_type == DSO_BINARY_TYPE__NOT_FOUND)
|
|
|
|
return '!';
|
|
|
|
return origin[dso->symtab_type];
|
|
|
|
}
|
|
|
|
|
2013-12-17 03:03:18 +07:00
|
|
|
int dso__read_binary_type_filename(const struct dso *dso,
|
|
|
|
enum dso_binary_type type,
|
|
|
|
char *root_dir, char *filename, size_t size)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
char build_id_hex[BUILD_ID_SIZE * 2 + 1];
|
|
|
|
int ret = 0;
|
2014-07-29 20:21:58 +07:00
|
|
|
size_t len;
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
switch (type) {
|
|
|
|
case DSO_BINARY_TYPE__DEBUGLINK: {
|
|
|
|
char *debuglink;
|
|
|
|
|
2015-01-27 13:34:02 +07:00
|
|
|
len = __symbol__join_symfs(filename, size, dso->long_name);
|
|
|
|
debuglink = filename + len;
|
2013-12-11 02:02:50 +07:00
|
|
|
while (debuglink != filename && *debuglink != '/')
|
2012-10-28 04:18:32 +07:00
|
|
|
debuglink--;
|
|
|
|
if (*debuglink == '/')
|
|
|
|
debuglink++;
|
2016-01-20 18:56:32 +07:00
|
|
|
|
|
|
|
ret = -1;
|
|
|
|
if (!is_regular_file(filename))
|
|
|
|
break;
|
|
|
|
|
2015-01-27 13:34:02 +07:00
|
|
|
ret = filename__read_debuglink(filename, debuglink,
|
2014-02-20 08:32:55 +07:00
|
|
|
size - (debuglink - filename));
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case DSO_BINARY_TYPE__BUILD_ID_CACHE:
|
|
|
|
/* skip the locally configured cache if a symfs is given */
|
|
|
|
if (symbol_conf.symfs[0] ||
|
2013-12-11 02:02:50 +07:00
|
|
|
(dso__build_id_filename(dso, filename, size) == NULL))
|
2012-10-28 04:18:32 +07:00
|
|
|
ret = -1;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case DSO_BINARY_TYPE__FEDORA_DEBUGINFO:
|
2014-07-29 20:21:58 +07:00
|
|
|
len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
|
|
|
|
snprintf(filename + len, size - len, "%s.debug", dso->long_name);
|
2012-10-28 04:18:32 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case DSO_BINARY_TYPE__UBUNTU_DEBUGINFO:
|
2014-07-29 20:21:58 +07:00
|
|
|
len = __symbol__join_symfs(filename, size, "/usr/lib/debug");
|
|
|
|
snprintf(filename + len, size - len, "%s", dso->long_name);
|
2012-10-28 04:18:32 +07:00
|
|
|
break;
|
|
|
|
|
2013-09-18 20:56:14 +07:00
|
|
|
case DSO_BINARY_TYPE__OPENEMBEDDED_DEBUGINFO:
|
|
|
|
{
|
2013-12-11 01:19:23 +07:00
|
|
|
const char *last_slash;
|
2013-09-18 20:56:14 +07:00
|
|
|
size_t dir_size;
|
|
|
|
|
|
|
|
last_slash = dso->long_name + dso->long_name_len;
|
|
|
|
while (last_slash != dso->long_name && *last_slash != '/')
|
|
|
|
last_slash--;
|
|
|
|
|
2014-07-29 20:21:58 +07:00
|
|
|
len = __symbol__join_symfs(filename, size, "");
|
2013-09-18 20:56:14 +07:00
|
|
|
dir_size = last_slash - dso->long_name + 2;
|
|
|
|
if (dir_size > (size - len)) {
|
|
|
|
ret = -1;
|
|
|
|
break;
|
|
|
|
}
|
2013-12-11 02:02:50 +07:00
|
|
|
len += scnprintf(filename + len, dir_size, "%s", dso->long_name);
|
|
|
|
len += scnprintf(filename + len , size - len, ".debug%s",
|
2013-09-18 20:56:14 +07:00
|
|
|
last_slash);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
case DSO_BINARY_TYPE__BUILDID_DEBUGINFO:
|
|
|
|
if (!dso->has_build_id) {
|
|
|
|
ret = -1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
build_id__sprintf(dso->build_id,
|
|
|
|
sizeof(dso->build_id),
|
|
|
|
build_id_hex);
|
2014-07-29 20:21:58 +07:00
|
|
|
len = __symbol__join_symfs(filename, size, "/usr/lib/debug/.build-id/");
|
|
|
|
snprintf(filename + len, size - len, "%.2s/%s.debug",
|
|
|
|
build_id_hex, build_id_hex + 2);
|
2012-10-28 04:18:32 +07:00
|
|
|
break;
|
|
|
|
|
2013-08-07 18:38:47 +07:00
|
|
|
case DSO_BINARY_TYPE__VMLINUX:
|
|
|
|
case DSO_BINARY_TYPE__GUEST_VMLINUX:
|
2012-10-28 04:18:32 +07:00
|
|
|
case DSO_BINARY_TYPE__SYSTEM_PATH_DSO:
|
2014-07-29 20:21:58 +07:00
|
|
|
__symbol__join_symfs(filename, size, dso->long_name);
|
2012-10-28 04:18:32 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case DSO_BINARY_TYPE__GUEST_KMODULE:
|
2014-11-04 08:14:27 +07:00
|
|
|
case DSO_BINARY_TYPE__GUEST_KMODULE_COMP:
|
2014-07-29 20:21:58 +07:00
|
|
|
path__join3(filename, size, symbol_conf.symfs,
|
|
|
|
root_dir, dso->long_name);
|
2012-10-28 04:18:32 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE:
|
2014-11-04 08:14:27 +07:00
|
|
|
case DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP:
|
2014-07-29 20:21:58 +07:00
|
|
|
__symbol__join_symfs(filename, size, dso->long_name);
|
2012-10-28 04:18:32 +07:00
|
|
|
break;
|
|
|
|
|
2013-08-07 18:38:51 +07:00
|
|
|
case DSO_BINARY_TYPE__KCORE:
|
|
|
|
case DSO_BINARY_TYPE__GUEST_KCORE:
|
2013-12-11 02:02:50 +07:00
|
|
|
snprintf(filename, size, "%s", dso->long_name);
|
2013-08-07 18:38:51 +07:00
|
|
|
break;
|
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
default:
|
|
|
|
case DSO_BINARY_TYPE__KALLSYMS:
|
|
|
|
case DSO_BINARY_TYPE__GUEST_KALLSYMS:
|
|
|
|
case DSO_BINARY_TYPE__JAVA_JIT:
|
|
|
|
case DSO_BINARY_TYPE__NOT_FOUND:
|
|
|
|
ret = -1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-11-04 08:14:27 +07:00
|
|
|
static const struct {
|
|
|
|
const char *fmt;
|
|
|
|
int (*decompress)(const char *input, int output);
|
|
|
|
} compressions[] = {
|
perf tools: Add gzip decompression support for kernel module
Now my Archlinux box shows module symbols correctly.
Before:
$ perf report --stdio
Failed to open /tmp/perf-3477.map, continuing without symbols
no symbols found in /usr/bin/date, maybe install a debug package?
No kallsyms or vmlinux with build-id 7b4ea0a49ae2111925857099aaf05c3246ff33e0 was found
[drm] with build id 7b4ea0a49ae2111925857099aaf05c3246ff33e0 not found, continuing without symbols
No kallsyms or vmlinux with build-id edd931629094b660ca9dec09a1b635c8d87aa2ee was found
[jbd2] with build id edd931629094b660ca9dec09a1b635c8d87aa2ee not found, continuing without symbols
No kallsyms or vmlinux with build-id a7b1eada671c34933e5610bb920b2ca4945a82c3 was found
[ext4] with build id a7b1eada671c34933e5610bb920b2ca4945a82c3 not found, continuing without symbols
No kallsyms or vmlinux with build-id d69511fa3e5840e770336ef45b06c83fef8d74e3 was found
[scsi_mod] with build id d69511fa3e5840e770336ef45b06c83fef8d74e3 not found, continuing without symbols
No kallsyms or vmlinux with build-id af0430af13461af058770ee9b87afc07922c2e77 was found
[libata] with build id af0430af13461af058770ee9b87afc07922c2e77 not found, continuing without symbols
No kallsyms or vmlinux with build-id aaeedff8160ce631a5f0333591c6ff291201d29f was found
[libahci] with build id aaeedff8160ce631a5f0333591c6ff291201d29f not found, continuing without symbols
No kallsyms or vmlinux with build-id c57907712becaf662dc4981824bb372c0441d605 was found
[mac80211] with build id c57907712becaf662dc4981824bb372c0441d605 not found, continuing without symbols
No kallsyms or vmlinux with build-id e0589077cc0ec8c3e4c40eb9f2d9e69d236bee8f was found
[iwldvm] with build id e0589077cc0ec8c3e4c40eb9f2d9e69d236bee8f not found, continuing without symbols
No kallsyms or vmlinux with build-id 2d86086bf136bf374a2f029cf85a48194f9b950b was found
[cfg80211] with build id 2d86086bf136bf374a2f029cf85a48194f9b950b not found, continuing without symbols
No kallsyms or vmlinux with build-id 4493c48599bdb3d91d0f8db5150e0be33fdd9221 was found
[iwlwifi] with build id 4493c48599bdb3d91d0f8db5150e0be33fdd9221 not found, continuing without symbols
...
#
# Overhead Command Shared Object Symbol
# ........ ............... ....................... ........................................................
#
0.03% swapper [ext4] [k] 0x000000000000fe2e
0.03% swapper [kernel.kallsyms] [k] account_entity_enqueue
0.03% swapper [ext4] [k] 0x000000000000fc2b
0.03% irq/50-iwlwifi [iwlwifi] [k] 0x000000000000200b
0.03% swapper [kernel.kallsyms] [k] ktime_add_safe
0.03% swapper [kernel.kallsyms] [k] elv_completed_request
0.03% swapper [libata] [k] 0x0000000000003997
0.03% swapper [libahci] [k] 0x0000000000001f25
0.03% swapper [kernel.kallsyms] [k] rb_next
0.03% swapper [kernel.kallsyms] [k] blk_finish_request
0.03% swapper [ext4] [k] 0x0000000000010248
0.00% perf [kernel.kallsyms] [k] native_write_msr_safe
After:
$ perf report --stdio
Failed to open /tmp/perf-3477.map, continuing without symbols
no symbols found in /usr/bin/tr, maybe install a debug package?
...
#
# Overhead Command Shared Object Symbol
# ........ ............... ........................... ......................................................
#
0.04% kworker/u16:3 [ext4] [k] ext4_read_block_bitmap
0.03% kworker/u16:0 [mac80211] [k] ieee80211_sta_reset_beacon_monitor
0.02% irq/50-iwlwifi [mac80211] [k] ieee80211_get_bssid
0.02% firefox [e1000e] [k] __ew32_prepare
0.02% swapper [libahci] [k] ahci_handle_port_interrupt
0.02% emacs libglib-2.0.so.0.4000.0 [.] g_mutex_unlock
0.02% swapper [e1000e] [k] e1000_clean_tx_irq
0.02% dwm [kernel.kallsyms] [k] __schedule
0.02% gnome-terminal- [vdso] [.] __vdso_clock_gettime
0.02% swapper [e1000e] [k] e1000_alloc_rx_buffers
0.02% irq/50-iwlwifi [mac80211] [k] ieee80211_rx
0.01% firefox [vdso] [.] __vdso_gettimeofday
0.01% irq/50-iwlwifi [iwlwifi] [k] iwl_pcie_rxq_restock.part.13
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Acked-by: Jiri Olsa <jolsa@redhat.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Namhyung Kim <namhyung.kim@lge.com>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/r/87h9yexshi.fsf@sejong.aot.lge.com
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2014-10-31 14:51:38 +07:00
|
|
|
#ifdef HAVE_ZLIB_SUPPORT
|
|
|
|
{ "gz", gzip_decompress_to_file },
|
2015-01-29 19:29:39 +07:00
|
|
|
#endif
|
|
|
|
#ifdef HAVE_LZMA_SUPPORT
|
|
|
|
{ "xz", lzma_decompress_to_file },
|
perf tools: Add gzip decompression support for kernel module
Now my Archlinux box shows module symbols correctly.
Before:
$ perf report --stdio
Failed to open /tmp/perf-3477.map, continuing without symbols
no symbols found in /usr/bin/date, maybe install a debug package?
No kallsyms or vmlinux with build-id 7b4ea0a49ae2111925857099aaf05c3246ff33e0 was found
[drm] with build id 7b4ea0a49ae2111925857099aaf05c3246ff33e0 not found, continuing without symbols
No kallsyms or vmlinux with build-id edd931629094b660ca9dec09a1b635c8d87aa2ee was found
[jbd2] with build id edd931629094b660ca9dec09a1b635c8d87aa2ee not found, continuing without symbols
No kallsyms or vmlinux with build-id a7b1eada671c34933e5610bb920b2ca4945a82c3 was found
[ext4] with build id a7b1eada671c34933e5610bb920b2ca4945a82c3 not found, continuing without symbols
No kallsyms or vmlinux with build-id d69511fa3e5840e770336ef45b06c83fef8d74e3 was found
[scsi_mod] with build id d69511fa3e5840e770336ef45b06c83fef8d74e3 not found, continuing without symbols
No kallsyms or vmlinux with build-id af0430af13461af058770ee9b87afc07922c2e77 was found
[libata] with build id af0430af13461af058770ee9b87afc07922c2e77 not found, continuing without symbols
No kallsyms or vmlinux with build-id aaeedff8160ce631a5f0333591c6ff291201d29f was found
[libahci] with build id aaeedff8160ce631a5f0333591c6ff291201d29f not found, continuing without symbols
No kallsyms or vmlinux with build-id c57907712becaf662dc4981824bb372c0441d605 was found
[mac80211] with build id c57907712becaf662dc4981824bb372c0441d605 not found, continuing without symbols
No kallsyms or vmlinux with build-id e0589077cc0ec8c3e4c40eb9f2d9e69d236bee8f was found
[iwldvm] with build id e0589077cc0ec8c3e4c40eb9f2d9e69d236bee8f not found, continuing without symbols
No kallsyms or vmlinux with build-id 2d86086bf136bf374a2f029cf85a48194f9b950b was found
[cfg80211] with build id 2d86086bf136bf374a2f029cf85a48194f9b950b not found, continuing without symbols
No kallsyms or vmlinux with build-id 4493c48599bdb3d91d0f8db5150e0be33fdd9221 was found
[iwlwifi] with build id 4493c48599bdb3d91d0f8db5150e0be33fdd9221 not found, continuing without symbols
...
#
# Overhead Command Shared Object Symbol
# ........ ............... ....................... ........................................................
#
0.03% swapper [ext4] [k] 0x000000000000fe2e
0.03% swapper [kernel.kallsyms] [k] account_entity_enqueue
0.03% swapper [ext4] [k] 0x000000000000fc2b
0.03% irq/50-iwlwifi [iwlwifi] [k] 0x000000000000200b
0.03% swapper [kernel.kallsyms] [k] ktime_add_safe
0.03% swapper [kernel.kallsyms] [k] elv_completed_request
0.03% swapper [libata] [k] 0x0000000000003997
0.03% swapper [libahci] [k] 0x0000000000001f25
0.03% swapper [kernel.kallsyms] [k] rb_next
0.03% swapper [kernel.kallsyms] [k] blk_finish_request
0.03% swapper [ext4] [k] 0x0000000000010248
0.00% perf [kernel.kallsyms] [k] native_write_msr_safe
After:
$ perf report --stdio
Failed to open /tmp/perf-3477.map, continuing without symbols
no symbols found in /usr/bin/tr, maybe install a debug package?
...
#
# Overhead Command Shared Object Symbol
# ........ ............... ........................... ......................................................
#
0.04% kworker/u16:3 [ext4] [k] ext4_read_block_bitmap
0.03% kworker/u16:0 [mac80211] [k] ieee80211_sta_reset_beacon_monitor
0.02% irq/50-iwlwifi [mac80211] [k] ieee80211_get_bssid
0.02% firefox [e1000e] [k] __ew32_prepare
0.02% swapper [libahci] [k] ahci_handle_port_interrupt
0.02% emacs libglib-2.0.so.0.4000.0 [.] g_mutex_unlock
0.02% swapper [e1000e] [k] e1000_clean_tx_irq
0.02% dwm [kernel.kallsyms] [k] __schedule
0.02% gnome-terminal- [vdso] [.] __vdso_clock_gettime
0.02% swapper [e1000e] [k] e1000_alloc_rx_buffers
0.02% irq/50-iwlwifi [mac80211] [k] ieee80211_rx
0.01% firefox [vdso] [.] __vdso_gettimeofday
0.01% irq/50-iwlwifi [iwlwifi] [k] iwl_pcie_rxq_restock.part.13
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Acked-by: Jiri Olsa <jolsa@redhat.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Namhyung Kim <namhyung.kim@lge.com>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/r/87h9yexshi.fsf@sejong.aot.lge.com
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2014-10-31 14:51:38 +07:00
|
|
|
#endif
|
|
|
|
{ NULL, NULL },
|
2014-11-04 08:14:27 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
bool is_supported_compression(const char *ext)
|
|
|
|
{
|
|
|
|
unsigned i;
|
|
|
|
|
|
|
|
for (i = 0; compressions[i].fmt; i++) {
|
|
|
|
if (!strcmp(ext, compressions[i].fmt))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2015-06-03 15:52:21 +07:00
|
|
|
bool is_kernel_module(const char *pathname, int cpumode)
|
2014-11-04 08:14:27 +07:00
|
|
|
{
|
2015-02-12 21:56:21 +07:00
|
|
|
struct kmod_path m;
|
2015-06-03 15:52:21 +07:00
|
|
|
int mode = cpumode & PERF_RECORD_MISC_CPUMODE_MASK;
|
|
|
|
|
|
|
|
WARN_ONCE(mode != cpumode,
|
|
|
|
"Internal error: passing unmasked cpumode (%x) to is_kernel_module",
|
|
|
|
cpumode);
|
|
|
|
|
|
|
|
switch (mode) {
|
|
|
|
case PERF_RECORD_MISC_USER:
|
|
|
|
case PERF_RECORD_MISC_HYPERVISOR:
|
|
|
|
case PERF_RECORD_MISC_GUEST_USER:
|
|
|
|
return false;
|
|
|
|
/* Treat PERF_RECORD_MISC_CPUMODE_UNKNOWN as kernel */
|
|
|
|
default:
|
|
|
|
if (kmod_path__parse(&m, pathname)) {
|
|
|
|
pr_err("Failed to check whether %s is a kernel module or not. Assume it is.",
|
|
|
|
pathname);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
2014-11-04 08:14:27 +07:00
|
|
|
|
2015-02-12 21:56:21 +07:00
|
|
|
return m.kmod;
|
2014-11-04 08:14:27 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
bool decompress_to_file(const char *ext, const char *filename, int output_fd)
|
|
|
|
{
|
|
|
|
unsigned i;
|
|
|
|
|
|
|
|
for (i = 0; compressions[i].fmt; i++) {
|
|
|
|
if (!strcmp(ext, compressions[i].fmt))
|
|
|
|
return !compressions[i].decompress(filename,
|
|
|
|
output_fd);
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool dso__needs_decompress(struct dso *dso)
|
|
|
|
{
|
|
|
|
return dso->symtab_type == DSO_BINARY_TYPE__SYSTEM_PATH_KMODULE_COMP ||
|
|
|
|
dso->symtab_type == DSO_BINARY_TYPE__GUEST_KMODULE_COMP;
|
|
|
|
}
|
|
|
|
|
perf tools: Add kmod_path__parse function
Provides united way of parsing kernel module path
into several components.
The new kmod_path__parse function and few defines:
int __kmod_path__parse(struct kmod_path *m, const char *path,
bool alloc_name, bool alloc_ext);
#define kmod_path__parse(__m, __p) __kmod_path__parse(__m, __p, false, false)
#define kmod_path__parse_name(__m, __p) __kmod_path__parse(__m, __p, true , false)
#define kmod_path__parse_ext(__m, __p) __kmod_path__parse(__m, __p, false, true)
parse kernel module @path and updates @m argument like:
@comp - true if @path contains supported compression suffix,
false otherwise
@kmod - true if @path contains '.ko' suffix in right position,
false otherwise
@name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
of the kernel module without suffixes, otherwise strudup-ed
base name of @path
@ext - if (@alloc_ext && @comp) is true, it contains strdup-ed string
the compression suffix
It returns 0 if there's no strdup error, -ENOMEM otherwise.
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/n/tip-9t6eqg8j610r94l743hkntiv@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2015-02-05 21:40:25 +07:00
|
|
|
/*
|
|
|
|
* Parses kernel module specified in @path and updates
|
|
|
|
* @m argument like:
|
|
|
|
*
|
|
|
|
* @comp - true if @path contains supported compression suffix,
|
|
|
|
* false otherwise
|
|
|
|
* @kmod - true if @path contains '.ko' suffix in right position,
|
|
|
|
* false otherwise
|
|
|
|
* @name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
|
|
|
|
* of the kernel module without suffixes, otherwise strudup-ed
|
|
|
|
* base name of @path
|
|
|
|
* @ext - if (@alloc_ext && @comp) is true, it contains strdup-ed string
|
|
|
|
* the compression suffix
|
|
|
|
*
|
|
|
|
* Returns 0 if there's no strdup error, -ENOMEM otherwise.
|
|
|
|
*/
|
|
|
|
int __kmod_path__parse(struct kmod_path *m, const char *path,
|
|
|
|
bool alloc_name, bool alloc_ext)
|
|
|
|
{
|
|
|
|
const char *name = strrchr(path, '/');
|
|
|
|
const char *ext = strrchr(path, '.');
|
2015-06-03 15:52:21 +07:00
|
|
|
bool is_simple_name = false;
|
perf tools: Add kmod_path__parse function
Provides united way of parsing kernel module path
into several components.
The new kmod_path__parse function and few defines:
int __kmod_path__parse(struct kmod_path *m, const char *path,
bool alloc_name, bool alloc_ext);
#define kmod_path__parse(__m, __p) __kmod_path__parse(__m, __p, false, false)
#define kmod_path__parse_name(__m, __p) __kmod_path__parse(__m, __p, true , false)
#define kmod_path__parse_ext(__m, __p) __kmod_path__parse(__m, __p, false, true)
parse kernel module @path and updates @m argument like:
@comp - true if @path contains supported compression suffix,
false otherwise
@kmod - true if @path contains '.ko' suffix in right position,
false otherwise
@name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
of the kernel module without suffixes, otherwise strudup-ed
base name of @path
@ext - if (@alloc_ext && @comp) is true, it contains strdup-ed string
the compression suffix
It returns 0 if there's no strdup error, -ENOMEM otherwise.
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/n/tip-9t6eqg8j610r94l743hkntiv@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2015-02-05 21:40:25 +07:00
|
|
|
|
|
|
|
memset(m, 0x0, sizeof(*m));
|
|
|
|
name = name ? name + 1 : path;
|
|
|
|
|
2015-06-03 15:52:21 +07:00
|
|
|
/*
|
|
|
|
* '.' is also a valid character for module name. For example:
|
|
|
|
* [aaa.bbb] is a valid module name. '[' should have higher
|
|
|
|
* priority than '.ko' suffix.
|
|
|
|
*
|
|
|
|
* The kernel names are from machine__mmap_name. Such
|
|
|
|
* name should belong to kernel itself, not kernel module.
|
|
|
|
*/
|
|
|
|
if (name[0] == '[') {
|
|
|
|
is_simple_name = true;
|
|
|
|
if ((strncmp(name, "[kernel.kallsyms]", 17) == 0) ||
|
|
|
|
(strncmp(name, "[guest.kernel.kallsyms", 22) == 0) ||
|
|
|
|
(strncmp(name, "[vdso]", 6) == 0) ||
|
|
|
|
(strncmp(name, "[vsyscall]", 10) == 0)) {
|
|
|
|
m->kmod = false;
|
|
|
|
|
|
|
|
} else
|
|
|
|
m->kmod = true;
|
|
|
|
}
|
|
|
|
|
perf tools: Add kmod_path__parse function
Provides united way of parsing kernel module path
into several components.
The new kmod_path__parse function and few defines:
int __kmod_path__parse(struct kmod_path *m, const char *path,
bool alloc_name, bool alloc_ext);
#define kmod_path__parse(__m, __p) __kmod_path__parse(__m, __p, false, false)
#define kmod_path__parse_name(__m, __p) __kmod_path__parse(__m, __p, true , false)
#define kmod_path__parse_ext(__m, __p) __kmod_path__parse(__m, __p, false, true)
parse kernel module @path and updates @m argument like:
@comp - true if @path contains supported compression suffix,
false otherwise
@kmod - true if @path contains '.ko' suffix in right position,
false otherwise
@name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
of the kernel module without suffixes, otherwise strudup-ed
base name of @path
@ext - if (@alloc_ext && @comp) is true, it contains strdup-ed string
the compression suffix
It returns 0 if there's no strdup error, -ENOMEM otherwise.
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/n/tip-9t6eqg8j610r94l743hkntiv@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2015-02-05 21:40:25 +07:00
|
|
|
/* No extension, just return name. */
|
2015-06-03 15:52:21 +07:00
|
|
|
if ((ext == NULL) || is_simple_name) {
|
perf tools: Add kmod_path__parse function
Provides united way of parsing kernel module path
into several components.
The new kmod_path__parse function and few defines:
int __kmod_path__parse(struct kmod_path *m, const char *path,
bool alloc_name, bool alloc_ext);
#define kmod_path__parse(__m, __p) __kmod_path__parse(__m, __p, false, false)
#define kmod_path__parse_name(__m, __p) __kmod_path__parse(__m, __p, true , false)
#define kmod_path__parse_ext(__m, __p) __kmod_path__parse(__m, __p, false, true)
parse kernel module @path and updates @m argument like:
@comp - true if @path contains supported compression suffix,
false otherwise
@kmod - true if @path contains '.ko' suffix in right position,
false otherwise
@name - if (@alloc_name && @kmod) is true, it contains strdup-ed base name
of the kernel module without suffixes, otherwise strudup-ed
base name of @path
@ext - if (@alloc_ext && @comp) is true, it contains strdup-ed string
the compression suffix
It returns 0 if there's no strdup error, -ENOMEM otherwise.
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/n/tip-9t6eqg8j610r94l743hkntiv@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2015-02-05 21:40:25 +07:00
|
|
|
if (alloc_name) {
|
|
|
|
m->name = strdup(name);
|
|
|
|
return m->name ? 0 : -ENOMEM;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (is_supported_compression(ext + 1)) {
|
|
|
|
m->comp = true;
|
|
|
|
ext -= 3;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Check .ko extension only if there's enough name left. */
|
|
|
|
if (ext > name)
|
|
|
|
m->kmod = !strncmp(ext, ".ko", 3);
|
|
|
|
|
|
|
|
if (alloc_name) {
|
|
|
|
if (m->kmod) {
|
|
|
|
if (asprintf(&m->name, "[%.*s]", (int) (ext - name), name) == -1)
|
|
|
|
return -ENOMEM;
|
|
|
|
} else {
|
|
|
|
if (asprintf(&m->name, "%s", name) == -1)
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
|
|
|
strxfrchar(m->name, '-', '_');
|
|
|
|
}
|
|
|
|
|
|
|
|
if (alloc_ext && m->comp) {
|
|
|
|
m->ext = strdup(ext + 4);
|
|
|
|
if (!m->ext) {
|
|
|
|
free((void *) m->name);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2014-04-30 20:00:59 +07:00
|
|
|
/*
|
2014-04-30 20:25:10 +07:00
|
|
|
* Global list of open DSOs and the counter.
|
2014-04-30 20:00:59 +07:00
|
|
|
*/
|
|
|
|
static LIST_HEAD(dso__data_open);
|
2014-04-30 20:25:10 +07:00
|
|
|
static long dso__data_open_cnt;
|
2015-05-18 07:30:42 +07:00
|
|
|
static pthread_mutex_t dso__data_open_lock = PTHREAD_MUTEX_INITIALIZER;
|
2014-04-30 20:00:59 +07:00
|
|
|
|
|
|
|
static void dso__list_add(struct dso *dso)
|
|
|
|
{
|
|
|
|
list_add_tail(&dso->data.open_entry, &dso__data_open);
|
2014-04-30 20:25:10 +07:00
|
|
|
dso__data_open_cnt++;
|
2014-04-30 20:00:59 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void dso__list_del(struct dso *dso)
|
|
|
|
{
|
|
|
|
list_del(&dso->data.open_entry);
|
2014-04-30 20:25:10 +07:00
|
|
|
WARN_ONCE(dso__data_open_cnt <= 0,
|
|
|
|
"DSO data fd counter out of bounds.");
|
|
|
|
dso__data_open_cnt--;
|
2014-04-30 20:00:59 +07:00
|
|
|
}
|
|
|
|
|
2014-05-08 02:35:02 +07:00
|
|
|
static void close_first_dso(void);
|
|
|
|
|
|
|
|
static int do_open(char *name)
|
|
|
|
{
|
|
|
|
int fd;
|
2014-08-14 09:22:36 +07:00
|
|
|
char sbuf[STRERR_BUFSIZE];
|
2014-05-08 02:35:02 +07:00
|
|
|
|
|
|
|
do {
|
|
|
|
fd = open(name, O_RDONLY);
|
|
|
|
if (fd >= 0)
|
|
|
|
return fd;
|
|
|
|
|
2015-01-30 09:33:29 +07:00
|
|
|
pr_debug("dso open failed: %s\n",
|
2014-08-14 09:22:36 +07:00
|
|
|
strerror_r(errno, sbuf, sizeof(sbuf)));
|
2014-05-08 02:35:02 +07:00
|
|
|
if (!dso__data_open_cnt || errno != EMFILE)
|
|
|
|
break;
|
|
|
|
|
|
|
|
close_first_dso();
|
|
|
|
} while (1);
|
|
|
|
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2014-04-30 20:00:59 +07:00
|
|
|
static int __open_dso(struct dso *dso, struct machine *machine)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
int fd;
|
2013-12-17 03:03:18 +07:00
|
|
|
char *root_dir = (char *)"";
|
|
|
|
char *name = malloc(PATH_MAX);
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
if (!name)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
if (machine)
|
|
|
|
root_dir = machine->root_dir;
|
|
|
|
|
2013-12-18 02:14:07 +07:00
|
|
|
if (dso__read_binary_type_filename(dso, dso->binary_type,
|
2013-12-17 03:03:18 +07:00
|
|
|
root_dir, name, PATH_MAX)) {
|
2012-10-28 04:18:32 +07:00
|
|
|
free(name);
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
2014-05-08 02:35:02 +07:00
|
|
|
fd = do_open(name);
|
2012-10-28 04:18:32 +07:00
|
|
|
free(name);
|
|
|
|
return fd;
|
|
|
|
}
|
|
|
|
|
perf tools: Cache dso data file descriptor
Caching dso data file descriptors to avoid expensive re-opens
especially during DWARF unwind.
We keep dsos data file descriptors open until their count reaches
the half of the current fd open limit (RLIMIT_NOFILE). In this case
we close file descriptor of the first opened dso object.
We've got overall speedup (~27% for my workload) of report:
'perf report --stdio -i perf-test.data' (3 runs)
(perf-test.data size was around 12GB)
current code:
545,640,944,228 cycles ( +- 0.53% )
785,255,798,320 instructions ( +- 0.03% )
366.340910010 seconds time elapsed ( +- 3.65% )
after change:
435,895,036,114 cycles ( +- 0.26% )
636,790,271,176 instructions ( +- 0.04% )
266.481463387 seconds time elapsed ( +- 0.13% )
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Arnaldo Carvalho de Melo <acme@kernel.org>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jean Pihet <jean.pihet@linaro.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1401892622-30848-7-git-send-email-jolsa@kernel.org
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
2014-04-30 20:47:27 +07:00
|
|
|
static void check_data_close(void);
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/**
|
|
|
|
* dso_close - Open DSO data file
|
|
|
|
* @dso: dso object
|
|
|
|
*
|
|
|
|
* Open @dso's data file descriptor and updates
|
|
|
|
* list/count of open DSO objects.
|
|
|
|
*/
|
2014-04-30 20:00:59 +07:00
|
|
|
static int open_dso(struct dso *dso, struct machine *machine)
|
|
|
|
{
|
|
|
|
int fd = __open_dso(dso, machine);
|
|
|
|
|
2014-07-17 15:43:09 +07:00
|
|
|
if (fd >= 0) {
|
2014-04-30 20:00:59 +07:00
|
|
|
dso__list_add(dso);
|
perf tools: Cache dso data file descriptor
Caching dso data file descriptors to avoid expensive re-opens
especially during DWARF unwind.
We keep dsos data file descriptors open until their count reaches
the half of the current fd open limit (RLIMIT_NOFILE). In this case
we close file descriptor of the first opened dso object.
We've got overall speedup (~27% for my workload) of report:
'perf report --stdio -i perf-test.data' (3 runs)
(perf-test.data size was around 12GB)
current code:
545,640,944,228 cycles ( +- 0.53% )
785,255,798,320 instructions ( +- 0.03% )
366.340910010 seconds time elapsed ( +- 3.65% )
after change:
435,895,036,114 cycles ( +- 0.26% )
636,790,271,176 instructions ( +- 0.04% )
266.481463387 seconds time elapsed ( +- 0.13% )
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Arnaldo Carvalho de Melo <acme@kernel.org>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jean Pihet <jean.pihet@linaro.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1401892622-30848-7-git-send-email-jolsa@kernel.org
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
2014-04-30 20:47:27 +07:00
|
|
|
/*
|
|
|
|
* Check if we crossed the allowed number
|
|
|
|
* of opened DSOs and close one if needed.
|
|
|
|
*/
|
|
|
|
check_data_close();
|
|
|
|
}
|
2014-04-30 20:00:59 +07:00
|
|
|
|
|
|
|
return fd;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void close_data_fd(struct dso *dso)
|
2014-04-28 21:43:43 +07:00
|
|
|
{
|
|
|
|
if (dso->data.fd >= 0) {
|
|
|
|
close(dso->data.fd);
|
|
|
|
dso->data.fd = -1;
|
2014-05-07 23:51:41 +07:00
|
|
|
dso->data.file_size = 0;
|
2014-04-30 20:00:59 +07:00
|
|
|
dso__list_del(dso);
|
2014-04-28 21:43:43 +07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/**
|
|
|
|
* dso_close - Close DSO data file
|
|
|
|
* @dso: dso object
|
|
|
|
*
|
|
|
|
* Close @dso's data file descriptor and updates
|
|
|
|
* list/count of open DSO objects.
|
|
|
|
*/
|
2014-04-30 20:00:59 +07:00
|
|
|
static void close_dso(struct dso *dso)
|
|
|
|
{
|
|
|
|
close_data_fd(dso);
|
|
|
|
}
|
|
|
|
|
perf tools: Cache dso data file descriptor
Caching dso data file descriptors to avoid expensive re-opens
especially during DWARF unwind.
We keep dsos data file descriptors open until their count reaches
the half of the current fd open limit (RLIMIT_NOFILE). In this case
we close file descriptor of the first opened dso object.
We've got overall speedup (~27% for my workload) of report:
'perf report --stdio -i perf-test.data' (3 runs)
(perf-test.data size was around 12GB)
current code:
545,640,944,228 cycles ( +- 0.53% )
785,255,798,320 instructions ( +- 0.03% )
366.340910010 seconds time elapsed ( +- 3.65% )
after change:
435,895,036,114 cycles ( +- 0.26% )
636,790,271,176 instructions ( +- 0.04% )
266.481463387 seconds time elapsed ( +- 0.13% )
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Arnaldo Carvalho de Melo <acme@kernel.org>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jean Pihet <jean.pihet@linaro.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1401892622-30848-7-git-send-email-jolsa@kernel.org
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
2014-04-30 20:47:27 +07:00
|
|
|
static void close_first_dso(void)
|
|
|
|
{
|
|
|
|
struct dso *dso;
|
|
|
|
|
|
|
|
dso = list_first_entry(&dso__data_open, struct dso, data.open_entry);
|
|
|
|
close_dso(dso);
|
|
|
|
}
|
|
|
|
|
|
|
|
static rlim_t get_fd_limit(void)
|
|
|
|
{
|
|
|
|
struct rlimit l;
|
|
|
|
rlim_t limit = 0;
|
|
|
|
|
|
|
|
/* Allow half of the current open fd limit. */
|
|
|
|
if (getrlimit(RLIMIT_NOFILE, &l) == 0) {
|
|
|
|
if (l.rlim_cur == RLIM_INFINITY)
|
|
|
|
limit = l.rlim_cur;
|
|
|
|
else
|
|
|
|
limit = l.rlim_cur / 2;
|
|
|
|
} else {
|
|
|
|
pr_err("failed to get fd limit\n");
|
|
|
|
limit = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return limit;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool may_cache_fd(void)
|
|
|
|
{
|
|
|
|
static rlim_t limit;
|
|
|
|
|
|
|
|
if (!limit)
|
|
|
|
limit = get_fd_limit();
|
|
|
|
|
|
|
|
if (limit == RLIM_INFINITY)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
return limit > (rlim_t) dso__data_open_cnt;
|
|
|
|
}
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/*
|
|
|
|
* Check and close LRU dso if we crossed allowed limit
|
|
|
|
* for opened dso file descriptors. The limit is half
|
|
|
|
* of the RLIMIT_NOFILE files opened.
|
|
|
|
*/
|
perf tools: Cache dso data file descriptor
Caching dso data file descriptors to avoid expensive re-opens
especially during DWARF unwind.
We keep dsos data file descriptors open until their count reaches
the half of the current fd open limit (RLIMIT_NOFILE). In this case
we close file descriptor of the first opened dso object.
We've got overall speedup (~27% for my workload) of report:
'perf report --stdio -i perf-test.data' (3 runs)
(perf-test.data size was around 12GB)
current code:
545,640,944,228 cycles ( +- 0.53% )
785,255,798,320 instructions ( +- 0.03% )
366.340910010 seconds time elapsed ( +- 3.65% )
after change:
435,895,036,114 cycles ( +- 0.26% )
636,790,271,176 instructions ( +- 0.04% )
266.481463387 seconds time elapsed ( +- 0.13% )
Acked-by: Namhyung Kim <namhyung@kernel.org>
Cc: Arnaldo Carvalho de Melo <acme@kernel.org>
Cc: Corey Ashford <cjashfor@linux.vnet.ibm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jean Pihet <jean.pihet@linaro.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1401892622-30848-7-git-send-email-jolsa@kernel.org
Signed-off-by: Jiri Olsa <jolsa@kernel.org>
2014-04-30 20:47:27 +07:00
|
|
|
static void check_data_close(void)
|
|
|
|
{
|
|
|
|
bool cache_fd = may_cache_fd();
|
|
|
|
|
|
|
|
if (!cache_fd)
|
|
|
|
close_first_dso();
|
|
|
|
}
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/**
|
|
|
|
* dso__data_close - Close DSO data file
|
|
|
|
* @dso: dso object
|
|
|
|
*
|
|
|
|
* External interface to close @dso's data file descriptor.
|
|
|
|
*/
|
2014-04-30 20:00:59 +07:00
|
|
|
void dso__data_close(struct dso *dso)
|
|
|
|
{
|
2015-05-18 07:30:42 +07:00
|
|
|
pthread_mutex_lock(&dso__data_open_lock);
|
2014-04-30 20:00:59 +07:00
|
|
|
close_dso(dso);
|
2015-05-18 07:30:42 +07:00
|
|
|
pthread_mutex_unlock(&dso__data_open_lock);
|
2014-04-30 20:00:59 +07:00
|
|
|
}
|
|
|
|
|
2015-05-20 23:03:39 +07:00
|
|
|
static void try_to_open_dso(struct dso *dso, struct machine *machine)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2013-12-17 02:57:43 +07:00
|
|
|
enum dso_binary_type binary_type_data[] = {
|
2012-10-28 04:18:32 +07:00
|
|
|
DSO_BINARY_TYPE__BUILD_ID_CACHE,
|
|
|
|
DSO_BINARY_TYPE__SYSTEM_PATH_DSO,
|
|
|
|
DSO_BINARY_TYPE__NOT_FOUND,
|
|
|
|
};
|
|
|
|
int i = 0;
|
|
|
|
|
2014-04-28 21:43:43 +07:00
|
|
|
if (dso->data.fd >= 0)
|
2015-05-20 23:03:39 +07:00
|
|
|
return;
|
2014-04-28 21:43:43 +07:00
|
|
|
|
|
|
|
if (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND) {
|
|
|
|
dso->data.fd = open_dso(dso, machine);
|
2014-07-22 20:17:18 +07:00
|
|
|
goto out;
|
2014-04-28 21:43:43 +07:00
|
|
|
}
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
do {
|
2013-12-18 02:14:07 +07:00
|
|
|
dso->binary_type = binary_type_data[i++];
|
2012-10-28 04:18:32 +07:00
|
|
|
|
2014-07-22 20:17:18 +07:00
|
|
|
dso->data.fd = open_dso(dso, machine);
|
|
|
|
if (dso->data.fd >= 0)
|
|
|
|
goto out;
|
2012-10-28 04:18:32 +07:00
|
|
|
|
2013-12-18 02:14:07 +07:00
|
|
|
} while (dso->binary_type != DSO_BINARY_TYPE__NOT_FOUND);
|
2014-07-22 20:17:18 +07:00
|
|
|
out:
|
|
|
|
if (dso->data.fd >= 0)
|
|
|
|
dso->data.status = DSO_DATA_STATUS_OK;
|
|
|
|
else
|
|
|
|
dso->data.status = DSO_DATA_STATUS_ERROR;
|
2015-05-20 23:03:39 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2015-05-20 23:03:41 +07:00
|
|
|
* dso__data_get_fd - Get dso's data file descriptor
|
2015-05-20 23:03:39 +07:00
|
|
|
* @dso: dso object
|
|
|
|
* @machine: machine object
|
|
|
|
*
|
|
|
|
* External interface to find dso's file, open it and
|
2015-05-20 23:03:41 +07:00
|
|
|
* returns file descriptor. It should be paired with
|
|
|
|
* dso__data_put_fd() if it returns non-negative value.
|
2015-05-20 23:03:39 +07:00
|
|
|
*/
|
2015-05-20 23:03:41 +07:00
|
|
|
int dso__data_get_fd(struct dso *dso, struct machine *machine)
|
2015-05-20 23:03:39 +07:00
|
|
|
{
|
|
|
|
if (dso->data.status == DSO_DATA_STATUS_ERROR)
|
|
|
|
return -1;
|
2012-10-28 04:18:32 +07:00
|
|
|
|
2015-05-20 23:03:41 +07:00
|
|
|
if (pthread_mutex_lock(&dso__data_open_lock) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2015-05-20 23:03:39 +07:00
|
|
|
try_to_open_dso(dso, machine);
|
2015-05-20 23:03:41 +07:00
|
|
|
|
|
|
|
if (dso->data.fd < 0)
|
|
|
|
pthread_mutex_unlock(&dso__data_open_lock);
|
2015-05-20 23:03:39 +07:00
|
|
|
|
2014-07-22 20:17:18 +07:00
|
|
|
return dso->data.fd;
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
2015-05-20 23:03:41 +07:00
|
|
|
void dso__data_put_fd(struct dso *dso __maybe_unused)
|
|
|
|
{
|
|
|
|
pthread_mutex_unlock(&dso__data_open_lock);
|
|
|
|
}
|
|
|
|
|
2014-07-22 20:17:19 +07:00
|
|
|
bool dso__data_status_seen(struct dso *dso, enum dso_data_status_seen by)
|
|
|
|
{
|
|
|
|
u32 flag = 1 << by;
|
|
|
|
|
|
|
|
if (dso->data.status_seen & flag)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
dso->data.status_seen |= flag;
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
static void
|
2015-05-18 07:30:41 +07:00
|
|
|
dso_cache__free(struct dso *dso)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2015-05-18 07:30:41 +07:00
|
|
|
struct rb_root *root = &dso->data.cache;
|
2012-10-28 04:18:32 +07:00
|
|
|
struct rb_node *next = rb_first(root);
|
|
|
|
|
2015-05-18 07:30:41 +07:00
|
|
|
pthread_mutex_lock(&dso->lock);
|
2012-10-28 04:18:32 +07:00
|
|
|
while (next) {
|
|
|
|
struct dso_cache *cache;
|
|
|
|
|
|
|
|
cache = rb_entry(next, struct dso_cache, rb_node);
|
|
|
|
next = rb_next(&cache->rb_node);
|
|
|
|
rb_erase(&cache->rb_node, root);
|
|
|
|
free(cache);
|
|
|
|
}
|
2015-05-18 07:30:41 +07:00
|
|
|
pthread_mutex_unlock(&dso->lock);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
2015-05-18 07:30:41 +07:00
|
|
|
static struct dso_cache *dso_cache__find(struct dso *dso, u64 offset)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2015-05-18 07:30:41 +07:00
|
|
|
const struct rb_root *root = &dso->data.cache;
|
2013-12-11 01:46:29 +07:00
|
|
|
struct rb_node * const *p = &root->rb_node;
|
|
|
|
const struct rb_node *parent = NULL;
|
2012-10-28 04:18:32 +07:00
|
|
|
struct dso_cache *cache;
|
|
|
|
|
|
|
|
while (*p != NULL) {
|
|
|
|
u64 end;
|
|
|
|
|
|
|
|
parent = *p;
|
|
|
|
cache = rb_entry(parent, struct dso_cache, rb_node);
|
|
|
|
end = cache->offset + DSO__DATA_CACHE_SIZE;
|
|
|
|
|
|
|
|
if (offset < cache->offset)
|
|
|
|
p = &(*p)->rb_left;
|
|
|
|
else if (offset >= end)
|
|
|
|
p = &(*p)->rb_right;
|
|
|
|
else
|
|
|
|
return cache;
|
|
|
|
}
|
2015-05-18 07:30:41 +07:00
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2015-05-18 07:30:41 +07:00
|
|
|
static struct dso_cache *
|
|
|
|
dso_cache__insert(struct dso *dso, struct dso_cache *new)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2015-05-18 07:30:41 +07:00
|
|
|
struct rb_root *root = &dso->data.cache;
|
2012-10-28 04:18:32 +07:00
|
|
|
struct rb_node **p = &root->rb_node;
|
|
|
|
struct rb_node *parent = NULL;
|
|
|
|
struct dso_cache *cache;
|
|
|
|
u64 offset = new->offset;
|
|
|
|
|
2015-05-18 07:30:41 +07:00
|
|
|
pthread_mutex_lock(&dso->lock);
|
2012-10-28 04:18:32 +07:00
|
|
|
while (*p != NULL) {
|
|
|
|
u64 end;
|
|
|
|
|
|
|
|
parent = *p;
|
|
|
|
cache = rb_entry(parent, struct dso_cache, rb_node);
|
|
|
|
end = cache->offset + DSO__DATA_CACHE_SIZE;
|
|
|
|
|
|
|
|
if (offset < cache->offset)
|
|
|
|
p = &(*p)->rb_left;
|
|
|
|
else if (offset >= end)
|
|
|
|
p = &(*p)->rb_right;
|
2015-05-18 07:30:41 +07:00
|
|
|
else
|
|
|
|
goto out;
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
rb_link_node(&new->rb_node, parent, p);
|
|
|
|
rb_insert_color(&new->rb_node, root);
|
2015-05-18 07:30:41 +07:00
|
|
|
|
|
|
|
cache = NULL;
|
|
|
|
out:
|
|
|
|
pthread_mutex_unlock(&dso->lock);
|
|
|
|
return cache;
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
dso_cache__memcpy(struct dso_cache *cache, u64 offset,
|
|
|
|
u8 *data, u64 size)
|
|
|
|
{
|
|
|
|
u64 cache_offset = offset - cache->offset;
|
|
|
|
u64 cache_size = min(cache->size - cache_offset, size);
|
|
|
|
|
|
|
|
memcpy(data, cache->data + cache_offset, cache_size);
|
|
|
|
return cache_size;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
2015-05-18 07:30:42 +07:00
|
|
|
dso_cache__read(struct dso *dso, struct machine *machine,
|
|
|
|
u64 offset, u8 *data, ssize_t size)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
struct dso_cache *cache;
|
2015-05-18 07:30:41 +07:00
|
|
|
struct dso_cache *old;
|
2012-10-28 04:18:32 +07:00
|
|
|
ssize_t ret;
|
|
|
|
|
|
|
|
do {
|
|
|
|
u64 cache_offset;
|
|
|
|
|
|
|
|
cache = zalloc(sizeof(*cache) + DSO__DATA_CACHE_SIZE);
|
|
|
|
if (!cache)
|
2015-05-18 07:30:42 +07:00
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
pthread_mutex_lock(&dso__data_open_lock);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* dso->data.fd might be closed if other thread opened another
|
|
|
|
* file (dso) due to open file limit (RLIMIT_NOFILE).
|
|
|
|
*/
|
2015-05-20 23:03:39 +07:00
|
|
|
try_to_open_dso(dso, machine);
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
if (dso->data.fd < 0) {
|
2015-05-20 23:03:39 +07:00
|
|
|
ret = -errno;
|
|
|
|
dso->data.status = DSO_DATA_STATUS_ERROR;
|
|
|
|
break;
|
2015-05-18 07:30:42 +07:00
|
|
|
}
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
cache_offset = offset & DSO__DATA_CACHE_MASK;
|
|
|
|
|
2015-01-30 03:02:01 +07:00
|
|
|
ret = pread(dso->data.fd, cache->data, DSO__DATA_CACHE_SIZE, cache_offset);
|
2012-10-28 04:18:32 +07:00
|
|
|
if (ret <= 0)
|
|
|
|
break;
|
|
|
|
|
|
|
|
cache->offset = cache_offset;
|
|
|
|
cache->size = ret;
|
2015-05-18 07:30:42 +07:00
|
|
|
} while (0);
|
|
|
|
|
|
|
|
pthread_mutex_unlock(&dso__data_open_lock);
|
|
|
|
|
|
|
|
if (ret > 0) {
|
2015-05-18 07:30:41 +07:00
|
|
|
old = dso_cache__insert(dso, cache);
|
|
|
|
if (old) {
|
|
|
|
/* we lose the race */
|
|
|
|
free(cache);
|
|
|
|
cache = old;
|
|
|
|
}
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
ret = dso_cache__memcpy(cache, offset, data, size);
|
2015-05-18 07:30:42 +07:00
|
|
|
}
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
if (ret <= 0)
|
|
|
|
free(cache);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
static ssize_t dso_cache_read(struct dso *dso, struct machine *machine,
|
|
|
|
u64 offset, u8 *data, ssize_t size)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
struct dso_cache *cache;
|
|
|
|
|
2015-05-18 07:30:41 +07:00
|
|
|
cache = dso_cache__find(dso, offset);
|
2012-10-28 04:18:32 +07:00
|
|
|
if (cache)
|
|
|
|
return dso_cache__memcpy(cache, offset, data, size);
|
|
|
|
else
|
2015-05-18 07:30:42 +07:00
|
|
|
return dso_cache__read(dso, machine, offset, data, size);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/*
|
|
|
|
* Reads and caches dso data DSO__DATA_CACHE_SIZE size chunks
|
|
|
|
* in the rb_tree. Any read to already cached data is served
|
|
|
|
* by cached data.
|
|
|
|
*/
|
2015-05-18 07:30:42 +07:00
|
|
|
static ssize_t cached_read(struct dso *dso, struct machine *machine,
|
|
|
|
u64 offset, u8 *data, ssize_t size)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
ssize_t r = 0;
|
|
|
|
u8 *p = data;
|
|
|
|
|
|
|
|
do {
|
|
|
|
ssize_t ret;
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
ret = dso_cache_read(dso, machine, offset, p, size);
|
2012-10-28 04:18:32 +07:00
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
/* Reached EOF, return what we have. */
|
|
|
|
if (!ret)
|
|
|
|
break;
|
|
|
|
|
|
|
|
BUG_ON(ret > size);
|
|
|
|
|
|
|
|
r += ret;
|
|
|
|
p += ret;
|
|
|
|
offset += ret;
|
|
|
|
size -= ret;
|
|
|
|
|
|
|
|
} while (size);
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
static int data_file_size(struct dso *dso, struct machine *machine)
|
2014-05-07 23:51:41 +07:00
|
|
|
{
|
2015-05-18 07:30:42 +07:00
|
|
|
int ret = 0;
|
2014-05-07 23:51:41 +07:00
|
|
|
struct stat st;
|
2014-08-14 09:22:36 +07:00
|
|
|
char sbuf[STRERR_BUFSIZE];
|
2014-05-07 23:51:41 +07:00
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
if (dso->data.file_size)
|
|
|
|
return 0;
|
|
|
|
|
2015-05-20 23:03:39 +07:00
|
|
|
if (dso->data.status == DSO_DATA_STATUS_ERROR)
|
|
|
|
return -1;
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
pthread_mutex_lock(&dso__data_open_lock);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* dso->data.fd might be closed if other thread opened another
|
|
|
|
* file (dso) due to open file limit (RLIMIT_NOFILE).
|
|
|
|
*/
|
2015-05-20 23:03:39 +07:00
|
|
|
try_to_open_dso(dso, machine);
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
if (dso->data.fd < 0) {
|
2015-05-20 23:03:39 +07:00
|
|
|
ret = -errno;
|
|
|
|
dso->data.status = DSO_DATA_STATUS_ERROR;
|
|
|
|
goto out;
|
2014-05-07 23:51:41 +07:00
|
|
|
}
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
if (fstat(dso->data.fd, &st) < 0) {
|
|
|
|
ret = -errno;
|
|
|
|
pr_err("dso cache fstat failed: %s\n",
|
|
|
|
strerror_r(errno, sbuf, sizeof(sbuf)));
|
|
|
|
dso->data.status = DSO_DATA_STATUS_ERROR;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
dso->data.file_size = st.st_size;
|
|
|
|
|
|
|
|
out:
|
|
|
|
pthread_mutex_unlock(&dso__data_open_lock);
|
|
|
|
return ret;
|
2014-05-07 23:51:41 +07:00
|
|
|
}
|
|
|
|
|
2014-07-22 20:17:35 +07:00
|
|
|
/**
|
|
|
|
* dso__data_size - Return dso data size
|
|
|
|
* @dso: dso object
|
|
|
|
* @machine: machine object
|
|
|
|
*
|
|
|
|
* Return: dso data size
|
|
|
|
*/
|
|
|
|
off_t dso__data_size(struct dso *dso, struct machine *machine)
|
|
|
|
{
|
2015-05-18 07:30:42 +07:00
|
|
|
if (data_file_size(dso, machine))
|
2014-07-22 20:17:35 +07:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* For now just estimate dso data size is close to file size */
|
|
|
|
return dso->data.file_size;
|
|
|
|
}
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
static ssize_t data_read_offset(struct dso *dso, struct machine *machine,
|
|
|
|
u64 offset, u8 *data, ssize_t size)
|
2014-05-07 23:51:41 +07:00
|
|
|
{
|
2015-05-18 07:30:42 +07:00
|
|
|
if (data_file_size(dso, machine))
|
2014-05-07 23:51:41 +07:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
/* Check the offset sanity. */
|
|
|
|
if (offset > dso->data.file_size)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (offset + size < offset)
|
|
|
|
return -1;
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
return cached_read(dso, machine, offset, data, size);
|
2014-05-07 23:51:41 +07:00
|
|
|
}
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/**
|
|
|
|
* dso__data_read_offset - Read data from dso file offset
|
|
|
|
* @dso: dso object
|
|
|
|
* @machine: machine object
|
|
|
|
* @offset: file offset
|
|
|
|
* @data: buffer to store data
|
|
|
|
* @size: size of the @data buffer
|
|
|
|
*
|
|
|
|
* External interface to read data from dso file offset. Open
|
|
|
|
* dso data file and use cached_read to get the data.
|
|
|
|
*/
|
2014-05-07 23:51:41 +07:00
|
|
|
ssize_t dso__data_read_offset(struct dso *dso, struct machine *machine,
|
|
|
|
u64 offset, u8 *data, ssize_t size)
|
|
|
|
{
|
2015-05-18 07:30:42 +07:00
|
|
|
if (dso->data.status == DSO_DATA_STATUS_ERROR)
|
2014-05-07 23:51:41 +07:00
|
|
|
return -1;
|
|
|
|
|
2015-05-18 07:30:42 +07:00
|
|
|
return data_read_offset(dso, machine, offset, data, size);
|
2014-05-07 23:51:41 +07:00
|
|
|
}
|
|
|
|
|
2014-05-08 02:09:59 +07:00
|
|
|
/**
|
|
|
|
* dso__data_read_addr - Read data from dso address
|
|
|
|
* @dso: dso object
|
|
|
|
* @machine: machine object
|
|
|
|
* @add: virtual memory address
|
|
|
|
* @data: buffer to store data
|
|
|
|
* @size: size of the @data buffer
|
|
|
|
*
|
|
|
|
* External interface to read data from dso address.
|
|
|
|
*/
|
2012-10-28 04:18:32 +07:00
|
|
|
ssize_t dso__data_read_addr(struct dso *dso, struct map *map,
|
|
|
|
struct machine *machine, u64 addr,
|
|
|
|
u8 *data, ssize_t size)
|
|
|
|
{
|
|
|
|
u64 offset = map->map_ip(map, addr);
|
|
|
|
return dso__data_read_offset(dso, machine, offset, data, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
struct map *dso__new_map(const char *name)
|
|
|
|
{
|
|
|
|
struct map *map = NULL;
|
|
|
|
struct dso *dso = dso__new(name);
|
|
|
|
|
|
|
|
if (dso)
|
|
|
|
map = map__new2(0, dso, MAP__FUNCTION);
|
|
|
|
|
|
|
|
return map;
|
|
|
|
}
|
|
|
|
|
2015-05-28 22:40:55 +07:00
|
|
|
struct dso *machine__findnew_kernel(struct machine *machine, const char *name,
|
|
|
|
const char *short_name, int dso_type)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
/*
|
|
|
|
* The kernel dso could be created by build_id processing.
|
|
|
|
*/
|
2015-05-29 21:31:12 +07:00
|
|
|
struct dso *dso = machine__findnew_dso(machine, name);
|
2012-10-28 04:18:32 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* We need to run this in all cases, since during the build_id
|
|
|
|
* processing we had no idea this was the kernel dso.
|
|
|
|
*/
|
|
|
|
if (dso != NULL) {
|
2013-12-10 21:11:46 +07:00
|
|
|
dso__set_short_name(dso, short_name, false);
|
2012-10-28 04:18:32 +07:00
|
|
|
dso->kernel = dso_type;
|
|
|
|
}
|
|
|
|
|
|
|
|
return dso;
|
|
|
|
}
|
|
|
|
|
2014-10-01 00:36:15 +07:00
|
|
|
/*
|
|
|
|
* Find a matching entry and/or link current entry to RB tree.
|
|
|
|
* Either one of the dso or name parameter must be non-NULL or the
|
|
|
|
* function will not work.
|
|
|
|
*/
|
2015-06-02 01:40:01 +07:00
|
|
|
static struct dso *__dso__findlink_by_longname(struct rb_root *root,
|
|
|
|
struct dso *dso, const char *name)
|
2014-10-01 00:36:15 +07:00
|
|
|
{
|
|
|
|
struct rb_node **p = &root->rb_node;
|
|
|
|
struct rb_node *parent = NULL;
|
|
|
|
|
|
|
|
if (!name)
|
|
|
|
name = dso->long_name;
|
|
|
|
/*
|
|
|
|
* Find node with the matching name
|
|
|
|
*/
|
|
|
|
while (*p) {
|
|
|
|
struct dso *this = rb_entry(*p, struct dso, rb_node);
|
|
|
|
int rc = strcmp(name, this->long_name);
|
|
|
|
|
|
|
|
parent = *p;
|
|
|
|
if (rc == 0) {
|
|
|
|
/*
|
|
|
|
* In case the new DSO is a duplicate of an existing
|
|
|
|
* one, print an one-time warning & put the new entry
|
|
|
|
* at the end of the list of duplicates.
|
|
|
|
*/
|
|
|
|
if (!dso || (dso == this))
|
|
|
|
return this; /* Find matching dso */
|
|
|
|
/*
|
|
|
|
* The core kernel DSOs may have duplicated long name.
|
|
|
|
* In this case, the short name should be different.
|
|
|
|
* Comparing the short names to differentiate the DSOs.
|
|
|
|
*/
|
|
|
|
rc = strcmp(dso->short_name, this->short_name);
|
|
|
|
if (rc == 0) {
|
|
|
|
pr_err("Duplicated dso name: %s\n", name);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (rc < 0)
|
|
|
|
p = &parent->rb_left;
|
|
|
|
else
|
|
|
|
p = &parent->rb_right;
|
|
|
|
}
|
|
|
|
if (dso) {
|
|
|
|
/* Add new node and rebalance tree */
|
|
|
|
rb_link_node(&dso->rb_node, parent, p);
|
|
|
|
rb_insert_color(&dso->rb_node, root);
|
2015-11-13 16:48:30 +07:00
|
|
|
dso->root = root;
|
2014-10-01 00:36:15 +07:00
|
|
|
}
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2015-06-02 01:40:01 +07:00
|
|
|
static inline struct dso *__dso__find_by_longname(struct rb_root *root,
|
|
|
|
const char *name)
|
2014-10-01 00:36:15 +07:00
|
|
|
{
|
2015-06-02 01:40:01 +07:00
|
|
|
return __dso__findlink_by_longname(root, NULL, name);
|
2014-10-01 00:36:15 +07:00
|
|
|
}
|
|
|
|
|
2013-12-11 01:19:23 +07:00
|
|
|
void dso__set_long_name(struct dso *dso, const char *name, bool name_allocated)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2015-11-13 16:48:30 +07:00
|
|
|
struct rb_root *root = dso->root;
|
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
if (name == NULL)
|
|
|
|
return;
|
2013-12-11 01:08:44 +07:00
|
|
|
|
|
|
|
if (dso->long_name_allocated)
|
2013-12-11 01:19:23 +07:00
|
|
|
free((char *)dso->long_name);
|
2013-12-11 01:08:44 +07:00
|
|
|
|
2015-11-13 16:48:30 +07:00
|
|
|
if (root) {
|
|
|
|
rb_erase(&dso->rb_node, root);
|
|
|
|
/*
|
|
|
|
* __dso__findlink_by_longname() isn't guaranteed to add it
|
|
|
|
* back, so a clean removal is required here.
|
|
|
|
*/
|
|
|
|
RB_CLEAR_NODE(&dso->rb_node);
|
|
|
|
dso->root = NULL;
|
|
|
|
}
|
|
|
|
|
2013-12-11 01:08:44 +07:00
|
|
|
dso->long_name = name;
|
|
|
|
dso->long_name_len = strlen(name);
|
|
|
|
dso->long_name_allocated = name_allocated;
|
2015-11-13 16:48:30 +07:00
|
|
|
|
|
|
|
if (root)
|
|
|
|
__dso__findlink_by_longname(root, dso, NULL);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
2013-12-10 21:11:46 +07:00
|
|
|
void dso__set_short_name(struct dso *dso, const char *name, bool name_allocated)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
if (name == NULL)
|
|
|
|
return;
|
2013-12-10 21:11:46 +07:00
|
|
|
|
|
|
|
if (dso->short_name_allocated)
|
|
|
|
free((char *)dso->short_name);
|
|
|
|
|
|
|
|
dso->short_name = name;
|
|
|
|
dso->short_name_len = strlen(name);
|
|
|
|
dso->short_name_allocated = name_allocated;
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void dso__set_basename(struct dso *dso)
|
|
|
|
{
|
2013-12-06 01:26:42 +07:00
|
|
|
/*
|
|
|
|
* basename() may modify path buffer, so we must pass
|
|
|
|
* a copy.
|
|
|
|
*/
|
|
|
|
char *base, *lname = strdup(dso->long_name);
|
|
|
|
|
|
|
|
if (!lname)
|
|
|
|
return;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* basename() may return a pointer to internal
|
|
|
|
* storage which is reused in subsequent calls
|
|
|
|
* so copy the result.
|
|
|
|
*/
|
|
|
|
base = strdup(basename(lname));
|
|
|
|
|
|
|
|
free(lname);
|
|
|
|
|
|
|
|
if (!base)
|
|
|
|
return;
|
|
|
|
|
|
|
|
dso__set_short_name(dso, base, true);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
int dso__name_len(const struct dso *dso)
|
|
|
|
{
|
|
|
|
if (!dso)
|
|
|
|
return strlen("[unknown]");
|
|
|
|
if (verbose)
|
|
|
|
return dso->long_name_len;
|
|
|
|
|
|
|
|
return dso->short_name_len;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool dso__loaded(const struct dso *dso, enum map_type type)
|
|
|
|
{
|
|
|
|
return dso->loaded & (1 << type);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool dso__sorted_by_name(const struct dso *dso, enum map_type type)
|
|
|
|
{
|
|
|
|
return dso->sorted_by_name & (1 << type);
|
|
|
|
}
|
|
|
|
|
|
|
|
void dso__set_sorted_by_name(struct dso *dso, enum map_type type)
|
|
|
|
{
|
|
|
|
dso->sorted_by_name |= (1 << type);
|
|
|
|
}
|
|
|
|
|
|
|
|
struct dso *dso__new(const char *name)
|
|
|
|
{
|
|
|
|
struct dso *dso = calloc(1, sizeof(*dso) + strlen(name) + 1);
|
|
|
|
|
|
|
|
if (dso != NULL) {
|
|
|
|
int i;
|
|
|
|
strcpy(dso->name, name);
|
2013-12-11 01:08:44 +07:00
|
|
|
dso__set_long_name(dso, dso->name, false);
|
2013-12-10 21:11:46 +07:00
|
|
|
dso__set_short_name(dso, dso->name, false);
|
2012-10-28 04:18:32 +07:00
|
|
|
for (i = 0; i < MAP__NR_TYPES; ++i)
|
|
|
|
dso->symbols[i] = dso->symbol_names[i] = RB_ROOT;
|
2014-05-07 23:30:45 +07:00
|
|
|
dso->data.cache = RB_ROOT;
|
2014-04-28 21:43:43 +07:00
|
|
|
dso->data.fd = -1;
|
2014-07-22 20:17:18 +07:00
|
|
|
dso->data.status = DSO_DATA_STATUS_UNKNOWN;
|
2012-10-28 04:18:32 +07:00
|
|
|
dso->symtab_type = DSO_BINARY_TYPE__NOT_FOUND;
|
2013-12-18 02:14:07 +07:00
|
|
|
dso->binary_type = DSO_BINARY_TYPE__NOT_FOUND;
|
2014-07-14 17:02:41 +07:00
|
|
|
dso->is_64_bit = (sizeof(void *) == 8);
|
2012-10-28 04:18:32 +07:00
|
|
|
dso->loaded = 0;
|
2013-08-07 18:38:50 +07:00
|
|
|
dso->rel = 0;
|
2012-10-28 04:18:32 +07:00
|
|
|
dso->sorted_by_name = 0;
|
|
|
|
dso->has_build_id = 0;
|
2013-09-11 12:09:31 +07:00
|
|
|
dso->has_srcline = 1;
|
2013-12-03 14:23:10 +07:00
|
|
|
dso->a2l_fails = 1;
|
2012-10-28 04:18:32 +07:00
|
|
|
dso->kernel = DSO_TYPE_USER;
|
|
|
|
dso->needs_swap = DSO_SWAP__UNSET;
|
2014-10-01 00:36:15 +07:00
|
|
|
RB_CLEAR_NODE(&dso->rb_node);
|
2015-11-13 16:48:30 +07:00
|
|
|
dso->root = NULL;
|
2012-10-28 04:18:32 +07:00
|
|
|
INIT_LIST_HEAD(&dso->node);
|
2014-04-30 20:00:59 +07:00
|
|
|
INIT_LIST_HEAD(&dso->data.open_entry);
|
2015-05-18 07:30:40 +07:00
|
|
|
pthread_mutex_init(&dso->lock, NULL);
|
2015-06-02 21:53:26 +07:00
|
|
|
atomic_set(&dso->refcnt, 1);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
return dso;
|
|
|
|
}
|
|
|
|
|
|
|
|
void dso__delete(struct dso *dso)
|
|
|
|
{
|
|
|
|
int i;
|
2014-10-01 00:36:15 +07:00
|
|
|
|
|
|
|
if (!RB_EMPTY_NODE(&dso->rb_node))
|
|
|
|
pr_err("DSO %s is still in rbtree when being deleted!\n",
|
|
|
|
dso->long_name);
|
2012-10-28 04:18:32 +07:00
|
|
|
for (i = 0; i < MAP__NR_TYPES; ++i)
|
|
|
|
symbols__delete(&dso->symbols[i]);
|
2013-12-11 01:26:55 +07:00
|
|
|
|
|
|
|
if (dso->short_name_allocated) {
|
2013-12-27 03:41:15 +07:00
|
|
|
zfree((char **)&dso->short_name);
|
2013-12-11 01:26:55 +07:00
|
|
|
dso->short_name_allocated = false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (dso->long_name_allocated) {
|
2013-12-27 03:41:15 +07:00
|
|
|
zfree((char **)&dso->long_name);
|
2013-12-11 01:26:55 +07:00
|
|
|
dso->long_name_allocated = false;
|
|
|
|
}
|
|
|
|
|
2014-04-28 21:43:43 +07:00
|
|
|
dso__data_close(dso);
|
2015-04-09 22:53:55 +07:00
|
|
|
auxtrace_cache__free(dso->auxtrace_cache);
|
2015-05-18 07:30:41 +07:00
|
|
|
dso_cache__free(dso);
|
2013-12-03 14:23:07 +07:00
|
|
|
dso__free_a2l(dso);
|
2013-12-27 03:41:15 +07:00
|
|
|
zfree(&dso->symsrc_filename);
|
2015-05-18 07:30:40 +07:00
|
|
|
pthread_mutex_destroy(&dso->lock);
|
2012-10-28 04:18:32 +07:00
|
|
|
free(dso);
|
|
|
|
}
|
|
|
|
|
2015-06-02 21:53:26 +07:00
|
|
|
struct dso *dso__get(struct dso *dso)
|
|
|
|
{
|
|
|
|
if (dso)
|
|
|
|
atomic_inc(&dso->refcnt);
|
|
|
|
return dso;
|
|
|
|
}
|
|
|
|
|
|
|
|
void dso__put(struct dso *dso)
|
|
|
|
{
|
|
|
|
if (dso && atomic_dec_and_test(&dso->refcnt))
|
|
|
|
dso__delete(dso);
|
|
|
|
}
|
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
void dso__set_build_id(struct dso *dso, void *build_id)
|
|
|
|
{
|
|
|
|
memcpy(dso->build_id, build_id, sizeof(dso->build_id));
|
|
|
|
dso->has_build_id = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool dso__build_id_equal(const struct dso *dso, u8 *build_id)
|
|
|
|
{
|
|
|
|
return memcmp(dso->build_id, build_id, sizeof(dso->build_id)) == 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void dso__read_running_kernel_build_id(struct dso *dso, struct machine *machine)
|
|
|
|
{
|
|
|
|
char path[PATH_MAX];
|
|
|
|
|
|
|
|
if (machine__is_default_guest(machine))
|
|
|
|
return;
|
|
|
|
sprintf(path, "%s/sys/kernel/notes", machine->root_dir);
|
|
|
|
if (sysfs__read_build_id(path, dso->build_id,
|
|
|
|
sizeof(dso->build_id)) == 0)
|
|
|
|
dso->has_build_id = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
int dso__kernel_module_get_build_id(struct dso *dso,
|
|
|
|
const char *root_dir)
|
|
|
|
{
|
|
|
|
char filename[PATH_MAX];
|
|
|
|
/*
|
|
|
|
* kernel module short names are of the form "[module]" and
|
|
|
|
* we need just "module" here.
|
|
|
|
*/
|
|
|
|
const char *name = dso->short_name + 1;
|
|
|
|
|
|
|
|
snprintf(filename, sizeof(filename),
|
|
|
|
"%s/sys/module/%.*s/notes/.note.gnu.build-id",
|
|
|
|
root_dir, (int)strlen(name) - 1, name);
|
|
|
|
|
|
|
|
if (sysfs__read_build_id(filename, dso->build_id,
|
|
|
|
sizeof(dso->build_id)) == 0)
|
|
|
|
dso->has_build_id = true;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool __dsos__read_build_ids(struct list_head *head, bool with_hits)
|
|
|
|
{
|
|
|
|
bool have_build_id = false;
|
|
|
|
struct dso *pos;
|
|
|
|
|
|
|
|
list_for_each_entry(pos, head, node) {
|
|
|
|
if (with_hits && !pos->hit)
|
|
|
|
continue;
|
|
|
|
if (pos->has_build_id) {
|
|
|
|
have_build_id = true;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (filename__read_build_id(pos->long_name, pos->build_id,
|
|
|
|
sizeof(pos->build_id)) > 0) {
|
|
|
|
have_build_id = true;
|
|
|
|
pos->has_build_id = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return have_build_id;
|
|
|
|
}
|
|
|
|
|
2015-06-02 01:40:01 +07:00
|
|
|
void __dsos__add(struct dsos *dsos, struct dso *dso)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2014-09-30 03:07:28 +07:00
|
|
|
list_add_tail(&dso->node, &dsos->head);
|
2015-06-02 01:40:01 +07:00
|
|
|
__dso__findlink_by_longname(&dsos->root, dso, NULL);
|
2015-06-02 21:53:26 +07:00
|
|
|
/*
|
|
|
|
* It is now in the linked list, grab a reference, then garbage collect
|
|
|
|
* this when needing memory, by looking at LRU dso instances in the
|
|
|
|
* list with atomic_read(&dso->refcnt) == 1, i.e. no references
|
|
|
|
* anywhere besides the one for the list, do, under a lock for the
|
|
|
|
* list: remove it from the list, then a dso__put(), that probably will
|
|
|
|
* be the last and will then call dso__delete(), end of life.
|
|
|
|
*
|
|
|
|
* That, or at the end of the 'struct machine' lifetime, when all
|
|
|
|
* 'struct dso' instances will be removed from the list, in
|
|
|
|
* dsos__exit(), if they have no other reference from some other data
|
|
|
|
* structure.
|
|
|
|
*
|
|
|
|
* E.g.: after processing a 'perf.data' file and storing references
|
|
|
|
* to objects instantiated while processing events, we will have
|
|
|
|
* references to the 'thread', 'map', 'dso' structs all from 'struct
|
|
|
|
* hist_entry' instances, but we may not need anything not referenced,
|
|
|
|
* so we might as well call machines__exit()/machines__delete() and
|
|
|
|
* garbage collect it.
|
|
|
|
*/
|
|
|
|
dso__get(dso);
|
2015-06-02 01:40:01 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
void dsos__add(struct dsos *dsos, struct dso *dso)
|
|
|
|
{
|
|
|
|
pthread_rwlock_wrlock(&dsos->lock);
|
|
|
|
__dsos__add(dsos, dso);
|
|
|
|
pthread_rwlock_unlock(&dsos->lock);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
2015-06-02 01:40:01 +07:00
|
|
|
struct dso *__dsos__find(struct dsos *dsos, const char *name, bool cmp_short)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
struct dso *pos;
|
|
|
|
|
perf symbols: Fix vdso list searching
When "perf record" was used on a large machine with a lot of CPUs, the
perf post-processing time (the time after the workload was done until
the perf command itself exited) could take a lot of minutes and even
hours depending on how large the resulting perf.data file was.
While running AIM7 1500-user high_systime workload on a 80-core x86-64
system with a 3.9 kernel (with only the -s -a options used), the
workload itself took about 2 minutes to run and the perf.data file had a
size of 1108.746 MB. However, the post-processing step took more than 10
minutes.
With a gprof-profiled perf binary, the time spent by perf was as
follows:
% cumulative self self total
time seconds seconds calls s/call s/call name
96.90 822.10 822.10 192156 0.00 0.00 dsos__find
0.81 828.96 6.86 172089958 0.00 0.00 rb_next
0.41 832.44 3.48 48539289 0.00 0.00 rb_erase
So 97% (822 seconds) of the time was spent in a single dsos_find()
function. After analyzing the call-graph data below:
-----------------------------------------------
0.00 822.12 192156/192156 map__new [6]
[7] 96.9 0.00 822.12 192156 vdso__dso_findnew [7]
822.10 0.00 192156/192156 dsos__find [8]
0.01 0.00 192156/192156 dsos__add [62]
0.01 0.00 192156/192366 dso__new [61]
0.00 0.00 1/45282525 memdup [31]
0.00 0.00 192156/192230 dso__set_long_name [91]
-----------------------------------------------
822.10 0.00 192156/192156 vdso__dso_findnew [7]
[8] 96.9 822.10 0.00 192156 dsos__find [8]
-----------------------------------------------
It was found that the vdso__dso_findnew() function failed to locate
VDSO__MAP_NAME ("[vdso]") in the dso list and have to insert a new
entry at the end for 192156 times. This problem is due to the fact that
there are 2 types of name in the dso entry - short name and long name.
The initial dso__new() adds "[vdso]" to both the short and long names.
After that, vdso__dso_findnew() modifies the long name to something
like /tmp/perf-vdso.so-NoXkDj. The dsos__find() function only compares
the long name. As a result, the same vdso entry is duplicated many
time in the dso list. This bug increases memory consumption as well
as slows the symbol processing time to a crawl.
To resolve this problem, the dsos__find() function interface was
modified to enable searching either the long name or the short
name. The vdso__dso_findnew() will now search only the short name
while the other call sites search for the long name as before.
With this change, the cpu time of perf was reduced from 848.38s to
15.77s and dsos__find() only accounted for 0.06% of the total time.
0.06 15.73 0.01 192151 0.00 0.00 dsos__find
Signed-off-by: Waiman Long <Waiman.Long@hp.com>
Acked-by: Ingo Molnar <mingo@kernel.org>
Cc: "Chandramouleeswaran, Aswin" <aswin@hp.com>
Cc: "Norton, Scott J" <scott.norton@hp.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/r/1368110568-64714-1-git-send-email-Waiman.Long@hp.com
[ replaced TRUE/FALSE with stdbool.h equivalents, fixing builds where
those macros are not present (NO_LIBPYTHON=1 NO_LIBPERL=1), fix from Jiri Olsa ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-05-09 21:42:48 +07:00
|
|
|
if (cmp_short) {
|
2014-09-30 03:07:28 +07:00
|
|
|
list_for_each_entry(pos, &dsos->head, node)
|
perf symbols: Fix vdso list searching
When "perf record" was used on a large machine with a lot of CPUs, the
perf post-processing time (the time after the workload was done until
the perf command itself exited) could take a lot of minutes and even
hours depending on how large the resulting perf.data file was.
While running AIM7 1500-user high_systime workload on a 80-core x86-64
system with a 3.9 kernel (with only the -s -a options used), the
workload itself took about 2 minutes to run and the perf.data file had a
size of 1108.746 MB. However, the post-processing step took more than 10
minutes.
With a gprof-profiled perf binary, the time spent by perf was as
follows:
% cumulative self self total
time seconds seconds calls s/call s/call name
96.90 822.10 822.10 192156 0.00 0.00 dsos__find
0.81 828.96 6.86 172089958 0.00 0.00 rb_next
0.41 832.44 3.48 48539289 0.00 0.00 rb_erase
So 97% (822 seconds) of the time was spent in a single dsos_find()
function. After analyzing the call-graph data below:
-----------------------------------------------
0.00 822.12 192156/192156 map__new [6]
[7] 96.9 0.00 822.12 192156 vdso__dso_findnew [7]
822.10 0.00 192156/192156 dsos__find [8]
0.01 0.00 192156/192156 dsos__add [62]
0.01 0.00 192156/192366 dso__new [61]
0.00 0.00 1/45282525 memdup [31]
0.00 0.00 192156/192230 dso__set_long_name [91]
-----------------------------------------------
822.10 0.00 192156/192156 vdso__dso_findnew [7]
[8] 96.9 822.10 0.00 192156 dsos__find [8]
-----------------------------------------------
It was found that the vdso__dso_findnew() function failed to locate
VDSO__MAP_NAME ("[vdso]") in the dso list and have to insert a new
entry at the end for 192156 times. This problem is due to the fact that
there are 2 types of name in the dso entry - short name and long name.
The initial dso__new() adds "[vdso]" to both the short and long names.
After that, vdso__dso_findnew() modifies the long name to something
like /tmp/perf-vdso.so-NoXkDj. The dsos__find() function only compares
the long name. As a result, the same vdso entry is duplicated many
time in the dso list. This bug increases memory consumption as well
as slows the symbol processing time to a crawl.
To resolve this problem, the dsos__find() function interface was
modified to enable searching either the long name or the short
name. The vdso__dso_findnew() will now search only the short name
while the other call sites search for the long name as before.
With this change, the cpu time of perf was reduced from 848.38s to
15.77s and dsos__find() only accounted for 0.06% of the total time.
0.06 15.73 0.01 192151 0.00 0.00 dsos__find
Signed-off-by: Waiman Long <Waiman.Long@hp.com>
Acked-by: Ingo Molnar <mingo@kernel.org>
Cc: "Chandramouleeswaran, Aswin" <aswin@hp.com>
Cc: "Norton, Scott J" <scott.norton@hp.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Stephane Eranian <eranian@google.com>
Link: http://lkml.kernel.org/r/1368110568-64714-1-git-send-email-Waiman.Long@hp.com
[ replaced TRUE/FALSE with stdbool.h equivalents, fixing builds where
those macros are not present (NO_LIBPYTHON=1 NO_LIBPERL=1), fix from Jiri Olsa ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-05-09 21:42:48 +07:00
|
|
|
if (strcmp(pos->short_name, name) == 0)
|
|
|
|
return pos;
|
|
|
|
return NULL;
|
|
|
|
}
|
2015-06-02 01:40:01 +07:00
|
|
|
return __dso__find_by_longname(&dsos->root, name);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
|
2015-06-02 01:40:01 +07:00
|
|
|
struct dso *dsos__find(struct dsos *dsos, const char *name, bool cmp_short)
|
|
|
|
{
|
|
|
|
struct dso *dso;
|
|
|
|
pthread_rwlock_rdlock(&dsos->lock);
|
|
|
|
dso = __dsos__find(dsos, name, cmp_short);
|
|
|
|
pthread_rwlock_unlock(&dsos->lock);
|
|
|
|
return dso;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct dso *__dsos__addnew(struct dsos *dsos, const char *name)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
2015-02-13 04:06:09 +07:00
|
|
|
struct dso *dso = dso__new(name);
|
2012-10-28 04:18:32 +07:00
|
|
|
|
2015-02-13 04:06:09 +07:00
|
|
|
if (dso != NULL) {
|
2015-06-02 01:40:01 +07:00
|
|
|
__dsos__add(dsos, dso);
|
2015-02-13 04:06:09 +07:00
|
|
|
dso__set_basename(dso);
|
2015-11-18 13:40:31 +07:00
|
|
|
/* Put dso here because __dsos_add already got it */
|
|
|
|
dso__put(dso);
|
2012-10-28 04:18:32 +07:00
|
|
|
}
|
|
|
|
return dso;
|
|
|
|
}
|
|
|
|
|
2015-02-13 04:06:09 +07:00
|
|
|
struct dso *__dsos__findnew(struct dsos *dsos, const char *name)
|
|
|
|
{
|
2015-06-02 01:40:01 +07:00
|
|
|
struct dso *dso = __dsos__find(dsos, name, false);
|
|
|
|
|
|
|
|
return dso ? dso : __dsos__addnew(dsos, name);
|
|
|
|
}
|
2015-02-13 04:06:09 +07:00
|
|
|
|
2015-06-02 01:40:01 +07:00
|
|
|
struct dso *dsos__findnew(struct dsos *dsos, const char *name)
|
|
|
|
{
|
|
|
|
struct dso *dso;
|
|
|
|
pthread_rwlock_wrlock(&dsos->lock);
|
2015-06-02 21:53:26 +07:00
|
|
|
dso = dso__get(__dsos__findnew(dsos, name));
|
2015-06-02 01:40:01 +07:00
|
|
|
pthread_rwlock_unlock(&dsos->lock);
|
|
|
|
return dso;
|
2015-02-13 04:06:09 +07:00
|
|
|
}
|
|
|
|
|
2012-10-28 04:18:32 +07:00
|
|
|
size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp,
|
2012-12-07 19:53:58 +07:00
|
|
|
bool (skip)(struct dso *dso, int parm), int parm)
|
2012-10-28 04:18:32 +07:00
|
|
|
{
|
|
|
|
struct dso *pos;
|
|
|
|
size_t ret = 0;
|
|
|
|
|
|
|
|
list_for_each_entry(pos, head, node) {
|
2012-12-07 19:53:58 +07:00
|
|
|
if (skip && skip(pos, parm))
|
2012-10-28 04:18:32 +07:00
|
|
|
continue;
|
|
|
|
ret += dso__fprintf_buildid(pos, fp);
|
|
|
|
ret += fprintf(fp, " %s\n", pos->long_name);
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t __dsos__fprintf(struct list_head *head, FILE *fp)
|
|
|
|
{
|
|
|
|
struct dso *pos;
|
|
|
|
size_t ret = 0;
|
|
|
|
|
|
|
|
list_for_each_entry(pos, head, node) {
|
|
|
|
int i;
|
|
|
|
for (i = 0; i < MAP__NR_TYPES; ++i)
|
|
|
|
ret += dso__fprintf(pos, i, fp);
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t dso__fprintf_buildid(struct dso *dso, FILE *fp)
|
|
|
|
{
|
|
|
|
char sbuild_id[BUILD_ID_SIZE * 2 + 1];
|
|
|
|
|
|
|
|
build_id__sprintf(dso->build_id, sizeof(dso->build_id), sbuild_id);
|
|
|
|
return fprintf(fp, "%s", sbuild_id);
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t dso__fprintf(struct dso *dso, enum map_type type, FILE *fp)
|
|
|
|
{
|
|
|
|
struct rb_node *nd;
|
|
|
|
size_t ret = fprintf(fp, "dso: %s (", dso->short_name);
|
|
|
|
|
|
|
|
if (dso->short_name != dso->long_name)
|
|
|
|
ret += fprintf(fp, "%s, ", dso->long_name);
|
|
|
|
ret += fprintf(fp, "%s, %sloaded, ", map_type__name[type],
|
2012-11-20 16:51:02 +07:00
|
|
|
dso__loaded(dso, type) ? "" : "NOT ");
|
2012-10-28 04:18:32 +07:00
|
|
|
ret += dso__fprintf_buildid(dso, fp);
|
|
|
|
ret += fprintf(fp, ")\n");
|
|
|
|
for (nd = rb_first(&dso->symbols[type]); nd; nd = rb_next(nd)) {
|
|
|
|
struct symbol *pos = rb_entry(nd, struct symbol, rb_node);
|
|
|
|
ret += symbol__fprintf(pos, fp);
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
2014-07-22 20:17:59 +07:00
|
|
|
|
|
|
|
enum dso_type dso__type(struct dso *dso, struct machine *machine)
|
|
|
|
{
|
|
|
|
int fd;
|
2015-05-20 23:03:41 +07:00
|
|
|
enum dso_type type = DSO__TYPE_UNKNOWN;
|
2014-07-22 20:17:59 +07:00
|
|
|
|
2015-05-20 23:03:41 +07:00
|
|
|
fd = dso__data_get_fd(dso, machine);
|
|
|
|
if (fd >= 0) {
|
|
|
|
type = dso__type_fd(fd);
|
|
|
|
dso__data_put_fd(dso);
|
|
|
|
}
|
2014-07-22 20:17:59 +07:00
|
|
|
|
2015-05-20 23:03:41 +07:00
|
|
|
return type;
|
2014-07-22 20:17:59 +07:00
|
|
|
}
|
2015-03-24 21:49:02 +07:00
|
|
|
|
|
|
|
int dso__strerror_load(struct dso *dso, char *buf, size_t buflen)
|
|
|
|
{
|
|
|
|
int idx, errnum = dso->load_errno;
|
|
|
|
/*
|
|
|
|
* This must have a same ordering as the enum dso_load_errno.
|
|
|
|
*/
|
|
|
|
static const char *dso_load__error_str[] = {
|
|
|
|
"Internal tools/perf/ library error",
|
|
|
|
"Invalid ELF file",
|
|
|
|
"Can not read build id",
|
|
|
|
"Mismatching build id",
|
|
|
|
"Decompression failure",
|
|
|
|
};
|
|
|
|
|
|
|
|
BUG_ON(buflen == 0);
|
|
|
|
|
|
|
|
if (errnum >= 0) {
|
|
|
|
const char *err = strerror_r(errnum, buf, buflen);
|
|
|
|
|
|
|
|
if (err != buf)
|
|
|
|
scnprintf(buf, buflen, "%s", err);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (errnum < __DSO_LOAD_ERRNO__START || errnum >= __DSO_LOAD_ERRNO__END)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
idx = errnum - __DSO_LOAD_ERRNO__START;
|
|
|
|
scnprintf(buf, buflen, "%s", dso_load__error_str[idx]);
|
|
|
|
return 0;
|
|
|
|
}
|