mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2025-01-15 07:06:28 +07:00
61f63e3837
New features: - Add 'brstackinsn' field in 'perf script' to reuse the x86 instruction decoder used in the Intel PT code to study hot paths to samples (Andi Kleen) Kernel: - Default UPROBES_EVENTS to Y (Alexei Starovoitov) - Fix check for kretprobe offset within function entry (Naveen N. Rao) Infrastructure: - Introduce util func is_sdt_event() (Ravi Bangoria) - Make perf_event__synthesize_mmap_events() scale on older kernels where reading /proc/pid/maps is way slower than reading /proc/pid/task/pid/maps (Stephane Eranian) Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com> -----BEGIN PGP SIGNATURE----- Version: GnuPG v2 iQIcBAABCAAGBQJYyrdSAAoJENZQFvNTUqpAe+4P/3c4ilBSOxLCCxGO7jDYo9oq /KqlvsCIg7+vo5eqrOUJAb4qXFnvpYxwjMMkL5rx7gdsBCRfRXIINGWUMrq5mNyk MgxuqYnp+yRuxLYml2wn+tdwLzcHWSN2EO9mqQ14N4I+HvgdLmVPQ44ACQXs6KfL dk/Ix8YtnFWl2sDZjvyr7ZBqwCPzzklZgHM6erxNUr/WJspzUiixAWqUmewodOUl P3PitlHXkITOK3AxSqOjJ4g1k933215nGih7hr0XdjEm4pIYaYksShQ6k9DASCrv dn2o1pF1LTu7KCtAo70aaSB7GXydwoA//o2gRbDkSwJJ25DIImZxJXQz9PAYDOo1 vXSIhmlQ72c4/Yv/XzVOrIoMMMpmWKS3lGZxMVGR/Ie9Gw4kbotkaoEqEpNQsaDZ iIaU5v/EcvvToT7T7VHrGg0+vmHgYxm5gSlyASi2IrO2/wJAs0v2pYfuL6gYhXGp mhv/pHUv4l9OW+Ubm+zJEEcg337c2RQU5wT/bk4PihxY6nQyEH2Pn5VzdNbZLuMR eWnqTH/md+8/bkhmuZJp71wm60oPHoPvbDjvtfVmXAa52AzO+NWSc9Veke3C/QRm XgNkrXlzeKopEso3j4gw2iAolqw9t8FHFLGgbTkS+6UCKjAM7vNLiIV02LQqhM50 qCnKEusMDCRgzeOXxYt+ =Bg5M -----END PGP SIGNATURE----- Merge tag 'perf-core-for-mingo-4.12-20170316' of git://git.kernel.org/pub/scm/linux/kernel/git/acme/linux into perf/core Pull perf/core improvements and fixes from Arnaldo Carvalho de Melo: New features: - Add 'brstackinsn' field in 'perf script' to reuse the x86 instruction decoder used in the Intel PT code to study hot paths to samples (Andi Kleen) Kernel changes: - Default UPROBES_EVENTS to Y (Alexei Starovoitov) - Fix check for kretprobe offset within function entry (Naveen N. Rao) Infrastructure changes: - Introduce util func is_sdt_event() (Ravi Bangoria) - Make perf_event__synthesize_mmap_events() scale on older kernels where reading /proc/pid/maps is way slower than reading /proc/pid/task/pid/maps (Stephane Eranian) Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com> Signed-off-by: Ingo Molnar <mingo@kernel.org>
275 lines
6.6 KiB
C
275 lines
6.6 KiB
C
/*
|
|
* intel_pt_insn_decoder.c: Intel Processor Trace support
|
|
* Copyright (c) 2013-2014, Intel Corporation.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify it
|
|
* under the terms and conditions of the GNU General Public License,
|
|
* version 2, as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
* more details.
|
|
*
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <endian.h>
|
|
#include <byteswap.h>
|
|
|
|
#include "event.h"
|
|
|
|
#include "insn.h"
|
|
|
|
#include "inat.c"
|
|
#include "insn.c"
|
|
|
|
#include "intel-pt-insn-decoder.h"
|
|
#include "dump-insn.h"
|
|
|
|
#if INTEL_PT_INSN_BUF_SZ < MAX_INSN_SIZE || INTEL_PT_INSN_BUF_SZ > MAX_INSN
|
|
#error Instruction buffer size too small
|
|
#endif
|
|
|
|
/* Based on branch_type() from arch/x86/events/intel/lbr.c */
|
|
static void intel_pt_insn_decoder(struct insn *insn,
|
|
struct intel_pt_insn *intel_pt_insn)
|
|
{
|
|
enum intel_pt_insn_op op = INTEL_PT_OP_OTHER;
|
|
enum intel_pt_insn_branch branch = INTEL_PT_BR_NO_BRANCH;
|
|
int ext;
|
|
|
|
intel_pt_insn->rel = 0;
|
|
|
|
if (insn_is_avx(insn)) {
|
|
intel_pt_insn->op = INTEL_PT_OP_OTHER;
|
|
intel_pt_insn->branch = INTEL_PT_BR_NO_BRANCH;
|
|
intel_pt_insn->length = insn->length;
|
|
return;
|
|
}
|
|
|
|
switch (insn->opcode.bytes[0]) {
|
|
case 0xf:
|
|
switch (insn->opcode.bytes[1]) {
|
|
case 0x05: /* syscall */
|
|
case 0x34: /* sysenter */
|
|
op = INTEL_PT_OP_SYSCALL;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0x07: /* sysret */
|
|
case 0x35: /* sysexit */
|
|
op = INTEL_PT_OP_SYSRET;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0x80 ... 0x8f: /* jcc */
|
|
op = INTEL_PT_OP_JCC;
|
|
branch = INTEL_PT_BR_CONDITIONAL;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
break;
|
|
case 0x70 ... 0x7f: /* jcc */
|
|
op = INTEL_PT_OP_JCC;
|
|
branch = INTEL_PT_BR_CONDITIONAL;
|
|
break;
|
|
case 0xc2: /* near ret */
|
|
case 0xc3: /* near ret */
|
|
case 0xca: /* far ret */
|
|
case 0xcb: /* far ret */
|
|
op = INTEL_PT_OP_RET;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0xcf: /* iret */
|
|
op = INTEL_PT_OP_IRET;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0xcc ... 0xce: /* int */
|
|
op = INTEL_PT_OP_INT;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0xe8: /* call near rel */
|
|
op = INTEL_PT_OP_CALL;
|
|
branch = INTEL_PT_BR_UNCONDITIONAL;
|
|
break;
|
|
case 0x9a: /* call far absolute */
|
|
op = INTEL_PT_OP_CALL;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0xe0 ... 0xe2: /* loop */
|
|
op = INTEL_PT_OP_LOOP;
|
|
branch = INTEL_PT_BR_CONDITIONAL;
|
|
break;
|
|
case 0xe3: /* jcc */
|
|
op = INTEL_PT_OP_JCC;
|
|
branch = INTEL_PT_BR_CONDITIONAL;
|
|
break;
|
|
case 0xe9: /* jmp */
|
|
case 0xeb: /* jmp */
|
|
op = INTEL_PT_OP_JMP;
|
|
branch = INTEL_PT_BR_UNCONDITIONAL;
|
|
break;
|
|
case 0xea: /* far jmp */
|
|
op = INTEL_PT_OP_JMP;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 0xff: /* call near absolute, call far absolute ind */
|
|
ext = (insn->modrm.bytes[0] >> 3) & 0x7;
|
|
switch (ext) {
|
|
case 2: /* near ind call */
|
|
case 3: /* far ind call */
|
|
op = INTEL_PT_OP_CALL;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
case 4:
|
|
case 5:
|
|
op = INTEL_PT_OP_JMP;
|
|
branch = INTEL_PT_BR_INDIRECT;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
intel_pt_insn->op = op;
|
|
intel_pt_insn->branch = branch;
|
|
intel_pt_insn->length = insn->length;
|
|
|
|
if (branch == INTEL_PT_BR_CONDITIONAL ||
|
|
branch == INTEL_PT_BR_UNCONDITIONAL) {
|
|
#if __BYTE_ORDER == __BIG_ENDIAN
|
|
switch (insn->immediate.nbytes) {
|
|
case 1:
|
|
intel_pt_insn->rel = insn->immediate.value;
|
|
break;
|
|
case 2:
|
|
intel_pt_insn->rel =
|
|
bswap_16((short)insn->immediate.value);
|
|
break;
|
|
case 4:
|
|
intel_pt_insn->rel = bswap_32(insn->immediate.value);
|
|
break;
|
|
default:
|
|
intel_pt_insn->rel = 0;
|
|
break;
|
|
}
|
|
#else
|
|
intel_pt_insn->rel = insn->immediate.value;
|
|
#endif
|
|
}
|
|
}
|
|
|
|
int intel_pt_get_insn(const unsigned char *buf, size_t len, int x86_64,
|
|
struct intel_pt_insn *intel_pt_insn)
|
|
{
|
|
struct insn insn;
|
|
|
|
insn_init(&insn, buf, len, x86_64);
|
|
insn_get_length(&insn);
|
|
if (!insn_complete(&insn) || insn.length > len)
|
|
return -1;
|
|
intel_pt_insn_decoder(&insn, intel_pt_insn);
|
|
if (insn.length < INTEL_PT_INSN_BUF_SZ)
|
|
memcpy(intel_pt_insn->buf, buf, insn.length);
|
|
else
|
|
memcpy(intel_pt_insn->buf, buf, INTEL_PT_INSN_BUF_SZ);
|
|
return 0;
|
|
}
|
|
|
|
const char *dump_insn(struct perf_insn *x, uint64_t ip __maybe_unused,
|
|
u8 *inbuf, int inlen, int *lenp)
|
|
{
|
|
struct insn insn;
|
|
int n, i;
|
|
int left;
|
|
|
|
insn_init(&insn, inbuf, inlen, x->is64bit);
|
|
insn_get_length(&insn);
|
|
if (!insn_complete(&insn) || insn.length > inlen)
|
|
return "<bad>";
|
|
if (lenp)
|
|
*lenp = insn.length;
|
|
left = sizeof(x->out);
|
|
n = snprintf(x->out, left, "insn: ");
|
|
left -= n;
|
|
for (i = 0; i < insn.length; i++) {
|
|
n += snprintf(x->out + n, left, "%02x ", inbuf[i]);
|
|
left -= n;
|
|
}
|
|
return x->out;
|
|
}
|
|
|
|
const char *branch_name[] = {
|
|
[INTEL_PT_OP_OTHER] = "Other",
|
|
[INTEL_PT_OP_CALL] = "Call",
|
|
[INTEL_PT_OP_RET] = "Ret",
|
|
[INTEL_PT_OP_JCC] = "Jcc",
|
|
[INTEL_PT_OP_JMP] = "Jmp",
|
|
[INTEL_PT_OP_LOOP] = "Loop",
|
|
[INTEL_PT_OP_IRET] = "IRet",
|
|
[INTEL_PT_OP_INT] = "Int",
|
|
[INTEL_PT_OP_SYSCALL] = "Syscall",
|
|
[INTEL_PT_OP_SYSRET] = "Sysret",
|
|
};
|
|
|
|
const char *intel_pt_insn_name(enum intel_pt_insn_op op)
|
|
{
|
|
return branch_name[op];
|
|
}
|
|
|
|
int intel_pt_insn_desc(const struct intel_pt_insn *intel_pt_insn, char *buf,
|
|
size_t buf_len)
|
|
{
|
|
switch (intel_pt_insn->branch) {
|
|
case INTEL_PT_BR_CONDITIONAL:
|
|
case INTEL_PT_BR_UNCONDITIONAL:
|
|
return snprintf(buf, buf_len, "%s %s%d",
|
|
intel_pt_insn_name(intel_pt_insn->op),
|
|
intel_pt_insn->rel > 0 ? "+" : "",
|
|
intel_pt_insn->rel);
|
|
case INTEL_PT_BR_NO_BRANCH:
|
|
case INTEL_PT_BR_INDIRECT:
|
|
return snprintf(buf, buf_len, "%s",
|
|
intel_pt_insn_name(intel_pt_insn->op));
|
|
default:
|
|
break;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int intel_pt_insn_type(enum intel_pt_insn_op op)
|
|
{
|
|
switch (op) {
|
|
case INTEL_PT_OP_OTHER:
|
|
return 0;
|
|
case INTEL_PT_OP_CALL:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_CALL;
|
|
case INTEL_PT_OP_RET:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_RETURN;
|
|
case INTEL_PT_OP_JCC:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_CONDITIONAL;
|
|
case INTEL_PT_OP_JMP:
|
|
return PERF_IP_FLAG_BRANCH;
|
|
case INTEL_PT_OP_LOOP:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_CONDITIONAL;
|
|
case INTEL_PT_OP_IRET:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_RETURN |
|
|
PERF_IP_FLAG_INTERRUPT;
|
|
case INTEL_PT_OP_INT:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_CALL |
|
|
PERF_IP_FLAG_INTERRUPT;
|
|
case INTEL_PT_OP_SYSCALL:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_CALL |
|
|
PERF_IP_FLAG_SYSCALLRET;
|
|
case INTEL_PT_OP_SYSRET:
|
|
return PERF_IP_FLAG_BRANCH | PERF_IP_FLAG_RETURN |
|
|
PERF_IP_FLAG_SYSCALLRET;
|
|
default:
|
|
return 0;
|
|
}
|
|
}
|