b843e9c3a2
In order to make libtraceevent into a proper library, variables, data structures and functions require a unique prefix to prevent name space conflicts. That prefix will be "tep_" and not "pevent_". This changes APIs: pevent_register_print_function, pevent_unregister_print_function, pevent_register_event_handler, pevent_unregister_event_handler, pevent_register_function, pevent_register_trace_clock Signed-off-by: Steven Rostedt <rostedt@goodmis.org> Cc: Andrew Morton <akpm@linux-foundation.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Yordan Karadzhov (VMware) <y.karadz@gmail.com> Cc: linux-trace-devel@vger.kernel.org Link: http://lkml.kernel.org/r/20180808180702.524813185@goodmis.org Signed-off-by: Tzvetomir Stoyanov (VMware) <tz.stoyanov@gmail.com> Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
522 lines
14 KiB
C
522 lines
14 KiB
C
/*
|
|
* Copyright (C) 2009 Red Hat Inc, Steven Rostedt <srostedt@redhat.com>
|
|
*
|
|
* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation;
|
|
* version 2.1 of the License (not later!)
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this program; if not, see <http://www.gnu.org/licenses>
|
|
*
|
|
* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
*/
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <stdint.h>
|
|
|
|
#include "event-parse.h"
|
|
|
|
#ifdef HAVE_UDIS86
|
|
|
|
#include <udis86.h>
|
|
|
|
static ud_t ud;
|
|
|
|
static void init_disassembler(void)
|
|
{
|
|
ud_init(&ud);
|
|
ud_set_syntax(&ud, UD_SYN_ATT);
|
|
}
|
|
|
|
static const char *disassemble(unsigned char *insn, int len, uint64_t rip,
|
|
int cr0_pe, int eflags_vm,
|
|
int cs_d, int cs_l)
|
|
{
|
|
int mode;
|
|
|
|
if (!cr0_pe)
|
|
mode = 16;
|
|
else if (eflags_vm)
|
|
mode = 16;
|
|
else if (cs_l)
|
|
mode = 64;
|
|
else if (cs_d)
|
|
mode = 32;
|
|
else
|
|
mode = 16;
|
|
|
|
ud_set_pc(&ud, rip);
|
|
ud_set_mode(&ud, mode);
|
|
ud_set_input_buffer(&ud, insn, len);
|
|
ud_disassemble(&ud);
|
|
return ud_insn_asm(&ud);
|
|
}
|
|
|
|
#else
|
|
|
|
static void init_disassembler(void)
|
|
{
|
|
}
|
|
|
|
static const char *disassemble(unsigned char *insn, int len, uint64_t rip,
|
|
int cr0_pe, int eflags_vm,
|
|
int cs_d, int cs_l)
|
|
{
|
|
static char out[15*3+1];
|
|
int i;
|
|
|
|
for (i = 0; i < len; ++i)
|
|
sprintf(out + i * 3, "%02x ", insn[i]);
|
|
out[len*3-1] = '\0';
|
|
return out;
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
#define VMX_EXIT_REASONS \
|
|
_ER(EXCEPTION_NMI, 0) \
|
|
_ER(EXTERNAL_INTERRUPT, 1) \
|
|
_ER(TRIPLE_FAULT, 2) \
|
|
_ER(PENDING_INTERRUPT, 7) \
|
|
_ER(NMI_WINDOW, 8) \
|
|
_ER(TASK_SWITCH, 9) \
|
|
_ER(CPUID, 10) \
|
|
_ER(HLT, 12) \
|
|
_ER(INVD, 13) \
|
|
_ER(INVLPG, 14) \
|
|
_ER(RDPMC, 15) \
|
|
_ER(RDTSC, 16) \
|
|
_ER(VMCALL, 18) \
|
|
_ER(VMCLEAR, 19) \
|
|
_ER(VMLAUNCH, 20) \
|
|
_ER(VMPTRLD, 21) \
|
|
_ER(VMPTRST, 22) \
|
|
_ER(VMREAD, 23) \
|
|
_ER(VMRESUME, 24) \
|
|
_ER(VMWRITE, 25) \
|
|
_ER(VMOFF, 26) \
|
|
_ER(VMON, 27) \
|
|
_ER(CR_ACCESS, 28) \
|
|
_ER(DR_ACCESS, 29) \
|
|
_ER(IO_INSTRUCTION, 30) \
|
|
_ER(MSR_READ, 31) \
|
|
_ER(MSR_WRITE, 32) \
|
|
_ER(MWAIT_INSTRUCTION, 36) \
|
|
_ER(MONITOR_INSTRUCTION, 39) \
|
|
_ER(PAUSE_INSTRUCTION, 40) \
|
|
_ER(MCE_DURING_VMENTRY, 41) \
|
|
_ER(TPR_BELOW_THRESHOLD, 43) \
|
|
_ER(APIC_ACCESS, 44) \
|
|
_ER(EOI_INDUCED, 45) \
|
|
_ER(EPT_VIOLATION, 48) \
|
|
_ER(EPT_MISCONFIG, 49) \
|
|
_ER(INVEPT, 50) \
|
|
_ER(PREEMPTION_TIMER, 52) \
|
|
_ER(WBINVD, 54) \
|
|
_ER(XSETBV, 55) \
|
|
_ER(APIC_WRITE, 56) \
|
|
_ER(INVPCID, 58) \
|
|
_ER(PML_FULL, 62) \
|
|
_ER(XSAVES, 63) \
|
|
_ER(XRSTORS, 64)
|
|
|
|
#define SVM_EXIT_REASONS \
|
|
_ER(EXIT_READ_CR0, 0x000) \
|
|
_ER(EXIT_READ_CR3, 0x003) \
|
|
_ER(EXIT_READ_CR4, 0x004) \
|
|
_ER(EXIT_READ_CR8, 0x008) \
|
|
_ER(EXIT_WRITE_CR0, 0x010) \
|
|
_ER(EXIT_WRITE_CR3, 0x013) \
|
|
_ER(EXIT_WRITE_CR4, 0x014) \
|
|
_ER(EXIT_WRITE_CR8, 0x018) \
|
|
_ER(EXIT_READ_DR0, 0x020) \
|
|
_ER(EXIT_READ_DR1, 0x021) \
|
|
_ER(EXIT_READ_DR2, 0x022) \
|
|
_ER(EXIT_READ_DR3, 0x023) \
|
|
_ER(EXIT_READ_DR4, 0x024) \
|
|
_ER(EXIT_READ_DR5, 0x025) \
|
|
_ER(EXIT_READ_DR6, 0x026) \
|
|
_ER(EXIT_READ_DR7, 0x027) \
|
|
_ER(EXIT_WRITE_DR0, 0x030) \
|
|
_ER(EXIT_WRITE_DR1, 0x031) \
|
|
_ER(EXIT_WRITE_DR2, 0x032) \
|
|
_ER(EXIT_WRITE_DR3, 0x033) \
|
|
_ER(EXIT_WRITE_DR4, 0x034) \
|
|
_ER(EXIT_WRITE_DR5, 0x035) \
|
|
_ER(EXIT_WRITE_DR6, 0x036) \
|
|
_ER(EXIT_WRITE_DR7, 0x037) \
|
|
_ER(EXIT_EXCP_BASE, 0x040) \
|
|
_ER(EXIT_INTR, 0x060) \
|
|
_ER(EXIT_NMI, 0x061) \
|
|
_ER(EXIT_SMI, 0x062) \
|
|
_ER(EXIT_INIT, 0x063) \
|
|
_ER(EXIT_VINTR, 0x064) \
|
|
_ER(EXIT_CR0_SEL_WRITE, 0x065) \
|
|
_ER(EXIT_IDTR_READ, 0x066) \
|
|
_ER(EXIT_GDTR_READ, 0x067) \
|
|
_ER(EXIT_LDTR_READ, 0x068) \
|
|
_ER(EXIT_TR_READ, 0x069) \
|
|
_ER(EXIT_IDTR_WRITE, 0x06a) \
|
|
_ER(EXIT_GDTR_WRITE, 0x06b) \
|
|
_ER(EXIT_LDTR_WRITE, 0x06c) \
|
|
_ER(EXIT_TR_WRITE, 0x06d) \
|
|
_ER(EXIT_RDTSC, 0x06e) \
|
|
_ER(EXIT_RDPMC, 0x06f) \
|
|
_ER(EXIT_PUSHF, 0x070) \
|
|
_ER(EXIT_POPF, 0x071) \
|
|
_ER(EXIT_CPUID, 0x072) \
|
|
_ER(EXIT_RSM, 0x073) \
|
|
_ER(EXIT_IRET, 0x074) \
|
|
_ER(EXIT_SWINT, 0x075) \
|
|
_ER(EXIT_INVD, 0x076) \
|
|
_ER(EXIT_PAUSE, 0x077) \
|
|
_ER(EXIT_HLT, 0x078) \
|
|
_ER(EXIT_INVLPG, 0x079) \
|
|
_ER(EXIT_INVLPGA, 0x07a) \
|
|
_ER(EXIT_IOIO, 0x07b) \
|
|
_ER(EXIT_MSR, 0x07c) \
|
|
_ER(EXIT_TASK_SWITCH, 0x07d) \
|
|
_ER(EXIT_FERR_FREEZE, 0x07e) \
|
|
_ER(EXIT_SHUTDOWN, 0x07f) \
|
|
_ER(EXIT_VMRUN, 0x080) \
|
|
_ER(EXIT_VMMCALL, 0x081) \
|
|
_ER(EXIT_VMLOAD, 0x082) \
|
|
_ER(EXIT_VMSAVE, 0x083) \
|
|
_ER(EXIT_STGI, 0x084) \
|
|
_ER(EXIT_CLGI, 0x085) \
|
|
_ER(EXIT_SKINIT, 0x086) \
|
|
_ER(EXIT_RDTSCP, 0x087) \
|
|
_ER(EXIT_ICEBP, 0x088) \
|
|
_ER(EXIT_WBINVD, 0x089) \
|
|
_ER(EXIT_MONITOR, 0x08a) \
|
|
_ER(EXIT_MWAIT, 0x08b) \
|
|
_ER(EXIT_MWAIT_COND, 0x08c) \
|
|
_ER(EXIT_NPF, 0x400) \
|
|
_ER(EXIT_ERR, -1)
|
|
|
|
#define _ER(reason, val) { #reason, val },
|
|
struct str_values {
|
|
const char *str;
|
|
int val;
|
|
};
|
|
|
|
static struct str_values vmx_exit_reasons[] = {
|
|
VMX_EXIT_REASONS
|
|
{ NULL, -1}
|
|
};
|
|
|
|
static struct str_values svm_exit_reasons[] = {
|
|
SVM_EXIT_REASONS
|
|
{ NULL, -1}
|
|
};
|
|
|
|
static struct isa_exit_reasons {
|
|
unsigned isa;
|
|
struct str_values *strings;
|
|
} isa_exit_reasons[] = {
|
|
{ .isa = 1, .strings = vmx_exit_reasons },
|
|
{ .isa = 2, .strings = svm_exit_reasons },
|
|
{ }
|
|
};
|
|
|
|
static const char *find_exit_reason(unsigned isa, int val)
|
|
{
|
|
struct str_values *strings = NULL;
|
|
int i;
|
|
|
|
for (i = 0; isa_exit_reasons[i].strings; ++i)
|
|
if (isa_exit_reasons[i].isa == isa) {
|
|
strings = isa_exit_reasons[i].strings;
|
|
break;
|
|
}
|
|
if (!strings)
|
|
return "UNKNOWN-ISA";
|
|
for (i = 0; strings[i].val >= 0; i++)
|
|
if (strings[i].val == val)
|
|
break;
|
|
|
|
return strings[i].str;
|
|
}
|
|
|
|
static int print_exit_reason(struct trace_seq *s, struct tep_record *record,
|
|
struct event_format *event, const char *field)
|
|
{
|
|
unsigned long long isa;
|
|
unsigned long long val;
|
|
const char *reason;
|
|
|
|
if (pevent_get_field_val(s, event, field, record, &val, 1) < 0)
|
|
return -1;
|
|
|
|
if (pevent_get_field_val(s, event, "isa", record, &isa, 0) < 0)
|
|
isa = 1;
|
|
|
|
reason = find_exit_reason(isa, val);
|
|
if (reason)
|
|
trace_seq_printf(s, "reason %s", reason);
|
|
else
|
|
trace_seq_printf(s, "reason UNKNOWN (%llu)", val);
|
|
return 0;
|
|
}
|
|
|
|
static int kvm_exit_handler(struct trace_seq *s, struct tep_record *record,
|
|
struct event_format *event, void *context)
|
|
{
|
|
unsigned long long info1 = 0, info2 = 0;
|
|
|
|
if (print_exit_reason(s, record, event, "exit_reason") < 0)
|
|
return -1;
|
|
|
|
tep_print_num_field(s, " rip 0x%lx", event, "guest_rip", record, 1);
|
|
|
|
if (pevent_get_field_val(s, event, "info1", record, &info1, 0) >= 0
|
|
&& pevent_get_field_val(s, event, "info2", record, &info2, 0) >= 0)
|
|
trace_seq_printf(s, " info %llx %llx", info1, info2);
|
|
|
|
return 0;
|
|
}
|
|
|
|
#define KVM_EMUL_INSN_F_CR0_PE (1 << 0)
|
|
#define KVM_EMUL_INSN_F_EFL_VM (1 << 1)
|
|
#define KVM_EMUL_INSN_F_CS_D (1 << 2)
|
|
#define KVM_EMUL_INSN_F_CS_L (1 << 3)
|
|
|
|
static int kvm_emulate_insn_handler(struct trace_seq *s,
|
|
struct tep_record *record,
|
|
struct event_format *event, void *context)
|
|
{
|
|
unsigned long long rip, csbase, len, flags, failed;
|
|
int llen;
|
|
uint8_t *insn;
|
|
const char *disasm;
|
|
|
|
if (pevent_get_field_val(s, event, "rip", record, &rip, 1) < 0)
|
|
return -1;
|
|
|
|
if (pevent_get_field_val(s, event, "csbase", record, &csbase, 1) < 0)
|
|
return -1;
|
|
|
|
if (pevent_get_field_val(s, event, "len", record, &len, 1) < 0)
|
|
return -1;
|
|
|
|
if (pevent_get_field_val(s, event, "flags", record, &flags, 1) < 0)
|
|
return -1;
|
|
|
|
if (pevent_get_field_val(s, event, "failed", record, &failed, 1) < 0)
|
|
return -1;
|
|
|
|
insn = pevent_get_field_raw(s, event, "insn", record, &llen, 1);
|
|
if (!insn)
|
|
return -1;
|
|
|
|
disasm = disassemble(insn, len, rip,
|
|
flags & KVM_EMUL_INSN_F_CR0_PE,
|
|
flags & KVM_EMUL_INSN_F_EFL_VM,
|
|
flags & KVM_EMUL_INSN_F_CS_D,
|
|
flags & KVM_EMUL_INSN_F_CS_L);
|
|
|
|
trace_seq_printf(s, "%llx:%llx: %s%s", csbase, rip, disasm,
|
|
failed ? " FAIL" : "");
|
|
return 0;
|
|
}
|
|
|
|
|
|
static int kvm_nested_vmexit_inject_handler(struct trace_seq *s, struct tep_record *record,
|
|
struct event_format *event, void *context)
|
|
{
|
|
if (print_exit_reason(s, record, event, "exit_code") < 0)
|
|
return -1;
|
|
|
|
tep_print_num_field(s, " info1 %llx", event, "exit_info1", record, 1);
|
|
tep_print_num_field(s, " info2 %llx", event, "exit_info2", record, 1);
|
|
tep_print_num_field(s, " int_info %llx", event, "exit_int_info", record, 1);
|
|
tep_print_num_field(s, " int_info_err %llx", event, "exit_int_info_err", record, 1);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int kvm_nested_vmexit_handler(struct trace_seq *s, struct tep_record *record,
|
|
struct event_format *event, void *context)
|
|
{
|
|
tep_print_num_field(s, "rip %llx ", event, "rip", record, 1);
|
|
|
|
return kvm_nested_vmexit_inject_handler(s, record, event, context);
|
|
}
|
|
|
|
union kvm_mmu_page_role {
|
|
unsigned word;
|
|
struct {
|
|
unsigned level:4;
|
|
unsigned cr4_pae:1;
|
|
unsigned quadrant:2;
|
|
unsigned direct:1;
|
|
unsigned access:3;
|
|
unsigned invalid:1;
|
|
unsigned nxe:1;
|
|
unsigned cr0_wp:1;
|
|
unsigned smep_and_not_wp:1;
|
|
unsigned smap_and_not_wp:1;
|
|
unsigned pad_for_nice_hex_output:8;
|
|
unsigned smm:8;
|
|
};
|
|
};
|
|
|
|
static int kvm_mmu_print_role(struct trace_seq *s, struct tep_record *record,
|
|
struct event_format *event, void *context)
|
|
{
|
|
unsigned long long val;
|
|
static const char *access_str[] = {
|
|
"---", "--x", "w--", "w-x", "-u-", "-ux", "wu-", "wux"
|
|
};
|
|
union kvm_mmu_page_role role;
|
|
|
|
if (pevent_get_field_val(s, event, "role", record, &val, 1) < 0)
|
|
return -1;
|
|
|
|
role.word = (int)val;
|
|
|
|
/*
|
|
* We can only use the structure if file is of the same
|
|
* endianess.
|
|
*/
|
|
if (pevent_is_file_bigendian(event->pevent) ==
|
|
pevent_is_host_bigendian(event->pevent)) {
|
|
|
|
trace_seq_printf(s, "%u q%u%s %s%s %spae %snxe %swp%s%s%s",
|
|
role.level,
|
|
role.quadrant,
|
|
role.direct ? " direct" : "",
|
|
access_str[role.access],
|
|
role.invalid ? " invalid" : "",
|
|
role.cr4_pae ? "" : "!",
|
|
role.nxe ? "" : "!",
|
|
role.cr0_wp ? "" : "!",
|
|
role.smep_and_not_wp ? " smep" : "",
|
|
role.smap_and_not_wp ? " smap" : "",
|
|
role.smm ? " smm" : "");
|
|
} else
|
|
trace_seq_printf(s, "WORD: %08x", role.word);
|
|
|
|
tep_print_num_field(s, " root %u ", event,
|
|
"root_count", record, 1);
|
|
|
|
if (pevent_get_field_val(s, event, "unsync", record, &val, 1) < 0)
|
|
return -1;
|
|
|
|
trace_seq_printf(s, "%s%c", val ? "unsync" : "sync", 0);
|
|
return 0;
|
|
}
|
|
|
|
static int kvm_mmu_get_page_handler(struct trace_seq *s,
|
|
struct tep_record *record,
|
|
struct event_format *event, void *context)
|
|
{
|
|
unsigned long long val;
|
|
|
|
if (pevent_get_field_val(s, event, "created", record, &val, 1) < 0)
|
|
return -1;
|
|
|
|
trace_seq_printf(s, "%s ", val ? "new" : "existing");
|
|
|
|
if (pevent_get_field_val(s, event, "gfn", record, &val, 1) < 0)
|
|
return -1;
|
|
|
|
trace_seq_printf(s, "sp gfn %llx ", val);
|
|
return kvm_mmu_print_role(s, record, event, context);
|
|
}
|
|
|
|
#define PT_WRITABLE_SHIFT 1
|
|
#define PT_WRITABLE_MASK (1ULL << PT_WRITABLE_SHIFT)
|
|
|
|
static unsigned long long
|
|
process_is_writable_pte(struct trace_seq *s, unsigned long long *args)
|
|
{
|
|
unsigned long pte = args[0];
|
|
return pte & PT_WRITABLE_MASK;
|
|
}
|
|
|
|
int TEP_PLUGIN_LOADER(struct tep_handle *pevent)
|
|
{
|
|
init_disassembler();
|
|
|
|
tep_register_event_handler(pevent, -1, "kvm", "kvm_exit",
|
|
kvm_exit_handler, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvm", "kvm_emulate_insn",
|
|
kvm_emulate_insn_handler, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvm", "kvm_nested_vmexit",
|
|
kvm_nested_vmexit_handler, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvm", "kvm_nested_vmexit_inject",
|
|
kvm_nested_vmexit_inject_handler, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvmmmu", "kvm_mmu_get_page",
|
|
kvm_mmu_get_page_handler, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvmmmu", "kvm_mmu_sync_page",
|
|
kvm_mmu_print_role, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1,
|
|
"kvmmmu", "kvm_mmu_unsync_page",
|
|
kvm_mmu_print_role, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvmmmu", "kvm_mmu_zap_page",
|
|
kvm_mmu_print_role, NULL);
|
|
|
|
tep_register_event_handler(pevent, -1, "kvmmmu",
|
|
"kvm_mmu_prepare_zap_page", kvm_mmu_print_role,
|
|
NULL);
|
|
|
|
tep_register_print_function(pevent,
|
|
process_is_writable_pte,
|
|
TEP_FUNC_ARG_INT,
|
|
"is_writable_pte",
|
|
TEP_FUNC_ARG_LONG,
|
|
TEP_FUNC_ARG_VOID);
|
|
return 0;
|
|
}
|
|
|
|
void TEP_PLUGIN_UNLOADER(struct tep_handle *pevent)
|
|
{
|
|
tep_unregister_event_handler(pevent, -1, "kvm", "kvm_exit",
|
|
kvm_exit_handler, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvm", "kvm_emulate_insn",
|
|
kvm_emulate_insn_handler, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvm", "kvm_nested_vmexit",
|
|
kvm_nested_vmexit_handler, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvm", "kvm_nested_vmexit_inject",
|
|
kvm_nested_vmexit_inject_handler, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvmmmu", "kvm_mmu_get_page",
|
|
kvm_mmu_get_page_handler, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvmmmu", "kvm_mmu_sync_page",
|
|
kvm_mmu_print_role, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1,
|
|
"kvmmmu", "kvm_mmu_unsync_page",
|
|
kvm_mmu_print_role, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvmmmu", "kvm_mmu_zap_page",
|
|
kvm_mmu_print_role, NULL);
|
|
|
|
tep_unregister_event_handler(pevent, -1, "kvmmmu",
|
|
"kvm_mmu_prepare_zap_page", kvm_mmu_print_role,
|
|
NULL);
|
|
|
|
tep_unregister_print_function(pevent, process_is_writable_pte,
|
|
"is_writable_pte");
|
|
}
|