torvalds/linux

View on GitHub
tools/perf/scripts/python/intel-pt-events.py

Summary

Maintainability
F
5 days
Test Coverage
# SPDX-License-Identifier: GPL-2.0
# intel-pt-events.py: Print Intel PT Events including Power Events and PTWRITE
# Copyright (c) 2017-2021, Intel Corporation.
#
# This program is free software; you can redistribute it and/or modify it
# under the terms and conditions of the GNU General Public License,
# version 2, as published by the Free Software Foundation.
#
# This program is distributed in the hope it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
# more details.

from __future__ import division, print_function

import io
import os
import sys
import struct
import argparse
import contextlib

from libxed import LibXED
from ctypes import create_string_buffer, addressof

sys.path.append(os.environ['PERF_EXEC_PATH'] + \
    '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')

from perf_trace_context import perf_set_itrace_options, \
    perf_sample_insn, perf_sample_srccode

try:
    broken_pipe_exception = BrokenPipeError
except:
    broken_pipe_exception = IOError

glb_switch_str        = {}
glb_insn        = False
glb_disassembler    = None
glb_src            = False
glb_source_file_name    = None
glb_line_number        = None
glb_dso            = None
glb_stash_dict        = {}
glb_output        = None
glb_output_pos        = 0
glb_cpu            = -1
glb_time        = 0

def get_optional_null(perf_dict, field):
    if field in perf_dict:
        return perf_dict[field]
    return ""

def get_optional_zero(perf_dict, field):
    if field in perf_dict:
        return perf_dict[field]
    return 0

def get_optional_bytes(perf_dict, field):
    if field in perf_dict:
        return perf_dict[field]
    return bytes()

def get_optional(perf_dict, field):
    if field in perf_dict:
        return perf_dict[field]
    return "[unknown]"

def get_offset(perf_dict, field):
    if field in perf_dict:
        return "+%#x" % perf_dict[field]
    return ""

def trace_begin():
    ap = argparse.ArgumentParser(usage = "", add_help = False)
    ap.add_argument("--insn-trace", action='store_true')
    ap.add_argument("--src-trace", action='store_true')
    ap.add_argument("--all-switch-events", action='store_true')
    ap.add_argument("--interleave", type=int, nargs='?', const=4, default=0)
    global glb_args
    global glb_insn
    global glb_src
    glb_args = ap.parse_args()
    if glb_args.insn_trace:
        print("Intel PT Instruction Trace")
        itrace = "i0nsepwxI"
        glb_insn = True
    elif glb_args.src_trace:
        print("Intel PT Source Trace")
        itrace = "i0nsepwxI"
        glb_insn = True
        glb_src = True
    else:
        print("Intel PT Branch Trace, Power Events, Event Trace and PTWRITE")
        itrace = "bepwxI"
    global glb_disassembler
    try:
        glb_disassembler = LibXED()
    except:
        glb_disassembler = None
    perf_set_itrace_options(perf_script_context, itrace)

def trace_end():
    if glb_args.interleave:
        flush_stashed_output()
    print("End")

def trace_unhandled(event_name, context, event_fields_dict):
        print(' '.join(['%s=%s'%(k,str(v))for k,v in sorted(event_fields_dict.items())]))

def stash_output():
    global glb_stash_dict
    global glb_output_pos
    output_str = glb_output.getvalue()[glb_output_pos:]
    n = len(output_str)
    if n:
        glb_output_pos += n
        if glb_cpu not in glb_stash_dict:
            glb_stash_dict[glb_cpu] = []
        glb_stash_dict[glb_cpu].append(output_str)

def flush_stashed_output():
    global glb_stash_dict
    while glb_stash_dict:
        cpus = list(glb_stash_dict.keys())
        # Output at most glb_args.interleave output strings per cpu
        for cpu in cpus:
            items = glb_stash_dict[cpu]
            countdown = glb_args.interleave
            while len(items) and countdown:
                sys.stdout.write(items[0])
                del items[0]
                countdown -= 1
            if not items:
                del glb_stash_dict[cpu]

def print_ptwrite(raw_buf):
    data = struct.unpack_from("<IQ", raw_buf)
    flags = data[0]
    payload = data[1]
    exact_ip = flags & 1
    try:
        s = payload.to_bytes(8, "little").decode("ascii").rstrip("\x00")
        if not s.isprintable():
            s = ""
    except:
        s = ""
    print("IP: %u payload: %#x" % (exact_ip, payload), s, end=' ')

def print_cbr(raw_buf):
    data = struct.unpack_from("<BBBBII", raw_buf)
    cbr = data[0]
    f = (data[4] + 500) / 1000
    p = ((cbr * 1000 / data[2]) + 5) / 10
    print("%3u  freq: %4u MHz  (%3u%%)" % (cbr, f, p), end=' ')

def print_mwait(raw_buf):
    data = struct.unpack_from("<IQ", raw_buf)
    payload = data[1]
    hints = payload & 0xff
    extensions = (payload >> 32) & 0x3
    print("hints: %#x extensions: %#x" % (hints, extensions), end=' ')

def print_pwre(raw_buf):
    data = struct.unpack_from("<IQ", raw_buf)
    payload = data[1]
    hw = (payload >> 7) & 1
    cstate = (payload >> 12) & 0xf
    subcstate = (payload >> 8) & 0xf
    print("hw: %u cstate: %u sub-cstate: %u" % (hw, cstate, subcstate),
        end=' ')

def print_exstop(raw_buf):
    data = struct.unpack_from("<I", raw_buf)
    flags = data[0]
    exact_ip = flags & 1
    print("IP: %u" % (exact_ip), end=' ')

def print_pwrx(raw_buf):
    data = struct.unpack_from("<IQ", raw_buf)
    payload = data[1]
    deepest_cstate = payload & 0xf
    last_cstate = (payload >> 4) & 0xf
    wake_reason = (payload >> 8) & 0xf
    print("deepest cstate: %u last cstate: %u wake reason: %#x" %
        (deepest_cstate, last_cstate, wake_reason), end=' ')

def print_psb(raw_buf):
    data = struct.unpack_from("<IQ", raw_buf)
    offset = data[1]
    print("offset: %#x" % (offset), end=' ')

glb_cfe = ["", "INTR", "IRET", "SMI", "RSM", "SIPI", "INIT", "VMENTRY", "VMEXIT",
        "VMEXIT_INTR", "SHUTDOWN", "", "UINT", "UIRET"] + [""] * 18
glb_evd = ["", "PFA", "VMXQ", "VMXR"] + [""] * 60

def print_evt(raw_buf):
    data = struct.unpack_from("<BBH", raw_buf)
    typ = data[0] & 0x1f
    ip_flag = (data[0] & 0x80) >> 7
    vector = data[1]
    evd_cnt = data[2]
    s = glb_cfe[typ]
    if s:
        print(" cfe: %s IP: %u vector: %u" % (s, ip_flag, vector), end=' ')
    else:
        print(" cfe: %u IP: %u vector: %u" % (typ, ip_flag, vector), end=' ')
    pos = 4
    for i in range(evd_cnt):
        data = struct.unpack_from("<QQ", raw_buf)
        et = data[0] & 0x3f
        s = glb_evd[et]
        if s:
            print("%s: %#x" % (s, data[1]), end=' ')
        else:
            print("EVD_%u: %#x" % (et, data[1]), end=' ')

def print_iflag(raw_buf):
    data = struct.unpack_from("<IQ", raw_buf)
    iflag = data[0] & 1
    old_iflag = iflag ^ 1
    via_branch = data[0] & 2
    branch_ip = data[1]
    if via_branch:
        s = "via"
    else:
        s = "non"
    print("IFLAG: %u->%u %s branch" % (old_iflag, iflag, s), end=' ')

def common_start_str(comm, sample):
    ts = sample["time"]
    cpu = sample["cpu"]
    pid = sample["pid"]
    tid = sample["tid"]
    if "machine_pid" in sample:
        machine_pid = sample["machine_pid"]
        vcpu = sample["vcpu"]
        return "VM:%5d VCPU:%03d %16s %5u/%-5u [%03u] %9u.%09u  " % (machine_pid, vcpu, comm, pid, tid, cpu, ts / 1000000000, ts %1000000000)
    else:
        return "%16s %5u/%-5u [%03u] %9u.%09u  " % (comm, pid, tid, cpu, ts / 1000000000, ts %1000000000)

def print_common_start(comm, sample, name):
    flags_disp = get_optional_null(sample, "flags_disp")
    # Unused fields:
    # period      = sample["period"]
    # phys_addr   = sample["phys_addr"]
    # weight      = sample["weight"]
    # transaction = sample["transaction"]
    # cpumode     = get_optional_zero(sample, "cpumode")
    print(common_start_str(comm, sample) + "%8s  %21s" % (name, flags_disp), end=' ')

def print_instructions_start(comm, sample):
    if "x" in get_optional_null(sample, "flags"):
        print(common_start_str(comm, sample) + "x", end=' ')
    else:
        print(common_start_str(comm, sample), end='  ')

def disassem(insn, ip):
    inst = glb_disassembler.Instruction()
    glb_disassembler.SetMode(inst, 0) # Assume 64-bit
    buf = create_string_buffer(64)
    buf.value = insn
    return glb_disassembler.DisassembleOne(inst, addressof(buf), len(insn), ip)

def print_common_ip(param_dict, sample, symbol, dso):
    ip   = sample["ip"]
    offs = get_offset(param_dict, "symoff")
    if "cyc_cnt" in sample:
        cyc_cnt = sample["cyc_cnt"]
        insn_cnt = get_optional_zero(sample, "insn_cnt")
        ipc_str = "  IPC: %#.2f (%u/%u)" % (insn_cnt / cyc_cnt, insn_cnt, cyc_cnt)
    else:
        ipc_str = ""
    if glb_insn and glb_disassembler is not None:
        insn = perf_sample_insn(perf_script_context)
        if insn and len(insn):
            cnt, text = disassem(insn, ip)
            byte_str = ("%x" % ip).rjust(16)
            if sys.version_info.major >= 3:
                for k in range(cnt):
                    byte_str += " %02x" % insn[k]
            else:
                for k in xrange(cnt):
                    byte_str += " %02x" % ord(insn[k])
            print("%-40s  %-30s" % (byte_str, text), end=' ')
        print("%s%s (%s)" % (symbol, offs, dso), end=' ')
    else:
        print("%16x %s%s (%s)" % (ip, symbol, offs, dso), end=' ')
    if "addr_correlates_sym" in sample:
        addr   = sample["addr"]
        dso    = get_optional(sample, "addr_dso")
        symbol = get_optional(sample, "addr_symbol")
        offs   = get_offset(sample, "addr_symoff")
        print("=> %x %s%s (%s)%s" % (addr, symbol, offs, dso, ipc_str))
    else:
        print(ipc_str)

def print_srccode(comm, param_dict, sample, symbol, dso, with_insn):
    ip = sample["ip"]
    if symbol == "[unknown]":
        start_str = common_start_str(comm, sample) + ("%x" % ip).rjust(16).ljust(40)
    else:
        offs = get_offset(param_dict, "symoff")
        start_str = common_start_str(comm, sample) + (symbol + offs).ljust(40)

    if with_insn and glb_insn and glb_disassembler is not None:
        insn = perf_sample_insn(perf_script_context)
        if insn and len(insn):
            cnt, text = disassem(insn, ip)
        start_str += text.ljust(30)

    global glb_source_file_name
    global glb_line_number
    global glb_dso

    source_file_name, line_number, source_line = perf_sample_srccode(perf_script_context)
    if source_file_name:
        if glb_line_number == line_number and glb_source_file_name == source_file_name:
            src_str = ""
        else:
            if len(source_file_name) > 40:
                src_file = ("..." + source_file_name[-37:]) + " "
            else:
                src_file = source_file_name.ljust(41)
            if source_line is None:
                src_str = src_file + str(line_number).rjust(4) + " <source not found>"
            else:
                src_str = src_file + str(line_number).rjust(4) + " " + source_line
        glb_dso = None
    elif dso == glb_dso:
        src_str = ""
    else:
        src_str = dso
        glb_dso = dso

    glb_line_number = line_number
    glb_source_file_name = source_file_name

    print(start_str, src_str)

def do_process_event(param_dict):
    sample       = param_dict["sample"]
    raw_buf       = param_dict["raw_buf"]
    comm       = param_dict["comm"]
    name       = param_dict["ev_name"]
    # Unused fields:
    # callchain  = param_dict["callchain"]
    # brstack    = param_dict["brstack"]
    # brstacksym = param_dict["brstacksym"]
    # event_attr = param_dict["attr"]

    # Symbol and dso info are not always resolved
    dso    = get_optional(param_dict, "dso")
    symbol = get_optional(param_dict, "symbol")

    cpu = sample["cpu"]
    if cpu in glb_switch_str:
        print(glb_switch_str[cpu])
        del glb_switch_str[cpu]

    if name.startswith("instructions"):
        if glb_src:
            print_srccode(comm, param_dict, sample, symbol, dso, True)
        else:
            print_instructions_start(comm, sample)
            print_common_ip(param_dict, sample, symbol, dso)
    elif name.startswith("branches"):
        if glb_src:
            print_srccode(comm, param_dict, sample, symbol, dso, False)
        else:
            print_common_start(comm, sample, name)
            print_common_ip(param_dict, sample, symbol, dso)
    elif name == "ptwrite":
        print_common_start(comm, sample, name)
        print_ptwrite(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "cbr":
        print_common_start(comm, sample, name)
        print_cbr(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "mwait":
        print_common_start(comm, sample, name)
        print_mwait(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "pwre":
        print_common_start(comm, sample, name)
        print_pwre(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "exstop":
        print_common_start(comm, sample, name)
        print_exstop(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "pwrx":
        print_common_start(comm, sample, name)
        print_pwrx(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "psb":
        print_common_start(comm, sample, name)
        print_psb(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "evt":
        print_common_start(comm, sample, name)
        print_evt(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    elif name == "iflag":
        print_common_start(comm, sample, name)
        print_iflag(raw_buf)
        print_common_ip(param_dict, sample, symbol, dso)
    else:
        print_common_start(comm, sample, name)
        print_common_ip(param_dict, sample, symbol, dso)

def interleave_events(param_dict):
    global glb_cpu
    global glb_time
    global glb_output
    global glb_output_pos

    sample  = param_dict["sample"]
    glb_cpu = sample["cpu"]
    ts      = sample["time"]

    if glb_time != ts:
        glb_time = ts
        flush_stashed_output()

    glb_output_pos = 0
    with contextlib.redirect_stdout(io.StringIO()) as glb_output:
        do_process_event(param_dict)

    stash_output()

def process_event(param_dict):
    try:
        if glb_args.interleave:
            interleave_events(param_dict)
        else:
            do_process_event(param_dict)
    except broken_pipe_exception:
        # Stop python printing broken pipe errors and traceback
        sys.stdout = open(os.devnull, 'w')
        sys.exit(1)

def auxtrace_error(typ, code, cpu, pid, tid, ip, ts, msg, cpumode, *x):
    if glb_args.interleave:
        flush_stashed_output()
    if len(x) >= 2 and x[0]:
        machine_pid = x[0]
        vcpu = x[1]
    else:
        machine_pid = 0
        vcpu = -1
    try:
        if machine_pid:
            print("VM:%5d VCPU:%03d %16s %5u/%-5u [%03u] %9u.%09u  error type %u code %u: %s ip 0x%16x" %
                (machine_pid, vcpu, "Trace error", pid, tid, cpu, ts / 1000000000, ts %1000000000, typ, code, msg, ip))
        else:
            print("%16s %5u/%-5u [%03u] %9u.%09u  error type %u code %u: %s ip 0x%16x" %
                ("Trace error", pid, tid, cpu, ts / 1000000000, ts %1000000000, typ, code, msg, ip))
    except broken_pipe_exception:
        # Stop python printing broken pipe errors and traceback
        sys.stdout = open(os.devnull, 'w')
        sys.exit(1)

def context_switch(ts, cpu, pid, tid, np_pid, np_tid, machine_pid, out, out_preempt, *x):
    if glb_args.interleave:
        flush_stashed_output()
    if out:
        out_str = "Switch out "
    else:
        out_str = "Switch In  "
    if out_preempt:
        preempt_str = "preempt"
    else:
        preempt_str = ""
    if len(x) >= 2 and x[0]:
        machine_pid = x[0]
        vcpu = x[1]
    else:
        vcpu = None;
    if machine_pid == -1:
        machine_str = ""
    elif vcpu is None:
        machine_str = "machine PID %d" % machine_pid
    else:
        machine_str = "machine PID %d VCPU %d" % (machine_pid, vcpu)
    switch_str = "%16s %5d/%-5d [%03u] %9u.%09u %5d/%-5d %s %s" % \
        (out_str, pid, tid, cpu, ts / 1000000000, ts %1000000000, np_pid, np_tid, machine_str, preempt_str)
    if glb_args.all_switch_events:
        print(switch_str)
    else:
        global glb_switch_str
        glb_switch_str[cpu] = switch_str