diff options
Diffstat (limited to 'tools/perf/scripts/python')
| -rw-r--r-- | tools/perf/scripts/python/Perf-Trace-Util/Build | 2 | ||||
| -rwxr-xr-x | tools/perf/scripts/python/bin/task-analyzer-record | 2 | ||||
| -rwxr-xr-x | tools/perf/scripts/python/bin/task-analyzer-report | 3 | ||||
| -rw-r--r-- | tools/perf/scripts/python/intel-pt-events.py | 65 | ||||
| -rwxr-xr-x | tools/perf/scripts/python/task-analyzer.py | 934 | 
5 files changed, 1004 insertions, 2 deletions
| diff --git a/tools/perf/scripts/python/Perf-Trace-Util/Build b/tools/perf/scripts/python/Perf-Trace-Util/Build index 7d0e33ce6aba..d5fed4e42617 100644 --- a/tools/perf/scripts/python/Perf-Trace-Util/Build +++ b/tools/perf/scripts/python/Perf-Trace-Util/Build @@ -1,3 +1,3 @@ -perf-y += Context.o +perf-$(CONFIG_LIBTRACEEVENT) += Context.o  CFLAGS_Context.o += $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs diff --git a/tools/perf/scripts/python/bin/task-analyzer-record b/tools/perf/scripts/python/bin/task-analyzer-record new file mode 100755 index 000000000000..0f6b51bb2767 --- /dev/null +++ b/tools/perf/scripts/python/bin/task-analyzer-record @@ -0,0 +1,2 @@ +#!/bin/bash +perf record -e sched:sched_switch -e sched:sched_migrate_task "$@" diff --git a/tools/perf/scripts/python/bin/task-analyzer-report b/tools/perf/scripts/python/bin/task-analyzer-report new file mode 100755 index 000000000000..4b16a8cc40a0 --- /dev/null +++ b/tools/perf/scripts/python/bin/task-analyzer-report @@ -0,0 +1,3 @@ +#!/bin/bash +# description: analyze timings of tasks +perf script -s "$PERF_EXEC_PATH"/scripts/python/task-analyzer.py -- "$@" diff --git a/tools/perf/scripts/python/intel-pt-events.py b/tools/perf/scripts/python/intel-pt-events.py index 6be7fd8fd615..08862a2582f4 100644 --- a/tools/perf/scripts/python/intel-pt-events.py +++ b/tools/perf/scripts/python/intel-pt-events.py @@ -13,10 +13,12 @@  from __future__ import print_function +import io  import os  import sys  import struct  import argparse +import contextlib  from libxed import LibXED  from ctypes import create_string_buffer, addressof @@ -39,6 +41,11 @@ glb_src			= False  glb_source_file_name	= None  glb_line_number		= None  glb_dso			= None +glb_stash_dict		= {} +glb_output		= None +glb_output_pos		= 0 +glb_cpu			= -1 +glb_time		= 0  def get_optional_null(perf_dict, field):  	if field in perf_dict: @@ -70,6 +77,7 @@ def trace_begin():  	ap.add_argument("--insn-trace", action='store_true')  	ap.add_argument("--src-trace", action='store_true')  	ap.add_argument("--all-switch-events", action='store_true') +	ap.add_argument("--interleave", type=int, nargs='?', const=4, default=0)  	global glb_args  	global glb_insn  	global glb_src @@ -94,11 +102,39 @@ def trace_begin():  	perf_set_itrace_options(perf_script_context, itrace)  def trace_end(): +	if glb_args.interleave: +		flush_stashed_output()  	print("End")  def trace_unhandled(event_name, context, event_fields_dict):  		print(' '.join(['%s=%s'%(k,str(v))for k,v in sorted(event_fields_dict.items())])) +def stash_output(): +	global glb_stash_dict +	global glb_output_pos +	output_str = glb_output.getvalue()[glb_output_pos:] +	n = len(output_str) +	if n: +		glb_output_pos += n +		if glb_cpu not in glb_stash_dict: +			glb_stash_dict[glb_cpu] = [] +		glb_stash_dict[glb_cpu].append(output_str) + +def flush_stashed_output(): +	global glb_stash_dict +	while glb_stash_dict: +		cpus = list(glb_stash_dict.keys()) +		# Output at most glb_args.interleave output strings per cpu +		for cpu in cpus: +			items = glb_stash_dict[cpu] +			countdown = glb_args.interleave +			while len(items) and countdown: +				sys.stdout.write(items[0]) +				del items[0] +				countdown -= 1 +			if not items: +				del glb_stash_dict[cpu] +  def print_ptwrite(raw_buf):  	data = struct.unpack_from("<IQ", raw_buf)  	flags = data[0] @@ -375,15 +411,40 @@ def do_process_event(param_dict):  		print_common_start(comm, sample, name)  		print_common_ip(param_dict, sample, symbol, dso) +def interleave_events(param_dict): +	global glb_cpu +	global glb_time +	global glb_output +	global glb_output_pos + +	sample  = param_dict["sample"] +	glb_cpu = sample["cpu"] +	ts      = sample["time"] + +	if glb_time != ts: +		glb_time = ts +		flush_stashed_output() + +	glb_output_pos = 0 +	with contextlib.redirect_stdout(io.StringIO()) as glb_output: +		do_process_event(param_dict) + +	stash_output() +  def process_event(param_dict):  	try: -		do_process_event(param_dict) +		if glb_args.interleave: +			interleave_events(param_dict) +		else: +			do_process_event(param_dict)  	except broken_pipe_exception:  		# Stop python printing broken pipe errors and traceback  		sys.stdout = open(os.devnull, 'w')  		sys.exit(1)  def auxtrace_error(typ, code, cpu, pid, tid, ip, ts, msg, cpumode, *x): +	if glb_args.interleave: +		flush_stashed_output()  	if len(x) >= 2 and x[0]:  		machine_pid = x[0]  		vcpu = x[1] @@ -403,6 +464,8 @@ def auxtrace_error(typ, code, cpu, pid, tid, ip, ts, msg, cpumode, *x):  		sys.exit(1)  def context_switch(ts, cpu, pid, tid, np_pid, np_tid, machine_pid, out, out_preempt, *x): +	if glb_args.interleave: +		flush_stashed_output()  	if out:  		out_str = "Switch out "  	else: diff --git a/tools/perf/scripts/python/task-analyzer.py b/tools/perf/scripts/python/task-analyzer.py new file mode 100755 index 000000000000..52e8dae9b1f0 --- /dev/null +++ b/tools/perf/scripts/python/task-analyzer.py @@ -0,0 +1,934 @@ +# task-analyzer.py - comprehensive perf tasks analysis +# SPDX-License-Identifier: GPL-2.0 +# Copyright (c) 2022, Hagen Paul Pfeifer <hagen@jauu.net> +# Licensed under the terms of the GNU GPL License version 2 +# +# Usage: +# +#     perf record -e sched:sched_switch -a -- sleep 10 +#     perf script report task-analyzer +# + +from __future__ import print_function +import sys +import os +import string +import argparse +import decimal + + +sys.path.append( +    os.environ["PERF_EXEC_PATH"] + "/scripts/python/Perf-Trace-Util/lib/Perf/Trace" +) +from perf_trace_context import * +from Core import * + +# Definition of possible ASCII color codes +_COLORS = { +    "grey": "\033[90m", +    "red": "\033[91m", +    "green": "\033[92m", +    "yellow": "\033[93m", +    "blue": "\033[94m", +    "violet": "\033[95m", +    "reset": "\033[0m", +} + +# Columns will have a static size to align everything properly +# Support of 116 days of active update with nano precision +LEN_SWITCHED_IN = len("9999999.999999999")  # 17 +LEN_SWITCHED_OUT = len("9999999.999999999")  # 17 +LEN_CPU = len("000") +LEN_PID = len("maxvalue")  # 8 +LEN_TID = len("maxvalue")  # 8 +LEN_COMM = len("max-comms-length")  # 16 +LEN_RUNTIME = len("999999.999")  # 10 +# Support of 3.45 hours of timespans +LEN_OUT_IN = len("99999999999.999")  # 15 +LEN_OUT_OUT = len("99999999999.999")  # 15 +LEN_IN_IN = len("99999999999.999")  # 15 +LEN_IN_OUT = len("99999999999.999")  # 15 + + +# py2/py3 compatibility layer, see PEP469 +try: +    dict.iteritems +except AttributeError: +    # py3 +    def itervalues(d): +        return iter(d.values()) + +    def iteritems(d): +        return iter(d.items()) + +else: +    # py2 +    def itervalues(d): +        return d.itervalues() + +    def iteritems(d): +        return d.iteritems() + + +def _check_color(): +    global _COLORS +    """user enforced no-color or if stdout is no tty we disable colors""" +    if sys.stdout.isatty() and args.stdio_color != "never": +        return +    _COLORS = { +        "grey": "", +        "red": "", +        "green": "", +        "yellow": "", +        "blue": "", +        "violet": "", +        "reset": "", +    } + + +def _parse_args(): +    global args +    parser = argparse.ArgumentParser(description="Analyze tasks behavior") +    parser.add_argument( +        "--time-limit", +        default=[], +        help= +            "print tasks only in time[s] window e.g" +        " --time-limit 123.111:789.222(print all between 123.111 and 789.222)" +        " --time-limit 123: (print all from 123)" +        " --time-limit :456 (print all until incl. 456)", +    ) +    parser.add_argument( +        "--summary", action="store_true", help="print addtional runtime information" +    ) +    parser.add_argument( +        "--summary-only", action="store_true", help="print only summary without traces" +    ) +    parser.add_argument( +        "--summary-extended", +        action="store_true", +        help="print the summary with additional information of max inter task times" +            " relative to the prev task", +    ) +    parser.add_argument( +        "--ns", action="store_true", help="show timestamps in nanoseconds" +    ) +    parser.add_argument( +        "--ms", action="store_true", help="show timestamps in miliseconds" +    ) +    parser.add_argument( +        "--extended-times", +        action="store_true", +        help="Show the elapsed times between schedule in/schedule out" +            " of this task and the schedule in/schedule out of previous occurrence" +            " of the same task", +    ) +    parser.add_argument( +        "--filter-tasks", +        default=[], +        help="filter out unneeded tasks by tid, pid or processname." +        " E.g --filter-task 1337,/sbin/init ", +    ) +    parser.add_argument( +        "--limit-to-tasks", +        default=[], +        help="limit output to selected task by tid, pid, processname." +        " E.g --limit-to-tasks 1337,/sbin/init", +    ) +    parser.add_argument( +        "--highlight-tasks", +        default="", +        help="colorize special tasks by their pid/tid/comm." +        " E.g. --highlight-tasks 1:red,mutt:yellow" +        " Colors available: red,grey,yellow,blue,violet,green", +    ) +    parser.add_argument( +        "--rename-comms-by-tids", +        default="", +        help="rename task names by using tid (<tid>:<newname>,<tid>:<newname>)" +            " This option is handy for inexpressive processnames like python interpreted" +            " process. E.g --rename 1337:my-python-app", +    ) +    parser.add_argument( +        "--stdio-color", +        default="auto", +        choices=["always", "never", "auto"], +        help="always, never or auto, allowing configuring color output" +            " via the command line", +    ) +    parser.add_argument( +        "--csv", +        default="", +        help="Write trace to file selected by user. Options, like --ns or --extended" +            "-times are used.", +    ) +    parser.add_argument( +        "--csv-summary", +        default="", +        help="Write summary to file selected by user. Options, like --ns or" +            " --summary-extended are used.", +    ) +    args = parser.parse_args() +    args.tid_renames = dict() + +    _argument_filter_sanity_check() +    _argument_prepare_check() + + +def time_uniter(unit): +    picker = { +        "s": 1, +        "ms": 1e3, +        "us": 1e6, +        "ns": 1e9, +    } +    return picker[unit] + + +def _init_db(): +    global db +    db = dict() +    db["running"] = dict() +    db["cpu"] = dict() +    db["tid"] = dict() +    db["global"] = [] +    if args.summary or args.summary_extended or args.summary_only: +        db["task_info"] = dict() +        db["runtime_info"] = dict() +        # min values for summary depending on the header +        db["task_info"]["pid"] = len("PID") +        db["task_info"]["tid"] = len("TID") +        db["task_info"]["comm"] = len("Comm") +        db["runtime_info"]["runs"] = len("Runs") +        db["runtime_info"]["acc"] = len("Accumulated") +        db["runtime_info"]["max"] = len("Max") +        db["runtime_info"]["max_at"] = len("Max At") +        db["runtime_info"]["min"] = len("Min") +        db["runtime_info"]["mean"] = len("Mean") +        db["runtime_info"]["median"] = len("Median") +        if args.summary_extended: +            db["inter_times"] = dict() +            db["inter_times"]["out_in"] = len("Out-In") +            db["inter_times"]["inter_at"] = len("At") +            db["inter_times"]["out_out"] = len("Out-Out") +            db["inter_times"]["in_in"] = len("In-In") +            db["inter_times"]["in_out"] = len("In-Out") + + +def _median(numbers): +    """phython3 hat statistics module - we have nothing""" +    n = len(numbers) +    index = n // 2 +    if n % 2: +        return sorted(numbers)[index] +    return sum(sorted(numbers)[index - 1 : index + 1]) / 2 + + +def _mean(numbers): +    return sum(numbers) / len(numbers) + + +class Timespans(object): +    """ +    The elapsed time between two occurrences of the same task is being tracked with the +    help of this class. There are 4 of those Timespans Out-Out, In-Out, Out-In and +    In-In. +    The first half of the name signals the first time point of the +    first task. The second half of the name represents the second +    timepoint of the second task. +    """ + +    def __init__(self): +        self._last_start = None +        self._last_finish = None +        self.out_out = -1 +        self.in_out = -1 +        self.out_in = -1 +        self.in_in = -1 +        if args.summary_extended: +            self._time_in = -1 +            self.max_out_in = -1 +            self.max_at = -1 +            self.max_in_out = -1 +            self.max_in_in = -1 +            self.max_out_out = -1 + +    def feed(self, task): +        """ +        Called for every recorded trace event to find process pair and calculate the +        task timespans. Chronological ordering, feed does not do reordering +        """ +        if not self._last_finish: +            self._last_start = task.time_in(time_unit) +            self._last_finish = task.time_out(time_unit) +            return +        self._time_in = task.time_in() +        time_in = task.time_in(time_unit) +        time_out = task.time_out(time_unit) +        self.in_in = time_in - self._last_start +        self.out_in = time_in - self._last_finish +        self.in_out = time_out - self._last_start +        self.out_out = time_out - self._last_finish +        if args.summary_extended: +            self._update_max_entries() +        self._last_finish = task.time_out(time_unit) +        self._last_start = task.time_in(time_unit) + +    def _update_max_entries(self): +        if self.in_in > self.max_in_in: +            self.max_in_in = self.in_in +        if self.out_out > self.max_out_out: +            self.max_out_out = self.out_out +        if self.in_out > self.max_in_out: +            self.max_in_out = self.in_out +        if self.out_in > self.max_out_in: +            self.max_out_in = self.out_in +            self.max_at = self._time_in + + + +class Summary(object): +    """ +    Primary instance for calculating the summary output. Processes the whole trace to +    find and memorize relevant data such as mean, max et cetera. This instance handles +    dynamic alignment aspects for summary output. +    """ + +    def __init__(self): +        self._body = [] + +    class AlignmentHelper: +        """ +        Used to calculated the alignment for the output of the summary. +        """ +        def __init__(self, pid, tid, comm, runs, acc, mean, +                    median, min, max, max_at): +            self.pid = pid +            self.tid = tid +            self.comm = comm +            self.runs = runs +            self.acc = acc +            self.mean = mean +            self.median = median +            self.min = min +            self.max = max +            self.max_at = max_at +            if args.summary_extended: +                self.out_in = None +                self.inter_at = None +                self.out_out = None +                self.in_in = None +                self.in_out = None + +    def _print_header(self): +        ''' +        Output is trimmed in _format_stats thus additional adjustment in the header +        is needed, depending on the choice of timeunit. The adjustment corresponds +        to the amount of column titles being adjusted in _column_titles. +        ''' +        decimal_precision = 6 if not args.ns else 9 +        fmt = " {{:^{}}}".format(sum(db["task_info"].values())) +        fmt += " {{:^{}}}".format( +            sum(db["runtime_info"].values()) - 2 * decimal_precision +            ) +        _header = ("Task Information", "Runtime Information") + +        if args.summary_extended: +            fmt += " {{:^{}}}".format( +                sum(db["inter_times"].values()) - 4 * decimal_precision +                ) +            _header += ("Max Inter Task Times",) +        fd_sum.write(fmt.format(*_header) +  "\n") + +    def _column_titles(self): +        """ +        Cells are being processed and displayed in different way so an alignment adjust +        is implemented depeding on the choice of the timeunit. The positions of the max +        values are being displayed in grey. Thus in their format two additional {}, +        are placed for color set and reset. +        """ +        separator, fix_csv_align = _prepare_fmt_sep() +        decimal_precision, time_precision = _prepare_fmt_precision() +        fmt = "{{:>{}}}".format(db["task_info"]["pid"] * fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, db["task_info"]["tid"] * fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, db["task_info"]["comm"] * fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, db["runtime_info"]["runs"] * fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, db["runtime_info"]["acc"] * fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, db["runtime_info"]["mean"] * fix_csv_align) +        fmt += "{}{{:>{}}}".format( +            separator, db["runtime_info"]["median"] * fix_csv_align +        ) +        fmt += "{}{{:>{}}}".format( +            separator, (db["runtime_info"]["min"] - decimal_precision) * fix_csv_align +        ) +        fmt += "{}{{:>{}}}".format( +            separator, (db["runtime_info"]["max"] - decimal_precision) * fix_csv_align +        ) +        fmt += "{}{{}}{{:>{}}}{{}}".format( +            separator, (db["runtime_info"]["max_at"] - time_precision) * fix_csv_align +        ) + +        column_titles = ("PID", "TID", "Comm") +        column_titles += ("Runs", "Accumulated", "Mean", "Median", "Min", "Max") +        column_titles += (_COLORS["grey"], "Max At", _COLORS["reset"]) + +        if args.summary_extended: +            fmt += "{}{{:>{}}}".format( +                separator, +                (db["inter_times"]["out_in"] - decimal_precision) * fix_csv_align +            ) +            fmt += "{}{{}}{{:>{}}}{{}}".format( +                separator, +                (db["inter_times"]["inter_at"] - time_precision) * fix_csv_align +            ) +            fmt += "{}{{:>{}}}".format( +                separator, +                (db["inter_times"]["out_out"] - decimal_precision) * fix_csv_align +            ) +            fmt += "{}{{:>{}}}".format( +                separator, +                (db["inter_times"]["in_in"] - decimal_precision) * fix_csv_align +            ) +            fmt += "{}{{:>{}}}".format( +                separator, +                (db["inter_times"]["in_out"] - decimal_precision) * fix_csv_align +            ) + +            column_titles += ("Out-In", _COLORS["grey"], "Max At", _COLORS["reset"], +                        "Out-Out", "In-In", "In-Out") + +        fd_sum.write(fmt.format(*column_titles) + "\n") + + +    def _task_stats(self): +        """calculates the stats of every task and constructs the printable summary""" +        for tid in sorted(db["tid"]): +            color_one_sample = _COLORS["grey"] +            color_reset = _COLORS["reset"] +            no_executed = 0 +            runtimes = [] +            time_in = [] +            timespans = Timespans() +            for task in db["tid"][tid]: +                pid = task.pid +                comm = task.comm +                no_executed += 1 +                runtimes.append(task.runtime(time_unit)) +                time_in.append(task.time_in()) +                timespans.feed(task) +            if len(runtimes) > 1: +                color_one_sample = "" +                color_reset = "" +            time_max = max(runtimes) +            time_min = min(runtimes) +            max_at = time_in[runtimes.index(max(runtimes))] + +            # The size of the decimal after sum,mean and median varies, thus we cut +            # the decimal number, by rounding it. It has no impact on the output, +            # because we have a precision of the decimal points at the output. +            time_sum = round(sum(runtimes), 3) +            time_mean = round(_mean(runtimes), 3) +            time_median = round(_median(runtimes), 3) + +            align_helper = self.AlignmentHelper(pid, tid, comm, no_executed, time_sum, +                                    time_mean, time_median, time_min, time_max, max_at) +            self._body.append([pid, tid, comm, no_executed, time_sum, color_one_sample, +                                time_mean, time_median, time_min, time_max, +                                _COLORS["grey"], max_at, _COLORS["reset"], color_reset]) +            if args.summary_extended: +                self._body[-1].extend([timespans.max_out_in, +                                _COLORS["grey"], timespans.max_at, +                                _COLORS["reset"], timespans.max_out_out, +                                timespans.max_in_in, +                                timespans.max_in_out]) +                align_helper.out_in = timespans.max_out_in +                align_helper.inter_at = timespans.max_at +                align_helper.out_out = timespans.max_out_out +                align_helper.in_in = timespans.max_in_in +                align_helper.in_out = timespans.max_in_out +            self._calc_alignments_summary(align_helper) + +    def _format_stats(self): +        separator, fix_csv_align = _prepare_fmt_sep() +        decimal_precision, time_precision = _prepare_fmt_precision() +        len_pid = db["task_info"]["pid"] * fix_csv_align +        len_tid = db["task_info"]["tid"] * fix_csv_align +        len_comm = db["task_info"]["comm"] * fix_csv_align +        len_runs = db["runtime_info"]["runs"] * fix_csv_align +        len_acc = db["runtime_info"]["acc"] * fix_csv_align +        len_mean = db["runtime_info"]["mean"] * fix_csv_align +        len_median = db["runtime_info"]["median"] * fix_csv_align +        len_min = (db["runtime_info"]["min"] - decimal_precision) * fix_csv_align +        len_max = (db["runtime_info"]["max"] - decimal_precision) * fix_csv_align +        len_max_at = (db["runtime_info"]["max_at"] - time_precision) * fix_csv_align +        if args.summary_extended: +            len_out_in = ( +                db["inter_times"]["out_in"] - decimal_precision +            ) * fix_csv_align +            len_inter_at = ( +                db["inter_times"]["inter_at"] - time_precision +            ) * fix_csv_align +            len_out_out = ( +                db["inter_times"]["out_out"] - decimal_precision +            ) * fix_csv_align +            len_in_in = (db["inter_times"]["in_in"] - decimal_precision) * fix_csv_align +            len_in_out = ( +                db["inter_times"]["in_out"] - decimal_precision +            ) * fix_csv_align + +        fmt = "{{:{}d}}".format(len_pid) +        fmt += "{}{{:{}d}}".format(separator, len_tid) +        fmt += "{}{{:>{}}}".format(separator, len_comm) +        fmt += "{}{{:{}d}}".format(separator, len_runs) +        fmt += "{}{{:{}.{}f}}".format(separator, len_acc, time_precision) +        fmt += "{}{{}}{{:{}.{}f}}".format(separator, len_mean, time_precision) +        fmt += "{}{{:{}.{}f}}".format(separator, len_median, time_precision) +        fmt += "{}{{:{}.{}f}}".format(separator, len_min, time_precision) +        fmt += "{}{{:{}.{}f}}".format(separator, len_max, time_precision) +        fmt += "{}{{}}{{:{}.{}f}}{{}}{{}}".format( +            separator, len_max_at, decimal_precision +        ) +        if args.summary_extended: +            fmt += "{}{{:{}.{}f}}".format(separator, len_out_in, time_precision) +            fmt += "{}{{}}{{:{}.{}f}}{{}}".format( +                separator, len_inter_at, decimal_precision +            ) +            fmt += "{}{{:{}.{}f}}".format(separator, len_out_out, time_precision) +            fmt += "{}{{:{}.{}f}}".format(separator, len_in_in, time_precision) +            fmt += "{}{{:{}.{}f}}".format(separator, len_in_out, time_precision) +        return fmt + + +    def _calc_alignments_summary(self, align_helper): +        # Length is being cut in 3 groups so that further addition is easier to handle. +        # The length of every argument from the alignment helper is being checked if it +        # is longer than the longest until now. In that case the length is being saved. +        for key in db["task_info"]: +            if len(str(getattr(align_helper, key))) > db["task_info"][key]: +                db["task_info"][key] = len(str(getattr(align_helper, key))) +        for key in db["runtime_info"]: +            if len(str(getattr(align_helper, key))) > db["runtime_info"][key]: +                db["runtime_info"][key] = len(str(getattr(align_helper, key))) +        if args.summary_extended: +            for key in db["inter_times"]: +                if len(str(getattr(align_helper, key))) > db["inter_times"][key]: +                    db["inter_times"][key] = len(str(getattr(align_helper, key))) + + +    def print(self): +        self._task_stats() +        fmt = self._format_stats() + +        if not args.csv_summary: +            print("\nSummary") +            self._print_header() +        self._column_titles() +        for i in range(len(self._body)): +            fd_sum.write(fmt.format(*tuple(self._body[i])) + "\n") + + + +class Task(object): +    """ The class is used to handle the information of a given task.""" + +    def __init__(self, id, tid, cpu, comm): +        self.id = id +        self.tid = tid +        self.cpu = cpu +        self.comm = comm +        self.pid = None +        self._time_in = None +        self._time_out = None + +    def schedule_in_at(self, time): +        """set the time where the task was scheduled in""" +        self._time_in = time + +    def schedule_out_at(self, time): +        """set the time where the task was scheduled out""" +        self._time_out = time + +    def time_out(self, unit="s"): +        """return time where a given task was scheduled out""" +        factor = time_uniter(unit) +        return self._time_out * decimal.Decimal(factor) + +    def time_in(self, unit="s"): +        """return time where a given task was scheduled in""" +        factor = time_uniter(unit) +        return self._time_in * decimal.Decimal(factor) + +    def runtime(self, unit="us"): +        factor = time_uniter(unit) +        return (self._time_out - self._time_in) * decimal.Decimal(factor) + +    def update_pid(self, pid): +        self.pid = pid + + +def _task_id(pid, cpu): +    """returns a "unique-enough" identifier, please do not change""" +    return "{}-{}".format(pid, cpu) + + +def _filter_non_printable(unfiltered): +    """comm names may contain loony chars like '\x00000'""" +    filtered = "" +    for char in unfiltered: +        if char not in string.printable: +            continue +        filtered += char +    return filtered + + +def _fmt_header(): +    separator, fix_csv_align = _prepare_fmt_sep() +    fmt = "{{:>{}}}".format(LEN_SWITCHED_IN*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_SWITCHED_OUT*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_CPU*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_PID*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_TID*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_COMM*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_RUNTIME*fix_csv_align) +    fmt += "{}{{:>{}}}".format(separator, LEN_OUT_IN*fix_csv_align) +    if args.extended_times: +        fmt += "{}{{:>{}}}".format(separator, LEN_OUT_OUT*fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, LEN_IN_IN*fix_csv_align) +        fmt += "{}{{:>{}}}".format(separator, LEN_IN_OUT*fix_csv_align) +    return fmt + + +def _fmt_body(): +    separator, fix_csv_align = _prepare_fmt_sep() +    decimal_precision, time_precision = _prepare_fmt_precision() +    fmt = "{{}}{{:{}.{}f}}".format(LEN_SWITCHED_IN*fix_csv_align, decimal_precision) +    fmt += "{}{{:{}.{}f}}".format( +        separator, LEN_SWITCHED_OUT*fix_csv_align, decimal_precision +    ) +    fmt += "{}{{:{}d}}".format(separator, LEN_CPU*fix_csv_align) +    fmt += "{}{{:{}d}}".format(separator, LEN_PID*fix_csv_align) +    fmt += "{}{{}}{{:{}d}}{{}}".format(separator, LEN_TID*fix_csv_align) +    fmt += "{}{{}}{{:>{}}}".format(separator, LEN_COMM*fix_csv_align) +    fmt += "{}{{:{}.{}f}}".format(separator, LEN_RUNTIME*fix_csv_align, time_precision) +    if args.extended_times: +        fmt += "{}{{:{}.{}f}}".format(separator, LEN_OUT_IN*fix_csv_align, time_precision) +        fmt += "{}{{:{}.{}f}}".format(separator, LEN_OUT_OUT*fix_csv_align, time_precision) +        fmt += "{}{{:{}.{}f}}".format(separator, LEN_IN_IN*fix_csv_align, time_precision) +        fmt += "{}{{:{}.{}f}}{{}}".format( +            separator, LEN_IN_OUT*fix_csv_align, time_precision +        ) +    else: +        fmt += "{}{{:{}.{}f}}{{}}".format( +            separator, LEN_OUT_IN*fix_csv_align, time_precision +        ) +    return fmt + + +def _print_header(): +    fmt = _fmt_header() +    header = ("Switched-In", "Switched-Out", "CPU", "PID", "TID", "Comm", "Runtime", +            "Time Out-In") +    if args.extended_times: +        header += ("Time Out-Out", "Time In-In", "Time In-Out") +    fd_task.write(fmt.format(*header) + "\n") + + + +def _print_task_finish(task): +    """calculating every entry of a row and printing it immediately""" +    c_row_set = "" +    c_row_reset = "" +    out_in = -1 +    out_out = -1 +    in_in = -1 +    in_out = -1 +    fmt = _fmt_body() +    # depending on user provided highlight option we change the color +    # for particular tasks +    if str(task.tid) in args.highlight_tasks_map: +        c_row_set = _COLORS[args.highlight_tasks_map[str(task.tid)]] +        c_row_reset = _COLORS["reset"] +    if task.comm in args.highlight_tasks_map: +        c_row_set = _COLORS[args.highlight_tasks_map[task.comm]] +        c_row_reset = _COLORS["reset"] +    # grey-out entries if PID == TID, they +    # are identical, no threaded model so the +    # thread id (tid) do not matter +    c_tid_set = "" +    c_tid_reset = "" +    if task.pid == task.tid: +        c_tid_set = _COLORS["grey"] +        c_tid_reset = _COLORS["reset"] +    if task.tid in db["tid"]: +        # get last task of tid +        last_tid_task = db["tid"][task.tid][-1] +        # feed the timespan calculate, last in tid db +        # and second the current one +        timespan_gap_tid = Timespans() +        timespan_gap_tid.feed(last_tid_task) +        timespan_gap_tid.feed(task) +        out_in = timespan_gap_tid.out_in +        out_out = timespan_gap_tid.out_out +        in_in = timespan_gap_tid.in_in +        in_out = timespan_gap_tid.in_out + + +    if args.extended_times: +        line_out = fmt.format(c_row_set, task.time_in(), task.time_out(), task.cpu, +                        task.pid, c_tid_set, task.tid, c_tid_reset, c_row_set, task.comm, +                        task.runtime(time_unit), out_in, out_out, in_in, in_out, +                        c_row_reset) + "\n" +    else: +        line_out = fmt.format(c_row_set, task.time_in(), task.time_out(), task.cpu, +                        task.pid, c_tid_set, task.tid, c_tid_reset, c_row_set, task.comm, +                        task.runtime(time_unit), out_in, c_row_reset) + "\n" +    try: +        fd_task.write(line_out) +    except(IOError): +        # don't mangle the output if user SIGINT this script +        sys.exit() + +def _record_cleanup(_list): +    """ +    no need to store more then one element if --summarize +    is not enabled +    """ +    if not args.summary and len(_list) > 1: +        _list = _list[len(_list) - 1 :] + + +def _record_by_tid(task): +    tid = task.tid +    if tid not in db["tid"]: +        db["tid"][tid] = [] +    db["tid"][tid].append(task) +    _record_cleanup(db["tid"][tid]) + + +def _record_by_cpu(task): +    cpu = task.cpu +    if cpu not in db["cpu"]: +        db["cpu"][cpu] = [] +    db["cpu"][cpu].append(task) +    _record_cleanup(db["cpu"][cpu]) + + +def _record_global(task): +    """record all executed task, ordered by finish chronological""" +    db["global"].append(task) +    _record_cleanup(db["global"]) + + +def _handle_task_finish(tid, cpu, time, perf_sample_dict): +    if tid == 0: +        return +    _id = _task_id(tid, cpu) +    if _id not in db["running"]: +        # may happen, if we missed the switch to +        # event. Seen in combination with --exclude-perf +        # where the start is filtered out, but not the +        # switched in. Probably a bug in exclude-perf +        # option. +        return +    task = db["running"][_id] +    task.schedule_out_at(time) + +    # record tid, during schedule in the tid +    # is not available, update now +    pid = int(perf_sample_dict["sample"]["pid"]) + +    task.update_pid(pid) +    del db["running"][_id] + +    # print only tasks which are not being filtered and no print of trace +    # for summary only, but record every task. +    if not _limit_filtered(tid, pid, task.comm) and not args.summary_only: +        _print_task_finish(task) +    _record_by_tid(task) +    _record_by_cpu(task) +    _record_global(task) + + +def _handle_task_start(tid, cpu, comm, time): +    if tid == 0: +        return +    if tid in args.tid_renames: +        comm = args.tid_renames[tid] +    _id = _task_id(tid, cpu) +    if _id in db["running"]: +        # handle corner cases where already running tasks +        # are switched-to again - saw this via --exclude-perf +        # recorded traces. We simple ignore this "second start" +        # event. +        return +    assert _id not in db["running"] +    task = Task(_id, tid, cpu, comm) +    task.schedule_in_at(time) +    db["running"][_id] = task + + +def _time_to_internal(time_ns): +    """ +    To prevent float rounding errors we use Decimal internally +    """ +    return decimal.Decimal(time_ns) / decimal.Decimal(1e9) + + +def _limit_filtered(tid, pid, comm): +    if args.filter_tasks: +        if str(tid) in args.filter_tasks or comm in args.filter_tasks: +            return True +        else: +            return False +    if args.limit_to_tasks: +        if str(tid) in args.limit_to_tasks or comm in args.limit_to_tasks: +            return False +        else: +            return True + + +def _argument_filter_sanity_check(): +    if args.limit_to_tasks and args.filter_tasks: +        sys.exit("Error: Filter and Limit at the same time active.") +    if args.extended_times and args.summary_only: +        sys.exit("Error: Summary only and extended times active.") +    if args.time_limit and ":" not in args.time_limit: +        sys.exit( +            "Error: No bound set for time limit. Please set bound by ':' e.g :123." +        ) +    if args.time_limit and (args.summary or args.summary_only or args.summary_extended): +        sys.exit("Error: Cannot set time limit and print summary") +    if args.csv_summary: +        args.summary = True +        if args.csv == args.csv_summary: +            sys.exit("Error: Chosen files for csv and csv summary are the same") +    if args.csv and (args.summary_extended or args.summary) and not args.csv_summary: +        sys.exit("Error: No file chosen to write summary to. Choose with --csv-summary " +        "<file>") +    if args.csv and args.summary_only: +        sys.exit("Error: --csv chosen and --summary-only. Standard task would not be" +            "written to csv file.") + +def _argument_prepare_check(): +    global time_unit, fd_task, fd_sum +    if args.filter_tasks: +        args.filter_tasks = args.filter_tasks.split(",") +    if args.limit_to_tasks: +        args.limit_to_tasks = args.limit_to_tasks.split(",") +    if args.time_limit: +        args.time_limit = args.time_limit.split(":") +    for rename_tuple in args.rename_comms_by_tids.split(","): +        tid_name = rename_tuple.split(":") +        if len(tid_name) != 2: +            continue +        args.tid_renames[int(tid_name[0])] = tid_name[1] +    args.highlight_tasks_map = dict() +    for highlight_tasks_tuple in args.highlight_tasks.split(","): +        tasks_color_map = highlight_tasks_tuple.split(":") +        # default highlight color to red if no color set by user +        if len(tasks_color_map) == 1: +            tasks_color_map.append("red") +        if args.highlight_tasks and tasks_color_map[1].lower() not in _COLORS: +            sys.exit( +                "Error: Color not defined, please choose from grey,red,green,yellow,blue," +                "violet" +            ) +        if len(tasks_color_map) != 2: +            continue +        args.highlight_tasks_map[tasks_color_map[0]] = tasks_color_map[1] +    time_unit = "us" +    if args.ns: +        time_unit = "ns" +    elif args.ms: +        time_unit = "ms" + + +    fd_task = sys.stdout +    if args.csv: +        args.stdio_color = "never" +        fd_task = open(args.csv, "w") +        print("generating csv at",args.csv,) + +    fd_sum = sys.stdout +    if args.csv_summary: +        args.stdio_color = "never" +        fd_sum = open(args.csv_summary, "w") +        print("generating csv summary at",args.csv_summary) +        if not args.csv: +            args.summary_only = True + + +def _is_within_timelimit(time): +    """ +    Check if a time limit was given by parameter, if so ignore the rest. If not, +    process the recorded trace in its entirety. +    """ +    if not args.time_limit: +        return True +    lower_time_limit = args.time_limit[0] +    upper_time_limit = args.time_limit[1] +    # check for upper limit +    if upper_time_limit == "": +        if time >= decimal.Decimal(lower_time_limit): +            return True +    # check for lower limit +    if lower_time_limit == "": +        if time <= decimal.Decimal(upper_time_limit): +            return True +        # quit if time exceeds upper limit. Good for big datasets +        else: +            quit() +    if lower_time_limit != "" and upper_time_limit != "": +        if (time >= decimal.Decimal(lower_time_limit) and +            time <= decimal.Decimal(upper_time_limit)): +            return True +        # quit if time exceeds upper limit. Good for big datasets +        elif time > decimal.Decimal(upper_time_limit): +            quit() + +def _prepare_fmt_precision(): +    decimal_precision = 6 +    time_precision = 3 +    if args.ns: +     decimal_precision = 9 +     time_precision = 0 +    return decimal_precision, time_precision + +def _prepare_fmt_sep(): +    separator = " " +    fix_csv_align = 1 +    if args.csv or args.csv_summary: +        separator = ";" +        fix_csv_align = 0 +    return separator, fix_csv_align + +def trace_unhandled(event_name, context, event_fields_dict, perf_sample_dict): +    pass + + +def trace_begin(): +    _parse_args() +    _check_color() +    _init_db() +    if not args.summary_only: +        _print_header() + +def trace_end(): +    if args.summary or args.summary_extended or args.summary_only: +        Summary().print() + +def sched__sched_switch(event_name, context, common_cpu, common_secs, common_nsecs, +                        common_pid, common_comm, common_callchain, prev_comm, +                        prev_pid, prev_prio, prev_state, next_comm, next_pid, +                        next_prio, perf_sample_dict): +    # ignore common_secs & common_nsecs cause we need +    # high res timestamp anyway, using the raw value is +    # faster +    time = _time_to_internal(perf_sample_dict["sample"]["time"]) +    if not _is_within_timelimit(time): +        # user specific --time-limit a:b set +        return + +    next_comm = _filter_non_printable(next_comm) +    _handle_task_finish(prev_pid, common_cpu, time, perf_sample_dict) +    _handle_task_start(next_pid, common_cpu, next_comm, time) | 
