From 9b53ab71fc73e452691efe931afdbb5073fa6312 Mon Sep 17 00:00:00 2001
From: Joel Fernandes <joelaf@google.com>
Date: Wed, 21 Jun 2017 20:16:05 -0700
Subject: [PATCH] Add trace analysis scripts

runnable: measure task runnable times
runtime: calculate runtime of tasks as percent of CPU.
---
 tools/analysis/runnable.py | 165 +++++++++++++++++++++++++++++++++++++
 tools/analysis/runtime.py  | 159 +++++++++++++++++++++++++++++++++++
 2 files changed, 324 insertions(+)
 create mode 100755 tools/analysis/runnable.py
 create mode 100755 tools/analysis/runtime.py

diff --git a/tools/analysis/runnable.py b/tools/analysis/runnable.py
new file mode 100755
index 000000000..1da3bfbee
--- /dev/null
+++ b/tools/analysis/runnable.py
@@ -0,0 +1,165 @@
+#!/usr/bin/env python
+# SPDX-License-Identifier: Apache-2.0
+#
+# Copyright (C) 2017, ARM Limited, Google, and contributors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+from collections import namedtuple
+import trappy
+import argparse
+
+EventData = namedtuple('EventData', ['time', 'event', 'data'])
+LatData = namedtuple('LatData', ['pid', 'switch_data', 'wake_data', 'last_wake_data', 'running', 'wake_pend', 'latency', 'lat_total'])
+
+parser = argparse.ArgumentParser(description='Analyze runnable times')
+
+parser.add_argument('--trace', dest='trace_file', action='store', required=True,
+                    help='trace file')
+
+parser.add_argument('--rt', dest='rt', action='store_true', default=False,
+                    help='only consider RT tasks')
+
+parser.add_argument('--normalize', dest='normalize', action='store_true', default=False,
+                    help='normalize time')
+
+parser.add_argument('--rows', dest='nrows', action='store', default=20, type=int,
+                    help='normalize time')
+
+parser.add_argument('--total', dest='lat_total', action='store_true', default=False,
+                    help='sort by total runnable time')
+
+parser.add_argument('--start-time', dest='start_time', action='store', default=0, type=float,
+                    help='trace window start time')
+
+parser.add_argument('--end-time', dest='end_time', action='store', default=None, type=float,
+                    help='trace window end time')
+
+args = parser.parse_args()
+
+path_to_html = args.trace_file
+rtonly = args.rt
+nrows = args.nrows
+
+# Hash table of pid -> LatData named tuple
+latpids = {}
+
+def switch_cb(data):
+    event = "switch"
+    prevpid = data['prev_pid']
+    nextpid = data['next_pid']
+    time = data['Index']
+
+    e = EventData(time, event, data)
+
+    # prev pid processing (switch out)
+    if latpids.has_key(prevpid):
+        if latpids[prevpid].running == 1:
+            latpids[prevpid] = latpids[prevpid]._replace(running=0)
+        if latpids[prevpid].wake_pend == 1:
+            print "Impossible: switch out during wake_pend " + str(e)
+            latpids[prevpid] = latpids[prevpid]._replace(wake_pend=0)
+            return
+
+    if not latpids.has_key(nextpid):
+        return
+
+    # nextpid processing  (switch in)
+    pid = nextpid
+    if latpids[pid].running == 1:
+        print "INFO: previous pid switch-out not seen for an event, ignoring\n" + str(e)
+        return
+    latpids[pid] = latpids[pid]._replace(running=1)
+
+    # Ignore latency calc for next-switch events for which wake never seen
+    # They are still valid in this scenario because of preemption
+    if latpids[pid].wake_pend == 0:
+        return
+
+    # Measure latency
+    lat = time - latpids[pid].last_wake_data.time
+    total = latpids[pid].lat_total + lat
+    latpids[pid] = latpids[pid]._replace(lat_total=total)
+
+    if lat > latpids[pid].latency:
+        latpids[pid] = LatData(pid, switch_data = e,
+                               wake_data = latpids[pid].last_wake_data,
+                               last_wake_data=None, latency=lat, lat_total=latpids[pid].lat_total, running=1, wake_pend=0)
+        return
+    latpids[pid] = latpids[pid]._replace(running=1, wake_pend=0)
+
+def wake_cb(data):
+    event = "wake"
+    pid = data['pid']
+    time = data['Index']
+
+    e = EventData(time, event, data)
+
+    if rtonly and data["prio"] > 99:
+        return
+
+    if  not latpids.has_key(pid):
+        latpids[pid] = LatData(pid, switch_data=None, wake_data=None,
+                last_wake_data = e, running=0, latency=-1, lat_total=0, wake_pend=1)
+        return
+
+    if latpids[pid].running == 1 or latpids[pid].wake_pend == 1:
+        # Task already running or a wakeup->switch pending, ignore
+        return
+
+    latpids[pid] = latpids[pid]._replace(last_wake_data = e, wake_pend=1)
+
+
+if args.normalize:
+    kwargs = { 'window': (args.start_time, args.end_time) }
+else:
+    kwargs = { 'abs_window': (args.start_time, args.end_time) }
+
+systrace_obj = trappy.SysTrace(name="systrace", path=path_to_html, \
+        scope="sched", events=["sched_switch", "sched_wakeup", "sched_waking"], normalize_time=args.normalize, **kwargs)
+
+systrace_obj.apply_callbacks({ "sched_switch": switch_cb, "sched_wakeup": wake_cb, \
+                               "sched_waking": wake_cb })
+
+# Print the results: PID, latency, start, end, sort
+if args.lat_total:
+    result = sorted(latpids.items(), key=lambda x: x[1].lat_total, reverse=True)
+else:
+    result = sorted(latpids.items(), key=lambda x: x[1].latency, reverse=True)
+
+print "\t".join([
+    "PID".ljust(10),
+    "name".ljust(20),
+    "latency (secs)".ljust(20),
+    "start time".ljust(20),
+    "end time".ljust(20),
+    "total (secs)".ljust(20)
+])
+
+for r in result[:nrows]:
+    l = r[1] # LatData named tuple
+    if l.pid != r[0]:
+        raise RuntimeError("BUG: pid inconsistency found") # Sanity check
+    wake_time   = l.wake_data.time
+    switch_time = l.switch_data.time
+    total = l.lat_total
+
+    print "\t".join([
+        str(r[0]).ljust(10),
+        str(l.wake_data.data['comm']).ljust(20),
+        str(l.latency).ljust(20)[:20],
+        str(wake_time).ljust(20)[:20],
+        str(switch_time).ljust(20)[:20],
+        str(total).ljust(20)[:20]
+    ])
diff --git a/tools/analysis/runtime.py b/tools/analysis/runtime.py
new file mode 100755
index 000000000..d59abfeb0
--- /dev/null
+++ b/tools/analysis/runtime.py
@@ -0,0 +1,159 @@
+#!/usr/bin/env python
+# SPDX-License-Identifier: Apache-2.0
+#
+# Copyright (C) 2017, ARM Limited, Google, and contributors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import trappy
+import numpy as np
+import argparse
+
+class RunData:
+    def __init__(self, pid, comm, time):
+        self.pid = pid
+        self.comm = comm
+        self.last_start_time = time
+        self.total_time = np.float64(0.0)
+        self.start_time = -1
+        self.end_time = -1
+        self.running = 1
+        self.maxrun = -1
+
+parser = argparse.ArgumentParser(description='Analyze runtimes')
+
+parser.add_argument('--trace', dest='trace_file', action='store', required=True,
+                    help='trace file')
+
+parser.add_argument('--normalize', dest='normalize', action='store_true', default=False,
+                    help='normalize time')
+
+parser.add_argument('--rows', dest='nrows', action='store', default=20, type=int,
+                    help='normalize time')
+
+parser.add_argument('--start-time', dest='start_time', action='store', default=0, type=float,
+                    help='trace window start time')
+
+parser.add_argument('--end-time', dest='end_time', action='store', default=None, type=float,
+                    help='trace window end time')
+
+args = parser.parse_args()
+
+path_to_html = args.trace_file
+nrows = args.nrows
+
+# Hash table for runtimes
+runpids = {}
+
+starttime = None
+endtime = None
+
+def switch_cb(data):
+    global starttime, endtime
+
+    prevpid = data['prev_pid']
+    nextpid = data['next_pid']
+    time = data['Index']
+
+    if not starttime:
+        starttime = time
+    endtime = time
+
+    if prevpid != 0:
+        # prev pid processing (switch out)
+        if runpids.has_key(prevpid):
+            rp = runpids[prevpid]
+            if rp.running == 1:
+                rp.running = 0
+                runtime = time - rp.last_start_time
+                if runtime > rp.maxrun:
+                    rp.maxrun = runtime
+                    rp.start_time = rp.last_start_time
+                    rp.end_time = time
+                rp.total_time += runtime
+
+            else:
+                print 'switch out seen while no switch in {}'.format(prevpid)
+        else:
+            print 'switch out seen while no switch in {}'.format(prevpid)
+
+    if nextpid == 0:
+        return
+
+    # nextpid processing  (switch in)
+    if not runpids.has_key(nextpid):
+        # print 'creating data for nextpid {}'.format(nextpid)
+        rp = RunData(nextpid, data['next_comm'], time)
+        runpids[nextpid] = rp
+        return
+
+    rp = runpids[nextpid]
+    if rp.running == 1:
+        print 'switch in seen for already running task {}'.format(nextpid)
+        return
+
+    rp.running = 1
+    rp.last_start_time = time
+
+
+if args.normalize:
+    kwargs = { 'window': (args.start_time, args.end_time) }
+else:
+    kwargs = { 'abs_window': (args.start_time, args.end_time) }
+
+systrace_obj = trappy.SysTrace(name="systrace", path=path_to_html, \
+        scope="sched", events=["sched_switch"], normalize_time=args.normalize, **kwargs)
+
+ncpus = systrace_obj.sched_switch.data_frame["__cpu"].max() + 1
+print 'cpus found: {}\n'.format(ncpus)
+
+systrace_obj.apply_callbacks({ "sched_switch": switch_cb })
+
+## Print results
+testtime = (endtime - starttime) * ncpus              # for 4 cpus
+print "total test time (scaled by number of CPUs): {} secs".format(testtime)
+
+# Print the results: PID, latency, start, end, sort
+result = sorted(runpids.items(), key=lambda x: x[1].total_time, reverse=True)
+print "\t".join([
+    "PID".ljust(10),
+    "name".ljust(15),
+    "max run (secs)".ljust(15),
+    "start time".ljust(15),
+    "end time".ljust(15),
+    "total runtime".ljust(15),
+    "percent cpu".ljust(15),
+    "totalpc"
+])
+
+totalpc = np.float64(0.0)
+for r in result[:nrows]:
+    rd = r[1] # RunData named tuple
+    if rd.pid != r[0]:
+        raise RuntimeError("BUG: pid inconsistency found") # Sanity check
+    start = rd.start_time
+    end = rd.end_time
+    cpupc = (rd.total_time / testtime) * 100
+    totalpc += cpupc
+
+    print "\t".join([
+        str(r[0]).ljust(10),
+        str(rd.comm).ljust(15),
+        str(rd.maxrun).ljust(15)[:15],
+        str(start).ljust(15)[:15],
+        str(end).ljust(15)[:15],
+        str(rd.total_time).ljust(15),
+        str(cpupc),
+        str(totalpc)
+    ])
-- 
GitLab