123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139 |
- #!/usr/bin/env python3
- # coding=utf-8
- #
- # StarPU --- Runtime system for heterogeneous multicore architectures.
- #
- # Copyright (C) 2019-2021 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
- #
- # StarPU is free software; you can redistribute it and/or modify
- # it under the terms of the GNU Lesser General Public License as published by
- # the Free Software Foundation; either version 2.1 of the License, or (at
- # your option) any later version.
- #
- # StarPU is distributed in the hope that it will be useful, but
- # WITHOUT ANY WARRANTY; without even the implied warranty of
- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- #
- # See the GNU Lesser General Public License in COPYING.LGPL for more details.
- #
- import sys
- PROGNAME = sys.argv[0]
- def usage():
- print("Offline tool to draw graph showing elapsed time between sent or received data and their use by tasks")
- print("")
- print("Usage: %s <folder containing comms.rec and tasks.rec files>" % PROGNAME)
- if len(sys.argv) != 2:
- usage()
- sys.exit(1)
- import re
- import numpy as np
- import matplotlib.pyplot as plt
- from matplotlib.gridspec import GridSpec
- import os
- def convert_rec_file(filename):
- lines = []
- item = dict()
- with open(filename, "r") as f:
- for l in f.readlines():
- if l == "\n":
- lines.append(item)
- item = dict()
- else:
- ls = l.split(":")
- key = ls[0].lower()
- value = ls[1].strip()
- if key in item:
- print("Warning: duplicated key '" + key + "'")
- else:
- if re.match('^\d+$', value) != None:
- item[key] = int(value)
- elif re.match("^\d+\.\d+$", value) != None:
- item[key] = float(value)
- else:
- item[key] = value
- return lines
- working_directory = sys.argv[1]
- comms = convert_rec_file(os.path.join(working_directory, "comms.rec"))
- tasks = [t for t in convert_rec_file(os.path.join(working_directory, "tasks.rec")) if "control" not in t and "starttime" in t]
- if len(tasks) == 0:
- print("There is no task using data after communication.")
- sys.exit(0)
- def plot_graph(comm_time_key, match, filename, title, xlabel):
- delays = []
- workers = dict()
- nb = 0
- durations = []
- min_time = 0.
- max_time = 0.
- for c in comms:
- t_matched = None
- for t in tasks:
- if match(t, c):
- t_matched = t
- break
- if t_matched is not None:
- worker = str(t_matched['mpirank']) + "-" + str(t_matched['workerid'])
- if worker not in workers:
- workers[worker] = []
- eps = t["starttime"] - c[comm_time_key]
- assert eps > 0
- durations.append(eps)
- workers[worker].append((c[comm_time_key], eps))
- if min_time == 0 or c[comm_time_key] < min_time:
- min_time = c[comm_time_key]
- if max_time == 0 or c[comm_time_key] > max_time:
- max_time = c[comm_time_key]
- nb += 1
- fig = plt.figure(constrained_layout=True)
- gs = GridSpec(2, 2, figure=fig)
- axs = [fig.add_subplot(gs[0, :-1]), fig.add_subplot(gs[1, :-1]), fig.add_subplot(gs[0:, -1])]
- i = 0
- for y, x in workers.items():
- # print(y, x)
- axs[0].broken_barh(x, [i*10, 8], facecolors=(0.1, 0.2, 0.5, 0.2))
- i += 1
- i = 0
- for y, x in workers.items():
- for xx in x:
- axs[1].broken_barh([xx], [i, 1])
- i += 1
- axs[0].set_yticks([i*10+4 for i in range(len(workers))])
- axs[0].set_yticklabels(list(workers))
- axs[0].set(xlabel="Time (ms) - Duration: " + str(max_time - min_time) + "ms", ylabel="Worker [mpi]-[*pu]", title=title)
- if len(durations) != 0:
- axs[2].hist(durations, bins=np.logspace(np.log10(1), np.log10(max(durations)), 50), rwidth=0.8)
- axs[2].set_xscale("log")
- axs[2].set(xlabel=xlabel, ylabel="Number of occurences", title="Histogramm")
- fig.set_size_inches(15, 9)
- plt.savefig(os.path.join(working_directory, filename), dpi=100)
- plt.show()
- plot_graph("recvtime", lambda t, c: (t["mpirank"] == c["dst"] and t["starttime"] >= c["recvtime"] and str(c["recvhandle"]) in t["handles"]), "recv_use.png", "Elapsed time between recv and use (ms)", "Time between data reception and its use by a task")
- plot_graph("sendtime", lambda t, c: (t["mpirank"] == c["src"] and t["starttime"] >= c["sendtime"] and str(c["sendhandle"]) in t["handles"]), "send_use.png", "Elapsed time between send and use (ms)", "Time between data sending and its use by a task")
|