You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

362 lines
10 KiB

#!/usr/bin/env python3
#
# (c) 2019-2020 Antmicro <www.antmicro.com>
# License: Apache
#
import signal
import os
import subprocess
import sys
import time
from datetime import datetime, timedelta
from select import select
from fcntl import fcntl, F_GETFL, F_SETFL
from socket import gethostname
from parse import search
GNUPLOT_VERSION_EXPECTED = 5.0
global gnuplot
global die
die = 0
def kill_handler(a, b):
global die
die = 1
def merge_dicts(x, y):
res = x.copy()
res.update(y)
return res
def rename_key(d, old, new):
d[new] = d.pop(old)
# Check if a process is running
def pid_running(pid):
return os.path.exists("/proc/%d" % pid)
# Run process, return subprocess object on success, exit script on fail
def run_process(*argv, **kwargs):
try:
p = subprocess.Popen(argv, **kwargs)
except:
print("Error: '%s' tool not found" % argv[0])
sys.exit(1)
return p
# Read a single table from sar output
def read_table(f):
# Find the header
while True:
header = f.readline().decode().split()
if len(header) > 0:
break
# The first columns is always just time
header[0] = 'time'
table = {}
for title in header:
table[title] = []
# Read rows
while True:
row = f.readline().decode().split()
if len(row) <= 0:
break
for i, value in enumerate(row):
table[header[i]].append(value)
return table
# Run a command in a running gnuplot process
def g(command):
global gnuplot
if not (gnuplot.poll() is None):
print("Error: gnuplot not running!")
return
print ("gnuplot> %s" % command)
try:
command = b"%s\n" % command
except:
command = b"%s\n" % str.encode(command)
gnuplot.stdin.write(b"%s\n" % command)
gnuplot.stdin.flush()
if command == b"quit\n":
while gnuplot.poll() is None:
time.sleep(0.25)
# Check if the avaliable gnuplot has a required version
p = run_process("gnuplot", "--version", stdout=subprocess.PIPE)
version = search("gnuplot {:f}", p.stdout.readline().decode())
if version[0] < GNUPLOT_VERSION_EXPECTED:
print("Error: Gnuplot version too low. Need at least %g found %g" % (GNUPLOT_VERSION_EXPECTED, version[0]))
sys.exit(1)
OUTPUT_TYPE="pngcairo"
OUTPUT_EXT="png"
try:
if os.environ["SARGRAPH_OUTPUT_TYPE"] == "svg":
OUTPUT_TYPE="svg"
OUTPUT_EXT="svg"
except:
pass
p = run_process("sar", "-V", stdout=subprocess.PIPE)
# If the script was run with parameters, handle them
if len(sys.argv) > 1:
# Check if screen provides expected output
p = run_process("screen", "-v", stdout=subprocess.PIPE)
version = search("Screen version {major:d}", p.stdout.readline().decode())
if version is None:
print("Error: 'screen' tool returned unknown output!")
sys.exit(1)
# Check if a command was provided
if len(sys.argv) < 3:
print("Error: command not provided.")
sys.exit(1)
# Get session name and command name
sid = sys.argv[1]
cmd = sys.argv[2]
if cmd == "start":
print("Starting sargraph session '%s'" % sid)
p = subprocess.Popen(["screen", "-dmSL", sid, os.path.realpath(__file__)])
while p.poll() is None:
time.sleep(0.1)
gpid = 0
j = 0
time.sleep(1)
print("Session '%s' started" % sid)
elif cmd == "stop":
print("Terminating sargraph session '%s'" % sid)
try:
gpid = int(os.popen("screen -ls | grep '.%s' | tr -d ' \t' | cut -f 1 -d '.'" % sid).read())
except:
print("Warning: cannot find pid.")
gpid = -1
p = subprocess.Popen(["screen", "-S", sid, "-X", "stuff", "q\n"])
while p.poll() is None:
time.sleep(0.1)
if gpid == -1:
print("Waiting 3 seconds.")
time.sleep(3)
else:
#print("Waiting for pid %d" % gpid)
while pid_running(gpid):
time.sleep(0.25)
elif cmd == "label":
# Check if the label name was provided
if len(sys.argv) < 4:
print("Error: label command requires an additional parameter")
sys.exit(1)
label = sys.argv[3]
print("Adding label '%s' to sargraph session '%s'." % (label, sid))
p = subprocess.Popen(["screen", "-S", sid, "-X", "stuff", "%s\n" % label])
while p.poll() is None:
time.sleep(0.1)
else:
print("Error: Unknown parameter '%s'" % cmd)
sys.exit(1)
sys.exit(0)
# If the script runs in a screen session, initialize the plot and gather data
gnuplot = run_process("gnuplot", stdin=subprocess.PIPE, stdout=subprocess.PIPE)
my_env = os.environ
my_env["S_TIME_FORMAT"] = "ISO"
TOTAL_RAM = 0
with open("/proc/meminfo") as f:
TOTAL_RAM = int(search("MemTotal:{:s}{mem:d}", f.read())["mem"]/1024.0/1024.0)
p = run_process("sar", "-u","-r", "1", stdout=subprocess.PIPE, env=my_env)
print("%d" % os.getpid())
machine = p.stdout.readline().decode()
uname = machine.split(" ")[0:2]
uname = "%s %s" % (uname[0], uname[1])
cpus = int(machine.split(" CPU)")[0].split("(")[-1])
cpu_name = "unknown"
with open("/proc/cpuinfo") as f:
for line in f:
if "model name" in line:
cpu_name = line.replace("\n", "").split(": ")[1]
break
with open("data.txt", "w") as f:
f.write("# pid: %d, machine: %s, cpu count: %d\n" % (os.getpid(), uname, cpus))
p.stdout.readline()
g("set ylabel 'cpu % load (user)'")
g("set ylabel tc rgb 'white' font 'Courier-New,8'")
g("set datafile commentschars '#'")
g("set timefmt '%s'")
g("set xdata time")
g("set border lc rgb 'white'")
g("set key tc rgb 'white'")
g("set timefmt '%Y-%m-%d-%H:%M:%S'")
g("set xtics format '%H:%M:%S'")
g("set xtics font 'Courier-New,8' tc rgb 'white'")
g("set ytics font 'Courier-New,8' tc rgb 'white'")
g("set grid xtics ytics ls 12 lc rgb '#444444'")
g("set style fill solid")
g("set palette defined ( 0.2 '#00ff00', 0.8 '#ff0000' )")
g("set cbrange [0:100]")
g("unset colorbox")
g("unset key")
g("set rmargin 6")
g("set terminal %s size 1200,800 background '#222222' font 'Courier-New,8'" % OUTPUT_TYPE)
signal.signal(signal.SIGTERM, kill_handler)
i = 0
START_DATE = ""
END_DATE = ""
MAX_USED_RAM = 0
AVERAGE_LOAD = 0.0
flags = fcntl(sys.stdin, F_GETFL)
fcntl(sys.stdin, F_SETFL, flags | os.O_NONBLOCK)
labels = []
# Gather data from sar output
while 1:
rlist, _, _ = select([p.stdout, sys.stdin], [], [], 0.25)
now = datetime.now()
if sys.stdin in rlist:
label_line = sys.stdin.readline().replace("\n", "")
if label_line == "q":
die = 1
break
labels.append(["%04d-%02d-%02d-%02d:%02d:%02d" % (now.year, now.month, now.day, now.hour, now.minute, now.second), label_line])
with open("data.txt", "a") as f:
f.write("# %04d-%02d-%02d-%02d:%02d:%02d label: %s\n" % (now.year, now.month, now.day, now.hour, now.minute, now.second, label_line))
if (p.stdout not in rlist):
continue
now = "%04d-%02d-%02d" % (now.year, now.month, now.day);
cpu_data = read_table(p.stdout)
if START_DATE == "":
START_DATE = "%s %s" % (now, cpu_data['time'][0])
cpu_data['time'][0] = now + "-" + cpu_data['time'][0]
AVERAGE_LOAD += float(cpu_data["%user"][0])
i = i + 1
ram_data = read_table(p.stdout)
END_DATE = now + " " + ram_data['time'][0]
ram_data['time'][0] = now + "-" + ram_data['time'][0]
values = merge_dicts(ram_data, cpu_data)
if TOTAL_RAM == 0:
TOTAL_RAM = (int(values['kbmemused'][0]) + int(values['kbmemfree'][0])) / 1024.0 / 1024.0
if MAX_USED_RAM < int(values['kbmemused'][0]):
MAX_USED_RAM = int(values['kbmemused'][0])
with open("data.txt", "a") as f:
f.write("%s %s %s\n" % (values["time"][0], values["%user"][0], values["%memused"][0]))
if die:
break
if i == 0:
g("quit")
time.sleep(1)
sys.exit(0)
g("set output 'plot.%s'" % OUTPUT_EXT)
g("set multiplot layout 2,1 title \"%s\"" % "\\n\\n\\n")
AVERAGE_LOAD = AVERAGE_LOAD / float(i)
MAX_USED_RAM = MAX_USED_RAM / 1024.0 / 1024.0
sdt = datetime.strptime(START_DATE, '%Y-%m-%d %H:%M:%S')
edt = datetime.strptime(END_DATE, '%Y-%m-%d %H:%M:%S')
delta_t = ((edt - sdt).total_seconds()) / 60.0
with open("data.txt", "a") as f:
f.write("# total ram: %.2f GB, max ram used: %.2f GB, avarage load: %.2f %%, duration: %.2f minutes\n" % (TOTAL_RAM, MAX_USED_RAM, AVERAGE_LOAD, delta_t))
g("set title 'cpu load (avarage = %.2f %%)'" % AVERAGE_LOAD)
g("set title tc rgb 'white' font 'Courier-New,8'")
seconds_between = (edt - sdt).total_seconds()
if seconds_between < 100:
seconds_between = 100
nsdt = sdt - timedelta(seconds = (seconds_between * 0.01))
nedt = edt + timedelta(seconds = (seconds_between * 0.01))
g("set xrange ['%s':'%s']" % (nsdt.strftime("%Y-%m-%d-%H:%M:%S"), nedt.strftime("%Y-%m-%d-%H:%M:%S")));
g("set label 101 at screen 0.02, screen 0.95 'Running on {/:Bold %s} \@ {/:Bold %s}, {/:Bold %d} threads x {/:Bold %s}, total ram is {/:Bold %.2f GB}' tc rgb 'white'" % (gethostname(), uname, cpus, cpu_name, TOTAL_RAM))
g("set label 102 at screen 0.02, screen 0.93 'duration: {/:Bold %s} .. {/:Bold %s} (%.2f minutes)' tc rgb 'white'" % (START_DATE, END_DATE, delta_t))
i = 0
for label in labels:
i = i + 1
g("set arrow nohead from '%s', graph 0.01 to '%s', graph 0.87 front lc rgb 'red' dt 2" % (label[0],label[0]))
g("set object rect at '%s', graph 0.90 size char %d, char 1.5 fc rgb 'red'" % (label[0],len("%d" % i)+1))
g("set object rect at '%s', graph 0.0 size char 0.5, char 0.5 front fc rgb 'red'" % label[0])
g("set label at '%s', graph 0.90 '%d' center tc rgb 'black' font 'Courier-New,7'" % (label[0],i))
g("set label at '%s', graph 0.95 '%s' center tc rgb 'white' font 'Courier-New,7'" % (label[0], label[1][0:20]))
if i > 0:
g("set yrange [0:119]")
else:
g("set yrange [0:100]")
g("set object rectangle from graph 0, graph 0 to graph 1, graph 1 behind fillcolor rgb '#111111' fillstyle solid noborder")
g("set object rectangle from '%s', 0 to '%s', 100 behind fillcolor rgb '#000000' fillstyle solid noborder" % (START_DATE.replace(" ", "-"), END_DATE.replace(" ", "-")))
g("plot 'data.txt' using 1:2:2 title 'cpu' with boxes palette")
g("set ylabel 'ram % usage'")
g("set title 'ram usage (max = %.2f GB)'" % MAX_USED_RAM);
g("plot 'data.txt' using 1:3:3 title 'ram' with boxes palette")
g("unset multiplot")
g("unset output")
g("quit")