Compare commits

..

No commits in common. "master" and "r3.01.08" have entirely different histories.

20 changed files with 121 additions and 645 deletions

90
app.py
View File

@ -5,9 +5,7 @@ import logging
import logging.config import logging.config
import os import os
from collections import defaultdict from flask import (Flask, request, jsonify, abort, render_template)
from flask import (Flask, request, jsonify, abort, render_template, url_for)
from ltsdb_json import LTS from ltsdb_json import LTS
from dashboard import Dashboard from dashboard import Dashboard
@ -99,9 +97,8 @@ def verify_node(d):
if "/" in node: if "/" in node:
raise ValueError("invalid node name %s", node) raise ValueError("invalid node name %s", node)
try: try:
fn = "config/" + node log.info("getting client config from %s", "config/" + node)
log.info("getting client config from %s", fn) with open("config/" + node) as fh:
with open(fn) as fh:
node_conf = json.load(fh) node_conf = json.load(fh)
except Exception as e: except Exception as e:
log.warning("got %s opening %s", e, "config/" + node) log.warning("got %s opening %s", e, "config/" + node)
@ -115,19 +112,8 @@ def verify_node(d):
if timestamp > node_conf["last"]: if timestamp > node_conf["last"]:
node_conf["last"] = timestamp node_conf["last"] = timestamp
os.replace("config/" + node, "config/" + node + ".old") os.replace("config/" + node, "config/" + node + ".old")
tmpfn = fn + "." + str(os.getpid()) with open("config/" + node, "w") as fh:
oldfn = fn + ".old"
with open(tmpfn, "w") as fh:
json.dump(node_conf, fh) # XXX json.dump(node_conf, fh) # XXX
try:
os.unlink(oldfn)
except FileNotFoundError:
pass
try:
os.link(fn, oldfn)
except FileNotFoundError:
pass
os.rename(tmpfn, fn)
return node return node
else: else:
abort(409, "timestamp out of sync") abort(409, "timestamp out of sync")
@ -154,71 +140,3 @@ def dashboard_index():
def dashboard_file(dashboard): def dashboard_file(dashboard):
d = Dashboard("dashboards/" + dashboard + ".json") d = Dashboard("dashboards/" + dashboard + ".json")
return d.as_html() return d.as_html()
@app.get("/nav")
def nav():
# Start with a list of all dimensions, the number of matching time series
# and a truncated list of series.
# If a dimension is chosen, display a choice of members
# choosing one or more members goes back to the list of
# (remaining) dimensions
with open("data/.index") as fh:
fcntl.flock(fh, fcntl.LOCK_SH)
index = json.load(fh)
timeseries = None
for k, v in request.args.lists():
if k[0] == ".":
continue
log.debug("search: %s -> %s", k, v)
if timeseries is None:
timeseries = set()
log.debug("search: %s: %s", k, index[k])
for m in v:
timeseries |= set(index[k][m])
else:
filter = set()
for m in v:
filter |= set(index[k][m])
timeseries &= filter
if timeseries is None:
timeseries = set()
for mc in index.values():
for tsl in mc.values():
timeseries |= set(tsl)
if d := request.args.get(".m"):
members = []
for m, tsl in index[d].items():
if set(tsl) & timeseries:
members.append(m)
return render_template("nav_member_select.html", dimension=d, members=members)
else:
params = request.args.to_dict(flat=False)
matching_dimensions = defaultdict(int)
for d, mc in index.items():
if d in params:
continue
for m, tsl in mc.items():
mtsl = set(tsl) & timeseries
if mtsl:
matching_dimensions[d] += len(mtsl)
matching_dimensions_list = []
for d in matching_dimensions:
params[".m"] = d
url = url_for("nav", **params)
app.logger.debug(f"{d=} {url=}")
matching_dimensions_list.append(
{"name": d, "count": matching_dimensions[d], "url": url}
)
total_timeseries = len(timeseries)
timeseries = [LTS(id=ts) for ts in list(timeseries)[:100]]
return render_template(
"nav_dimension_list.html",
matching_dimensions=matching_dimensions_list,
timeseries=timeseries, total_timeseries=total_timeseries)
#

View File

@ -1,44 +0,0 @@
#!/usr/bin/python3
import re
import subprocess
import time
import ltsdb_record
p = subprocess.run(["/usr/bin/lsb_release", "-ir"],
stdout=subprocess.PIPE, universal_newlines=True)
for ln in p.stdout.split("\n")[:-1]:
m = re.match(r"(.*?)\s*:\s+(.*)", ln)
if m:
if m.group(1) == "Distributor ID":
distributor = m.group(2).lower()
elif m.group(1) == "Release":
release = m.group(2)
if distributor == "ubuntu":
# special rule for ubuntu. The format is year.month, so we convert the
# months into fractional years
m = re.match(r"(\d+)\.(\d+)", release)
release = int(m.group(1)) + (int(m.group(2)) - 1) / 12
else:
# for everybody else we assume its a fp number
release = float(release)
report0 = []
report0.append({ "measure": "os_version_" + distributor, "unit": "version", "value": release})
now = time.time()
report = [
{
"description": {
"hostname": ltsdb_record.node,
"measure": r["measure"],
"unit": r["unit"]
},
"data": [
[now, r["value"]]
]
}
for r in report0
]
success = ltsdb_record.record_observations(report)
exit(1 - success)

View File

@ -1,60 +0,0 @@
#!/usr/bin/python3
import time
import re
import psycopg2
import psycopg2.extras
import ltsdb_record
db = psycopg2.connect() # We only get useful results if we are postgres, but for testing we can be any user
csr = db.cursor(cursor_factory=psycopg2.extras.NamedTupleCursor)
csr.execute(
"""
select datname, count(*)
from pg_stat_activity
where backend_type = 'client backend' group by datname order by datname
""")
total = 0
now = time.time()
report0 = []
for r in csr:
report0.append(
{
"measure": "connections",
"database": r.datname,
"unit": "connections",
"value": r.count
}
)
total += r.count
report0.append(
{
"measure": "connections",
"database": "ALL",
"unit": "connections",
"value": total
}
)
report = [
{
"description": {
"hostname": ltsdb_record.node,
"measure": r["measure"],
"database": r["database"],
"unit": r["unit"]
},
"data": [
[now, r["value"]]
]
}
for r in report0
]
success = ltsdb_record.record_observations(report)
exit(1 - success)

View File

@ -1,36 +0,0 @@
#!/usr/bin/python3
import re
import subprocess
import time
import ltsdb_record
p = subprocess.run(["psql", "-c", "select version()", "-A", "-t", "-X", "-q",],
stdout=subprocess.PIPE, universal_newlines=True)
# This works only for PostgreSQL 10.x and above. I don't expect to encounter
# older versions any more.
m = re.match(r"^PostgreSQL (\d+).(\d+) ", p.stdout)
if m:
version = int(m.group(1)) + int(m.group(2)) / 100
report0 = []
report0.append({ "measure": "postgresql_version", "unit": "version", "value":
version})
now = time.time()
report = [
{
"description": {
"hostname": ltsdb_record.node,
"measure": r["measure"],
"unit": r["unit"]
},
"data": [
[now, r["value"]]
]
}
for r in report0
]
success = ltsdb_record.record_observations(report)
exit(1 - success)

View File

@ -1,43 +0,0 @@
#!/usr/bin/python3
import time
import glob
import os.path
import ltsdb_record
now = time.time()
with open("/proc/uptime") as fh:
ln = fh.readline()
uptime = float(ln.split()[0])
last_reboot = now - uptime
last_mtime = 0
for p in glob.glob("/boot/**/*", recursive=True):
mtime = os.path.getmtime(p)
if mtime > last_mtime:
last_mtime = mtime
if last_mtime > last_reboot:
overdue = now - last_mtime
else:
overdue = 0
report0 = []
report0.append({ "measure": "reboot_overdue", "unit": "s", "value": overdue})
report = [
{
"description": {
"hostname": ltsdb_record.node,
"measure": r["measure"],
"unit": r["unit"]
},
"data": [
[now, r["value"]]
]
}
for r in report0
]
success = ltsdb_record.record_observations(report)
exit(1 - success)

View File

@ -1,78 +0,0 @@
#!/usr/bin/python3
import argparse
import re
import subprocess
import time
import ltsdb_record
ap = argparse.ArgumentParser()
ap.add_argument("device")
args = ap.parse_args()
p = subprocess.run(["/usr/sbin/smartctl", "-A", args.device],
stdout=subprocess.PIPE, universal_newlines=True)
report0 = []
state = 0
for ln in p.stdout.splitlines():
if state == 0 and ln.startswith("ID# ATTRIBUTE_NAME"):
state = 1
elif state == 1 and ln == "":
state = 2
elif state == 1:
(id, attribute_name, flag, value, worst, thresh, type, updated, when_failed, raw_value) = ln.split(None, 9)
if attribute_name == "Command_Timeout":
# This is a tuple of three values and I don't know what they mean
# so I just skip them.
# I guess I could just record them as smart_command_timeout_1,
# smart_command_timeout_2 and smart_command_timeout_3 ...
continue
if "_Ct" in attribute_name or "_Count" in attribute_name or "_Cnt" in attribute_name:
unit = "count"
elif "_Hours" in attribute_name:
unit = "hours"
elif "Total_LBAs_Written" in attribute_name:
unit = "blocks"
elif "Temperature_Cel" in attribute_name:
unit = "°C"
else:
unit = "unknown"
if unit == "°C":
# Sometimes there is extra information included - just ignore that.
value = int(raw_value.split()[0])
elif unit == "hours":
if m := re.match(r"([0-9]+)h\+([0-9]+)m\+([0-9.]+)s", raw_value):
# e.g. 60633h+54m+11.557s
value = (int(m.group(1)) * 3600 + int(m.group(2)) * 60 + float(m.group(2))) / 3600
else:
value = int(raw_value)
else:
value = int(raw_value)
report0.append(
{
"measure": "smart_" + attribute_name.lower(),
"unit": unit,
"value": value,
})
now = time.time()
report = [
{
"description": {
"hostname": ltsdb_record.node,
"device": args.device,
"measure": r["measure"],
"unit": r["unit"],
},
"data": [
[now, r["value"]]
]
}
for r in report0
]
success = ltsdb_record.record_observations(report)
exit(1 - success)

View File

@ -1,11 +1,14 @@
#!/usr/bin/python3 #!/usr/bin/python3
import argparse import argparse
import hmac
import json
import os
import socket import socket
import ssl import ssl
import time import time
import ltsdb_record import requests
ap = argparse.ArgumentParser() ap = argparse.ArgumentParser()
ap.add_argument("--verbose", action="store_true") ap.add_argument("--verbose", action="store_true")
@ -13,20 +16,23 @@ ap.add_argument("hostname")
ap.add_argument("port", type=int, default=443, nargs="?") ap.add_argument("port", type=int, default=443, nargs="?")
args = ap.parse_args() args = ap.parse_args()
# It's a bit weird that this works.
myhostname = socket.gethostbyaddr(socket.gethostname())[0]
now = time.time() now = time.time()
report0 = [] report0 = []
try: with socket.create_connection((args.hostname, args.port)) as sock:
with socket.create_connection((args.hostname, args.port)) as sock:
context = ssl.create_default_context() context = ssl.create_default_context()
try:
with context.wrap_socket(sock, server_hostname=args.hostname) as ssock: with context.wrap_socket(sock, server_hostname=args.hostname) as ssock:
cert = ssock.getpeercert() cert = ssock.getpeercert()
not_after = ssl.cert_time_to_seconds(cert["notAfter"]) not_after = ssl.cert_time_to_seconds(cert["notAfter"])
delta = not_after - now delta = not_after - now
except (ssl.SSLCertVerificationError, ConnectionRefusedError) as e: except ssl.SSLCertVerificationError as e:
print("got error %s; setting delta to 0" % e) print("got error %s; setting delta to 0", e)
delta = 0 delta = 0
report0.append({ "measure": "tls_cert_ttl", "unit": "s", "value": delta }) report0.append({ "measure": "tls_cert_ttl", "unit": "s", "value": delta })
report = [ report = [
{ {
@ -43,5 +49,32 @@ report = [
for r in report0 for r in report0
] ]
success = ltsdb_record.record_observations(report) for dir in (".", os.environ["HOME"] + "/.config/ltsdb", "/etc/ltsdb"):
exit(1 - success) try:
with open(dir + "/config.json") as fh:
client_config = json.load(fh)
baseurl = client_config["server"]
break
except FileNotFoundError:
pass
while True:
for r in report:
node = myhostname
timestamp = time.time()
msg = (node + " " + str(timestamp)).encode("UTF-8")
digest = hmac.new(client_config["key"].encode("UTF-8"), msg, "SHA256").hexdigest()
r["auth"] = {
"node": node,
"timestamp": timestamp,
"hmac": digest,
}
#pprint.pp(report)
r = requests.post(baseurl + "report", json=report)
print(r)
if r.status_code == 200:
exit(0)
elif r.status_code == 409:
time.sleep(0.5 + random.random())
continue
else:
exit(1)

View File

@ -27,15 +27,11 @@ class Dashboard:
if w.get("multi"): if w.get("multi"):
ts_list = LTS.find(w["data"][0]) ts_list = LTS.find(w["data"][0])
for ts in ts_list: for ts in ts_list:
try:
tso = LTS(id=ts) tso = LTS(id=ts)
except json.decoder.JSONDecodeError as e:
log.error("%s contains bad data: %s: Skipping", ts, e)
continue
if not tso.data: if not tso.data:
log.warning("%s has no data: Skipping", tso.id) log.warning("%s has no data: Skipping", tso.id)
continue continue
if tso.data[-1][0] < time.time() - 7 * 86400: if tso.data[-1][0] < time.time() - 86400:
log.info("%s too old; Skipping", tso.id) log.info("%s too old; Skipping", tso.id)
continue continue
w1 = {**w, "data": [ts]} w1 = {**w, "data": [ts]}
@ -60,10 +56,6 @@ class Dashboard:
else: else:
self.widgets.append(Widget(w)) self.widgets.append(Widget(w))
# Sort widgets by ascending healthscore to get the most critical at the
# top.
self.widgets.sort(key=lambda w: w.healthscore())
def as_html(self): def as_html(self):
return render_template("dashboard.html", dashboard=self) return render_template("dashboard.html", dashboard=self)
@ -78,40 +70,65 @@ class Widget:
self.extra = {} self.extra = {}
log.debug("data = %s", d["data"]) log.debug("data = %s", d["data"])
self.lts = LTS(id=d["data"][0]) # by default we handle only one data source self.lts = LTS(id=d["data"][0]) # by default we handle only one data source
self.lastvalue = self.lts.data[-1][1] pass
def as_html(self): def as_html(self):
log.debug("") log.debug("")
self.lastvalue = self.lts.data[-1][1]
return Markup(render_template("widget.html", widget=self)) return Markup(render_template("widget.html", widget=self))
def healthscore(self, value=None): def criticalcolor(self, value=None):
"""
Return a score between 0 (unhealthy) and 100 (healthy)
"""
if value == None: if value == None:
value = self.lastvalue value = self.lastvalue
log.debug("stops = %s", self.stops) log.debug("stops = %s", self.stops)
stops = self.stops
if stops[-1] < stops[0]:
value = -value
stops = [-v for v in stops]
if value <= stops[0]:
log.debug("ok")
return 100
if value >= stops[-1]:
log.debug("fail")
return 0
for i in range(0, len(stops) - 1):
if stops[i] <= value < stops[i+1]:
log.debug("at stop %d", i)
return 100 - ((value - stops[i]) / (stops[i+1] - stops[i]) + i) * 100 / (len(stops) - 1)
def criticalcolor(self, value=None):
healthscore = self.healthscore(value)
hue = round(healthscore * 120 / 100)
brightness = 30 brightness = 30
if self.stops[0] < self.stops[2]:
if value < self.stops[0]:
log.debug("definitely ok")
return f"hsl(120, 100%, {brightness}%)"
elif value < self.stops[1]:
log.debug("mostly ok")
hue = 120 - round(
(value - self.stops[0])
/ (self.stops[1] - self.stops[0])
* 60
)
return f"hsl({hue}, 100%, {brightness}%)" return f"hsl({hue}, 100%, {brightness}%)"
elif value < self.stops[2]:
log.debug("maybe fail")
hue = 60 - round(
(value - self.stops[1])
/ (self.stops[2] - self.stops[1])
* 60
)
return f"hsl({hue}, 100%, {brightness}%)"
else:
log.debug("definitely fail")
return f"hsl(0, 100%, {brightness}%)"
else:
log.debug("the other side")
if value > self.stops[0]:
log.debug("definitely ok")
return f"hsl(120, 100%, {brightness}%)"
elif value > self.stops[1]:
log.debug("mostly ok")
hue = 120 - round(
(value - self.stops[0])
/ (self.stops[1] - self.stops[0])
* 60
)
return f"hsl({hue}, 100%, {brightness}%)"
elif value > self.stops[2]:
log.debug("maybe fail")
hue = 60 - round(
(value - self.stops[1])
/ (self.stops[2] - self.stops[1])
* 60
)
return f"hsl({hue}, 100%, {brightness}%)"
else:
log.debug("definitely fail")
return f"hsl(0, 100%, {brightness}%)"
@property @property
def description_formatted(self): def description_formatted(self):
@ -143,13 +160,9 @@ class TimeSeries(Widget):
def v2y(v): def v2y(v):
if self.yscale == "log": if self.yscale == "log":
try: return (1 - math.log(v / min_value)
return (1 - math.log(max(v, min_value) / min_value)
/ math.log(max_value / min_value) / math.log(max_value / min_value)
) * 200 ) * 200
except ValueError:
log.error(f"ValueError: v = {v}, min_value = {min_value}, max_value = {max_value}")
return 0
elif self.yscale == "linear": elif self.yscale == "linear":
return (1 - v/max_value) * 200 return (1 - v/max_value) * 200
else: else:
@ -166,12 +179,11 @@ class TimeSeries(Widget):
min_step = 25 min_step = 25
steps = ("s", "m", "h", "D", "10D", "M", "Y") steps = ("s", "m", "h", "D", "10D", "M", "Y")
step_i = 0 step_i = 0
while step_i < len(steps): while True:
t0 = tickmarks[-1]["t"] t0 = tickmarks[-1]["t"]
x0 = tickmarks[-1]["x"] x0 = tickmarks[-1]["x"]
d0 = datetime.datetime.fromtimestamp(t0) d0 = datetime.datetime.fromtimestamp(t0)
log.debug("step_i = %s", step_i)
if steps[step_i] == "s": if steps[step_i] == "s":
d1 = datetime.datetime(d0.year, d0.month, d0.day, d0.hour, d0.minute, d0.second) d1 = datetime.datetime(d0.year, d0.month, d0.day, d0.hour, d0.minute, d0.second)
t1 = d1.timestamp() t1 = d1.timestamp()
@ -283,7 +295,6 @@ class TimeSeries(Widget):
t1 = d1.timestamp() t1 = d1.timestamp()
x1 = t2x(t1) x1 = t2x(t1)
if x0 - x1 < min_step: if x0 - x1 < min_step:
log.debug("t0 = %s, x0 = %s, t1 = %s, x1 = %s", t0, x0, t1, x1)
step_i += 1 step_i += 1
continue continue
if x1 < 0: if x1 < 0:
@ -304,11 +315,7 @@ class TimeSeries(Widget):
if self.yscale == "linear": if self.yscale == "linear":
log.debug("") log.debug("")
if unit == "s" and max_value > 3600: if unit == "s" and max_value > 3600:
if max_value >= 16 * 7 * 86400: if max_value >= 4 * 7 * 86400:
step = 4 * 7 * 86400
step_d = 4
unit = "w"
elif max_value >= 4 * 7 * 86400:
step = 7 * 86400 step = 7 * 86400
step_d = 1 step_d = 1
unit = "w" unit = "w"
@ -380,7 +387,7 @@ class TimeSeries(Widget):
log.debug("") log.debug("")
log.debug("in graph for %s", self.lts.id) log.debug("in graph")
data = self.lts.data data = self.lts.data
n = len(data) n = len(data)
t_last = data[-1][0] t_last = data[-1][0]
@ -388,17 +395,12 @@ class TimeSeries(Widget):
return "(not enough data)" return "(not enough data)"
dt = (t_last - data[-5][0]) / 4 dt = (t_last - data[-5][0]) / 4
k = math.log((t_last - data[0][0]) / dt / n + 1) k = math.log((t_last - data[0][0]) / dt / n + 1)
log.debug("times = [%s ... %s ... %s]", data[0][0], data[-5][0], data[-1][0])
max_value = max([d[3] if len(d) >= 4 else d[1] for d in self.lts.data]) max_value = max([d[1] for d in self.lts.data])
max_value = max(max_value, 0.001) # ensure positive max_value = max(max_value, 0.001) # ensure positive
unit = self.lts.description["unit"]
if self.yscale == "log": if self.yscale == "log":
try: try:
min_value = min(d[1] for d in self.lts.data if d[1] > 0) min_value = min(d[1] for d in self.lts.data if d[1] > 0)
if unit == "s":
self.extra["min"] = "%g" % min_value + " (" + self.format_time(min_value) + ")"
else:
self.extra["min"] = "%g" % min_value self.extra["min"] = "%g" % min_value
except ValueError: except ValueError:
# no non-negative values # no non-negative values
@ -413,10 +415,6 @@ class TimeSeries(Widget):
# Make sure min_value is less than max_value # Make sure min_value is less than max_value
min_value /= 2 min_value /= 2
log.debug("min_value = %s, max_value = %s", min_value, max_value) log.debug("min_value = %s, max_value = %s", min_value, max_value)
if unit == "s":
self.extra["max"] = "%g" % max_value + " (" + self.format_time(max_value) + ")"
self.extra["last"] = "%g" % data[-1][1] + " (" + self.format_time(data[-1][1]) + ")"
else:
self.extra["max"] = "%g" % max_value self.extra["max"] = "%g" % max_value
self.extra["last"] = "%g" % data[-1][1] self.extra["last"] = "%g" % data[-1][1]
log.debug("collecting data") log.debug("collecting data")
@ -424,17 +422,9 @@ class TimeSeries(Widget):
for i in range(n): for i in range(n):
t = data[i][0] t = data[i][0]
v = data[i][1] v = data[i][1]
if len(data[i]) >= 4:
v_min = data[i][2]
v_max = data[i][3]
else:
v_min = data[i][1]
v_max = data[i][1]
x = t2x(t) x = t2x(t)
t_h = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(t)) t_h = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(t))
y = v2y(v) y = v2y(v)
y_min = v2y(v_min)
y_max = v2y(v_max)
#print(t, t_h, x) #print(t, t_h, x)
v_data.append( v_data.append(
{ {
@ -442,8 +432,6 @@ class TimeSeries(Widget):
"v": v, "v": v,
"x": x, "x": x,
"y": y, "y": y,
"y_min": y_min,
"y_max": y_max,
"color": self.criticalcolor(v), "color": self.criticalcolor(v),
}) })
@ -462,8 +450,7 @@ class TimeSeries(Widget):
html += f"<line x1=0 y1={tm['y']} x2=1000 y2={tm['y']} stroke='#CCC' />" html += f"<line x1=0 y1={tm['y']} x2=1000 y2={tm['y']} stroke='#CCC' />"
html += f"<text x=1005 y={tm['y']} fill='#888'>{tm['v_h']}</text>" html += f"<text x=1005 y={tm['y']} fill='#888'>{tm['v_h']}</text>"
for v in v_data: for v in v_data:
html += f"<line x1={v['x']-3} x2={v['x']+3} y1={v['y']} y2={v['y']} stroke='{v['color']}' />" html += f"<circle cx={v['x']} cy={v['y']} r=3 fill='{v['color']}' />"
html += f"<line x1={v['x']} x2={v['x']} y1={v['y_min']} y2={v['y_max']} stroke='{v['color']}' />"
html += "</svg>" html += "</svg>"
log.debug("len(html) = %s", len(html)) log.debug("len(html) = %s", len(html))
return Markup(html) return Markup(html)
@ -472,29 +459,6 @@ class TimeSeries(Widget):
log.debug("in as_html") log.debug("in as_html")
return Markup(render_template("timeseries.html", widget=self)) return Markup(render_template("timeseries.html", widget=self))
def format_time(self, seconds):
value = seconds
unit = "s"
if value >= 365.25 * 86400:
value /= 365.25 * 86400
unit = "years"
elif value >= 86400:
value /= 86400
unit = "days"
elif value >= 3600:
value /= 3600
unit = "h"
elif value >= 60:
value /= 60
unit = "m"
elif value >= 1:
pass
elif value >= 0.001:
value *= 1000
unit = "ms"
return f"{value:.2f} {unit}"
class Gauge(Widget): class Gauge(Widget):
def __init__(self, d): def __init__(self, d):
super().__init__(d) super().__init__(d)
@ -536,4 +500,3 @@ class Gauge(Widget):
self.lastvalue_formatted = Markup(f"<span class='value'>{value:.2f}</span><span class='unit'>{unit}</unit>") self.lastvalue_formatted = Markup(f"<span class='value'>{value:.2f}</span><span class='unit'>{unit}</unit>")
return Markup(render_template("gauge.html", widget=self)) return Markup(render_template("gauge.html", widget=self))
# vim: sw=4

View File

@ -41,11 +41,7 @@ class LTS:
with open(self.filename, "x+") as fh: with open(self.filename, "x+") as fh:
fcntl.flock(fh, fcntl.LOCK_EX) fcntl.flock(fh, fcntl.LOCK_EX)
json.dump({"description": self.description, "data": self.data}, fh) json.dump({"description": self.description, "data": self.data}, fh)
log.info(f"Created {self.filename}")
self.rebuild_index() self.rebuild_index()
except json.decoder.JSONDecodeError as e:
log.exception(f"Cannot decode JSON in {self.filename}: {e}")
raise
def pop(self, i): def pop(self, i):
# Pop the element at index i and adjust the min/max values of the # Pop the element at index i and adjust the min/max values of the
@ -131,11 +127,7 @@ class LTS:
(_, _, hash) = fn.rpartition("/") (_, _, hash) = fn.rpartition("/")
with open(fn, "r") as fh: with open(fn, "r") as fh:
fcntl.flock(fh, fcntl.LOCK_SH) fcntl.flock(fh, fcntl.LOCK_SH)
try:
d = json.load(fh) d = json.load(fh)
except json.decoder.JSONDecodeError as e:
log.exception(f"Cannot decode JSON in {fn}: {e}")
raise
for k, v in d["description"].items(): for k, v in d["description"].items():
d1 = index.setdefault(k, {}) d1 = index.setdefault(k, {})
d2 = d1.setdefault(v, []) d2 = d1.setdefault(v, [])

View File

@ -1,22 +1,20 @@
#!/usr/bin/python3 #!/usr/bin/python3
import time
import random
from ltsdb_json import LTS from ltsdb_json import LTS
ts1 = LTS({"hostname": "rorschach.hjp.at", "measure": "uptime"}) ts1 = LTS({"hostname": "rorschach.hjp.at", "measure": "uptime"})
ts1.add(time.time(), 4 + random.random()) ts1.add(1661026122, 4)
ts1.save() ts1.save()
ts1 = LTS({"hostname": "rorschach.hjp.at", "website": "i12e.hjp.at", "measure": "rtt"}) ts1 = LTS({"hostname": "rorschach.hjp.at", "website": "i12e.hjp.at", "measure": "rtt"})
ts1.add(time.time(), 0.06) ts1.add(1661026122, 0.06)
ts1.save() ts1.save()
ts1 = LTS({"hostname": "rorschach.hjp.at", "measure": "uptime"}) ts1 = LTS({"hostname": "rorschach.hjp.at", "measure": "uptime"})
ts1.add(time.time() + 240, 5 + random.random()) ts1.add(1661026361, 5)
ts1.save() ts1.save()
ts1 = LTS({"hostname": "charly.wsr.ac.at", "website": "www.wifo.ac.at", "measure": "rtt"}) ts1 = LTS({"hostname": "charly.wsr.ac.at", "website": "www.wifo.ac.at", "measure": "rtt"})
ts1.add(time.time(), 0.347) ts1.add(1661026122, 0.347)
ts1.save() ts1.save()

View File

@ -2,10 +2,8 @@
import logging import logging
import logging.config import logging.config
import math
import os import os
import socket import socket
import statistics
import time import time
from ltsdb_json import LTS from ltsdb_json import LTS
@ -46,37 +44,13 @@ class DiskFullPredictor:
current_used_bytes = lts.data[-1][1] current_used_bytes = lts.data[-1][1]
current_usable_bytes = usable_lts.data[-1][1] current_usable_bytes = usable_lts.data[-1][1]
tuf = 1E9 tuf = 1E9
for i in reversed(range(len(lts.data))): for d in reversed(lts.data):
m = statistics.mean(x[1] for x in lts.data[max(0, i - 2) : min(len(lts.data), i + 3)]) if d[1] < current_usable_bytes * 0.1:
if m < current_usable_bytes * 0.1:
continue # for sanity continue # for sanity
if current_used_bytes ** 2 / m > current_usable_bytes: if current_used_bytes ** 2 / d[1] > current_usable_bytes:
log.info("d = %s, current_used_bytes = %s, current_usable_bytes = %s", m, current_used_bytes, current_usable_bytes) log.info("d = %s, current_used_bytes = %s, current_usable_bytes = %s", d, current_used_bytes, current_usable_bytes)
tuf = now - lts.data[i][0] tuf = now - d[0]
break break
else:
# Try always use the minimum of a range.
# We prefer the first datapoint
first_used_bytes = lts.data[0][2] if len(lts.data[0]) >= 4 else lts.data[0][1]
# But if that's not useable we search the whole timeseries for the
# minimum
if first_used_bytes >= current_used_bytes:
first_used_bytes = current_used_bytes
first_i = None
for i in range(len(lts.data)):
used_bytes = lts.data[i][2] if len(lts.data[i]) >= 4 else lts.data[i][1]
if used_bytes < first_used_bytes:
first_used_bytes = used_bytes
first_i = i
else:
first_i = 0
if first_i is not None:
historic_growth = current_used_bytes / first_used_bytes
future_growth = current_usable_bytes / current_used_bytes
tuf = math.log(future_growth) / math.log(historic_growth) * (now - lts.data[first_i][0])
tuf = max(tuf, now - lts.data[first_i][0])
tuf = min(tuf, 1E9)
desc = {**lts.description, desc = {**lts.description,
"measure": "time_until_disk_full", "measure": "time_until_disk_full",
"node": node, "node": node,

View File

@ -1,3 +0,0 @@
[tool.pytest.ini_options]
pythonpath = "."

View File

@ -8,9 +8,8 @@
body { body {
font-family: sans-serif; font-family: sans-serif;
} }
th, td { th {
text-align: left; text-align: left;
vertical-align: baseline;
} }
main { main {
display: flex; display: flex;

View File

@ -1,26 +0,0 @@
<!DOCTYPE html>
<html>
<head>
<meta name="viewport" content="width=device-width; initial-scale=1">
<meta charset="utf-8">
<style>
</style>
</head>
<body>
<ul>
{% for d in matching_dimensions %}
<li><a href="{{d['url']}}">{{d.name}}</a> ({{d.count}})</li>
{% endfor %}
</ul>
{{timeseries|length}}/{{total_timeseries}} timeseries:
<ul>
{% for ts in timeseries %}
<li>
<a href="/v?ts={{ts.id}}">{{ts.description}}</a>
</li>
{% endfor %}
</ul>
</body>
</html>

View File

@ -1,27 +0,0 @@
<!DOCTYPE html>
<html>
<head>
<meta name="viewport" content="width=device-width; initial-scale=1">
<meta charset="utf-8">
<style>
</style>
</head>
<body>
<form>
{% for dimension, members in request.args.lists() %}
{% for member in members %}
{% if dimension[0] != "." %}
<input name="{{dimension}}" value="{{member}}" type="hidden">
{% endif %}
{% endfor %}
{% endfor %}
<select name="{{dimension}}" multiple size={{members|length}}>
{% for member in members %}
<option>{{member}}</option>
{% endfor %}
</select>
<input type="submit">
</form>
</body>
</html>

View File

@ -1,11 +0,0 @@
{"description": {"fstype": "tmpfs", "hostname": "ehoiai.int.wsr.at", "measure": "time_until_disk_full", "mountpoint": "/run/user/1054", "node": "rorschach.hjp.at", "remote_addr": "", "unit": "s"},
"data": [
[1674806402.1014915, 1000000000.0],
[1674814201.3452954, 1000000000.0],
[1675164602.4004557, 1000000000.0],
[1675165201.6291275, 1000000000.0],
[1675165802.2402072, 1000000000.0],
[1675166401.542857, 1000000000.0],
[1675167002.2809808, 1000000000.0],
[1675167601.2632012, 1000000000.0],
[1675168201.8321788, 1000000000.0]]}

View File

View File

@ -1,56 +0,0 @@
import pytest
from dashboard import Widget
def test_healthscore_1_asc():
w = Widget(
{
"type": "gauge",
"stops": [1, 5],
"data": [ "605da6f41f58b122f41283823a99faa36286961a106ac901bb2b2d730fddc778" ] # required by API, not used for tests
}
)
# stops are ordered from best to worst
assert w.healthscore(0) == 100
assert w.healthscore(1) == 100
assert w.healthscore(2) == 75
assert w.healthscore(3) == 50
assert w.healthscore(4) == 25
assert w.healthscore(5) == 0
assert w.healthscore(6) == 0
def test_healthscore_2_asc():
w = Widget(
{
"type": "gauge",
"stops": [1, 10, 100],
"data": [ "605da6f41f58b122f41283823a99faa36286961a106ac901bb2b2d730fddc778" ] # required by API, not used for tests
}
)
# stops are ordered from best to worst
assert w.healthscore(0) == 100
assert w.healthscore(1) == 100
assert w.healthscore(5.5) == 75
assert w.healthscore(10) == 50
assert w.healthscore(55) == 25
assert w.healthscore(100) == 0
assert w.healthscore(1000) == 0
def test_healthscore_2_desc():
w = Widget(
{
"type": "gauge",
"stops": [100, 10, 1],
"data": [ "605da6f41f58b122f41283823a99faa36286961a106ac901bb2b2d730fddc778" ] # required by API, not used for tests
}
)
# stops are ordered from best to worst
assert w.healthscore(0) == 0
assert w.healthscore(1) == 0
assert w.healthscore(5.5) == 25
assert w.healthscore(10) == 50
assert w.healthscore(55) == 75
assert w.healthscore(100) == 100
assert w.healthscore(1000) == 100

View File

@ -1,17 +0,0 @@
import pytest
from dashboard import TimeSeries
def test_timeseries_1():
config = {
"type": "timeseries",
"multi": True,
"stops": [ 2592000, 604800, 86400 ],
"data": [
"605da6f41f58b122f41283823a99faa36286961a106ac901bb2b2d730fddc778"
],
"yscale": "log",
}
ts = TimeSeries(config)
graph = ts.graph
assert graph