l 2 monitoring server: add ram & deadman alarm

This commit is contained in:
lassulus 2017-02-05 00:25:39 +01:00
parent 2c484daf3c
commit 0ea991ffe9

View File

@ -1,9 +1,7 @@
{pkgs, config, ...}: {pkgs, config, ...}:
with import <stockholm/lib>; with import <stockholm/lib>;
{ {
services.influxdb = { services.influxdb.enable = true;
enable = true;
};
services.influxdb.extraConfig = { services.influxdb.extraConfig = {
meta.hostname = config.krebs.build.host.name; meta.hostname = config.krebs.build.host.name;
@ -29,24 +27,39 @@ with import <stockholm/lib>;
data="$(${pkgs.jq}/bin/jq -r .message)" data="$(${pkgs.jq}/bin/jq -r .message)"
export LOGNAME=prism-alarm export LOGNAME=prism-alarm
${pkgs.irc-announce}/bin/irc-announce \ ${pkgs.irc-announce}/bin/irc-announce \
irc.freenode.org 6667 prism-alarm \#krebs-bots "$data" >/dev/null ni.r 6667 prism-alarm \#retiolum "$data" >/dev/null
''; '';
in { in {
enable = true; enable = true;
check_db = "telegraf_db";
alarms = { alarms = {
test2 = '' cpu = ''
batch var data = batch
|query(${"'''"} |query(${"'''"}
SELECT mean("usage_user") AS mean SELECT mean("usage_user") AS mean
FROM "${config.lass.kapacitor.check_db}"."default"."cpu" FROM "${config.lass.kapacitor.check_db}"."default"."cpu"
${"'''"}) ${"'''"})
.every(3m) .period(10m)
.period(1m) .every(1m)
.groupBy('host') .groupBy('host')
|alert() data |alert()
.crit(lambda: "mean" > 90) .crit(lambda: "mean" > 90)
// Whenever we get an alert write it to a file. .exec('${echoToIrc}')
.log('/tmp/alerts.log') data |deadman(1.0,5m)
.stateChangesOnly()
.exec('${echoToIrc}')
'';
ram = ''
var data = batch
|query(${"'''"}
SELECT mean("used_percent") AS mean
FROM "${config.lass.kapacitor.check_db}"."default"."mem"
${"'''"})
.period(10m)
.every(1m)
.groupBy('host')
data |alert()
.crit(lambda: "mean" > 90)
.exec('${echoToIrc}') .exec('${echoToIrc}')
''; '';
}; };