2017-01-09 16:02:02 +01:00
|
|
|
{pkgs, config, ...}:
|
|
|
|
|
|
|
|
with import <stockholm/lib>;
|
|
|
|
let
|
2017-01-09 16:03:36 +01:00
|
|
|
collectd-port = 25826;
|
|
|
|
influx-port = 8086;
|
2017-01-09 16:02:02 +01:00
|
|
|
grafana-port = 3000; # TODO nginx forward
|
2017-03-01 15:46:23 +01:00
|
|
|
db = "collectd_db";
|
|
|
|
logging-interface = config.makefu.server.primary-itf;
|
2017-01-09 16:02:02 +01:00
|
|
|
in {
|
2017-01-09 16:03:36 +01:00
|
|
|
services.grafana.enable = true;
|
2017-01-09 16:02:02 +01:00
|
|
|
services.grafana.addr = "0.0.0.0";
|
|
|
|
|
|
|
|
services.influxdb.enable = true;
|
|
|
|
|
|
|
|
# forward these via nginx
|
|
|
|
services.influxdb.extraConfig = {
|
|
|
|
meta.hostname = config.krebs.build.host.name;
|
|
|
|
# meta.logging-enabled = true;
|
|
|
|
http.bind-address = ":${toString influx-port}";
|
|
|
|
admin.bind-address = ":8083";
|
|
|
|
monitoring = {
|
|
|
|
enabled = false;
|
|
|
|
# write-interval = "24h";
|
|
|
|
};
|
2017-01-09 16:03:36 +01:00
|
|
|
collectd = [{
|
2017-01-09 16:02:02 +01:00
|
|
|
enabled = true;
|
|
|
|
typesdb = "${pkgs.collectd}/share/collectd/types.db";
|
2017-03-01 15:46:23 +01:00
|
|
|
database = db;
|
2017-01-09 16:02:02 +01:00
|
|
|
port = collectd-port;
|
|
|
|
}];
|
|
|
|
};
|
2017-03-01 15:46:23 +01:00
|
|
|
krebs.kapacitor =
|
2017-02-03 20:45:27 +01:00
|
|
|
let
|
|
|
|
echoToIrc = pkgs.writeDash "echo_irc" ''
|
|
|
|
set -euf
|
|
|
|
data="$(${pkgs.jq}/bin/jq -r .message)"
|
|
|
|
export LOGNAME=malarm
|
|
|
|
${pkgs.irc-announce}/bin/irc-announce \
|
|
|
|
irc.freenode.org 6667 malarm \#krebs-bots "$data" >/dev/null
|
|
|
|
'';
|
|
|
|
in {
|
|
|
|
enable = true;
|
|
|
|
alarms = {
|
2017-03-01 15:46:23 +01:00
|
|
|
cpu_deadman.database = db;
|
|
|
|
cpu_deadman.text = ''
|
2017-02-03 20:45:27 +01:00
|
|
|
var data = batch
|
2017-02-05 22:34:16 +01:00
|
|
|
|query(${"'''"}
|
2017-02-03 20:45:27 +01:00
|
|
|
SELECT mean("value") AS mean
|
|
|
|
FROM "collectd_db"."default"."cpu_value"
|
|
|
|
WHERE "type_instance" = 'idle' AND "type" = 'percent' fill(0)
|
2017-02-05 22:34:16 +01:00
|
|
|
${"'''"})
|
2017-02-03 20:45:27 +01:00
|
|
|
.period(10m)
|
|
|
|
.every(1m)
|
|
|
|
.groupBy('host')
|
|
|
|
data |alert()
|
|
|
|
.crit(lambda: "mean" < 50)
|
|
|
|
.stateChangesOnly()
|
|
|
|
.exec('${echoToIrc}')
|
|
|
|
data |deadman(1.0,5m)
|
|
|
|
.stateChangesOnly()
|
|
|
|
.exec('${echoToIrc}')
|
|
|
|
'';
|
|
|
|
};
|
|
|
|
|
|
|
|
};
|
2017-01-09 16:02:02 +01:00
|
|
|
networking.firewall.extraCommands = ''
|
|
|
|
iptables -A INPUT -i retiolum -p udp --dport ${toString collectd-port} -j ACCEPT
|
|
|
|
iptables -A INPUT -i retiolum -p tcp --dport ${toString influx-port} -j ACCEPT
|
|
|
|
iptables -A INPUT -i retiolum -p tcp --dport ${toString grafana-port} -j ACCEPT
|
2017-03-01 15:46:23 +01:00
|
|
|
iptables -A INPUT -i ${logging-interface} -p udp --dport ${toString collectd-port} -j ACCEPT
|
|
|
|
iptables -A INPUT -i ${logging-interface} -p tcp --dport ${toString influx-port} -j ACCEPT
|
|
|
|
iptables -A INPUT -i ${logging-interface} -p tcp --dport ${toString grafana-port} -j ACCEPT
|
2017-04-19 10:05:39 +02:00
|
|
|
|
|
|
|
ip6tables -A INPUT -i retiolum -p udp --dport ${toString collectd-port} -j ACCEPT
|
|
|
|
ip6tables -A INPUT -i retiolum -p tcp --dport ${toString influx-port} -j ACCEPT
|
|
|
|
ip6tables -A INPUT -i retiolum -p tcp --dport ${toString grafana-port} -j ACCEPT
|
|
|
|
ip6tables -A INPUT -i ${logging-interface} -p udp --dport ${toString collectd-port} -j ACCEPT
|
|
|
|
ip6tables -A INPUT -i ${logging-interface} -p tcp --dport ${toString influx-port} -j ACCEPT
|
|
|
|
ip6tables -A INPUT -i ${logging-interface} -p tcp --dport ${toString grafana-port} -j ACCEPT
|
2017-01-09 16:02:02 +01:00
|
|
|
'';
|
|
|
|
}
|