monitoring: improve ntfy template

This commit is contained in:
xinyangli 2025-02-05 11:52:23 +08:00
parent a78e9164e9
commit 1462c96284
Signed by: xin
SSH key fingerprint: SHA256:UU5pRTl7NiLFJbWJZa+snLylZSXIz5rgHmwjzv8v4oE
2 changed files with 10 additions and 7 deletions

View file

@ -120,11 +120,11 @@ in
webhook_configs = [
{
url = "${ntfyUrl}/prometheus-alerts?tpl=yes&m=${lib.escapeURL ''
{{range .alerts}}[{{ if eq .status "resolved" }} RESOLVED{{ else }}{{ if eq .status "firing" }}🔥 FIRING{{end}}{{end}}]{{range $k,$v := .labels}}
{{$k}}={{$v}}{{end}}
{{range .alerts}}{{ if eq .status "resolved" }}{{ else }}{{ if eq .status "firing" }}🔥{{end}}{{end}}{{.labels.alertname}}
{{.annotations.summary}}
{{end}}''}";
send_resolved = true;
max_alerts = 5;
}
];
}

View file

@ -1,6 +1,9 @@
let
mkFunction = f: (targets: (map f targets));
mkPort = port: if isNull port then "" else ":${toString port}";
# get text before "." in the url
subdomain = url: builtins.elemAt (builtins.elemAt (builtins.split "([a-zA-Z0-9]+)\..*" url) 1) 0;
in
{
mkScrapes = mkFunction (
@ -228,7 +231,7 @@ in
...
}:
{
job_name = "blackbox(${hostAddress})";
job_name = "blackbox(${subdomain hostAddress})";
scrape_interval = "1m";
metrics_path = "/probe";
params = {
@ -268,14 +271,14 @@ in
inherit name;
rules = [
{
alert = "ProbeError";
expr = "probe_success != 1";
alert = "ProbeToError";
expr = "sum by(instance) (probe_success != 1) > 0";
for = "3m";
labels = {
severity = "critical";
};
annotations = {
summary = "Probing {{ $labels.instance }} from {{ $labels.from }} failed";
summary = "Probing {{ $labels.instance }} failed";
};
}
{