Skip to content

Commit cde5661

Browse files
committed
add alert for nomad-follower ACL issues
1 parent e961ade commit cde5661

File tree

2 files changed

+23
-0
lines changed

2 files changed

+23
-0
lines changed

nix/cloud/alerts.nix

Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,28 @@
1818
];
1919
};
2020

21+
ci-world-nomad-follower = {
22+
datasource = "loki";
23+
rules = [
24+
{
25+
alert = "NomadFollowerACLTokenNotFound";
26+
expr = ''sum(rate({syslog_identifier="nomad-follower"}[5m] |= `ACL token not found`)) by (host) > 0'';
27+
for = "1m";
28+
labels.severity = "critical";
29+
annotations = {
30+
description = ''
31+
Detected nomad-follower ACL issue on {{ $labels.host }}
32+
This may be due to a vault-agent issue and can usually be resolved
33+
by restarting both services.
34+
Without proper ACL, nomad-follower cannot send logs from Nomad jobs
35+
to Loki, and Cicero will not be able to display logs for actions.
36+
'';
37+
summary = "nomad-follower ACL issue on {{ $labels.host }}";
38+
};
39+
}
40+
];
41+
};
42+
2143
# inherit (inputs.bitte-cells.bitte.alerts)
2244
# ;
2345
}

nix/cloud/hydrationProfile.nix

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -205,6 +205,7 @@ in {
205205
inherit
206206
(cell.alerts)
207207
ci-world-spongix
208+
ci-world-nomad-follower
208209
# Upstream alerts which may have downstream deps can be imported here
209210

210211
;

0 commit comments

Comments
 (0)