Add alert rules for `systemd` services.
This commit is contained in:
parent
9aca3252b6
commit
e509c531ae
|
@ -20,7 +20,7 @@ encrypted_remote_file '/etc/prometheus.d/alertmanager.yml' do
|
||||||
end
|
end
|
||||||
|
|
||||||
# Deploy alert setting file:
|
# Deploy alert setting file:
|
||||||
%w(node_exporter prometheus filestat).each do |conf|
|
%w(node_exporter prometheus filestat services snmp).each do |conf|
|
||||||
remote_file "/etc/prometheus.d/alerts/#{conf}.yml" do
|
remote_file "/etc/prometheus.d/alerts/#{conf}.yml" do
|
||||||
owner 'root'
|
owner 'root'
|
||||||
group 'root'
|
group 'root'
|
||||||
|
|
|
@ -0,0 +1,12 @@
|
||||||
|
groups:
|
||||||
|
- name: services
|
||||||
|
rules:
|
||||||
|
- alert: Digdag
|
||||||
|
expr: node_systemd_unit_state{name="digdag.service", state="active"} != 1
|
||||||
|
for: 5m
|
||||||
|
labels:
|
||||||
|
severity: error
|
||||||
|
annotations:
|
||||||
|
summary: "Digdag is not running: {{ $labels.instance }}."
|
||||||
|
description: "Digdag is not running: {{ $labels.instance }}."
|
||||||
|
|
Loading…
Reference in New Issue