itamae/cookbooks/prometheus/files/etc/prometheus.d/alerts/services.yml

93 lines
3.3 KiB
YAML

groups:
- name: services
rules:
- alert: Digdag
expr: node_systemd_unit_state{name="digdag.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "Digdag is not running: {{ $labels.instance }}."
description: "Digdag is not running: {{ $labels.instance }}."
- alert: node_exporter
expr: node_systemd_unit_state{name="node_exporter.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "node_exporter is not running: {{ $labels.instance }}."
description: "node_exporter is not running: {{ $labels.instance }}."
- alert: vector-node_exporter
expr: node_systemd_unit_state{name="vector-node_exporter.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "vector-node_exporter is not running: {{ $labels.instance }}."
description: "vector-node_exporter is not running: {{ $labels.instance }}."
- alert: snmp_exporter
expr: node_systemd_unit_state{name="snmp_exporter.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "snmp_exporter is not running: {{ $labels.instance }}."
description: "snmp_exporter is not running: {{ $labels.instance }}."
- alert: vector-snmp_exporter
expr: node_systemd_unit_state{name="vector-snmp_exporter.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "vector-snmp_exporter is not running: {{ $labels.instance }}."
description: "vector-snmp_exporter is not running: {{ $labels.instance }}."
- alert: filestat_exporter
expr: node_systemd_unit_state{name="filestat_exporter.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "filestat_exporter is not running: {{ $labels.instance }}."
description: "filestat_exporter is not running: {{ $labels.instance }}."
- alert: vector-filestat_exporter
expr: node_systemd_unit_state{name="vector-filestat_exporter.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "vector-filestat_exporter is not running: {{ $labels.instance }}."
description: "vector-filestat_exporter is not running: {{ $labels.instance }}."
- alert: exporter_proxy
expr: node_systemd_unit_state{name="exporter_proxy.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "exporter_proxy is not running: {{ $labels.instance }}."
description: "exporter_proxy is not running: {{ $labels.instance }}."
- alert: prometheus
expr: node_systemd_unit_state{name="prometheus.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "prometheus is not running: {{ $labels.instance }}."
description: "prometheus is not running: {{ $labels.instance }}."
- alert: vector-prometheus
expr: node_systemd_unit_state{name="vector-prometheus.service", state="active"} != 1
for: 5m
labels:
severity: error
annotations:
summary: "vector-prometheus is not running: {{ $labels.instance }}."
description: "vector-prometheus is not running: {{ $labels.instance }}."