2023-02-05 04:40:53 +00:00
|
|
|
groups:
|
|
|
|
- name: services
|
|
|
|
rules:
|
|
|
|
- alert: Digdag
|
|
|
|
expr: node_systemd_unit_state{name="digdag.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "Digdag is not running: {{ $labels.instance }}."
|
|
|
|
description: "Digdag is not running: {{ $labels.instance }}."
|
|
|
|
|
2023-02-05 10:02:38 +00:00
|
|
|
- alert: node_exporter
|
|
|
|
expr: node_systemd_unit_state{name="node_exporter.service", state="active"} != 1
|
2023-02-05 05:25:05 +00:00
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
2023-02-05 10:02:38 +00:00
|
|
|
summary: "node_exporter is not running: {{ $labels.instance }}."
|
|
|
|
description: "node_exporter is not running: {{ $labels.instance }}."
|
2023-02-05 05:25:05 +00:00
|
|
|
|
2023-02-05 10:49:14 +00:00
|
|
|
- alert: vector-node_exporter
|
|
|
|
expr: node_systemd_unit_state{name="vector-node_exporter.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "vector-node_exporter is not running: {{ $labels.instance }}."
|
|
|
|
description: "vector-node_exporter is not running: {{ $labels.instance }}."
|
2023-02-07 13:29:00 +00:00
|
|
|
|
|
|
|
- alert: snmp_exporter
|
|
|
|
expr: node_systemd_unit_state{name="snmp_exporter.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "snmp_exporter is not running: {{ $labels.instance }}."
|
|
|
|
description: "snmp_exporter is not running: {{ $labels.instance }}."
|
|
|
|
|
|
|
|
- alert: vector-snmp_exporter
|
|
|
|
expr: node_systemd_unit_state{name="vector-snmp_exporter.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "vector-snmp_exporter is not running: {{ $labels.instance }}."
|
|
|
|
description: "vector-snmp_exporter is not running: {{ $labels.instance }}."
|
2023-02-07 14:47:20 +00:00
|
|
|
|
|
|
|
- alert: filestat_exporter
|
|
|
|
expr: node_systemd_unit_state{name="filestat_exporter.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "filestat_exporter is not running: {{ $labels.instance }}."
|
|
|
|
description: "filestat_exporter is not running: {{ $labels.instance }}."
|
|
|
|
|
|
|
|
- alert: vector-filestat_exporter
|
|
|
|
expr: node_systemd_unit_state{name="vector-filestat_exporter.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "vector-filestat_exporter is not running: {{ $labels.instance }}."
|
|
|
|
description: "vector-filestat_exporter is not running: {{ $labels.instance }}."
|
2023-02-10 12:52:36 +00:00
|
|
|
|
|
|
|
- alert: exporter_proxy
|
|
|
|
expr: node_systemd_unit_state{name="exporter_proxy.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "exporter_proxy is not running: {{ $labels.instance }}."
|
|
|
|
description: "exporter_proxy is not running: {{ $labels.instance }}."
|
2023-02-12 10:22:29 +00:00
|
|
|
|
|
|
|
- alert: prometheus
|
|
|
|
expr: node_systemd_unit_state{name="prometheus.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "prometheus is not running: {{ $labels.instance }}."
|
|
|
|
description: "prometheus is not running: {{ $labels.instance }}."
|
|
|
|
|
|
|
|
- alert: vector-prometheus
|
|
|
|
expr: node_systemd_unit_state{name="vector-prometheus.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "vector-prometheus is not running: {{ $labels.instance }}."
|
|
|
|
description: "vector-prometheus is not running: {{ $labels.instance }}."
|
2023-05-13 06:11:55 +00:00
|
|
|
|
|
|
|
- alert: vault
|
|
|
|
expr: node_systemd_unit_state{name="vault.service", state="active"} != 1
|
|
|
|
for: 5m
|
|
|
|
labels:
|
|
|
|
severity: error
|
|
|
|
annotations:
|
|
|
|
summary: "vault is not running: {{ $labels.instance }}."
|
|
|
|
description: "vault is not running: {{ $labels.instance }}."
|