Commit b5d18084 authored by ale's avatar ale

Add a HostUnreachable alert (for icmp failures)

parent 4902451a
Pipeline #2335 failed with stage
in 22 minutes and 5 seconds
......@@ -29,3 +29,11 @@ groups:
}}.
SUMMARY: High rate of packet drops on {{ $labels.instance }} device {{ $labels.device
}}
- alert: HostUnreachable
expr: probe_success{job="blackbox_ping"} < 1
for: 5m
labels:
severity: page
annotations:
DESCRIPTION: Host {{ $labels.instance }} is unreachable (icmp).
SUMMARY: Host {{ $labels.instance }} is unreachable
......@@ -13,16 +13,24 @@ route:
receiver: default
inhibit_rules:
# Inhibit severity=warning alerts if the same alert is already active with severity=page.
- source_match:
severity: 'page'
target_match:
severity: 'warning'
equal: ['alertname', 'service']
# Inhibit scope=host alerts if the same alert is active with scope=global.
- source_match:
scope: 'global'
target_match:
scope: 'host'
equal: ['alertname', 'service']
# Inhibit all host-level alerts if HostUnreachable is firing.
- source_match:
alertname: HostUnreachable
target_match:
severity: 'page'
equal: ['host']
receivers:
- name: default
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment