Skip to content

Commit 0097868

Browse files
committed
change alert grouping to send alerts with "severity: critical" immediately to the slack
1 parent db2280e commit 0097868

File tree

1 file changed

+4
-9
lines changed

1 file changed

+4
-9
lines changed

charts/prometheus-stack/values.yaml

Lines changed: 4 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -92,14 +92,6 @@ prometheusStack:
9292
summary: '{{ $labels.instance }} not reachable'
9393
expr: >
9494
sum by (instance) (sum_over_time(probe_success{}[90s])) < 1
95-
labels:
96-
severity: high
97-
- alert: ServiceIsDown
98-
annotations:
99-
description: 'Uptime of {{ $labels.instance }} is reporting down for 5 consecutive checks.'
100-
summary: '{{ $labels.instance }} not reachable'
101-
expr: >
102-
sum by (instance) (sum_over_time(probe_success{}[150s])) < 1
10395
labels:
10496
severity: critical
10597

@@ -148,7 +140,10 @@ prometheusStack:
148140
match:
149141
alertname: Watchdog
150142
- receiver: 'slack'
151-
continue: true
143+
group_by: [ '...' ]
144+
matchers:
145+
- severity: critical
146+
- receiver: 'slack'
152147
receivers:
153148
- name: 'null'
154149
- name: 'slack'

0 commit comments

Comments
 (0)