Alert rationalization for RabbitMQ
Change-Id: Ifb803105f5a2e53cf42c6d7c3ba67001008e7577
Closes-Bug: PROD-29227
diff --git a/rabbitmq/meta/prometheus.yml b/rabbitmq/meta/prometheus.yml
index 7b6773f..f005409 100644
--- a/rabbitmq/meta/prometheus.yml
+++ b/rabbitmq/meta/prometheus.yml
@@ -12,7 +12,7 @@
rabbitmq_up == 0
for: 1m
labels:
- severity: minor
+ severity: critical
service: rabbitmq
annotations:
summary: "RabbitMQ service is down"
@@ -86,7 +86,7 @@
if: >-
sum(rate(log_messages{service="rabbitmq",level=~"(?i:(error|emergency|fatal))"}[5m])) without (level) > 0.2
labels:
- severity: warning
+ severity: major
service: rabbitmq
annotations:
summary: "Too many errors in RabbitMQ logs"