Rationalize current Keepalived alerts
Change-Id: Ibb0acfa4ef43307fa9c021c492d4b89d8514a365
Closes-Bug: PROD-19537
diff --git a/keepalived/meta/prometheus.yml b/keepalived/meta/prometheus.yml
index 3c3b969..8003c65 100644
--- a/keepalived/meta/prometheus.yml
+++ b/keepalived/meta/prometheus.yml
@@ -7,21 +7,21 @@
procstat_running{process_name="keepalived"} == 0
{% raw %}
labels:
- severity: warning
+ severity: major
service: keepalived
annotations:
- summary: 'Keepalived service is down'
- description: 'Keepalived service is down on node {{ $labels.host }}'
+ summary: 'Keepalived process is down'
+ description: 'Keepalived process is down on node {{ $labels.host }}'
{% endraw %}
- KeepalivedStateFailed:
+ KeepalivedFailedState:
if: >-
keepalived_state == 0
{% raw %}
labels:
- severity: warning
+ severity: minor
service: keepalived
annotations:
- summary: 'Keepalived is in the Failed state'
- description: 'Keepalived service is in Failed state on node {{ $labels.host }}'
+ summary: 'Keepalived entered the FAILED state'
+ description: 'Keepalived is in the FAILED state on node {{ $labels.host }}'
{% endraw %}
{%- endif %}