Use only needed metrics for Grafana CEPH monitoring
In case we have more then 2000 OSD, each osd process generates hundreds
of metrics, so we need to enable only needed metrics which are shown in
Grafana.
This is a re-work of CR https://gerrit.mcp.mirantis.net/15205
Change-Id: I38d905451e3f33dc805903203b4eda4ccab568c5
diff --git a/ceph/meta/telegraf.yml b/ceph/meta/telegraf.yml
index 606960d..0fbb00a 100644
--- a/ceph/meta/telegraf.yml
+++ b/ceph/meta/telegraf.yml
@@ -5,7 +5,6 @@
input:
ceph:
template: ceph/files/telegraf.conf
- fielddrop: [ "get", "get_or_fail_fail", "get_or_fail_success", "get_sum", "max", "put", "put_sum", "take", "take_sum", "val", "wait_avgcount", "wait_sum"]
{%- if monitoring.cluster_stats is defined %}
ceph_user: client.{{ monitoring.cluster_stats.ceph_user|default('admin') }}
gather_admin_socket_stats: {{ monitoring.cluster_stats.gather_admin_socket_stats|default('false') }}
@@ -36,7 +35,6 @@
input:
ceph:
template: ceph/files/telegraf.conf
- fielddrop: [ "get", "get_or_fail_fail", "get_or_fail_success", "get_sum", "max", "put", "put_sum", "take", "take_sum", "val", "wait_avgcount", "wait_sum"]
{%- if monitoring.cluster_stats is defined %}
ceph_user: client.{{ monitoring.cluster_stats.ceph_user|default('admin') }}
gather_admin_socket_stats: {{ monitoring.cluster_stats.gather_admin_socket_stats|default('true') }}
@@ -79,7 +77,7 @@
input:
ceph:
template: ceph/files/telegraf.conf
- fielddrop: [ "get", "get_or_fail_fail", "get_or_fail_success", "get_sum", "max", "put", "put_sum", "take", "take_sum", "val", "wait_avgcount", "wait_sum"]
+ fieldpass: [ "apply_latency*", "commitcycle_latency*", "op_latency*", "osdop_append", "osdop_delete", "osdop_read", "osdop_write", "recovery_ops" ]
{%- if monitoring.node_stats is defined %}
gather_admin_socket_stats: {{ monitoring.node_stats.gather_admin_socket_stats|default('true') }}
gather_cluster_stats: {{ monitoring.node_stats.gather_cluster_stats|default('false') }}