Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 1 | import json |
| 2 | import requests |
Oleksii Zhurba | 84ce7fe | 2018-01-16 21:34:01 +0000 | [diff] [blame] | 3 | import datetime |
Oleksii Zhurba | 468e6c7 | 2018-01-16 17:43:15 +0000 | [diff] [blame] | 4 | from cvp_checks import utils |
Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 5 | |
| 6 | |
| 7 | def test_elasticsearch_cluster(local_salt_client): |
Oleksii Zhurba | e37cdab | 2017-11-02 20:00:03 +0000 | [diff] [blame] | 8 | salt_output = local_salt_client.cmd( |
Oleksii Zhurba | bc51288 | 2018-01-29 16:47:20 -0600 | [diff] [blame] | 9 | 'kibana:server', |
Oleksii Zhurba | e37cdab | 2017-11-02 20:00:03 +0000 | [diff] [blame] | 10 | 'pillar.get', |
| 11 | ['_param:haproxy_elasticsearch_bind_host'], |
| 12 | expr_form='pillar') |
Oleksii Zhurba | e592ed1 | 2018-06-21 18:01:09 -0500 | [diff] [blame^] | 13 | proxies = {"http": None, "https": None} |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 14 | for node in salt_output.keys(): |
| 15 | IP = salt_output[node] |
Oleksii Zhurba | e592ed1 | 2018-06-21 18:01:09 -0500 | [diff] [blame^] | 16 | assert requests.get('http://{}:9200/'.format(IP), |
| 17 | proxies=proxies).status_code == 200, \ |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 18 | 'Cannot check elasticsearch url on {}.'.format(IP) |
Oleksii Zhurba | e592ed1 | 2018-06-21 18:01:09 -0500 | [diff] [blame^] | 19 | resp = requests.get('http://{}:9200/_cat/health'.format(IP), |
| 20 | proxies=proxies).content |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 21 | assert resp.split()[3] == 'green', \ |
| 22 | 'elasticsearch status is not good {}'.format( |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 23 | json.dumps(resp, indent=4)) |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 24 | assert resp.split()[4] == '3', \ |
| 25 | 'elasticsearch status is not good {}'.format( |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 26 | json.dumps(resp, indent=4)) |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 27 | assert resp.split()[5] == '3', \ |
| 28 | 'elasticsearch status is not good {}'.format( |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 29 | json.dumps(resp, indent=4)) |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 30 | assert resp.split()[10] == '0', \ |
| 31 | 'elasticsearch status is not good {}'.format( |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 32 | json.dumps(resp, indent=4)) |
Oleksii Zhurba | b31323f | 2017-11-20 15:35:19 -0600 | [diff] [blame] | 33 | assert resp.split()[13] == '100.0%', \ |
Oleksii Zhurba | 88bc047 | 2017-11-09 21:04:09 +0000 | [diff] [blame] | 34 | 'elasticsearch status is not good {}'.format( |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 35 | json.dumps(resp, indent=4)) |
Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 36 | |
| 37 | |
Oleksii Zhurba | 84ce7fe | 2018-01-16 21:34:01 +0000 | [diff] [blame] | 38 | def test_elasticsearch_node_count(local_salt_client): |
| 39 | now = datetime.datetime.now() |
| 40 | today = now.strftime("%Y.%m.%d") |
| 41 | active_nodes = utils.get_active_nodes() |
| 42 | salt_output = local_salt_client.cmd( |
Oleksii Zhurba | bc51288 | 2018-01-29 16:47:20 -0600 | [diff] [blame] | 43 | 'kibana:server', |
Oleksii Zhurba | 84ce7fe | 2018-01-16 21:34:01 +0000 | [diff] [blame] | 44 | 'pillar.get', |
| 45 | ['_param:haproxy_elasticsearch_bind_host'], |
| 46 | expr_form='pillar') |
| 47 | IP = salt_output.values()[0] |
Oleksii Zhurba | e592ed1 | 2018-06-21 18:01:09 -0500 | [diff] [blame^] | 48 | proxies = {"http": None, "https": None} |
Oleksii Zhurba | d2847dc | 2018-02-16 15:13:09 -0600 | [diff] [blame] | 49 | resp = json.loads(requests.post('http://{0}:9200/log-{1}/_search?pretty'. |
| 50 | format(IP, today), |
Oleksii Zhurba | e592ed1 | 2018-06-21 18:01:09 -0500 | [diff] [blame^] | 51 | proxies=proxies, |
Oleksii Zhurba | 7f46341 | 2018-03-21 16:32:44 -0500 | [diff] [blame] | 52 | data='{"size": 0, "aggs": ' |
| 53 | '{"uniq_hostname": ' |
Oleksii Zhurba | d2847dc | 2018-02-16 15:13:09 -0600 | [diff] [blame] | 54 | '{"terms": {"size": 500, ' |
Oleksii Zhurba | 7f46341 | 2018-03-21 16:32:44 -0500 | [diff] [blame] | 55 | '"field": "Hostname.keyword"}}}}').text) |
Oleksii Zhurba | d2847dc | 2018-02-16 15:13:09 -0600 | [diff] [blame] | 56 | cluster_domain = local_salt_client.cmd('salt:control', |
| 57 | 'pillar.get', |
| 58 | ['_param:cluster_domain'], |
| 59 | expr_form='pillar').values()[0] |
| 60 | monitored_nodes = [] |
Oleksii Zhurba | 7f46341 | 2018-03-21 16:32:44 -0500 | [diff] [blame] | 61 | for item_ in resp['aggregations']['uniq_hostname']['buckets']: |
Oleksii Zhurba | d2847dc | 2018-02-16 15:13:09 -0600 | [diff] [blame] | 62 | node_name = item_['key'] |
| 63 | monitored_nodes.append(node_name + '.' + cluster_domain) |
| 64 | missing_nodes = [] |
| 65 | for node in active_nodes.keys(): |
| 66 | if node not in monitored_nodes: |
| 67 | missing_nodes.append(node) |
| 68 | assert len(missing_nodes) == 0, \ |
Oleksii Zhurba | 84ce7fe | 2018-01-16 21:34:01 +0000 | [diff] [blame] | 69 | 'Not all nodes are in Elasticsearch. Found {0} keys, ' \ |
Oleksii Zhurba | d2847dc | 2018-02-16 15:13:09 -0600 | [diff] [blame] | 70 | 'expected {1}. Missing nodes: \n{2}'. \ |
| 71 | format(len(monitored_nodes), len(active_nodes), missing_nodes) |
Oleksii Zhurba | 84ce7fe | 2018-01-16 21:34:01 +0000 | [diff] [blame] | 72 | |
| 73 | |
Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 74 | def test_stacklight_services_replicas(local_salt_client): |
| 75 | salt_output = local_salt_client.cmd( |
| 76 | 'docker:client:stack:monitoring', |
| 77 | 'cmd.run', |
| 78 | ['docker service ls'], |
| 79 | expr_form='pillar') |
| 80 | wrong_items = [] |
| 81 | for line in salt_output[salt_output.keys()[0]].split('\n'): |
| 82 | if line[line.find('/') - 1] != line[line.find('/') + 1] \ |
| 83 | and 'replicated' in line: |
| 84 | wrong_items.append(line) |
| 85 | assert len(wrong_items) == 0, \ |
| 86 | '''Some monitoring services doesn't have expected number of replicas: |
| 87 | {}'''.format(json.dumps(wrong_items, indent=4)) |
| 88 | |
| 89 | |
Oleksii Zhurba | 468e6c7 | 2018-01-16 17:43:15 +0000 | [diff] [blame] | 90 | def test_prometheus_alert_count(local_salt_client): |
| 91 | IP = utils.get_monitoring_ip('cluster_public_host') |
| 92 | # keystone:server can return 3 nodes instead of 1 |
| 93 | # this will be fixed later |
| 94 | # TODO |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 95 | nodes_info = local_salt_client.cmd( |
Oleksii Zhurba | 468e6c7 | 2018-01-16 17:43:15 +0000 | [diff] [blame] | 96 | 'keystone:server', |
| 97 | 'cmd.run', |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 98 | ['curl -s http://{}:15010/alerts | grep icon-chevron-down | ' |
| 99 | 'grep -v "0 active"'.format(IP)], |
Oleksii Zhurba | 468e6c7 | 2018-01-16 17:43:15 +0000 | [diff] [blame] | 100 | expr_form='pillar') |
Oleksii Zhurba | 0c039ee | 2018-01-16 19:44:53 +0000 | [diff] [blame] | 101 | result = nodes_info[nodes_info.keys()[0]].replace('</td>', '').replace( |
| 102 | '<td><i class="icon-chevron-down"></i> <b>', '').replace('</b>', '') |
| 103 | assert result == '', 'AlertManager page has some alerts! {}'.format( |
| 104 | json.dumps(result), indent=4) |
Oleksii Zhurba | 468e6c7 | 2018-01-16 17:43:15 +0000 | [diff] [blame] | 105 | |
| 106 | |
Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 107 | def test_stacklight_containers_status(local_salt_client): |
| 108 | salt_output = local_salt_client.cmd( |
| 109 | 'docker:swarm:role:master', |
| 110 | 'cmd.run', |
| 111 | ['docker service ps $(docker stack services -q monitoring)'], |
| 112 | expr_form='pillar') |
| 113 | result = {} |
Oleksii Zhurba | 468e6c7 | 2018-01-16 17:43:15 +0000 | [diff] [blame] | 114 | # for old reclass models, docker:swarm:role:master can return |
| 115 | # 2 nodes instead of one. Here is temporary fix. |
| 116 | # TODO |
| 117 | if len(salt_output.keys()) > 1: |
| 118 | if 'CURRENT STATE' not in salt_output[salt_output.keys()[0]]: |
| 119 | del salt_output[salt_output.keys()[0]] |
Oleksii Zhurba | f2af637 | 2017-11-01 22:53:03 +0000 | [diff] [blame] | 120 | for line in salt_output[salt_output.keys()[0]].split('\n')[1:]: |
Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 121 | shift = 0 |
Oleksii Zhurba | 020fab4 | 2017-11-01 20:13:28 +0000 | [diff] [blame] | 122 | if line.split()[1] == '\\_': |
| 123 | shift = 1 |
| 124 | if line.split()[1 + shift] not in result.keys(): |
| 125 | result[line.split()[1]] = 'NOT OK' |
| 126 | if line.split()[4 + shift] == 'Running' \ |
| 127 | or line.split()[4 + shift] == 'Ready': |
| 128 | result[line.split()[1 + shift]] = 'OK' |
| 129 | assert 'NOT OK' not in result.values(), \ |
| 130 | '''Some containers are in incorrect state: |
| 131 | {}'''.format(json.dumps(result, indent=4)) |
Oleksii Zhurba | e592ed1 | 2018-06-21 18:01:09 -0500 | [diff] [blame^] | 132 | |
| 133 | |
| 134 | def test_running_telegraf_services(local_salt_client): |
| 135 | salt_output = local_salt_client.cmd('telegraf:agent', |
| 136 | 'service.status', |
| 137 | 'telegraf', |
| 138 | expr_form='pillar') |
| 139 | result = [{node: status} for node, status |
| 140 | in salt_output.items() |
| 141 | if status is False] |
| 142 | assert result == [], 'Telegraf service is not running ' \ |
| 143 | 'on following nodes:'.format(result) |