koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 1 | from __future__ import print_function |
| 2 | |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 3 | import os |
koder aka kdanilov | 7acd6bd | 2015-02-12 14:28:30 -0800 | [diff] [blame] | 4 | import sys |
koder aka kdanilov | 12ae063 | 2015-04-15 01:13:43 +0300 | [diff] [blame] | 5 | import time |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 6 | import Queue |
koder aka kdanilov | 7acd6bd | 2015-02-12 14:28:30 -0800 | [diff] [blame] | 7 | import pprint |
koder aka kdanilov | e21d747 | 2015-02-14 19:02:04 -0800 | [diff] [blame] | 8 | import logging |
koder aka kdanilov | 7acd6bd | 2015-02-12 14:28:30 -0800 | [diff] [blame] | 9 | import argparse |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 10 | import threading |
| 11 | import collections |
koder aka kdanilov | 7acd6bd | 2015-02-12 14:28:30 -0800 | [diff] [blame] | 12 | |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 13 | import yaml |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 14 | from concurrent.futures import ThreadPoolExecutor |
koder aka kdanilov | 6c49106 | 2015-04-09 22:33:13 +0300 | [diff] [blame] | 15 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 16 | from wally import pretty_yaml |
| 17 | from wally.discover import discover, Node, undiscover |
| 18 | from wally import utils, report, ssh_utils, start_vms |
| 19 | from wally.suits.itest import IOPerfTest, PgBenchTest |
| 20 | from wally.config import cfg_dict, load_config, setup_loggers |
| 21 | from wally.sensors.api import (start_monitoring, |
| 22 | deploy_and_start_sensors, |
| 23 | SensorConfig) |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 24 | |
| 25 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 26 | logger = logging.getLogger("wally") |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 27 | |
koder aka kdanilov | 7acd6bd | 2015-02-12 14:28:30 -0800 | [diff] [blame] | 28 | |
Yulia Portnova | 7ddfa73 | 2015-02-24 17:32:58 +0200 | [diff] [blame] | 29 | def format_result(res, formatter): |
koder aka kdanilov | e21d747 | 2015-02-14 19:02:04 -0800 | [diff] [blame] | 30 | data = "\n{0}\n".format("=" * 80) |
| 31 | data += pprint.pformat(res) + "\n" |
| 32 | data += "{0}\n".format("=" * 80) |
koder aka kdanilov | fe05662 | 2015-02-19 08:46:15 -0800 | [diff] [blame] | 33 | templ = "{0}\n\n====> {1}\n\n{2}\n\n" |
Yulia Portnova | 7ddfa73 | 2015-02-24 17:32:58 +0200 | [diff] [blame] | 34 | return templ.format(data, formatter(res), "=" * 80) |
koder aka kdanilov | e21d747 | 2015-02-14 19:02:04 -0800 | [diff] [blame] | 35 | |
| 36 | |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 37 | class Context(object): |
| 38 | def __init__(self): |
| 39 | self.build_meta = {} |
| 40 | self.nodes = [] |
| 41 | self.clear_calls_stack = [] |
| 42 | self.openstack_nodes_ids = [] |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 43 | self.sensor_cm = None |
| 44 | self.keep_vm = False |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 45 | self.sensors_control_queue = None |
| 46 | self.sensor_listen_thread = None |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 47 | |
| 48 | |
koder aka kdanilov | 5d589b4 | 2015-03-26 12:25:51 +0200 | [diff] [blame] | 49 | def connect_one(node): |
| 50 | try: |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 51 | ssh_pref = "ssh://" |
| 52 | if node.conn_url.startswith(ssh_pref): |
| 53 | url = node.conn_url[len(ssh_pref):] |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 54 | logger.debug("Try connect to " + url) |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 55 | node.connection = ssh_utils.connect(url) |
| 56 | else: |
| 57 | raise ValueError("Unknown url type {0}".format(node.conn_url)) |
koder aka kdanilov | 3a6633e | 2015-03-26 18:20:00 +0200 | [diff] [blame] | 58 | except Exception: |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 59 | logger.exception("During connect to {0}".format(node)) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 60 | raise |
koder aka kdanilov | 5d589b4 | 2015-03-26 12:25:51 +0200 | [diff] [blame] | 61 | |
| 62 | |
| 63 | def connect_all(nodes): |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 64 | logger.info("Connecting to nodes") |
| 65 | with ThreadPoolExecutor(32) as pool: |
| 66 | list(pool.map(connect_one, nodes)) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 67 | logger.info("All nodes connected successfully") |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 68 | |
| 69 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 70 | def save_sensors_data(q, mon_q, fd): |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 71 | logger.info("Start receiving sensors data") |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 72 | fd.write("\n") |
| 73 | |
| 74 | observed_nodes = set() |
| 75 | |
| 76 | try: |
| 77 | while True: |
| 78 | val = q.get() |
| 79 | if val is None: |
| 80 | break |
| 81 | |
| 82 | addr, data = val |
| 83 | if addr not in observed_nodes: |
| 84 | mon_q.put(addr) |
| 85 | observed_nodes.add(addr) |
| 86 | |
| 87 | fd.write("{0!s} : {1!r}\n".format(time.time(), repr(val))) |
| 88 | except Exception: |
| 89 | logger.exception("Error in sensors thread") |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 90 | logger.info("Sensors thread exits") |
| 91 | |
| 92 | |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 93 | def test_thread(test, node, barrier, res_q): |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 94 | try: |
| 95 | logger.debug("Run preparation for {0}".format(node.conn_url)) |
| 96 | test.pre_run(node.connection) |
| 97 | logger.debug("Run test for {0}".format(node.conn_url)) |
| 98 | test.run(node.connection, barrier) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 99 | except Exception as exc: |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 100 | logger.exception("In test {0} for node {1}".format(test, node)) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 101 | res_q.put(exc) |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 102 | |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 103 | try: |
| 104 | test.cleanup(node.connection) |
| 105 | except: |
| 106 | msg = "Duringf cleanup - in test {0} for node {1}" |
| 107 | logger.exception(msg.format(test, node)) |
| 108 | |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 109 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 110 | def run_tests(test_block, nodes): |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 111 | tool_type_mapper = { |
| 112 | "io": IOPerfTest, |
| 113 | "pgbench": PgBenchTest, |
| 114 | } |
| 115 | |
| 116 | test_nodes = [node for node in nodes |
| 117 | if 'testnode' in node.roles] |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 118 | test_number_per_type = {} |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 119 | res_q = Queue.Queue() |
| 120 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 121 | for name, params in test_block.items(): |
| 122 | logger.info("Starting {0} tests".format(name)) |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 123 | test_num = test_number_per_type.get(name, 0) |
| 124 | test_number_per_type[name] = test_num + 1 |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 125 | threads = [] |
| 126 | barrier = utils.Barrier(len(test_nodes)) |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 127 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 128 | for node in test_nodes: |
| 129 | msg = "Starting {0} test on {1} node" |
| 130 | logger.debug(msg.format(name, node.conn_url)) |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 131 | |
| 132 | dr = os.path.join( |
| 133 | cfg_dict['test_log_directory'], |
| 134 | "{0}_{1}_{2}".format(name, test_num, node.get_ip()) |
| 135 | ) |
| 136 | |
| 137 | if not os.path.exists(dr): |
| 138 | os.makedirs(dr) |
| 139 | |
| 140 | test = tool_type_mapper[name](params, res_q.put, dr, |
| 141 | node=node.get_ip()) |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 142 | th = threading.Thread(None, test_thread, None, |
| 143 | (test, node, barrier, res_q)) |
| 144 | threads.append(th) |
| 145 | th.daemon = True |
| 146 | th.start() |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 147 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 148 | def gather_results(res_q, results): |
| 149 | while not res_q.empty(): |
| 150 | val = res_q.get() |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 151 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 152 | if isinstance(val, Exception): |
| 153 | msg = "Exception during test execution: {0}" |
| 154 | raise ValueError(msg.format(val.message)) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 155 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 156 | results.append(val) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 157 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 158 | results = [] |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 159 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 160 | while True: |
| 161 | for th in threads: |
| 162 | th.join(1) |
| 163 | gather_results(res_q, results) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 164 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 165 | if all(not th.is_alive() for th in threads): |
| 166 | break |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 167 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 168 | gather_results(res_q, results) |
| 169 | yield name, test.merge_results(results) |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 170 | |
| 171 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 172 | def log_nodes_statistic(_, ctx): |
| 173 | nodes = ctx.nodes |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 174 | logger.info("Found {0} nodes total".format(len(nodes))) |
| 175 | per_role = collections.defaultdict(lambda: 0) |
| 176 | for node in nodes: |
| 177 | for role in node.roles: |
| 178 | per_role[role] += 1 |
| 179 | |
| 180 | for role, count in sorted(per_role.items()): |
| 181 | logger.debug("Found {0} nodes with role {1}".format(count, role)) |
| 182 | |
| 183 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 184 | def connect_stage(cfg, ctx): |
| 185 | ctx.clear_calls_stack.append(disconnect_stage) |
| 186 | connect_all(ctx.nodes) |
| 187 | |
| 188 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 189 | def make_undiscover_stage(clean_data): |
| 190 | def undiscover_stage(cfg, ctx): |
| 191 | undiscover(clean_data) |
| 192 | return undiscover_stage |
| 193 | |
| 194 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 195 | def discover_stage(cfg, ctx): |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 196 | if cfg.get('discover') is not None: |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 197 | discover_objs = [i.strip() for i in cfg['discover'].strip().split(",")] |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 198 | |
| 199 | nodes, clean_data = discover(ctx, discover_objs, |
| 200 | cfg['clouds'], cfg['var_dir']) |
| 201 | ctx.clear_calls_stack.append(make_undiscover_stage(clean_data)) |
| 202 | ctx.nodes.extend(nodes) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 203 | |
| 204 | for url, roles in cfg.get('explicit_nodes', {}).items(): |
| 205 | ctx.nodes.append(Node(url, roles.split(","))) |
| 206 | |
| 207 | |
| 208 | def deploy_sensors_stage(cfg_dict, ctx): |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 209 | if 'sensors' not in cfg_dict: |
| 210 | return |
| 211 | |
| 212 | cfg = cfg_dict.get('sensors') |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 213 | |
| 214 | sensors_configs = [] |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 215 | monitored_nodes = [] |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 216 | |
| 217 | for role, sensors_str in cfg["roles_mapping"].items(): |
| 218 | sensors = [sens.strip() for sens in sensors_str.split(",")] |
| 219 | |
| 220 | collect_cfg = dict((sensor, {}) for sensor in sensors) |
| 221 | |
| 222 | for node in ctx.nodes: |
| 223 | if role in node.roles: |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 224 | monitored_nodes.append(node) |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 225 | sens_cfg = SensorConfig(node.connection, |
| 226 | node.get_ip(), |
| 227 | collect_cfg) |
| 228 | sensors_configs.append(sens_cfg) |
| 229 | |
| 230 | if len(monitored_nodes) == 0: |
| 231 | logger.info("Nothing to monitor, no sensors would be installed") |
| 232 | return |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 233 | |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 234 | ctx.receiver_uri = cfg["receiver_uri"] |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 235 | nodes_ips = [node.get_ip() for node in monitored_nodes] |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 236 | if '{ip}' in ctx.receiver_uri: |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 237 | ips = set(map(utils.get_ip_for_target, nodes_ips)) |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 238 | |
| 239 | if len(ips) > 1: |
| 240 | raise ValueError("Can't select external ip for sensors server") |
| 241 | |
| 242 | if len(ips) == 0: |
| 243 | raise ValueError("Can't find any external ip for sensors server") |
| 244 | |
| 245 | ext_ip = list(ips)[0] |
| 246 | ctx.receiver_uri = ctx.receiver_uri.format(ip=ext_ip) |
| 247 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 248 | ctx.clear_calls_stack.append(remove_sensors_stage) |
| 249 | ctx.sensor_cm = start_monitoring(ctx.receiver_uri, sensors_configs) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 250 | |
| 251 | ctx.sensors_control_queue = ctx.sensor_cm.__enter__() |
| 252 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 253 | mon_q = Queue.Queue() |
| 254 | |
koder aka kdanilov | 12ae063 | 2015-04-15 01:13:43 +0300 | [diff] [blame] | 255 | fd = open(cfg_dict['sensor_storage'], "w") |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 256 | th = threading.Thread(None, save_sensors_data, None, |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 257 | (ctx.sensors_control_queue, mon_q, fd)) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 258 | th.daemon = True |
| 259 | th.start() |
| 260 | ctx.sensor_listen_thread = th |
| 261 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 262 | nodes_ips_set = set(nodes_ips) |
| 263 | MAX_WAIT_FOR_SENSORS = 10 |
| 264 | etime = time.time() + MAX_WAIT_FOR_SENSORS |
| 265 | |
| 266 | msg = "Waiting at most {0}s till all {1} nodes starts report sensors data" |
| 267 | logger.debug(msg.format(MAX_WAIT_FOR_SENSORS, len(nodes_ips_set))) |
| 268 | |
| 269 | # wait till all nodes start sending data |
| 270 | while len(nodes_ips_set) != 0: |
| 271 | tleft = etime - time.time() |
| 272 | try: |
| 273 | data = mon_q.get(True, tleft) |
| 274 | ip, port = data |
| 275 | except Queue.Empty: |
| 276 | msg = "Node {0} not sending any sensor data in {1}s" |
| 277 | msg = msg.format(", ".join(nodes_ips_set), MAX_WAIT_FOR_SENSORS) |
| 278 | raise RuntimeError(msg) |
| 279 | |
| 280 | if ip not in nodes_ips_set: |
| 281 | logger.warning("Receive sensors from extra node: {0}".format(ip)) |
| 282 | |
| 283 | nodes_ips_set.remove(ip) |
| 284 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 285 | |
| 286 | def remove_sensors_stage(cfg, ctx): |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 287 | if ctx.sensor_cm is not None: |
| 288 | ctx.sensor_cm.__exit__(None, None, None) |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 289 | |
| 290 | if ctx.sensors_control_queue is not None: |
| 291 | ctx.sensors_control_queue.put(None) |
| 292 | |
| 293 | if ctx.sensor_listen_thread is not None: |
| 294 | ctx.sensor_listen_thread.join() |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 295 | |
| 296 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 297 | def get_os_credentials(cfg, ctx, creds_type): |
| 298 | creds = None |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 299 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 300 | if creds_type == 'clouds': |
| 301 | if 'openstack' in cfg['clouds']: |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 302 | os_cfg = cfg['clouds']['openstack'] |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 303 | |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 304 | tenant = os_cfg['OS_TENANT_NAME'].strip() |
| 305 | user = os_cfg['OS_USERNAME'].strip() |
| 306 | passwd = os_cfg['OS_PASSWORD'].strip() |
| 307 | auth_url = os_cfg['OS_AUTH_URL'].strip() |
| 308 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 309 | elif 'fuel' in cfg['clouds'] and \ |
| 310 | 'openstack_env' in cfg['clouds']['fuel']: |
| 311 | creds = ctx.fuel_openstack_creds |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 312 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 313 | elif creds_type == 'ENV': |
| 314 | user, passwd, tenant, auth_url = start_vms.ostack_get_creds() |
| 315 | elif os.path.isfile(creds_type): |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 316 | raise NotImplementedError() |
| 317 | # user, passwd, tenant, auth_url = start_vms.ostack_get_creds() |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 318 | else: |
| 319 | msg = "Creds {0!r} isn't supported".format(creds_type) |
| 320 | raise ValueError(msg) |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 321 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 322 | if creds is None: |
| 323 | creds = {'name': user, |
| 324 | 'passwd': passwd, |
| 325 | 'tenant': tenant, |
| 326 | 'auth_url': auth_url} |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 327 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 328 | return creds |
koder aka kdanilov | 4e9f3ed | 2015-04-14 11:26:12 +0300 | [diff] [blame] | 329 | |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 330 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 331 | def run_tests_stage(cfg, ctx): |
| 332 | ctx.results = [] |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 333 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 334 | if 'tests' not in cfg: |
| 335 | return |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 336 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 337 | for group in cfg['tests']: |
| 338 | |
| 339 | assert len(group.items()) == 1 |
| 340 | key, config = group.items()[0] |
| 341 | |
| 342 | if 'start_test_nodes' == key: |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 343 | params = config['vm_params'].copy() |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 344 | os_nodes_ids = [] |
| 345 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 346 | os_creds_type = config['creds'] |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 347 | os_creds = get_os_credentials(cfg, ctx, os_creds_type) |
| 348 | |
| 349 | start_vms.nova_connect(**os_creds) |
| 350 | |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 351 | logger.info("Preparing openstack") |
| 352 | start_vms.prepare_os_subpr(**os_creds) |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 353 | |
| 354 | new_nodes = [] |
| 355 | try: |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 356 | params['group_name'] = cfg_dict['run_uuid'] |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 357 | for new_node, node_id in start_vms.launch_vms(params): |
| 358 | new_node.roles.append('testnode') |
| 359 | ctx.nodes.append(new_node) |
| 360 | os_nodes_ids.append(node_id) |
| 361 | new_nodes.append(new_node) |
| 362 | |
| 363 | store_nodes_in_log(cfg, os_nodes_ids) |
| 364 | ctx.openstack_nodes_ids = os_nodes_ids |
| 365 | |
| 366 | connect_all(new_nodes) |
| 367 | |
koder aka kdanilov | 12ae063 | 2015-04-15 01:13:43 +0300 | [diff] [blame] | 368 | # deploy sensors on new nodes |
| 369 | # unify this code |
| 370 | if 'sensors' in cfg: |
| 371 | sens_cfg = [] |
| 372 | sensors_str = cfg["sensors"]["roles_mapping"]['testnode'] |
| 373 | sensors = [sens.strip() for sens in sensors_str.split(",")] |
| 374 | |
| 375 | collect_cfg = dict((sensor, {}) for sensor in sensors) |
| 376 | for node in new_nodes: |
| 377 | sens_cfg.append((node.connection, collect_cfg)) |
| 378 | |
| 379 | uri = cfg["sensors"]["receiver_uri"] |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 380 | logger.debug("Installing sensors on vm's") |
koder aka kdanilov | 12ae063 | 2015-04-15 01:13:43 +0300 | [diff] [blame] | 381 | deploy_and_start_sensors(uri, None, |
| 382 | connected_config=sens_cfg) |
| 383 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 384 | for test_group in config.get('tests', []): |
| 385 | ctx.results.extend(run_tests(test_group, ctx.nodes)) |
| 386 | |
| 387 | finally: |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 388 | if not ctx.keep_vm: |
| 389 | shut_down_vms_stage(cfg, ctx) |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 390 | |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 391 | else: |
| 392 | ctx.results.extend(run_tests(group, ctx.nodes)) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 393 | |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 394 | |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 395 | def shut_down_vms_stage(cfg, ctx): |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 396 | vm_ids_fname = cfg_dict['vm_ids_fname'] |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 397 | if ctx.openstack_nodes_ids is None: |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 398 | nodes_ids = open(vm_ids_fname).read().split() |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 399 | else: |
| 400 | nodes_ids = ctx.openstack_nodes_ids |
| 401 | |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 402 | if len(nodes_ids) != 0: |
| 403 | logger.info("Removing nodes") |
| 404 | start_vms.clear_nodes(nodes_ids) |
| 405 | logger.info("Nodes has been removed") |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 406 | |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 407 | if os.path.exists(vm_ids_fname): |
| 408 | os.remove(vm_ids_fname) |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 409 | |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 410 | |
| 411 | def store_nodes_in_log(cfg, nodes_ids): |
| 412 | with open(cfg['vm_ids_fname'], 'w') as fd: |
| 413 | fd.write("\n".join(nodes_ids)) |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 414 | |
| 415 | |
| 416 | def clear_enviroment(cfg, ctx): |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 417 | if os.path.exists(cfg_dict['vm_ids_fname']): |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 418 | shut_down_vms_stage(cfg, ctx) |
gstepanov | 023c1e4 | 2015-04-08 15:50:19 +0300 | [diff] [blame] | 419 | |
| 420 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 421 | def disconnect_stage(cfg, ctx): |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 422 | ssh_utils.close_all_sessions() |
| 423 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 424 | for node in ctx.nodes: |
| 425 | if node.connection is not None: |
| 426 | node.connection.close() |
| 427 | |
| 428 | |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 429 | def yamable(data): |
| 430 | if isinstance(data, (tuple, list)): |
| 431 | return map(yamable, data) |
| 432 | |
| 433 | if isinstance(data, unicode): |
| 434 | return str(data) |
| 435 | |
| 436 | if isinstance(data, dict): |
| 437 | res = {} |
| 438 | for k, v in data.items(): |
| 439 | res[yamable(k)] = yamable(v) |
| 440 | return res |
| 441 | |
| 442 | return data |
| 443 | |
| 444 | |
| 445 | def store_raw_results_stage(cfg, ctx): |
| 446 | |
| 447 | raw_results = os.path.join(cfg_dict['var_dir'], 'raw_results.yaml') |
| 448 | |
| 449 | if os.path.exists(raw_results): |
| 450 | cont = yaml.load(open(raw_results).read()) |
| 451 | else: |
| 452 | cont = [] |
| 453 | |
| 454 | cont.extend(yamable(ctx.results)) |
| 455 | raw_data = pretty_yaml.dumps(cont) |
| 456 | |
| 457 | with open(raw_results, "w") as fd: |
| 458 | fd.write(raw_data) |
| 459 | |
| 460 | |
| 461 | def console_report_stage(cfg, ctx): |
| 462 | for tp, data in ctx.results: |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 463 | if 'io' == tp and data is not None: |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 464 | print(IOPerfTest.format_for_console(data)) |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 465 | |
| 466 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 467 | def report_stage(cfg, ctx): |
Yulia Portnova | 8ca2057 | 2015-04-14 14:09:39 +0300 | [diff] [blame] | 468 | html_rep_fname = cfg['html_report_file'] |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 469 | |
| 470 | try: |
| 471 | fuel_url = cfg['clouds']['fuel']['url'] |
| 472 | except KeyError: |
| 473 | fuel_url = None |
| 474 | |
| 475 | try: |
| 476 | creds = cfg['clouds']['fuel']['creds'] |
| 477 | except KeyError: |
| 478 | creds = None |
| 479 | |
gstepanov | 69339ac | 2015-04-16 20:09:33 +0300 | [diff] [blame] | 480 | report.make_io_report(ctx.results, html_rep_fname, fuel_url, creds=creds) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 481 | |
Yulia Portnova | 8ca2057 | 2015-04-14 14:09:39 +0300 | [diff] [blame] | 482 | logger.info("Html report were stored in " + html_rep_fname) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 483 | |
| 484 | text_rep_fname = cfg_dict['text_report_file'] |
| 485 | with open(text_rep_fname, "w") as fd: |
| 486 | for tp, data in ctx.results: |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 487 | if 'io' == tp and data is not None: |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 488 | fd.write(IOPerfTest.format_for_console(data)) |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 489 | fd.write("\n") |
| 490 | fd.flush() |
| 491 | |
| 492 | logger.info("Text report were stored in " + text_rep_fname) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 493 | |
| 494 | |
| 495 | def complete_log_nodes_statistic(cfg, ctx): |
| 496 | nodes = ctx.nodes |
| 497 | for node in nodes: |
| 498 | logger.debug(str(node)) |
| 499 | |
| 500 | |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 501 | def load_data_from(var_dir): |
koder aka kdanilov | 4e9f3ed | 2015-04-14 11:26:12 +0300 | [diff] [blame] | 502 | def load_data_from_file(cfg, ctx): |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 503 | raw_results = os.path.join(var_dir, 'raw_results.yaml') |
| 504 | ctx.results = yaml.load(open(raw_results).read()) |
koder aka kdanilov | 4e9f3ed | 2015-04-14 11:26:12 +0300 | [diff] [blame] | 505 | return load_data_from_file |
gstepanov | cd256d6 | 2015-04-07 17:47:32 +0300 | [diff] [blame] | 506 | |
| 507 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 508 | def parse_args(argv): |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 509 | descr = "Disk io performance test suite" |
| 510 | parser = argparse.ArgumentParser(prog='wally', description=descr) |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 511 | |
| 512 | parser.add_argument("-l", dest='extra_logs', |
| 513 | action='store_true', default=False, |
| 514 | help="print some extra log info") |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 515 | parser.add_argument("-b", '--build_description', |
| 516 | type=str, default="Build info") |
| 517 | parser.add_argument("-i", '--build_id', type=str, default="id") |
| 518 | parser.add_argument("-t", '--build_type', type=str, default="GA") |
| 519 | parser.add_argument("-u", '--username', type=str, default="admin") |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 520 | parser.add_argument("-p", '--post-process-only', metavar="VAR_DIR", |
| 521 | help="Only process data from previour run") |
| 522 | parser.add_argument("-k", '--keep-vm', action='store_true', |
| 523 | help="Don't remove test vm's", default=False) |
| 524 | parser.add_argument("config_file") |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 525 | |
| 526 | return parser.parse_args(argv[1:]) |
| 527 | |
| 528 | |
koder aka kdanilov | 3f35626 | 2015-02-13 08:06:14 -0800 | [diff] [blame] | 529 | def main(argv): |
koder aka kdanilov | e06762a | 2015-03-22 23:32:09 +0200 | [diff] [blame] | 530 | opts = parse_args(argv) |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 531 | |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 532 | if opts.post_process_only is not None: |
| 533 | stages = [ |
| 534 | load_data_from(opts.post_process_only), |
| 535 | console_report_stage, |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 536 | report_stage |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 537 | ] |
| 538 | else: |
| 539 | stages = [ |
| 540 | discover_stage, |
| 541 | log_nodes_statistic, |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 542 | connect_stage, |
koder aka kdanilov | 66839a9 | 2015-04-11 13:22:31 +0300 | [diff] [blame] | 543 | deploy_sensors_stage, |
| 544 | run_tests_stage, |
| 545 | store_raw_results_stage, |
| 546 | console_report_stage, |
| 547 | report_stage |
| 548 | ] |
| 549 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 550 | load_config(opts.config_file, opts.post_process_only) |
koder aka kdanilov | f4b82c2 | 2015-04-11 13:35:25 +0300 | [diff] [blame] | 551 | |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 552 | if cfg_dict.get('logging', {}).get("extra_logs", False) or opts.extra_logs: |
| 553 | level = logging.DEBUG |
| 554 | else: |
| 555 | level = logging.WARNING |
| 556 | |
| 557 | setup_loggers(level, cfg_dict['log_file']) |
koder aka kdanilov | f4b82c2 | 2015-04-11 13:35:25 +0300 | [diff] [blame] | 558 | |
koder aka kdanilov | 652cd80 | 2015-04-13 12:21:07 +0300 | [diff] [blame] | 559 | logger.info("All info would be stored into {0}".format( |
| 560 | cfg_dict['var_dir'])) |
gstepanov | cd256d6 | 2015-04-07 17:47:32 +0300 | [diff] [blame] | 561 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 562 | ctx = Context() |
gstepanov | affcdb1 | 2015-04-07 17:18:29 +0300 | [diff] [blame] | 563 | ctx.build_meta['build_id'] = opts.build_id |
| 564 | ctx.build_meta['build_descrption'] = opts.build_description |
| 565 | ctx.build_meta['build_type'] = opts.build_type |
| 566 | ctx.build_meta['username'] = opts.username |
koder aka kdanilov | 4500a5f | 2015-04-17 16:55:17 +0300 | [diff] [blame] | 567 | ctx.keep_vm = opts.keep_vm |
koder aka kdanilov | 6c49106 | 2015-04-09 22:33:13 +0300 | [diff] [blame] | 568 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 569 | try: |
| 570 | for stage in stages: |
| 571 | logger.info("Start {0.__name__} stage".format(stage)) |
| 572 | stage(cfg_dict, ctx) |
koder aka kdanilov | cff7b2e | 2015-04-18 20:48:15 +0300 | [diff] [blame^] | 573 | except Exception as exc: |
| 574 | msg = "Exception during current stage: {0}".format(exc.message) |
| 575 | logger.error(msg) |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 576 | finally: |
| 577 | exc, cls, tb = sys.exc_info() |
| 578 | for stage in ctx.clear_calls_stack[::-1]: |
| 579 | try: |
| 580 | logger.info("Start {0.__name__} stage".format(stage)) |
| 581 | stage(cfg_dict, ctx) |
koder aka kdanilov | 1c2b511 | 2015-04-10 16:53:51 +0300 | [diff] [blame] | 582 | except Exception as exc: |
| 583 | logger.exception("During {0.__name__} stage".format(stage)) |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 584 | |
koder aka kdanilov | da45e88 | 2015-04-06 02:24:42 +0300 | [diff] [blame] | 585 | if exc is not None: |
| 586 | raise exc, cls, tb |
koder aka kdanilov | 2c47309 | 2015-03-29 17:12:13 +0300 | [diff] [blame] | 587 | |
koder aka kdanilov | cee4334 | 2015-04-14 22:52:53 +0300 | [diff] [blame] | 588 | logger.info("All info stored into {0}".format(cfg_dict['var_dir'])) |
koder aka kdanilov | e06762a | 2015-03-22 23:32:09 +0200 | [diff] [blame] | 589 | return 0 |