blob: 53224323a59a284309e80e1e22243897c7f1d64f [file] [log] [blame]
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +03001from __future__ import print_function
2
gstepanov023c1e42015-04-08 15:50:19 +03003import os
koder aka kdanilov7acd6bd2015-02-12 14:28:30 -08004import sys
koder aka kdanilov57ce4db2015-04-25 21:25:51 +03005import time
koder aka kdanilov2c473092015-03-29 17:12:13 +03006import Queue
koder aka kdanilov7acd6bd2015-02-12 14:28:30 -08007import pprint
koder aka kdanilov416b87a2015-05-12 00:26:04 +03008import signal
koder aka kdanilove21d7472015-02-14 19:02:04 -08009import logging
koder aka kdanilov7acd6bd2015-02-12 14:28:30 -080010import argparse
koder aka kdanilov168f6092015-04-19 02:33:38 +030011import functools
koder aka kdanilov2c473092015-03-29 17:12:13 +030012import threading
koder aka kdanilov7306c642015-04-23 15:29:45 +030013import subprocess
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +030014import contextlib
koder aka kdanilov2c473092015-03-29 17:12:13 +030015import collections
koder aka kdanilov7acd6bd2015-02-12 14:28:30 -080016
koder aka kdanilov66839a92015-04-11 13:22:31 +030017import yaml
koder aka kdanilov416b87a2015-05-12 00:26:04 +030018import faulthandler
koder aka kdanilov2c473092015-03-29 17:12:13 +030019from concurrent.futures import ThreadPoolExecutor
koder aka kdanilov6c491062015-04-09 22:33:13 +030020
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +030021from wally import pretty_yaml
koder aka kdanilovf86d7af2015-05-06 04:01:54 +030022from wally.hw_info import get_hw_info
23from wally.discover import discover, Node
koder aka kdanilov63ad2062015-04-27 13:11:40 +030024from wally.timeseries import SensorDatastore
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +030025from wally import utils, report, ssh_utils, start_vms
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +030026from wally.config import cfg_dict, load_config, setup_loggers
koder aka kdanilov416b87a2015-05-12 00:26:04 +030027from wally.suits.itest import IOPerfTest, PgBenchTest, MysqlTest
28from wally.sensors_utils import deploy_sensors_stage, gather_sensors_stage
koder aka kdanilov63ad2062015-04-27 13:11:40 +030029
koder aka kdanilov57ce4db2015-04-25 21:25:51 +030030
31try:
32 from wally import webui
33except ImportError:
34 webui = None
koder aka kdanilov2c473092015-03-29 17:12:13 +030035
36
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +030037logger = logging.getLogger("wally")
koder aka kdanilovcee43342015-04-14 22:52:53 +030038
koder aka kdanilov7acd6bd2015-02-12 14:28:30 -080039
Yulia Portnova7ddfa732015-02-24 17:32:58 +020040def format_result(res, formatter):
koder aka kdanilove21d7472015-02-14 19:02:04 -080041 data = "\n{0}\n".format("=" * 80)
42 data += pprint.pformat(res) + "\n"
43 data += "{0}\n".format("=" * 80)
koder aka kdanilovfe056622015-02-19 08:46:15 -080044 templ = "{0}\n\n====> {1}\n\n{2}\n\n"
Yulia Portnova7ddfa732015-02-24 17:32:58 +020045 return templ.format(data, formatter(res), "=" * 80)
koder aka kdanilove21d7472015-02-14 19:02:04 -080046
47
koder aka kdanilov1c2b5112015-04-10 16:53:51 +030048class Context(object):
49 def __init__(self):
50 self.build_meta = {}
51 self.nodes = []
52 self.clear_calls_stack = []
53 self.openstack_nodes_ids = []
koder aka kdanilov168f6092015-04-19 02:33:38 +030054 self.sensors_mon_q = None
koder aka kdanilovf86d7af2015-05-06 04:01:54 +030055 self.hw_info = []
koder aka kdanilov1c2b5112015-04-10 16:53:51 +030056
57
koder aka kdanilov168f6092015-04-19 02:33:38 +030058def connect_one(node, vm=False):
koder aka kdanilov0c598a12015-04-21 03:01:40 +030059 if node.conn_url == 'local':
60 node.connection = ssh_utils.connect(node.conn_url)
61 return
62
koder aka kdanilov5d589b42015-03-26 12:25:51 +020063 try:
koder aka kdanilov2c473092015-03-29 17:12:13 +030064 ssh_pref = "ssh://"
65 if node.conn_url.startswith(ssh_pref):
66 url = node.conn_url[len(ssh_pref):]
koder aka kdanilov168f6092015-04-19 02:33:38 +030067
68 if vm:
koder aka kdanilov6b1341a2015-04-21 22:44:21 +030069 conn_timeout = 240
koder aka kdanilov168f6092015-04-19 02:33:38 +030070 else:
koder aka kdanilov6b1341a2015-04-21 22:44:21 +030071 conn_timeout = 30
koder aka kdanilov168f6092015-04-19 02:33:38 +030072
73 node.connection = ssh_utils.connect(url,
koder aka kdanilov6b1341a2015-04-21 22:44:21 +030074 conn_timeout=conn_timeout)
koder aka kdanilov2c473092015-03-29 17:12:13 +030075 else:
76 raise ValueError("Unknown url type {0}".format(node.conn_url))
koder aka kdanilove87ae652015-04-20 02:14:35 +030077 except Exception as exc:
78 # logger.exception("During connect to " + node.get_conn_id())
koder aka kdanilovec1b9732015-04-23 20:43:29 +030079 msg = "During connect to {0}: {1!s}".format(node.get_conn_id(),
80 exc)
koder aka kdanilove87ae652015-04-20 02:14:35 +030081 logger.error(msg)
koder aka kdanilov168f6092015-04-19 02:33:38 +030082 node.connection = None
koder aka kdanilov5d589b42015-03-26 12:25:51 +020083
84
koder aka kdanilov168f6092015-04-19 02:33:38 +030085def connect_all(nodes, vm=False):
koder aka kdanilov2c473092015-03-29 17:12:13 +030086 logger.info("Connecting to nodes")
87 with ThreadPoolExecutor(32) as pool:
koder aka kdanilov168f6092015-04-19 02:33:38 +030088 connect_one_f = functools.partial(connect_one, vm=vm)
89 list(pool.map(connect_one_f, nodes))
koder aka kdanilov2c473092015-03-29 17:12:13 +030090
91
koder aka kdanilovf86d7af2015-05-06 04:01:54 +030092def collect_hw_info_stage(cfg, ctx):
93 if os.path.exists(cfg['hwreport_fname']):
94 msg = "{0} already exists. Skip hw info"
95 logger.info(msg.format(cfg['hwreport_fname']))
96 return
97
98 with ThreadPoolExecutor(32) as pool:
99 connections = (node.connection for node in ctx.nodes)
100 ctx.hw_info.extend(pool.map(get_hw_info, connections))
101
102 with open(cfg['hwreport_fname'], 'w') as hwfd:
103 for node, info in zip(ctx.nodes, ctx.hw_info):
104 hwfd.write("-" * 60 + "\n")
105 hwfd.write("Roles : " + ", ".join(node.roles) + "\n")
106 hwfd.write(str(info) + "\n")
107 hwfd.write("-" * 60 + "\n\n")
108
109 if info.hostname is not None:
110 fname = os.path.join(
111 cfg_dict['hwinfo_directory'],
112 info.hostname + "_lshw.xml")
113
114 with open(fname, "w") as fd:
115 fd.write(info.raw)
116 logger.info("Hardware report stored in " + cfg['hwreport_fname'])
117 logger.debug("Raw hardware info in " + cfg['hwinfo_directory'] + " folder")
118
119
koder aka kdanilov652cd802015-04-13 12:21:07 +0300120def test_thread(test, node, barrier, res_q):
koder aka kdanilov4d4771c2015-04-23 01:32:02 +0300121 exc = None
koder aka kdanilov2c473092015-03-29 17:12:13 +0300122 try:
koder aka kdanilova047e1b2015-04-21 23:16:59 +0300123 logger.debug("Run preparation for {0}".format(node.get_conn_id()))
koder aka kdanilov4d4771c2015-04-23 01:32:02 +0300124 test.pre_run()
koder aka kdanilova047e1b2015-04-21 23:16:59 +0300125 logger.debug("Run test for {0}".format(node.get_conn_id()))
koder aka kdanilov4d4771c2015-04-23 01:32:02 +0300126 test.run(barrier)
koder aka kdanilove2de58c2015-04-24 22:59:36 +0300127 except utils.StopTestError as exc:
128 pass
koder aka kdanilov652cd802015-04-13 12:21:07 +0300129 except Exception as exc:
koder aka kdanilove2de58c2015-04-24 22:59:36 +0300130 msg = "In test {0} for node {1}"
131 msg = msg.format(test, node.get_conn_id())
132 logger.exception(msg)
133 exc = utils.StopTestError(msg, exc)
koder aka kdanilov2c473092015-03-29 17:12:13 +0300134
koder aka kdanilov4500a5f2015-04-17 16:55:17 +0300135 try:
koder aka kdanilov4d4771c2015-04-23 01:32:02 +0300136 test.cleanup()
koder aka kdanilove2de58c2015-04-24 22:59:36 +0300137 except utils.StopTestError as exc1:
138 if exc is None:
139 exc = exc1
koder aka kdanilov4500a5f2015-04-17 16:55:17 +0300140 except:
141 msg = "Duringf cleanup - in test {0} for node {1}"
142 logger.exception(msg.format(test, node))
143
koder aka kdanilov4d4771c2015-04-23 01:32:02 +0300144 if exc is not None:
145 res_q.put(exc)
koder aka kdanilov2c473092015-03-29 17:12:13 +0300146
koder aka kdanilov4d4771c2015-04-23 01:32:02 +0300147
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300148def run_single_test(test_nodes, name, test_cls, params,
149 test_local_folder, run_uuid, counter=[0]):
150 logger.info("Starting {0} tests".format(name))
151 res_q = Queue.Queue()
152 threads = []
153 coord_q = Queue.Queue()
154 rem_folder = test_local_folder.format(name=name)
155
156 barrier = utils.Barrier(len(test_nodes))
157 for idx, node in enumerate(test_nodes):
158 msg = "Starting {0} test on {1} node"
159 logger.debug(msg.format(name, node.conn_url))
160
161 dname = "{0}_{1}_{2}".format(name, counter[0], node.get_ip())
162 counter[0] += 1
163 dr = os.path.join(cfg_dict['test_log_directory'], dname)
164
165 if not os.path.exists(dr):
166 os.makedirs(dr)
167
168 params = params.copy()
169 params['testnodes_count'] = len(test_nodes)
170 test = test_cls(options=params,
171 is_primary=(idx == 0),
172 on_result_cb=res_q.put,
173 test_uuid=run_uuid,
174 node=node,
175 remote_dir=rem_folder,
176 log_directory=dr,
177 coordination_queue=coord_q)
178 th = threading.Thread(None, test_thread, None,
179 (test, node, barrier, res_q))
180 threads.append(th)
181 th.daemon = True
182 th.start()
183
184 th = threading.Thread(None, test_cls.coordination_th, None,
185 (coord_q, barrier, len(threads)))
186 threads.append(th)
187 th.daemon = True
188 th.start()
189
190 results = []
191 coord_q.put(None)
192
193 while len(threads) != 0:
194 nthreads = []
195
196 for th in threads:
197 if not th.is_alive():
198 th.join()
199 else:
200 nthreads.append(th)
201
202 threads = nthreads
203
204 while not res_q.empty():
205 val = res_q.get()
206
207 if isinstance(val, utils.StopTestError):
208 raise val
209
210 if isinstance(val, Exception):
211 msg = "Exception during test execution: {0!s}"
212 raise ValueError(msg.format(val))
213
214 results.append(val)
215
216 results = test_cls.merge_results(results)
217 return results
218
219
koder aka kdanilov2066daf2015-04-23 21:05:41 +0300220def run_tests(cfg, test_block, nodes):
koder aka kdanilov2c473092015-03-29 17:12:13 +0300221 tool_type_mapper = {
222 "io": IOPerfTest,
223 "pgbench": PgBenchTest,
Yulia Portnovab1a15072015-05-06 14:59:25 +0300224 "mysql": MysqlTest,
koder aka kdanilov2c473092015-03-29 17:12:13 +0300225 }
226
227 test_nodes = [node for node in nodes
228 if 'testnode' in node.roles]
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300229 if len(test_nodes) == 0:
230 logger.error("No test nodes found")
231 return
232
koder aka kdanilovcee43342015-04-14 22:52:53 +0300233 for name, params in test_block.items():
koder aka kdanilovcee43342015-04-14 22:52:53 +0300234 results = []
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300235 limit = params.get('node_limit')
236 if isinstance(limit, (int, long)):
237 vm_limits = [limit]
238 elif limit is None:
239 vm_limits = [len(test_nodes)]
240 else:
241 vm_limits = limit
koder aka kdanilov652cd802015-04-13 12:21:07 +0300242
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300243 for vm_count in vm_limits:
244 if vm_count == 'all':
245 curr_test_nodes = test_nodes
246 unused_nodes = []
247 else:
248 curr_test_nodes = test_nodes[:vm_count]
249 unused_nodes = test_nodes[vm_count:]
koder aka kdanilove87ae652015-04-20 02:14:35 +0300250
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300251 if 0 == len(curr_test_nodes):
252 continue
koder aka kdanilov652cd802015-04-13 12:21:07 +0300253
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300254 if cfg.get('suspend_unused_vms', True):
255 pausable_nodes_ids = [node.os_vm_id for node in unused_nodes
256 if node.os_vm_id is not None]
257 non_pausable = len(unused_nodes) - len(pausable_nodes_ids)
koder aka kdanilov652cd802015-04-13 12:21:07 +0300258
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300259 if 0 != non_pausable:
260 logger.warning("Can't pause {0} nodes".format(
261 non_pausable))
koder aka kdanilove87ae652015-04-20 02:14:35 +0300262
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300263 if len(pausable_nodes_ids) != 0:
264 logger.debug("Try to pause {0} unused nodes".format(
265 len(pausable_nodes_ids)))
266 start_vms.pause(pausable_nodes_ids)
267
268 resumable_nodes_ids = [node.os_vm_id for node in curr_test_nodes
269 if node.os_vm_id is not None]
270
271 if len(resumable_nodes_ids) != 0:
272 logger.debug("Check and unpause {0} nodes".format(
273 len(resumable_nodes_ids)))
274 start_vms.unpause(resumable_nodes_ids)
275
276 test_cls = tool_type_mapper[name]
277 try:
278 res = run_single_test(curr_test_nodes, name, test_cls,
279 params,
280 cfg['default_test_local_folder'],
281 cfg['run_uuid'])
282 finally:
283 if cfg.get('suspend_unused_vms', True):
284 if len(pausable_nodes_ids) != 0:
285 logger.debug("Unpausing {0} nodes".format(
286 len(pausable_nodes_ids)))
287 start_vms.unpause(pausable_nodes_ids)
288
289 results.append(res)
290
291 yield name, results
koder aka kdanilov2c473092015-03-29 17:12:13 +0300292
293
koder aka kdanilovda45e882015-04-06 02:24:42 +0300294def log_nodes_statistic(_, ctx):
295 nodes = ctx.nodes
koder aka kdanilov2c473092015-03-29 17:12:13 +0300296 logger.info("Found {0} nodes total".format(len(nodes)))
297 per_role = collections.defaultdict(lambda: 0)
298 for node in nodes:
299 for role in node.roles:
300 per_role[role] += 1
301
302 for role, count in sorted(per_role.items()):
303 logger.debug("Found {0} nodes with role {1}".format(count, role))
304
305
koder aka kdanilovda45e882015-04-06 02:24:42 +0300306def connect_stage(cfg, ctx):
307 ctx.clear_calls_stack.append(disconnect_stage)
308 connect_all(ctx.nodes)
309
koder aka kdanilov168f6092015-04-19 02:33:38 +0300310 all_ok = True
koder aka kdanilovda45e882015-04-06 02:24:42 +0300311
koder aka kdanilov168f6092015-04-19 02:33:38 +0300312 for node in ctx.nodes:
313 if node.connection is None:
314 if 'testnode' in node.roles:
315 msg = "Can't connect to testnode {0}"
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300316 msg = msg.format(node.get_conn_id())
317 logger.error(msg)
318 raise utils.StopTestError(msg)
koder aka kdanilov168f6092015-04-19 02:33:38 +0300319 else:
320 msg = "Node {0} would be excluded - can't connect"
321 logger.warning(msg.format(node.get_conn_id()))
322 all_ok = False
323
324 if all_ok:
325 logger.info("All nodes connected successfully")
326
327 ctx.nodes = [node for node in ctx.nodes
328 if node.connection is not None]
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300329
330
koder aka kdanilovda45e882015-04-06 02:24:42 +0300331def discover_stage(cfg, ctx):
koder aka kdanilov652cd802015-04-13 12:21:07 +0300332 if cfg.get('discover') is not None:
koder aka kdanilovda45e882015-04-06 02:24:42 +0300333 discover_objs = [i.strip() for i in cfg['discover'].strip().split(",")]
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300334
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300335 nodes = discover(ctx,
336 discover_objs,
337 cfg['clouds'],
338 cfg['var_dir'],
339 not cfg['dont_discover_nodes'])
koder aka kdanilov168f6092015-04-19 02:33:38 +0300340
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300341 ctx.nodes.extend(nodes)
koder aka kdanilovda45e882015-04-06 02:24:42 +0300342
343 for url, roles in cfg.get('explicit_nodes', {}).items():
344 ctx.nodes.append(Node(url, roles.split(",")))
345
346
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300347def save_nodes_stage(cfg, ctx):
348 cluster = {}
349 for node in ctx.nodes:
350 roles = node.roles[:]
351 if 'testnode' in roles:
352 roles.remove('testnode')
353
354 if len(roles) != 0:
355 cluster[node.conn_url] = roles
356
357 with open(cfg['nodes_report_file'], "w") as fd:
358 fd.write(pretty_yaml.dumps(cluster))
359
360
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300361def reuse_vms_stage(cfg, ctx):
362 p = cfg.get('clouds', {})
363 p = p.get('openstack', {})
364 p = p.get('vms', [])
365
366 for creds in p:
367 vm_name_pattern, conn_pattern = creds.split(",")
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300368 try:
369 msg = "Looking for vm with name like {0}".format(vm_name_pattern)
370 logger.debug(msg)
371
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300372 if not start_vms.is_connected():
373 os_creds = get_OS_credentials(cfg, ctx)
374 else:
375 os_creds = {}
376
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300377 conn = start_vms.nova_connect(**os_creds)
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300378 for ip, vm_id in start_vms.find_vms(conn, vm_name_pattern):
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300379 node = Node(conn_pattern.format(ip=ip), ['testnode'])
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300380 node.os_vm_id = vm_id
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300381 ctx.nodes.append(node)
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300382 except utils.StopTestError:
383 raise
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300384 except Exception as exc:
385 msg = "Vm like {0} lookup failed".format(vm_name_pattern)
386 logger.exception(msg)
387 raise utils.StopTestError(msg, exc)
388
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300389
390def get_creds_openrc(path):
391 fc = open(path).read()
392
393 echo = 'echo "$OS_TENANT_NAME:$OS_USERNAME:$OS_PASSWORD@$OS_AUTH_URL"'
394
395 try:
396 data = utils.run_locally(['/bin/bash'],
397 input_data=fc + "\n" + echo)
398 except subprocess.CalledProcessError as exc:
399 msg = "Failed to get creads from openrc file: " + data
400 logger.exception(msg)
401 raise utils.StopTestError(msg, exc)
402
403 try:
404 data = data.strip()
405 user, tenant, passwd_auth_url = data.split(':', 2)
406 passwd, auth_url = passwd_auth_url.rsplit("@", 1)
407 assert (auth_url.startswith("https://") or
408 auth_url.startswith("http://"))
409 except Exception as exc:
410 msg = "Failed to get creads from openrc file: " + data
411 logger.exception(msg)
412 raise utils.StopTestError(msg, exc)
413 return user, passwd, tenant, auth_url
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300414
415
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300416def get_OS_credentials(cfg, ctx):
koder aka kdanilovcee43342015-04-14 22:52:53 +0300417 creds = None
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300418 if 'openstack' in cfg['clouds']:
419 os_cfg = cfg['clouds']['openstack']
420 if 'OPENRC' in os_cfg:
421 logger.info("Using OS credentials from " + os_cfg['OPENRC'])
422 user, passwd, tenant, auth_url = \
423 get_creds_openrc(os_cfg['OPENRC'])
424 elif 'ENV' in os_cfg:
425 logger.info("Using OS credentials from shell environment")
426 user, passwd, tenant, auth_url = start_vms.ostack_get_creds()
427 else:
428 logger.info("Using predefined credentials")
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300429 tenant = os_cfg['OS_TENANT_NAME'].strip()
430 user = os_cfg['OS_USERNAME'].strip()
431 passwd = os_cfg['OS_PASSWORD'].strip()
432 auth_url = os_cfg['OS_AUTH_URL'].strip()
433
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300434 elif 'fuel' in cfg['clouds'] and \
435 'openstack_env' in cfg['clouds']['fuel']:
436 logger.info("Using fuel creds")
437 creds = ctx.fuel_openstack_creds
koder aka kdanilovcee43342015-04-14 22:52:53 +0300438 else:
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300439 logger.error("Can't found OS credentials")
440 raise utils.StopTestError("Can't found OS credentials", None)
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300441
koder aka kdanilovcee43342015-04-14 22:52:53 +0300442 if creds is None:
443 creds = {'name': user,
444 'passwd': passwd,
445 'tenant': tenant,
446 'auth_url': auth_url}
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300447
koder aka kdanilov46d4f392015-04-24 11:35:00 +0300448 msg = "OS_CREDS: user={name} tenant={tenant} auth_url={auth_url}"
449 logger.debug(msg.format(**creds))
koder aka kdanilovcee43342015-04-14 22:52:53 +0300450 return creds
koder aka kdanilov4e9f3ed2015-04-14 11:26:12 +0300451
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300452
koder aka kdanilov168f6092015-04-19 02:33:38 +0300453@contextlib.contextmanager
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300454def create_vms_ctx(ctx, cfg, config, already_has_count=0):
koder aka kdanilovc368eb62015-04-28 18:22:01 +0300455 params = cfg['vm_configs'][config['cfg_name']].copy()
koder aka kdanilov168f6092015-04-19 02:33:38 +0300456 os_nodes_ids = []
457
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300458 if not start_vms.is_connected():
459 os_creds = get_OS_credentials(cfg, ctx)
460 else:
461 os_creds = {}
koder aka kdanilov168f6092015-04-19 02:33:38 +0300462 start_vms.nova_connect(**os_creds)
463
koder aka kdanilovc368eb62015-04-28 18:22:01 +0300464 params.update(config)
465 params['keypair_file_private'] = params['keypair_name'] + ".pem"
466 params['group_name'] = cfg_dict['run_uuid']
467
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300468 if not config.get('skip_preparation', False):
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300469 logger.info("Preparing openstack")
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300470 start_vms.prepare_os_subpr(params=params, **os_creds)
koder aka kdanilov168f6092015-04-19 02:33:38 +0300471
472 new_nodes = []
473 try:
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300474 for new_node, node_id in start_vms.launch_vms(params,
475 already_has_count):
koder aka kdanilov168f6092015-04-19 02:33:38 +0300476 new_node.roles.append('testnode')
477 ctx.nodes.append(new_node)
478 os_nodes_ids.append(node_id)
479 new_nodes.append(new_node)
480
481 store_nodes_in_log(cfg, os_nodes_ids)
482 ctx.openstack_nodes_ids = os_nodes_ids
483
484 yield new_nodes
485
486 finally:
487 if not cfg['keep_vm']:
488 shut_down_vms_stage(cfg, ctx)
489
490
koder aka kdanilovcee43342015-04-14 22:52:53 +0300491def run_tests_stage(cfg, ctx):
492 ctx.results = []
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300493
koder aka kdanilovcee43342015-04-14 22:52:53 +0300494 if 'tests' not in cfg:
495 return
gstepanov023c1e42015-04-08 15:50:19 +0300496
koder aka kdanilovcee43342015-04-14 22:52:53 +0300497 for group in cfg['tests']:
498
499 assert len(group.items()) == 1
500 key, config = group.items()[0]
501
502 if 'start_test_nodes' == key:
koder aka kdanilovc368eb62015-04-28 18:22:01 +0300503 if 'openstack' not in config:
504 msg = "No openstack block in config - can't spawn vm's"
505 logger.error(msg)
506 raise utils.StopTestError(msg)
507
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300508 num_test_nodes = sum(1 for node in ctx.nodes
509 if 'testnode' in node.roles)
510
511 vm_ctx = create_vms_ctx(ctx, cfg, config['openstack'],
512 num_test_nodes)
513 with vm_ctx as new_nodes:
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300514 if len(new_nodes) != 0:
515 connect_all(new_nodes, True)
koder aka kdanilovcee43342015-04-14 22:52:53 +0300516
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300517 for node in new_nodes:
518 if node.connection is None:
519 msg = "Failed to connect to vm {0}"
520 raise RuntimeError(msg.format(node.get_conn_id()))
koder aka kdanilovcee43342015-04-14 22:52:53 +0300521
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300522 deploy_sensors_stage(cfg_dict,
523 ctx,
524 nodes=new_nodes,
525 undeploy=False)
koder aka kdanilov12ae0632015-04-15 01:13:43 +0300526
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300527 for test_group in config.get('tests', []):
528 test_res = run_tests(cfg, test_group, ctx.nodes)
529 ctx.results.extend(test_res)
koder aka kdanilov4500a5f2015-04-17 16:55:17 +0300530 else:
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300531 test_res = run_tests(cfg, group, ctx.nodes)
532 ctx.results.extend(test_res)
koder aka kdanilovda45e882015-04-06 02:24:42 +0300533
gstepanov023c1e42015-04-08 15:50:19 +0300534
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300535def shut_down_vms_stage(cfg, ctx):
koder aka kdanilov66839a92015-04-11 13:22:31 +0300536 vm_ids_fname = cfg_dict['vm_ids_fname']
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300537 if ctx.openstack_nodes_ids is None:
koder aka kdanilov66839a92015-04-11 13:22:31 +0300538 nodes_ids = open(vm_ids_fname).read().split()
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300539 else:
540 nodes_ids = ctx.openstack_nodes_ids
541
koder aka kdanilov652cd802015-04-13 12:21:07 +0300542 if len(nodes_ids) != 0:
543 logger.info("Removing nodes")
544 start_vms.clear_nodes(nodes_ids)
545 logger.info("Nodes has been removed")
gstepanov023c1e42015-04-08 15:50:19 +0300546
koder aka kdanilov66839a92015-04-11 13:22:31 +0300547 if os.path.exists(vm_ids_fname):
548 os.remove(vm_ids_fname)
gstepanov023c1e42015-04-08 15:50:19 +0300549
koder aka kdanilov66839a92015-04-11 13:22:31 +0300550
551def store_nodes_in_log(cfg, nodes_ids):
552 with open(cfg['vm_ids_fname'], 'w') as fd:
553 fd.write("\n".join(nodes_ids))
gstepanov023c1e42015-04-08 15:50:19 +0300554
555
556def clear_enviroment(cfg, ctx):
koder aka kdanilov66839a92015-04-11 13:22:31 +0300557 if os.path.exists(cfg_dict['vm_ids_fname']):
koder aka kdanilov1c2b5112015-04-10 16:53:51 +0300558 shut_down_vms_stage(cfg, ctx)
gstepanov023c1e42015-04-08 15:50:19 +0300559
560
koder aka kdanilovda45e882015-04-06 02:24:42 +0300561def disconnect_stage(cfg, ctx):
koder aka kdanilov652cd802015-04-13 12:21:07 +0300562 ssh_utils.close_all_sessions()
563
koder aka kdanilovda45e882015-04-06 02:24:42 +0300564 for node in ctx.nodes:
565 if node.connection is not None:
566 node.connection.close()
567
568
koder aka kdanilov66839a92015-04-11 13:22:31 +0300569def store_raw_results_stage(cfg, ctx):
570
571 raw_results = os.path.join(cfg_dict['var_dir'], 'raw_results.yaml')
572
573 if os.path.exists(raw_results):
574 cont = yaml.load(open(raw_results).read())
575 else:
576 cont = []
577
koder aka kdanilov168f6092015-04-19 02:33:38 +0300578 cont.extend(utils.yamable(ctx.results))
koder aka kdanilov66839a92015-04-11 13:22:31 +0300579 raw_data = pretty_yaml.dumps(cont)
580
581 with open(raw_results, "w") as fd:
582 fd.write(raw_data)
583
584
585def console_report_stage(cfg, ctx):
586 for tp, data in ctx.results:
koder aka kdanilov4500a5f2015-04-17 16:55:17 +0300587 if 'io' == tp and data is not None:
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300588 dinfo = report.process_disk_info(data)
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300589 text_rep_fname = cfg['text_report_file']
590 rep = IOPerfTest.format_for_console(data, dinfo)
591
592 with open(text_rep_fname, "w") as fd:
593 fd.write(rep)
594 fd.write("\n")
595 fd.flush()
596
597 logger.info("Text report were stored in " + text_rep_fname)
koder aka kdanilove87ae652015-04-20 02:14:35 +0300598 print("\n")
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300599 print(IOPerfTest.format_for_console(data, dinfo))
koder aka kdanilove87ae652015-04-20 02:14:35 +0300600 print("\n")
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300601
Yulia Portnova1f123962015-05-06 18:48:11 +0300602 if tp in ['mysql', 'pgbench'] and data is not None:
Yulia Portnovab1a15072015-05-06 14:59:25 +0300603 print("\n")
604 print(MysqlTest.format_for_console(data))
605 print("\n")
koder aka kdanilov66839a92015-04-11 13:22:31 +0300606
607
koder aka kdanilove87ae652015-04-20 02:14:35 +0300608def html_report_stage(cfg, ctx):
Yulia Portnova8ca20572015-04-14 14:09:39 +0300609 html_rep_fname = cfg['html_report_file']
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300610 found = False
611 for tp, data in ctx.results:
612 if 'io' == tp and data is not None:
613 if found:
614 logger.error("Making reports for more than one " +
615 "io block isn't supported! All " +
616 "report, except first are skipped")
617 continue
618 found = True
619 dinfo = report.process_disk_info(data)
620 report.make_io_report(dinfo, data, html_rep_fname,
koder aka kdanilovd5ed4da2015-05-07 23:33:23 +0300621 cfg['charts_img_path'],
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300622 lab_info=ctx.hw_info)
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300623
koder aka kdanilovda45e882015-04-06 02:24:42 +0300624
625def complete_log_nodes_statistic(cfg, ctx):
626 nodes = ctx.nodes
627 for node in nodes:
628 logger.debug(str(node))
629
630
koder aka kdanilov66839a92015-04-11 13:22:31 +0300631def load_data_from(var_dir):
koder aka kdanilov4e9f3ed2015-04-14 11:26:12 +0300632 def load_data_from_file(cfg, ctx):
koder aka kdanilov66839a92015-04-11 13:22:31 +0300633 raw_results = os.path.join(var_dir, 'raw_results.yaml')
634 ctx.results = yaml.load(open(raw_results).read())
koder aka kdanilov4e9f3ed2015-04-14 11:26:12 +0300635 return load_data_from_file
gstepanovcd256d62015-04-07 17:47:32 +0300636
637
koder aka kdanilov57ce4db2015-04-25 21:25:51 +0300638def start_web_ui(cfg, ctx):
639 if webui is None:
640 logger.error("Can't start webui. Install cherrypy module")
641 ctx.web_thread = None
642 else:
643 th = threading.Thread(None, webui.web_main_thread, "webui", (None,))
644 th.daemon = True
645 th.start()
646 ctx.web_thread = th
647
648
649def stop_web_ui(cfg, ctx):
650 webui.web_main_stop()
651 time.sleep(1)
652
653
koder aka kdanilovcee43342015-04-14 22:52:53 +0300654def parse_args(argv):
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300655 descr = "Disk io performance test suite"
656 parser = argparse.ArgumentParser(prog='wally', description=descr)
koder aka kdanilovcee43342015-04-14 22:52:53 +0300657
658 parser.add_argument("-l", dest='extra_logs',
659 action='store_true', default=False,
660 help="print some extra log info")
koder aka kdanilovcee43342015-04-14 22:52:53 +0300661 parser.add_argument("-b", '--build_description',
662 type=str, default="Build info")
663 parser.add_argument("-i", '--build_id', type=str, default="id")
664 parser.add_argument("-t", '--build_type', type=str, default="GA")
665 parser.add_argument("-u", '--username', type=str, default="admin")
koder aka kdanilove87ae652015-04-20 02:14:35 +0300666 parser.add_argument("-n", '--no-tests', action='store_true',
667 help="Don't run tests", default=False)
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300668 parser.add_argument("-p", '--post-process-only', metavar="VAR_DIR",
669 help="Only process data from previour run")
670 parser.add_argument("-k", '--keep-vm', action='store_true',
671 help="Don't remove test vm's", default=False)
koder aka kdanilove87ae652015-04-20 02:14:35 +0300672 parser.add_argument("-d", '--dont-discover-nodes', action='store_true',
673 help="Don't connect/discover fuel nodes",
674 default=False)
koder aka kdanilova047e1b2015-04-21 23:16:59 +0300675 parser.add_argument("-r", '--no-html-report', action='store_true',
676 help="Skip html report", default=False)
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300677 parser.add_argument("--params", metavar="testname.paramname",
koder aka kdanilov63ad2062015-04-27 13:11:40 +0300678 help="Test params", default=[])
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300679 parser.add_argument("config_file")
koder aka kdanilovcee43342015-04-14 22:52:53 +0300680
681 return parser.parse_args(argv[1:])
682
683
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300684# from plop.collector import Collector
685
686
koder aka kdanilov3f356262015-02-13 08:06:14 -0800687def main(argv):
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300688 # collector = Collector()
689 # collector.start()
690
691 faulthandler.register(signal.SIGUSR1, all_threads=True)
koder aka kdanilove06762a2015-03-22 23:32:09 +0200692 opts = parse_args(argv)
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300693 load_config(opts.config_file, opts.post_process_only)
koder aka kdanilov2c473092015-03-29 17:12:13 +0300694
koder aka kdanilov66839a92015-04-11 13:22:31 +0300695 if opts.post_process_only is not None:
696 stages = [
koder aka kdanilove87ae652015-04-20 02:14:35 +0300697 load_data_from(opts.post_process_only)
koder aka kdanilov66839a92015-04-11 13:22:31 +0300698 ]
699 else:
700 stages = [
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300701 discover_stage
702 ]
703
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300704 stages.extend([
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300705 reuse_vms_stage,
koder aka kdanilov66839a92015-04-11 13:22:31 +0300706 log_nodes_statistic,
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300707 save_nodes_stage,
708 connect_stage])
709
710 if cfg_dict.get('collect_info', True):
711 stages.append(collect_hw_info_stage)
712
713 stages.extend([
koder aka kdanilov66839a92015-04-11 13:22:31 +0300714 deploy_sensors_stage,
715 run_tests_stage,
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300716 store_raw_results_stage,
717 gather_sensors_stage
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300718 ])
koder aka kdanilov66839a92015-04-11 13:22:31 +0300719
koder aka kdanilove87ae652015-04-20 02:14:35 +0300720 report_stages = [
721 console_report_stage,
koder aka kdanilove87ae652015-04-20 02:14:35 +0300722 ]
723
koder aka kdanilova047e1b2015-04-21 23:16:59 +0300724 if not opts.no_html_report:
725 report_stages.append(html_report_stage)
726
koder aka kdanilovcff7b2e2015-04-18 20:48:15 +0300727 if cfg_dict.get('logging', {}).get("extra_logs", False) or opts.extra_logs:
728 level = logging.DEBUG
729 else:
730 level = logging.WARNING
731
732 setup_loggers(level, cfg_dict['log_file'])
koder aka kdanilovf4b82c22015-04-11 13:35:25 +0300733
koder aka kdanilov652cd802015-04-13 12:21:07 +0300734 logger.info("All info would be stored into {0}".format(
735 cfg_dict['var_dir']))
gstepanovcd256d62015-04-07 17:47:32 +0300736
koder aka kdanilovda45e882015-04-06 02:24:42 +0300737 ctx = Context()
gstepanovaffcdb12015-04-07 17:18:29 +0300738 ctx.build_meta['build_id'] = opts.build_id
739 ctx.build_meta['build_descrption'] = opts.build_description
740 ctx.build_meta['build_type'] = opts.build_type
741 ctx.build_meta['username'] = opts.username
koder aka kdanilov57ce4db2015-04-25 21:25:51 +0300742 ctx.sensors_data = SensorDatastore()
koder aka kdanilove87ae652015-04-20 02:14:35 +0300743
koder aka kdanilov168f6092015-04-19 02:33:38 +0300744 cfg_dict['keep_vm'] = opts.keep_vm
koder aka kdanilove87ae652015-04-20 02:14:35 +0300745 cfg_dict['no_tests'] = opts.no_tests
746 cfg_dict['dont_discover_nodes'] = opts.dont_discover_nodes
koder aka kdanilov6c491062015-04-09 22:33:13 +0300747
koder aka kdanilov57ce4db2015-04-25 21:25:51 +0300748 if cfg_dict.get('run_web_ui', False):
749 start_web_ui(cfg_dict, ctx)
750
koder aka kdanilovc368eb62015-04-28 18:22:01 +0300751 msg_templ = "Exception during {0.__name__}: {1!s}"
752 msg_templ_no_exc = "During {0.__name__}"
753
koder aka kdanilovda45e882015-04-06 02:24:42 +0300754 try:
755 for stage in stages:
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300756 if stage.__name__.endswith("stage"):
757 logger.info("Start {0.__name__}".format(stage))
758 else:
759 logger.info("Start {0.__name__} stage".format(stage))
koder aka kdanilovda45e882015-04-06 02:24:42 +0300760 stage(cfg_dict, ctx)
koder aka kdanilovc368eb62015-04-28 18:22:01 +0300761 except utils.StopTestError as exc:
762 logger.error(msg_templ.format(stage, exc))
763 except Exception:
764 logger.exception(msg_templ_no_exc.format(stage))
koder aka kdanilovda45e882015-04-06 02:24:42 +0300765 finally:
766 exc, cls, tb = sys.exc_info()
767 for stage in ctx.clear_calls_stack[::-1]:
768 try:
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300769 if stage.__name__.endswith("stage"):
770 logger.info("Start {0.__name__}".format(stage))
771 else:
772 logger.info("Start {0.__name__} stage".format(stage))
koder aka kdanilovda45e882015-04-06 02:24:42 +0300773 stage(cfg_dict, ctx)
koder aka kdanilovf86d7af2015-05-06 04:01:54 +0300774 except utils.StopTestError as cleanup_exc:
775 logger.error(msg_templ.format(stage, cleanup_exc))
776 except Exception:
777 logger.exception(msg_templ_no_exc.format(stage))
778
779 logger.debug("Start utils.cleanup")
780 for clean_func, args, kwargs in utils.iter_clean_func():
781 try:
782 clean_func(*args, **kwargs)
783 except utils.StopTestError as cleanup_exc:
784 logger.error(msg_templ.format(stage, cleanup_exc))
koder aka kdanilovc368eb62015-04-28 18:22:01 +0300785 except Exception:
786 logger.exception(msg_templ_no_exc.format(stage))
koder aka kdanilov2c473092015-03-29 17:12:13 +0300787
koder aka kdanilove2de58c2015-04-24 22:59:36 +0300788 if exc is None:
789 for report_stage in report_stages:
790 report_stage(cfg_dict, ctx)
koder aka kdanilove87ae652015-04-20 02:14:35 +0300791
792 logger.info("All info stored in {0} folder".format(cfg_dict['var_dir']))
koder aka kdanilove2de58c2015-04-24 22:59:36 +0300793
koder aka kdanilov57ce4db2015-04-25 21:25:51 +0300794 if cfg_dict.get('run_web_ui', False):
795 stop_web_ui(cfg_dict, ctx)
796
koder aka kdanilov416b87a2015-05-12 00:26:04 +0300797 # collector.stop()
798 # open("plop.out", "w").write(repr(dict(collector.stack_counts)))
799
koder aka kdanilove2de58c2015-04-24 22:59:36 +0300800 if exc is None:
801 logger.info("Tests finished successfully")
802 return 0
803 else:
804 logger.error("Tests are failed. See detailed error above")
805 return 1