kdanylov aka koder | 4518318 | 2017-04-30 23:55:40 +0300 | [diff] [blame] | 1 | import bz2 |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 2 | import array |
| 3 | import logging |
| 4 | from typing import List, Dict, Tuple |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 5 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 6 | import numpy |
| 7 | |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 8 | from cephlib import sensors_rpc_plugin |
| 9 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 10 | from . import utils |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 11 | from .test_run_class import TestRun |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 12 | from .result_classes import DataSource |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 13 | from .stage import Stage, StepOrder |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 14 | from .hlstorage import ResultStorage |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 15 | |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame] | 16 | |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 17 | plugin_fname = sensors_rpc_plugin.__file__.rsplit(".", 1)[0] + ".py" |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 18 | SENSORS_PLUGIN_CODE = open(plugin_fname, "rb").read() # type: bytes |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 19 | |
| 20 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 21 | logger = logging.getLogger("wally") |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 22 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 23 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 24 | sensor_units = { |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 25 | "system-cpu.idle": "", |
| 26 | "system-cpu.nice": "", |
| 27 | "system-cpu.user": "", |
| 28 | "system-cpu.sys": "", |
| 29 | "system-cpu.iowait": "", |
| 30 | "system-cpu.irq": "", |
| 31 | "system-cpu.sirq": "", |
| 32 | "system-cpu.steal": "", |
| 33 | "system-cpu.guest": "", |
| 34 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 35 | "system-cpu.procs_blocked": "", |
| 36 | "system-cpu.procs_queue_x10": "", |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 37 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 38 | "net-io.recv_bytes": "B", |
| 39 | "net-io.recv_packets": "", |
| 40 | "net-io.send_bytes": "B", |
| 41 | "net-io.send_packets": "", |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 42 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 43 | "block-io.io_queue": "", |
| 44 | "block-io.io_time": "ms", |
| 45 | "block-io.reads_completed": "", |
| 46 | "block-io.rtime": "ms", |
| 47 | "block-io.sectors_read": "B", |
| 48 | "block-io.sectors_written": "B", |
| 49 | "block-io.writes_completed": "", |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame] | 50 | "block-io.wtime": "ms", |
| 51 | "block-io.weighted_io_time": "ms" |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 52 | } |
| 53 | |
| 54 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 55 | # TODO(koder): in case if node has more than one role sensor settings might be incorrect |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 56 | class StartSensorsStage(Stage): |
| 57 | priority = StepOrder.START_SENSORS |
| 58 | config_block = 'sensors' |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 59 | |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 60 | def run(self, ctx: TestRun) -> None: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 61 | if array.array('L').itemsize != 8: |
| 62 | message = "Python array.array('L') items should be 8 bytes in size, not {}." + \ |
| 63 | " Can't provide sensors on this platform. Disable sensors in config and retry" |
| 64 | logger.critical(message.format(array.array('L').itemsize)) |
| 65 | raise utils.StopTestError() |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 66 | |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 67 | # TODO: need carefully fix this |
| 68 | # sensors config is: |
| 69 | # role: |
| 70 | # sensor: [str] |
| 71 | # or |
| 72 | # role: |
| 73 | # sensor: |
| 74 | # allowed: [str] |
| 75 | # dissallowed: [str] |
| 76 | # params: Any |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 77 | per_role_config = {} # type: Dict[str, Dict[str, str]] |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 78 | |
| 79 | for name, val in ctx.config.sensors.roles_mapping.raw().items(): |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 80 | if isinstance(val, str): |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 81 | val = {vl.strip(): (".*" if vl.strip() != 'ceph' else {}) for vl in val.split(",")} |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 82 | elif isinstance(val, list): |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 83 | val = {vl: (".*" if vl != 'ceph' else {}) for vl in val} |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 84 | per_role_config[name] = val |
| 85 | |
| 86 | if 'all' in per_role_config: |
| 87 | all_vl = per_role_config.pop('all') |
| 88 | all_roles = set(per_role_config) |
| 89 | |
| 90 | for node in ctx.nodes: |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 91 | all_roles.update(node.info.roles) # type: ignore |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 92 | |
| 93 | for name, vals in list(per_role_config.items()): |
| 94 | new_vals = all_vl.copy() |
| 95 | new_vals.update(vals) |
| 96 | per_role_config[name] = new_vals |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 97 | |
| 98 | for node in ctx.nodes: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 99 | node_cfg = {} # type: Dict[str, Dict[str, str]] |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 100 | for role in node.info.roles: |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 101 | node_cfg.update(per_role_config.get(role, {})) # type: ignore |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 102 | |
koder aka kdanilov | 108ac36 | 2017-01-19 20:17:16 +0200 | [diff] [blame] | 103 | nid = node.node_id |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 104 | if node_cfg: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 105 | # ceph requires additional settings |
| 106 | if 'ceph' in node_cfg: |
| 107 | node_cfg['ceph'].update(node.info.params['ceph']) |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 108 | node_cfg['ceph']['osds'] = [osd['id'] for osd in node.info.params['ceph-osds']] # type: ignore |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 109 | |
kdanylov aka koder | 0e0cfcb | 2017-03-27 22:19:09 +0300 | [diff] [blame] | 110 | logger.debug("Setting up sensors RPC plugin for node %s", nid) |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 111 | node.upload_plugin("sensors", SENSORS_PLUGIN_CODE) |
| 112 | ctx.sensors_run_on.add(nid) |
| 113 | logger.debug("Start monitoring node %s", nid) |
| 114 | node.conn.sensors.start(node_cfg) |
| 115 | else: |
| 116 | logger.debug("Skip monitoring node %s, as no sensors selected", nid) |
| 117 | |
| 118 | |
| 119 | def collect_sensors_data(ctx: TestRun, stop: bool = False): |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 120 | rstorage = ResultStorage(ctx.storage) |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 121 | for node in ctx.nodes: |
koder aka kdanilov | 108ac36 | 2017-01-19 20:17:16 +0200 | [diff] [blame] | 122 | node_id = node.node_id |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 123 | if node_id in ctx.sensors_run_on: |
| 124 | |
| 125 | if stop: |
| 126 | func = node.conn.sensors.stop |
| 127 | else: |
| 128 | func = node.conn.sensors.get_updates |
| 129 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 130 | # TODO: units should came along with data |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame] | 131 | # TODO: process raw sensors data |
| 132 | |
kdanylov aka koder | 4518318 | 2017-04-30 23:55:40 +0300 | [diff] [blame] | 133 | for path, value, is_array in sensors_rpc_plugin.unpack_rpc_updates(func()): |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 134 | if path == 'collected_at': |
kdanylov aka koder | 4518318 | 2017-04-30 23:55:40 +0300 | [diff] [blame] | 135 | ds = DataSource(node_id=node_id, metric='collected_at', tag='csv') |
| 136 | rstorage.append_sensor(numpy.array(value), ds, 'us') |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 137 | else: |
| 138 | sensor, dev, metric = path.split(".") |
kdanylov aka koder | 4518318 | 2017-04-30 23:55:40 +0300 | [diff] [blame] | 139 | ds = DataSource(node_id=node_id, metric=metric, dev=dev, sensor=sensor, tag='csv') |
| 140 | if is_array: |
| 141 | units = sensor_units["{}.{}".format(sensor, metric)] |
| 142 | rstorage.append_sensor(numpy.array(value), ds, units) |
| 143 | else: |
| 144 | if metric == 'historic': |
| 145 | rstorage.put_sensor_raw(bz2.compress(value), ds(tag='bin')) |
| 146 | else: |
| 147 | assert metric in ('perf_dump', 'historic_js') |
| 148 | rstorage.put_sensor_raw(value, ds(tag='js')) |
kdanylov aka koder | cdfcdaf | 2017-04-29 10:03:39 +0300 | [diff] [blame] | 149 | |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 150 | |
| 151 | |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 152 | class CollectSensorsStage(Stage): |
| 153 | priority = StepOrder.COLLECT_SENSORS |
| 154 | config_block = 'sensors' |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 155 | |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 156 | def run(self, ctx: TestRun) -> None: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 157 | collect_sensors_data(ctx, True) |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 158 | |
| 159 | |
| 160 | # def delta(func, only_upd=True): |
| 161 | # prev = {} |
| 162 | # while True: |
| 163 | # for dev_name, vals in func(): |
| 164 | # if dev_name not in prev: |
| 165 | # prev[dev_name] = {} |
| 166 | # for name, (val, _) in vals.items(): |
| 167 | # prev[dev_name][name] = val |
| 168 | # else: |
| 169 | # dev_prev = prev[dev_name] |
| 170 | # res = {} |
| 171 | # for stat_name, (val, accum_val) in vals.items(): |
| 172 | # if accum_val: |
| 173 | # if stat_name in dev_prev: |
| 174 | # delta = int(val) - int(dev_prev[stat_name]) |
| 175 | # if not only_upd or 0 != delta: |
| 176 | # res[stat_name] = str(delta) |
| 177 | # dev_prev[stat_name] = val |
| 178 | # elif not only_upd or '0' != val: |
| 179 | # res[stat_name] = val |
| 180 | # |
| 181 | # if only_upd and len(res) == 0: |
| 182 | # continue |
| 183 | # yield dev_name, res |
| 184 | # yield None, None |
| 185 | # |
| 186 | # |
| 187 | |
| 188 | |