koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 1 | import array |
| 2 | import logging |
| 3 | from typing import List, Dict, Tuple |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 4 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 5 | import numpy |
| 6 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 7 | from . import utils |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 8 | from .test_run_class import TestRun |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 9 | from .result_classes import DataSource |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 10 | from .stage import Stage, StepOrder |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 11 | from .hlstorage import ResultStorage |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 12 | |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame^] | 13 | from cephlib import sensors_rpc_plugin |
| 14 | |
| 15 | |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 16 | plugin_fname = sensors_rpc_plugin.__file__.rsplit(".", 1)[0] + ".py" |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 17 | SENSORS_PLUGIN_CODE = open(plugin_fname, "rb").read() # type: bytes |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 18 | |
| 19 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 20 | logger = logging.getLogger("wally") |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 21 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 22 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 23 | sensor_units = { |
| 24 | "system-cpu.idle_time": "ms", |
| 25 | "system-cpu.nice_processes": "", |
| 26 | "system-cpu.procs_blocked": "", |
| 27 | "system-cpu.procs_queue_x10": "", |
| 28 | "system-cpu.system_processes": "", |
| 29 | "system-cpu.user_processes": "", |
| 30 | "net-io.recv_bytes": "B", |
| 31 | "net-io.recv_packets": "", |
| 32 | "net-io.send_bytes": "B", |
| 33 | "net-io.send_packets": "", |
| 34 | "block-io.io_queue": "", |
| 35 | "block-io.io_time": "ms", |
| 36 | "block-io.reads_completed": "", |
| 37 | "block-io.rtime": "ms", |
| 38 | "block-io.sectors_read": "B", |
| 39 | "block-io.sectors_written": "B", |
| 40 | "block-io.writes_completed": "", |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame^] | 41 | "block-io.wtime": "ms", |
| 42 | "block-io.weighted_io_time": "ms" |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 43 | } |
| 44 | |
| 45 | |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 46 | # TODO(koder): in case if node has more than one role sensor settings might be incorrect |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 47 | class StartSensorsStage(Stage): |
| 48 | priority = StepOrder.START_SENSORS |
| 49 | config_block = 'sensors' |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 50 | |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 51 | def run(self, ctx: TestRun) -> None: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 52 | if array.array('L').itemsize != 8: |
| 53 | message = "Python array.array('L') items should be 8 bytes in size, not {}." + \ |
| 54 | " Can't provide sensors on this platform. Disable sensors in config and retry" |
| 55 | logger.critical(message.format(array.array('L').itemsize)) |
| 56 | raise utils.StopTestError() |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 57 | |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 58 | # TODO: need carefully fix this |
| 59 | # sensors config is: |
| 60 | # role: |
| 61 | # sensor: [str] |
| 62 | # or |
| 63 | # role: |
| 64 | # sensor: |
| 65 | # allowed: [str] |
| 66 | # dissallowed: [str] |
| 67 | # params: Any |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 68 | per_role_config = {} # type: Dict[str, Dict[str, str]] |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 69 | |
| 70 | for name, val in ctx.config.sensors.roles_mapping.raw().items(): |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 71 | if isinstance(val, str): |
| 72 | val = {vl.strip(): ".*" for vl in val.split(",")} |
| 73 | elif isinstance(val, list): |
| 74 | val = {vl: ".*" for vl in val} |
| 75 | per_role_config[name] = val |
| 76 | |
| 77 | if 'all' in per_role_config: |
| 78 | all_vl = per_role_config.pop('all') |
| 79 | all_roles = set(per_role_config) |
| 80 | |
| 81 | for node in ctx.nodes: |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 82 | all_roles.update(node.info.roles) # type: ignore |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 83 | |
| 84 | for name, vals in list(per_role_config.items()): |
| 85 | new_vals = all_vl.copy() |
| 86 | new_vals.update(vals) |
| 87 | per_role_config[name] = new_vals |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 88 | |
| 89 | for node in ctx.nodes: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 90 | node_cfg = {} # type: Dict[str, Dict[str, str]] |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 91 | for role in node.info.roles: |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 92 | node_cfg.update(per_role_config.get(role, {})) # type: ignore |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 93 | |
koder aka kdanilov | 108ac36 | 2017-01-19 20:17:16 +0200 | [diff] [blame] | 94 | nid = node.node_id |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 95 | if node_cfg: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 96 | # ceph requires additional settings |
| 97 | if 'ceph' in node_cfg: |
| 98 | node_cfg['ceph'].update(node.info.params['ceph']) |
koder aka kdanilov | 23e6bdf | 2016-12-24 02:18:54 +0200 | [diff] [blame] | 99 | node_cfg['ceph']['osds'] = [osd.id for osd in node.info.params['ceph-osds']] # type: ignore |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 100 | |
kdanylov aka koder | 0e0cfcb | 2017-03-27 22:19:09 +0300 | [diff] [blame] | 101 | logger.debug("Setting up sensors RPC plugin for node %s", nid) |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 102 | node.upload_plugin("sensors", SENSORS_PLUGIN_CODE) |
| 103 | ctx.sensors_run_on.add(nid) |
| 104 | logger.debug("Start monitoring node %s", nid) |
| 105 | node.conn.sensors.start(node_cfg) |
| 106 | else: |
| 107 | logger.debug("Skip monitoring node %s, as no sensors selected", nid) |
| 108 | |
| 109 | |
| 110 | def collect_sensors_data(ctx: TestRun, stop: bool = False): |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 111 | rstorage = ResultStorage(ctx.storage) |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame^] | 112 | raw_skipped = False |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 113 | for node in ctx.nodes: |
koder aka kdanilov | 108ac36 | 2017-01-19 20:17:16 +0200 | [diff] [blame] | 114 | node_id = node.node_id |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 115 | if node_id in ctx.sensors_run_on: |
| 116 | |
| 117 | if stop: |
| 118 | func = node.conn.sensors.stop |
| 119 | else: |
| 120 | func = node.conn.sensors.get_updates |
| 121 | |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 122 | # TODO: units should came along with data |
kdanylov aka koder | 150b219 | 2017-04-01 16:53:01 +0300 | [diff] [blame^] | 123 | # TODO: process raw sensors data |
| 124 | |
| 125 | for path, value, is_parsed in sensors_rpc_plugin.unpack_rpc_updates(func()): |
| 126 | if not is_parsed: |
| 127 | if not raw_skipped: |
| 128 | logger.warning("Raw sensors data at path %r and, maybe, others are skipped", path) |
| 129 | raw_skipped = True |
| 130 | continue |
koder aka kdanilov | a732a60 | 2017-02-01 20:29:56 +0200 | [diff] [blame] | 131 | if path == 'collected_at': |
| 132 | ds = DataSource(node_id=node_id, metric='collected_at') |
| 133 | units = 'us' |
| 134 | else: |
| 135 | sensor, dev, metric = path.split(".") |
| 136 | ds = DataSource(node_id=node_id, metric=metric, dev=dev, sensor=sensor) |
| 137 | units = sensor_units["{}.{}".format(sensor, metric)] |
| 138 | rstorage.append_sensor(numpy.array(value), ds, units) |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 139 | |
| 140 | |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 141 | class CollectSensorsStage(Stage): |
| 142 | priority = StepOrder.COLLECT_SENSORS |
| 143 | config_block = 'sensors' |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 144 | |
koder aka kdanilov | 39e449e | 2016-12-17 15:15:26 +0200 | [diff] [blame] | 145 | def run(self, ctx: TestRun) -> None: |
koder aka kdanilov | 962ee5f | 2016-12-19 02:40:08 +0200 | [diff] [blame] | 146 | collect_sensors_data(ctx, True) |
koder aka kdanilov | 7022706 | 2016-11-26 23:23:21 +0200 | [diff] [blame] | 147 | |
| 148 | |
| 149 | # def delta(func, only_upd=True): |
| 150 | # prev = {} |
| 151 | # while True: |
| 152 | # for dev_name, vals in func(): |
| 153 | # if dev_name not in prev: |
| 154 | # prev[dev_name] = {} |
| 155 | # for name, (val, _) in vals.items(): |
| 156 | # prev[dev_name][name] = val |
| 157 | # else: |
| 158 | # dev_prev = prev[dev_name] |
| 159 | # res = {} |
| 160 | # for stat_name, (val, accum_val) in vals.items(): |
| 161 | # if accum_val: |
| 162 | # if stat_name in dev_prev: |
| 163 | # delta = int(val) - int(dev_prev[stat_name]) |
| 164 | # if not only_upd or 0 != delta: |
| 165 | # res[stat_name] = str(delta) |
| 166 | # dev_prev[stat_name] = val |
| 167 | # elif not only_upd or '0' != val: |
| 168 | # res[stat_name] = val |
| 169 | # |
| 170 | # if only_upd and len(res) == 0: |
| 171 | # continue |
| 172 | # yield dev_name, res |
| 173 | # yield None, None |
| 174 | # |
| 175 | # |
| 176 | |
| 177 | |