| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 1 | """Model Comparer: | 
 | 2 | - yaml parser | 
 | 3 | - class tree comparison | 
 | 4 | """ | 
 | 5 | import itertools | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 6 | import os | 
 | 7 | import yaml | 
 | 8 |  | 
| Alex Savatieiev | c905571 | 2019-03-01 14:43:56 -0600 | [diff] [blame^] | 9 | from cfg_checker import reporter | 
| Alex Savatieiev | 5118de0 | 2019-02-20 15:50:42 -0600 | [diff] [blame] | 10 | from cfg_checker.common import logger, logger_cli | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 11 |  | 
 | 12 |  | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 13 | def get_element(element_path, input_data):      | 
 | 14 |     paths = element_path.split(":") | 
 | 15 |     data = input_data | 
 | 16 |     for i in range(0, len(paths)): | 
 | 17 |         data = data[paths[i]] | 
 | 18 |     return data | 
 | 19 |  | 
 | 20 |  | 
 | 21 | def pop_element(element_path, input_data):      | 
 | 22 |     paths = element_path.split(":") | 
 | 23 |     data = input_data | 
 | 24 |     # Search for last dict | 
 | 25 |     for i in range(0, len(paths)-1): | 
 | 26 |         data = data[paths[i]] | 
 | 27 |     # pop the actual element | 
 | 28 |     return data.pop(paths[-1]) | 
 | 29 |  | 
 | 30 |  | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 31 | class ModelComparer(object): | 
 | 32 |     """Collection of functions to compare model data. | 
 | 33 |     """ | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 34 |     # key order is important | 
 | 35 |     _model_parts = { | 
 | 36 |         "01_nodes": "nodes", | 
 | 37 |         "02_system": "classes:system", | 
 | 38 |         "03_cluster": "classes:cluster", | 
 | 39 |         "04_other": "classes" | 
 | 40 |     } | 
 | 41 |      | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 42 |     models = {} | 
| Alex Savatieiev | 06ab17d | 2019-02-26 18:40:48 -0600 | [diff] [blame] | 43 |     models_path = "/srv/salt/reclass" | 
 | 44 |     model_name_1 = "source" | 
 | 45 |     model_path_1 = os.path.join(models_path, model_name_1) | 
 | 46 |     model_name_2 = "target" | 
 | 47 |     model_path_2 = os.path.join(models_path, model_name_1) | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 48 |  | 
 | 49 |     @staticmethod | 
 | 50 |     def load_yaml_class(fname): | 
 | 51 |         """Loads a yaml from the file and forms a tree item | 
 | 52 |  | 
 | 53 |         Arguments: | 
 | 54 |             fname {string} -- full path to the yaml file | 
 | 55 |         """ | 
 | 56 |         _yaml = {} | 
 | 57 |         try: | 
 | 58 |             _size = 0 | 
 | 59 |             with open(fname, 'r') as f: | 
 | 60 |                 _yaml = yaml.load(f) | 
 | 61 |                 _size = f.tell() | 
 | 62 |             # TODO: do smth with the data | 
 | 63 |             if not _yaml: | 
 | 64 |                 logger_cli.warning("WARN: empty file '{}'".format(fname)) | 
 | 65 |                 _yaml = {} | 
 | 66 |             else: | 
 | 67 |                 logger.debug("...loaded YAML '{}' ({}b)".format(fname, _size)) | 
 | 68 |             return _yaml | 
 | 69 |         except yaml.YAMLError as exc: | 
 | 70 |             logger_cli.error(exc) | 
 | 71 |         except IOError as e: | 
 | 72 |             logger_cli.error( | 
 | 73 |                 "Error loading file '{}': {}".format(fname, e.message) | 
 | 74 |             ) | 
 | 75 |             raise Exception("CRITICAL: Failed to load YAML data: {}".format( | 
| Alex Savatieiev | 36b938d | 2019-01-21 11:01:18 +0100 | [diff] [blame] | 76 |                 e.message + e.strerror | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 77 |             )) | 
 | 78 |  | 
 | 79 |     def load_model_tree(self, name, root_path="/srv/salt/reclass"): | 
 | 80 |         """Walks supplied path for the YAML filed and loads the tree | 
 | 81 |  | 
 | 82 |         Arguments: | 
 | 83 |             root_folder_path {string} -- Path to Model's root folder. Optional | 
 | 84 |         """ | 
 | 85 |         logger_cli.info("Loading reclass tree from '{}'".format(root_path)) | 
 | 86 |         # prepare the file tree to walk | 
 | 87 |         raw_tree = {} | 
 | 88 |         # Credits to Andrew Clark@MIT. Original code is here: | 
 | 89 |         # http://code.activestate.com/recipes/577879-create-a-nested-dictionary-from-oswalk/ | 
 | 90 |         root_path = root_path.rstrip(os.sep) | 
 | 91 |         start = root_path.rfind(os.sep) + 1 | 
 | 92 |         root_key = root_path.rsplit(os.sep, 1)[1] | 
 | 93 |         # Look Ma! I am walking the file tree with no recursion! | 
 | 94 |         for path, dirs, files in os.walk(root_path): | 
 | 95 |             # if this is a hidden folder, ignore it | 
| Alex Savatieiev | 06ab17d | 2019-02-26 18:40:48 -0600 | [diff] [blame] | 96 |             _folders_list = path[start:].split(os.sep) | 
 | 97 |             if any(item.startswith(".") for item in _folders_list): | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 98 |                 continue | 
 | 99 |             # cut absolute part of the path and split folder names | 
 | 100 |             folders = path[start:].split(os.sep) | 
 | 101 |             subdir = {} | 
 | 102 |             # create generator of files that are not hidden | 
| Alex Savatieiev | 36b938d | 2019-01-21 11:01:18 +0100 | [diff] [blame] | 103 |             _exts = ('.yml', '.yaml') | 
| Alex Savatieiev | 06ab17d | 2019-02-26 18:40:48 -0600 | [diff] [blame] | 104 |             _subfiles = (_fl for _fl in files | 
 | 105 |                          if _fl.endswith(_exts) and not _fl.startswith('.')) | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 106 |             for _file in _subfiles: | 
 | 107 |                 # cut file extension. All reclass files are '.yml' | 
 | 108 |                 _subnode = _file | 
 | 109 |                 # load all YAML class data into the tree | 
 | 110 |                 subdir[_subnode] = self.load_yaml_class( | 
 | 111 |                     os.path.join(path, _file) | 
 | 112 |                 ) | 
| Alex Savatieiev | 36b938d | 2019-01-21 11:01:18 +0100 | [diff] [blame] | 113 |                 try: | 
 | 114 |                     # Save original filepath, just in case | 
 | 115 |                     subdir[_subnode]["_source"] = os.path.join( | 
 | 116 |                         path[start:], | 
 | 117 |                         _file | 
 | 118 |                     ) | 
 | 119 |                 except Exception: | 
 | 120 |                     logger.warning( | 
 | 121 |                         "Non-yaml file detected: {}".format(_file) | 
 | 122 |                     ) | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 123 |             # creating dict structure out of folder list. Pure python magic | 
 | 124 |             parent = reduce(dict.get, folders[:-1], raw_tree) | 
 | 125 |             parent[folders[-1]] = subdir | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 126 |          | 
 | 127 |         self.models[name] = {} | 
 | 128 |         # Brake in according to pathes | 
 | 129 |         _parts = self._model_parts.keys() | 
 | 130 |         _parts = sorted(_parts) | 
 | 131 |         for ii in range(0, len(_parts)): | 
 | 132 |             self.models[name][_parts[ii]] = pop_element( | 
 | 133 |                 self._model_parts[_parts[ii]], | 
 | 134 |                 raw_tree[root_key] | 
 | 135 |             ) | 
 | 136 |          | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 137 |         # save it as a single data object | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 138 |         self.models[name]["all_diffs"] = raw_tree[root_key] | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 139 |         return True | 
 | 140 |  | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 141 |     def find_changes(self, dict1, dict2, path=""): | 
 | 142 |         _report = {} | 
 | 143 |         for k in dict1.keys(): | 
 | 144 |             # yamls might load values as non-str types | 
 | 145 |             if not isinstance(k, str): | 
 | 146 |                 _new_path = path + ":" + str(k) | 
 | 147 |             else: | 
 | 148 |                 _new_path = path + ":" + k | 
 | 149 |             # ignore _source key | 
 | 150 |             if k == "_source": | 
 | 151 |                 continue | 
 | 152 |             # check if this is an env name cluster entry | 
 | 153 |             if dict2 is not None and \ | 
 | 154 |                     k == self.model_name_1 and \ | 
 | 155 |                     self.model_name_2 in dict2.keys(): | 
 | 156 |                 k1 = self.model_name_1 | 
 | 157 |                 k2 = self.model_name_2 | 
 | 158 |                 if type(dict1[k1]) is dict: | 
 | 159 |                     if path == "": | 
 | 160 |                         _new_path = k1 | 
 | 161 |                     _child_report = self.find_changes( | 
 | 162 |                         dict1[k1], | 
 | 163 |                         dict2[k2], | 
 | 164 |                         _new_path | 
 | 165 |                     ) | 
 | 166 |                     _report.update(_child_report) | 
 | 167 |             elif dict2 is None or k not in dict2: | 
 | 168 |                 # no key in dict2 | 
 | 169 |                 _report[_new_path] = { | 
 | 170 |                     "type": "value", | 
 | 171 |                     "raw_values": [dict1[k], "N/A"], | 
 | 172 |                     "str_values": [ | 
 | 173 |                         "{}".format(dict1[k]), | 
 | 174 |                         "n/a" | 
 | 175 |                     ] | 
 | 176 |                 } | 
 | 177 |                 logger.info( | 
 | 178 |                     "{}: {}, {}".format(_new_path, dict1[k], "N/A") | 
 | 179 |                 ) | 
 | 180 |             else: | 
 | 181 |                 if type(dict1[k]) is dict: | 
 | 182 |                     if path == "": | 
 | 183 |                         _new_path = k | 
 | 184 |                     _child_report = self.find_changes( | 
 | 185 |                         dict1[k], | 
 | 186 |                         dict2[k], | 
 | 187 |                         _new_path | 
 | 188 |                     ) | 
 | 189 |                     _report.update(_child_report) | 
 | 190 |                 elif type(dict1[k]) is list and type(dict2[k]) is list: | 
 | 191 |                     # use ifilterfalse to compare lists of dicts | 
 | 192 |                     try: | 
 | 193 |                         _removed = list( | 
 | 194 |                             itertools.ifilterfalse( | 
 | 195 |                                 lambda x: x in dict2[k], | 
 | 196 |                                 dict1[k] | 
 | 197 |                             ) | 
 | 198 |                         ) | 
 | 199 |                         _added = list( | 
 | 200 |                             itertools.ifilterfalse( | 
 | 201 |                                 lambda x: x in dict1[k], | 
 | 202 |                                 dict2[k] | 
 | 203 |                             ) | 
 | 204 |                         ) | 
 | 205 |                     except TypeError as e: | 
 | 206 |                         # debug routine, | 
 | 207 |                         # should not happen, due to list check above | 
 | 208 |                         logger.error( | 
 | 209 |                             "Caught lambda type mismatch: {}".format( | 
 | 210 |                                 e.message | 
 | 211 |                             ) | 
 | 212 |                         ) | 
 | 213 |                         logger_cli.warning( | 
 | 214 |                             "Types mismatch for correct compare: " | 
 | 215 |                             "{}, {}".format( | 
 | 216 |                                 type(dict1[k]), | 
 | 217 |                                 type(dict2[k]) | 
 | 218 |                             ) | 
 | 219 |                         ) | 
 | 220 |                         _removed = None | 
 | 221 |                         _added = None | 
 | 222 |                     _original = ["= {}".format(item) for item in dict1[k]] | 
 | 223 |                     if _removed or _added: | 
 | 224 |                         _removed_str_lst = ["- {}".format(item) | 
 | 225 |                                             for item in _removed] | 
 | 226 |                         _added_str_lst = ["+ {}".format(item) | 
 | 227 |                                             for item in _added] | 
 | 228 |                         _report[_new_path] = { | 
 | 229 |                             "type": "list", | 
 | 230 |                             "raw_values": [ | 
 | 231 |                                 dict1[k], | 
 | 232 |                                 _removed_str_lst + _added_str_lst | 
 | 233 |                             ], | 
 | 234 |                             "str_values": [ | 
 | 235 |                                 "{}".format('\n'.join(_original)), | 
 | 236 |                                 "{}\n{}".format( | 
 | 237 |                                     '\n'.join(_removed_str_lst), | 
 | 238 |                                     '\n'.join(_added_str_lst) | 
 | 239 |                                 ) | 
 | 240 |                             ] | 
 | 241 |                         } | 
 | 242 |                         logger.info( | 
 | 243 |                             "{}:\n" | 
 | 244 |                             "{} original items total".format( | 
 | 245 |                                 _new_path, | 
 | 246 |                                 len(dict1[k]) | 
 | 247 |                             ) | 
 | 248 |                         ) | 
 | 249 |                         if _removed: | 
 | 250 |                             logger.info( | 
 | 251 |                                 "{}".format('\n'.join(_removed_str_lst)) | 
 | 252 |                             ) | 
 | 253 |                         if _added: | 
 | 254 |                             logger.info( | 
 | 255 |                                 "{}".format('\n'.join(_added_str_lst)) | 
 | 256 |                             ) | 
 | 257 |                 else: | 
 | 258 |                     # in case of type mismatch | 
 | 259 |                     # considering it as not equal | 
 | 260 |                     d1 = dict1 | 
 | 261 |                     d2 = dict2 | 
 | 262 |                     val1 = d1[k] if isinstance(d1, dict) else d1 | 
 | 263 |                     val2 = d2[k] if isinstance(d2, dict) else d2 | 
 | 264 |                     try: | 
 | 265 |                         match = val1 == val2 | 
 | 266 |                     except TypeError as e: | 
 | 267 |                         logger.warning( | 
 | 268 |                             "One of the values is not a dict: " | 
 | 269 |                             "{}, {}".format( | 
 | 270 |                                 str(dict1), | 
 | 271 |                                 str(dict2) | 
 | 272 |                             )) | 
 | 273 |                         match = False | 
 | 274 |                     if not match: | 
 | 275 |                         _report[_new_path] = { | 
 | 276 |                             "type": "value", | 
 | 277 |                             "raw_values": [val1, val2], | 
 | 278 |                             "str_values": [ | 
 | 279 |                                 "{}".format(val1), | 
 | 280 |                                 "{}".format(val2) | 
 | 281 |                             ] | 
 | 282 |                         } | 
 | 283 |                         logger.info("{}: {}, {}".format( | 
 | 284 |                             _new_path, | 
 | 285 |                             val1, | 
 | 286 |                             val2 | 
 | 287 |                         )) | 
 | 288 |         return _report | 
 | 289 |  | 
 | 290 |  | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 291 |     def generate_model_report_tree(self): | 
| Alex Savatieiev | 0137dad | 2019-01-25 16:18:42 +0100 | [diff] [blame] | 292 |         """Use two loaded models to generate comparison table with | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 293 |         values are groupped by YAML files | 
 | 294 |         """ | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 295 |         # We are to cut both models into logical pieces | 
 | 296 |         # nodes, will not be equal most of the time | 
 | 297 |         # system, must be pretty much the same or we in trouble | 
 | 298 |         # cluster, will be the most curious part for comparison | 
 | 299 |         # other, all of the rest | 
| Alex Savatieiev | 36b938d | 2019-01-21 11:01:18 +0100 | [diff] [blame] | 300 |  | 
| Alex Savatieiev | 4f149d0 | 2019-02-28 17:15:29 -0600 | [diff] [blame] | 301 |         _diff_report = {} | 
 | 302 |         for _key in self._model_parts.keys(): | 
 | 303 |             # tmp report for keys | 
 | 304 |             _tmp_diffs = self.find_changes( | 
 | 305 |                 self.models[self.model_name_1][_key], | 
 | 306 |                 self.models[self.model_name_2][_key] | 
 | 307 |             ) | 
 | 308 |             # prettify the report | 
 | 309 |             for key in _tmp_diffs.keys(): | 
 | 310 |                 # break the key in two parts | 
 | 311 |                 _ext = ".yml" | 
 | 312 |                 if ".yaml" in key: | 
 | 313 |                     _ext = ".yaml" | 
 | 314 |                 _split = key.split(_ext) | 
 | 315 |                 _file_path = _split[0] | 
 | 316 |                 _param_path = "none" | 
 | 317 |                 if len(_split) > 1: | 
 | 318 |                     _param_path = _split[1] | 
 | 319 |                 _tmp_diffs[key].update({ | 
 | 320 |                     "class_file": _file_path + _ext, | 
 | 321 |                     "param": _param_path, | 
 | 322 |                 }) | 
 | 323 |             _diff_report[_key[3:]] = { | 
 | 324 |                 "path": self._model_parts[_key], | 
 | 325 |                 "diffs": _tmp_diffs | 
 | 326 |             } | 
 | 327 |  | 
 | 328 |         _diff_report["diff_names"] = [self.model_name_1, self.model_name_2] | 
 | 329 |         return _diff_report | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 330 |  | 
| Alex Savatieiev | c905571 | 2019-03-01 14:43:56 -0600 | [diff] [blame^] | 331 |     def compare_models(self): | 
 | 332 |         # Do actual compare using model names from the class | 
 | 333 |         self.load_model_tree( | 
 | 334 |             self.model_name_1, | 
 | 335 |             self.model_path_1 | 
 | 336 |         ) | 
 | 337 |         self.load_model_tree( | 
 | 338 |             self.model_name_2, | 
 | 339 |             self.model_path_2 | 
 | 340 |         ) | 
 | 341 |         # Models should have similar structure to be compared | 
 | 342 |         # classes/system | 
 | 343 |         # classes/cluster | 
 | 344 |         # nodes | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 345 |  | 
| Alex Savatieiev | c905571 | 2019-03-01 14:43:56 -0600 | [diff] [blame^] | 346 |         diffs = self.generate_model_report_tree() | 
| Alex Savatieiev | d48994d | 2018-12-13 12:13:00 +0100 | [diff] [blame] | 347 |  | 
| Alex Savatieiev | c905571 | 2019-03-01 14:43:56 -0600 | [diff] [blame^] | 348 |         report_file = \ | 
 | 349 |             self.model_name_1 + "-vs-" + self.model_name_2 + ".html" | 
 | 350 |         # HTML report class is post-callable | 
 | 351 |         report = reporter.ReportToFile( | 
 | 352 |             reporter.HTMLModelCompare(), | 
 | 353 |             report_file | 
 | 354 |         ) | 
 | 355 |         logger_cli.info("...generating report to {}".format(report_file)) | 
 | 356 |         # report will have tabs for each of the comparable entities in diffs | 
 | 357 |         report({ | 
 | 358 |             "nodes": {}, | 
 | 359 |             "all_diffs": diffs, | 
 | 360 |         }) | 
 | 361 |         # with open("./gen_tree.json", "w+") as _out: | 
 | 362 |         #     _out.write(json.dumps(mComparer.generate_model_report_tree)) | 
| Alex Savatieiev | 06ab17d | 2019-02-26 18:40:48 -0600 | [diff] [blame] | 363 |  | 
| Alex Savatieiev | c905571 | 2019-03-01 14:43:56 -0600 | [diff] [blame^] | 364 |         return |