blob: c9cac603a8f23b5367d1f6e64bbcc03ee88960c9 [file] [log] [blame]
"""Model Comparer:
- yaml parser
- class tree comparison
"""
import itertools
import os
from functools import reduce
from cfg_checker.common import logger, logger_cli
import yaml
def get_element(element_path, input_data):
paths = element_path.split(":")
data = input_data
for i in range(0, len(paths)):
data = data[paths[i]]
return data
def pop_element(element_path, input_data):
paths = element_path.split(":")
data = input_data
# Search for last dict
for i in range(0, len(paths)-1):
data = data[paths[i]]
# pop the actual element
return data.pop(paths[-1])
class ModelComparer(object):
"""Collection of functions to compare model data.
"""
# key order is important
_model_parts = {
"01_nodes": "nodes",
"02_system": "classes:system",
"03_cluster": "classes:cluster",
"04_other": "classes"
}
models = {}
models_path = "/srv/salt/reclass"
model_name_1 = "source"
model_path_1 = os.path.join(models_path, model_name_1)
model_name_2 = "target"
model_path_2 = os.path.join(models_path, model_name_1)
@staticmethod
def load_yaml_class(fname):
"""Loads a yaml from the file and forms a tree item
Arguments:
fname {string} -- full path to the yaml file
"""
_yaml = {}
try:
_size = 0
with open(fname, 'r') as f:
_yaml = yaml.load(f, Loader=yaml.FullLoader)
_size = f.tell()
# TODO: do smth with the data
if not _yaml:
# logger.warning("WARN: empty file '{}'".format(fname))
_yaml = {}
else:
logger.debug("... loaded YAML '{}' ({}b)".format(fname, _size))
return _yaml
except yaml.YAMLError as exc:
logger_cli.error(exc)
except IOError as e:
logger_cli.error(
"Error loading file '{}': {}".format(fname, e.message)
)
raise Exception("CRITICAL: Failed to load YAML data: {}".format(
e.message + e.strerror
))
def load_model_tree(self, name, root_path="/srv/salt/reclass"):
"""Walks supplied path for the YAML filed and loads the tree
Arguments:
root_folder_path {string} -- Path to Model's root folder. Optional
"""
logger_cli.info("# Loading reclass tree from '{}'".format(root_path))
# prepare the file tree to walk
raw_tree = {}
# Credits to Andrew Clark@MIT. Original code is here:
# http://code.activestate.com/recipes/577879-create-a-nested-dictionary-from-oswalk/
root_path = root_path.rstrip(os.sep)
start = root_path.rfind(os.sep) + 1
root_key = root_path.rsplit(os.sep, 1)[1]
# Look Ma! I am walking the file tree with no recursion!
for path, dirs, files in os.walk(root_path):
# if this is a hidden folder, ignore it
_folders_list = path[start:].split(os.sep)
if any(item.startswith(".") for item in _folders_list):
continue
# cut absolute part of the path and split folder names
folders = path[start:].split(os.sep)
subdir = {}
# create generator of files that are not hidden
_exts = ('.yml', '.yaml')
_subfiles = (_fl for _fl in files
if _fl.endswith(_exts) and not _fl.startswith('.'))
for _file in _subfiles:
# cut file extension. All reclass files are '.yml'
_subnode = _file
# load all YAML class data into the tree
subdir[_subnode] = self.load_yaml_class(
os.path.join(path, _file)
)
try:
# Save original filepath, just in case
subdir[_subnode]["_source"] = os.path.join(
path[start:],
_file
)
except Exception:
logger.warning(
"Non-yaml file detected: {}".format(_file)
)
# creating dict structure out of folder list. Pure python magic
parent = reduce(dict.get, folders[:-1], raw_tree)
parent[folders[-1]] = subdir
self.models[name] = {}
# Brake in according to pathes
_parts = self._model_parts.keys()
_parts = sorted(_parts)
for ii in range(0, len(_parts)):
self.models[name][_parts[ii]] = pop_element(
self._model_parts[_parts[ii]],
raw_tree[root_key]
)
# save it as a single data object
self.models[name]["rc_diffs"] = raw_tree[root_key]
return True
def find_changes(self, dict1, dict2, path=""):
_report = {}
for k in dict1.keys():
# yamls might load values as non-str types
if not isinstance(k, str):
_new_path = path + ":" + str(k)
else:
_new_path = path + ":" + k
# ignore _source key
if k == "_source":
continue
# ignore secrets and other secure stuff
if isinstance(k, str) and k == "secrets.yml":
continue
if isinstance(k, str) and k.find("_password") > 0:
continue
if isinstance(k, str) and k.find("_key") > 0:
continue
if isinstance(k, str) and k.find("_token") > 0:
continue
# check if this is an env name cluster entry
if dict2 is not None and \
k == self.model_name_1 and \
self.model_name_2 in dict2.keys():
k1 = self.model_name_1
k2 = self.model_name_2
if type(dict1[k1]) is dict:
if path == "":
_new_path = k1
_child_report = self.find_changes(
dict1[k1],
dict2[k2],
_new_path
)
_report.update(_child_report)
elif dict2 is None or k not in dict2:
# no key in dict2
_report[_new_path] = {
"type": "value",
"raw_values": [dict1[k], "N/A"],
"str_values": [
"{}".format(dict1[k]),
"n/a"
]
}
logger.info(
"{}: {}, {}".format(_new_path, dict1[k], "N/A")
)
else:
if type(dict1[k]) is dict:
if path == "":
_new_path = k
_child_report = self.find_changes(
dict1[k],
dict2[k],
_new_path
)
_report.update(_child_report)
elif type(dict1[k]) is list and type(dict2[k]) is list:
# use ifilterfalse to compare lists of dicts
try:
_removed = list(
itertools.filterfalse(
lambda x: x in dict2[k],
dict1[k]
)
)
_added = list(
itertools.filterfalse(
lambda x: x in dict1[k],
dict2[k]
)
)
except TypeError as e:
# debug routine,
# should not happen, due to list check above
logger.error(
"Caught lambda type mismatch: {}".format(
e.message
)
)
logger_cli.warning(
"Types mismatch for correct compare: "
"{}, {}".format(
type(dict1[k]),
type(dict2[k])
)
)
_removed = None
_added = None
_original = ["= {}".format(item) for item in dict1[k]]
if _removed or _added:
_removed_str_lst = ["- {}".format(item)
for item in _removed]
_added_str_lst = ["+ {}".format(i) for i in _added]
_report[_new_path] = {
"type": "list",
"raw_values": [
dict1[k],
_removed_str_lst + _added_str_lst
],
"str_values": [
"{}".format('\n'.join(_original)),
"{}\n{}".format(
'\n'.join(_removed_str_lst),
'\n'.join(_added_str_lst)
)
]
}
logger.info(
"{}:\n"
"{} original items total".format(
_new_path,
len(dict1[k])
)
)
if _removed:
logger.info(
"{}".format('\n'.join(_removed_str_lst))
)
if _added:
logger.info(
"{}".format('\n'.join(_added_str_lst))
)
else:
# in case of type mismatch
# considering it as not equal
d1 = dict1
d2 = dict2
val1 = d1[k] if isinstance(d1, dict) else d1
val2 = d2[k] if isinstance(d2, dict) else d2
try:
match = val1 == val2
except TypeError as e:
logger.warning(
"One of the values is not a dict: "
"{}, {}; {}".format(
str(dict1),
str(dict2),
e.message
))
match = False
if not match:
_report[_new_path] = {
"type": "value",
"raw_values": [val1, val2],
"str_values": [
"{}".format(val1),
"{}".format(val2)
]
}
logger.info("{}: {}, {}".format(
_new_path,
val1,
val2
))
return _report
def generate_model_report_tree(self):
"""Use two loaded models to generate comparison table with
values are groupped by YAML files
"""
# We are to cut both models into logical pieces
# nodes, will not be equal most of the time
# system, must be pretty much the same or we in trouble
# cluster, will be the most curious part for comparison
# other, all of the rest
_diff_report = {}
for _key in self._model_parts.keys():
# tmp report for keys
_tmp_diffs = self.find_changes(
self.models[self.model_name_1][_key],
self.models[self.model_name_2][_key]
)
# prettify the report
for key in _tmp_diffs.keys():
# break the key in two parts
_ext = ".yml"
if ".yaml" in key:
_ext = ".yaml"
_split = key.split(_ext)
_file_path = _split[0]
_param_path = "none"
if len(_split) > 1:
_param_path = _split[1]
_tmp_diffs[key].update({
"class_file": _file_path + _ext,
"param": _param_path,
})
_diff_report[_key[3:]] = {
"path": self._model_parts[_key],
"diffs": _tmp_diffs
}
_diff_report["diff_names"] = [self.model_name_1, self.model_name_2]
return _diff_report