cfg_checker/modules/packages/repos.py - mcp/cfg-checker - Gitiles

 import json
 import os
 import re
 from copy import deepcopy

 from cfg_checker.common import logger, logger_cli, nested_set
 from cfg_checker.common.const import _mainteiners_index_filename
 from cfg_checker.common.const import _mirantis_versions_filename
 from cfg_checker.common.const import _other_versions_filename
 from cfg_checker.common.const import _pkg_desc_archive
 from cfg_checker.common.const import _repos_index_filename
 from cfg_checker.common.const import _repos_info_archive
 from cfg_checker.common.const import _repos_versions_archive
 from cfg_checker.common.const import ubuntu_releases
 from cfg_checker.common.const import kaas_ubuntu_active
 from cfg_checker.common.const import mcp_active_tags as active_tags
 from cfg_checker.common.file_utils import ensure_folder_exists
 from cfg_checker.common.file_utils import get_gzipped_file
 from cfg_checker.common.settings import pkg_dir
 from cfg_checker.helpers.console_utils import Progress
 from cfg_checker.helpers.tgz import TGZFile

 import requests
 from requests.exceptions import ConnectionError

 ext = ".json"


 def get_tag_label(_tag, parsed=False):
     # prettify the tag for printing
     if parsed:
         _label = "+ "
     else:
         _label = "  "

     if _tag.endswith(".update"):
         _label += "[updates] " + _tag.rsplit('.', 1)[0]
     elif _tag.endswith(".hotfix"):
         _label += " [hotfix] " + _tag.rsplit('.', 1)[0]
     else:
         _label += " "*10 + _tag

     return _label


 def _get_value_index(_di, value, header=None):
     # Mainteiner names often uses specific chars
     # so make sure that value saved is str not str
     # Python2
     # _val = str(value, 'utf-8') if isinstance(value, str) else value
     # Python3 has always utf-8 decoded value
     _val = value
     if header:
         try:
             _index = next(i for i in _di if header in _di[i]['header'])
         except StopIteration:
             _index = str(len(_di) + 1)
             _di[_index] = {
                 "header": header,
                 "props": _val
             }
         finally:
             return _index
     else:
         try:
             _index = next(i for i in _di if _val in _di[i])
             # iterator not empty, find index
         except StopIteration:
             _index = str(len(_di) + 1)
             # on save, cast it as str
             _di[_index] = _val
         finally:
             return _index


 def _safe_load(_f, _a):
     if _f in _a.list_files():
         logger_cli.debug(
             "... loading '{}':'{}'".format(
                 _a.basefile,
                 _f
             )
         )
         return json.loads(_a.get_file(_f, decode=True))
     else:
         return {}


 def _n_url(url):
     if url[-1] == '/':
         return url
     else:
         return url + '/'


 class ReposInfo(object):
     init_done = False

     def _init_vars(self):
         self.repos = []

     def _init_folders(self, arch_folder=None):
         if arch_folder:
             self._arch_folder = arch_folder
             self._repofile = os.path.join(arch_folder, _repos_info_archive)
         else:
             self._arch_folder = os.path.join(pkg_dir, "versions")
             self._repofile = os.path.join(
                 self._arch_folder,
                 _repos_info_archive
             )

     def __init__(self, arch_folder=None):
         # perform inits
         self._init_vars()
         self._init_folders(arch_folder)
         self.init_done = True

     def __call__(self, *args, **kwargs):
         if self.init_done:
             return self
         else:
             return self.__init__(self, *args, **kwargs)

     @staticmethod
     def _ls_repo_page(url):
         # Yes, this is ugly. But it works ok for small HTMLs.
         _a = "<a"
         _s = "href="
         _e = "\">"
         try:
             page = requests.get(url, timeout=60)
         except ConnectionError as e:
             logger_cli.error("# ERROR: {}".format(e.message))
             return [], []
         a = page.text.splitlines()
         # Comprehension for dirs. Anchors for ends with '-'
         _dirs = [ll[ll.index(_s)+6:ll.index(_e)-1]
                  for ll in a if ll.startswith(_a) and ll.endswith('-')]
         # Comprehension for files. Anchors ends with size
         _files = [ll[ll.index(_s)+6:ll.index(_e)]
                   for ll in a if ll.startswith(_a) and not ll.endswith('-')]

         return _dirs, _files

     def search_pkg(self, url, _list):
         # recoursive method to walk dists tree
         _dirs, _files = self._ls_repo_page(url)

         for _d in _dirs:
             # Search only in dists, ignore the rest
             if "dists" not in url and _d != "dists":
                 continue
             _u = _n_url(url + _d)
             self.search_pkg(_u, _list)

         for _f in _files:
             if _f == "Packages.gz":
                 _list.append(url + _f)
                 logger.debug("... [F] '{}'".format(url + _f))

         return _list

     @staticmethod
     def _map_repo(_path_list, _r):
         for _pkg_path in _path_list:
             _l = _pkg_path.split('/')
             _kw = _l[_l.index('dists')+1:]
             _kw.reverse()
             _repo_item = {
                 "arch": _kw[1][7:] if "binary" in _kw[1] else _kw[1],
                 "type": _kw[2],
                 "ubuntu-release": _kw[3],
                 "filepath": _pkg_path
             }
             _r.append(_repo_item)

     def _find_tag(self, _t, _u, label=""):
         if label:
             _url = _n_url(_u + label)
             _label = _t + '.' + label
         else:
             _url = _u
             _label = _t
         _ts, _ = self._ls_repo_page(_url)
         if _t in _ts:
             logger.debug(
                 "... found tag '{}' at '{}'".format(
                     _t,
                     _url
                 )
             )
             return {
                 _label: {
                     "baseurl": _n_url(_url + _t),
                     "all": {}
                 }
             }
         else:
             return {}

     def fetch_repos(self, url, tag=None):
         base_url = _n_url(url)
         logger_cli.info("# Using '{}' as a repos source".format(base_url))

         logger_cli.info("# Gathering repos info (i.e. links to 'packages.gz')")
         # init repoinfo archive
         _repotgz = TGZFile(self._repofile)
         # prepare repo links
         _repos = {}
         if tag:
             # only one tag to process
             _repos.update(self._find_tag(tag, base_url))
             _repos.update(self._find_tag(tag, base_url, label="hotfix"))
             _repos.update(self._find_tag(tag, base_url, label="update"))
         else:
             # gather all of them
             _tags, _ = self._ls_repo_page(base_url)
             if "hotfix" in _tags:
                 _tags.remove('hotfix')
             if "update" in _tags:
                 _tags.remove('update')
             # Filter out not active tags
             logger_cli.info("Active tags for mcp: {}".format(
                 ", ".join(active_tags)
             ))
             logger_cli.info("Active kaas ubuntu repos: {}".format(
                 ", ".join(kaas_ubuntu_active)
             ))
             _active_tags = [t for t in _tags if t in active_tags]

             # search tags in subfolders
             _h_tags, _ = self._ls_repo_page(base_url + 'hotfix')
             _u_tags, _ = self._ls_repo_page(base_url + 'update')
             _active_tags.extend(
                 [t for t in _h_tags if t not in _tags and t in active_tags]
             )
             _active_tags.extend(
                 [t for t in _u_tags if t not in _tags and t in active_tags]
             )
             _progress = Progress(len(_active_tags))
             _index = 0
             for _tag in _active_tags:
                 _repos.update(self._find_tag(_tag, base_url))
                 _repos.update(self._find_tag(_tag, base_url, label="hotfix"))
                 _repos.update(self._find_tag(_tag, base_url, label="update"))
                 _index += 1
                 _progress.write_progress(_index)
             _progress.end()

         # parse subtags
         for _label in _repos.keys():
             logger_cli.info("-> processing tag '{}'".format(_label))
             _name = _label + ".json"
             if _repotgz.has_file(_name) and not tag:
                 logger_cli.info(
                     "-> skipping, '{}' already has '{}'".format(
                         _repos_info_archive,
                         _name
                     )
                 )
                 continue
             # process the tag
             _repo = _repos[_label]
             _baseurl = _repos[_label]["baseurl"]
             # get the subtags
             _sub_tags, _ = self._ls_repo_page(_baseurl)
             _total_index = len(_sub_tags)
             _index = 0
             _progress = Progress(_total_index)
             logger_cli.debug(
                 "... found {} subtags for '{}'".format(
                     len(_sub_tags),
                     _label
                 )
             )
             # save the url and start search
             for _stag in _sub_tags:
                 _u = _baseurl + _stag
                 _index += 1
                 logger_cli.debug(
                     "... searching repos in '{}/{}'".format(
                         _label,
                         _stag
                     )
                 )

                 # Searching Package collections
                 if _stag in ubuntu_releases or _stag in kaas_ubuntu_active:
                     # if stag is the release, this is all packages
                     _repo["all"][_stag] = []
                     _repo["all"]["url"] = _n_url(_u)
                     _path_list = self.search_pkg(_n_url(_u), [])
                     self._map_repo(_path_list, _repo["all"][_stag])
                     logger_cli.info(
                         "-> found {} dists".format(
                             len(_repo["all"][_stag])
                         )
                     )

                 else:
                     # each subtag might have any ubuntu release
                     # so iterate them
                     _repo[_stag] = {
                         "url": _n_url(_u)
                     }
                     _releases, _ = self._ls_repo_page(_n_url(_u))
                     for _rel in _releases:
                         if _rel not in ubuntu_releases:
                             logger_cli.debug(
                                 "... skipped unknown ubuntu release: "
                                 "'{}' in '{}'".format(
                                     _rel,
                                     _u
                                 )
                             )
                         else:
                             _rel_u = _n_url(_u) + _rel
                             _repo[_stag][_rel] = []
                             _path_list = self.search_pkg(_n_url(_rel_u), [])
                             self._map_repo(
                                 _path_list,
                                 _repo[_stag][_rel]
                             )
                             logger_cli.info(
                                 "-> found {} dists for '{}'".format(
                                     len(_repo[_stag][_rel]),
                                     _rel
                                 )
                             )
                 _progress.write_progress(_index)

             _progress.end()
             _name = _label + ext
             _repotgz.add_file(_name, buf=json.dumps(_repo, indent=2))
             logger_cli.info(
                 "-> archive '{}' updated with '{}'".format(
                     self._repofile,
                     _name
                 )
             )

         return

     def list_tags(self, splitted=False):
         _files = TGZFile(self._repofile).list_files()
         # all files in archive with no '.json' part
         _all = set([f.rsplit('.', 1)[0] for f in _files])
         if splitted:
             # files that ends with '.update'
             _updates = set([f for f in _all if f.find('update') >= 0])
             # files that ends with '.hotfix'
             _hotfix = set([f for f in _all if f.find('hotfix') >= 0])
             # remove updates and hotfix tags from all. The true magic of SETs
             _all = _all - _updates - _hotfix
             # cut updates and hotfix endings
             _updates = [f.rsplit('.', 1)[0] for f in _updates]
             _hotfix = [f.rsplit('.', 1)[0] for f in _hotfix]

             return _all, _updates, _hotfix
         else:
             # dynamic import
             import re
             _all = list(_all)
             # lexical tags
             _lex = [s for s in _all if not s[0].isdigit()]
             _lex.sort()
             # tags with digits
             _dig = [s for s in _all if s[0].isdigit()]
             _dig = sorted(
                 _dig,
                 key=lambda x: tuple(int(i) for i in re.findall(r"\d+", x)[:3])
             )

             return _dig + _lex

     def get_repoinfo(self, tag):
         _tgz = TGZFile(self._repofile)
         _buf = _tgz.get_file(tag + ext, decode=True)
         return json.loads(_buf)


 class RepoManager(object):
     init_done = False

     def _init_folders(self, arch_folder=None):
         logger_cli.info("# Loading package versions data")
         # overide arch folder if needed
         if arch_folder:
             self._arch_folder = arch_folder
         else:
             self._arch_folder = os.path.join(pkg_dir, "versions")

         self._versions_arch = os.path.join(
             self._arch_folder,
             _repos_versions_archive
         )
         self._desc_arch = os.path.join(self._arch_folder, _pkg_desc_archive)

     def _init_vars(self, info_class):
         # RepoInfo instance init
         if info_class:
             self._info_class = info_class
         else:
             self._info_class = ReposInfo()
         # archives
         self._apps_filename = "apps.json"

         # repository index
         self._repo_index = {}
         self._mainteiners_index = {}

         self._apps = {}

         # init package versions storage
         self._versions_mirantis = {}
         self._versions_other = {}

     def _init_archives(self):
         # Init version files
         self.versionstgz = TGZFile(
             self._versions_arch,
             label="MCP Configuration Checker: Package versions archive"
         )
         self.desctgz = TGZFile(
             self._desc_arch,
             label="MCP Configuration Checker: Package descriptions archive"
         )

         # section / app
         self._apps = _safe_load(
             self._apps_filename,
             self.desctgz
         )

         # indices
         self._repo_index = _safe_load(
             _repos_index_filename,
             self.versionstgz
         )
         self._mainteiners_index = _safe_load(
             _mainteiners_index_filename,
             self.versionstgz
         )

         # versions
         self._versions_mirantis = _safe_load(
             _mirantis_versions_filename,
             self.versionstgz
         )
         self._versions_other = _safe_load(
             _other_versions_filename,
             self.versionstgz
         )

     def __init__(self, arch_folder=None, info_class=None):
         # Perform inits
         self._init_vars(info_class)
         self._init_folders(arch_folder)
         # Ensure that versions folder exists
         logger_cli.debug(ensure_folder_exists(self._arch_folder))
         # Preload/create archives
         self._init_archives()
         self.init_done = True

     def __call__(self, *args, **kwargs):
         if self.init_done:
             return self
         else:
             return self.__init__(self, *args, **kwargs)

     def _create_repo_header(self, p):
         _header = "_".join([
             p['tag'],
             p['subset'],
             p['release'],
             p['ubuntu-release'],
             p['type'],
             p['arch']
         ])
         return _get_value_index(self._repo_index, p, header=_header)

     def _get_indexed_values(self, pair):
         _h, _m = pair.split('-')
         return self._repo_index[_h], self._mainteiners_index[_m]

     def _update_pkg_version(self, _d, n, v, md5, s, a, h_index, m_index):
         """Method updates package version record in global dict
         """
         # 'if'*4 operation is pretty expensive when using it 100k in a row
         # so try/except is a better way to go, even faster than 'reduce'
         _pair = "-".join([h_index, m_index])
         _info = {
             'repo': [_pair],
             'section': s,
             'app': a
         }
         try:
             # try to load list
             _list = _d[n][v][md5]['repo']
             # cast it as set() and union()
             _list = set(_list).union([_pair])
             # cast back as set() is not serializeable
             _d[n][v][md5]['repo'] = list(_list)
             return False
         except KeyError:
             # ok, this is fresh pkg. Do it slow way.
             if n in _d:
                 # there is such pkg already
                 if v in _d[n]:
                     # there is such version, check md5
                     if md5 in _d[n][v]:
                         # just add new repo header
                         if _pair not in _d[n][v][md5]['repo']:
                             _d[n][v][md5]['repo'].append(_pair)
                     else:
                         # check if such index is here...
                         _existing = filter(
                             lambda i: _pair in _d[n][v][i]['repo'],
                             _d[n][v]
                         )
                         if _existing:
                             # Yuck! Same version had different MD5
                             _r, _m = self._get_indexed_values(_pair)
                             logger_cli.error(
                                 "# ERROR: Package version has multiple MD5s "
                                 "in '{}': {}:{}:{}".format(
                                     _r,
                                     n,
                                     v,
                                     md5
                                 )
                             )
                         _d[n][v][md5] = _info
                 else:
                     # this is new version for existing package
                     _d[n][v] = {
                         md5: _info
                     }
                 return False
             else:
                 # this is new pakcage
                 _d[n] = {
                     v: {
                         md5: _info
                     }
                 }
                 return True

     def _save_repo_descriptions(self, repo_props, desc):
         # form the filename for the repo and save it
         self.desctgz.add_file(
             self._create_repo_header(repo_props),
             json.dumps(desc)
         )

     # def get_description(self, repo_props, name, md5=None):
     #     """Gets target description
     #     """
     #     _filename = self._create_repo_header(repo_props)
     #     # check if it is present in cache
     #     if _filename in self._desc_cache:
     #         _descs = self._desc_cache[_filename]
     #     else:
     #         # load data
     #         _descs = self.desctgz.get_file(_filename)
     #         # Serialize it
     #         _descs = json.loads(_descs)
     #         self._desc_cache[_filename] = _descs
     #     # return target desc
     #     if name in _descs and md5 in _descs[name]:
     #         return _descs[name][md5]
     #     else:
     #         return None

     def parse_tag(self, tag, descriptions=False, apps=False):
         """Download and parse Package.gz files for specific tag
         By default, descriptions not saved
         due to huge resulting file size and slow processing
         """
         # init gzip and downloader
         _info = self._info_class.get_repoinfo(tag)
         # calculate Packages.gz files to process
         _baseurl = _info.pop("baseurl")
         _total_components = len(_info.keys()) - 1
         _ubuntu_package_repos = 0
         _other_repos = 0
         for _c, _d in _info.items():
             for _ur, _l in _d.items():
                 if _ur in ubuntu_releases or _ur in kaas_ubuntu_active:
                     _ubuntu_package_repos += len(_l)
                 elif _ur != 'url':
                     _other_repos += len(_l)
         logger_cli.info(
             "-> loaded repository info for '{}'.\n"
             "  '{}', {} components, {} ubuntu repos, {} other/uknown".format(
                 _baseurl,
                 tag,
                 _total_components,
                 _ubuntu_package_repos,
                 _other_repos
             )
         )
         # init progress bar
         _progress = Progress(_ubuntu_package_repos)
         _index = 0
         _processed = 0
         _new = 0
         for _c, _d in _info.items():
             # we do not need url here, just get rid of it
             if 'url' in _d:
                 _d.pop('url')
             # _url =  if 'url' in _d else _baseurl + _c
             for _ur, _l in _d.items():
                 # iterate package collections
                 for _p in _l:
                     # descriptions
                     if descriptions:
                         _descriptions = {}
                     # download and unzip
                     _index += 1
                     _progress.write_progress(
                         _index,
                         note="/ {} {} {} {} {}, GET 'Packages.gz'".format(
                             _c,
                             _ur,
                             _p['ubuntu-release'],
                             _p['type'],
                             _p['arch']
                         )
                     )
                     _raw = get_gzipped_file(_p['filepath'])
                     if not _raw:
                         # empty repo...
                         _progress.clearline()
                         logger_cli.warning(
                             "# WARNING: Empty file: '{}'".format(
                                 _p['filepath']
                             )
                         )
                         continue
                     else:
                         _raw = _raw.decode("utf-8")
                     _progress.write_progress(
                         _index,
                         note="/ {} {} {} {} {}, {}/{}".format(
                             _c,
                             _ur,
                             _p['ubuntu-release'],
                             _p['type'],
                             _p['arch'],
                             _processed,
                             _new
                         )
                     )
                     _lines = _raw.splitlines()
                     # break lines collection into isolated pkg data
                     _pkg = {
                         "tag": tag,
                         "subset": _c,
                         "release": _ur
                     }
                     _pkg.update(_p)
                     _desc = {}
                     _key = _value = ""
                     # if there is no empty line at end, add it
                     if _lines[-1] != '':
                         _lines.append('')
                     # Process lines
                     for _line in _lines:
                         if not _line:
                             # if the line is empty, process pkg data gathered
                             _name = _desc['package']
                             _md5 = _desc['md5sum']
                             _version = _desc['version']
                             _mainteiner = _desc['maintainer']

                             if 'source' in _desc:
                                 _ap = _desc['source'].lower()
                             else:
                                 _ap = "-"

                             if apps:
                                 # insert app
                                 _sc = _desc['section'].lower()
                                 if 'source' in _desc:
                                     _ap = _desc['source'].lower()
                                 else:
                                     _ap = "-"

                                 try:
                                     _tmp = set(self._apps[_sc][_ap][_name])
                                     _tmp.add(_desc['architecture'])
                                     self._apps[_sc][_ap][_name] = list(_tmp)
                                 except KeyError:
                                     nested_set(
                                         self._apps,
                                         [_sc, _ap, _name],
                                         [_desc['architecture']]
                                     )

                             # Check is mainteiner is Mirantis
                             if _mainteiner.endswith("@mirantis.com>"):
                                 # update mirantis versions
                                 if self._update_pkg_version(
                                     self._versions_mirantis,
                                     _name,
                                     _version,
                                     _md5,
                                     _desc['section'].lower(),
                                     _ap,
                                     self._create_repo_header(_pkg),
                                     _get_value_index(
                                         self._mainteiners_index,
                                         _mainteiner
                                     )
                                 ):
                                     _new += 1
                             else:
                                 # update other versions
                                 if self._update_pkg_version(
                                     self._versions_other,
                                     _name,
                                     _version,
                                     _md5,
                                     _desc['section'].lower(),
                                     _ap,
                                     self._create_repo_header(_pkg),
                                     _get_value_index(
                                         self._mainteiners_index,
                                         _mainteiner
                                     )
                                 ):
                                     _new += 1

                             if descriptions:
                                 _d_new = {
                                     _md5: deepcopy(_desc)
                                 }
                                 try:
                                     _descriptions[_name].update(_d_new)
                                 except KeyError:
                                     _descriptions[_name] = _d_new
                             # clear the data for next pkg
                             _processed += 1
                             _desc = {}
                             _key = ""
                             _value = ""
                         elif _line.startswith(' '):
                             _desc[_key] += "\n{}".format(_line)
                         else:
                             if _line.endswith(":"):
                                 _key = _line[:-1]
                                 _value = ""
                             else:
                                 _key, _value = _line.split(": ", 1)
                             _key = _key.lower()
                             _desc[_key] = _value
                     # save descriptions if needed
                     if descriptions:
                         _progress.clearline()
                         self._save_repo_descriptions(_pkg, _descriptions)

         _progress.end()
         # backup headers to disk
         self.versionstgz.add_file(
             _repos_index_filename,
             json.dumps(self._repo_index),
             replace=True
         )
         self.versionstgz.add_file(
             _mainteiners_index_filename,
             json.dumps(self._mainteiners_index),
             replace=True
         )
         if apps:
             self.desctgz.add_file(
                 self._apps_filename,
                 json.dumps(self._apps),
                 replace=True
             )

         return

     def fetch_versions(self, tag, descriptions=False, apps=False):
         """Executes parsing for specific tag
         """
         if descriptions:
             logger_cli.warning(
                 "\n\n# !!! WARNING: Saving repo descriptions "
                 "consumes huge amount of disk space\n\n"
             )
         # if there is no such tag, parse it from repoinfo
         logger_cli.info("# Fetching versions for {}".format(tag))
         self.parse_tag(tag, descriptions=descriptions, apps=apps)
         logger_cli.info("-> saving updated versions")
         self.versionstgz.add_file(
             _mirantis_versions_filename,
             json.dumps(self._versions_mirantis),
             replace=True
         )
         self.versionstgz.add_file(
             _other_versions_filename,
             json.dumps(self._versions_other),
             replace=True
         )

     def build_repos(self, url, tag=None):
         """Builds versions data for selected tag, or for all of them
         """
         # recoursively walk the mirrors
         # and gather all of the repos for 'tag' or all of the tags
         self._info_class.fetch_repos(url, tag=tag)

     def _build_action(self, url, tags):
         for t in tags:
             logger_cli.info("# Building repo info for '{}'".format(t))
             self.build_repos(url, tag=t)

     def get_available_tags(self, tag=None):
         # Populate action tags
         major, updates, hotfix = self._info_class.list_tags(splitted=True)

         _tags = []
         if tag in major:
             _tags.append(tag)
         if tag in updates:
             _tags.append(tag + ".update")
         if tag in hotfix:
             _tags.append(tag + ".hotfix")

         return _tags

     def action_for_tag(
         self,
         url,
         tag,
         action=None,
         descriptions=None,
         apps=None
     ):
         """Executes action for every tag from all collections
         """
         if not action:
             logger_cli.info("# No action set, nothing to do")
         # See if this is a list action
         if action == "list":
             _all = self._info_class.list_tags()
             if _all:
                 # Print pretty list and exit
                 logger_cli.info("# Tags available at '{}':".format(url))
                 for t in _all:
                     _ri = self._repo_index
                     _isparsed = any(
                         [k for k, v in _ri.items()
                          if v['props']['tag'] == t]
                     )
                     if _isparsed:
                         logger_cli.info(get_tag_label(t, parsed=True))
                     else:
                         logger_cli.info(get_tag_label(t))
             else:
                 logger_cli.info("# Not tags parsed yet for '{}':".format(url))

             # exit
             return

         if action == "build":
             self._build_action(url, [tag])

         # Populate action tags
         _action_tags = self.get_available_tags(tag)

         if not _action_tags:
             logger_cli.info(
                 "# Tag of '{}' not found. "
                 "Consider rebuilding repos info.".format(tag)
             )
         else:
             logger_cli.info(
                 "-> tags to process: {}".format(
                     ", ".join(_action_tags)
                 )
             )
         # Execute actions
         if action == "fetch":
             for t in _action_tags:
                 self.fetch_versions(t, descriptions=descriptions, apps=apps)

         logger_cli.info("# Done.")

     def show_package(self, name):
         # get the package data
         _p = self.get_package_versions(name)
         if not _p:
             logger_cli.warning(
                 "# WARNING: Package '{}' not found".format(name)
             )
         else:
             # print package info using sorted tags from headers
             # Package: name
             # [u/h] tag \t <version>
             #           \t <version>
             # <10symbols> \t <md5> \t sorted headers with no tag
             # ...
             # section
             for _s in sorted(_p):
                 # app
                 for _a in sorted(_p[_s]):
                     _o = ""
                     _mm = []
                     # get and sort tags
                     for _v in sorted(_p[_s][_a]):
                         _o += "\n" + " "*8 + _v + ':\n'
                         # get and sort tags
                         for _md5 in sorted(_p[_s][_a][_v]):
                             _o += " "*16 + _md5 + "\n"
                             # get and sort repo headers
                             for _r in sorted(_p[_s][_a][_v][_md5]):
                                 _o += " "*24 + _r.replace('_', ' ') + '\n'
                                 _m = _p[_s][_a][_v][_md5][_r]["maintainer"]
                                 if _m not in _mm:
                                     _mm.append(_m)

                     logger_cli.info(
                         "\n# Package: {}/{}/{}\nMaintainers: {}".format(
                             _s,
                             _a,
                             name,
                             ", ".join(_mm)
                         )
                     )

                     logger_cli.info(_o)

     @staticmethod
     def get_apps(versions, name):
         _all = True if name == '*' else False
         _s_max = _a_max = _p_max = _v_max = 0
         _rows = []
         for _p in versions.keys():
             _vs = versions[_p]
             for _v, _d1 in _vs.items():
                 for _md5, _info in _d1.items():
                     if _all or name == _info['app']:
                         _s_max = max(len(_info['section']), _s_max)
                         _a_max = max(len(_info['app']), _a_max)
                         _p_max = max(len(_p), _p_max)
                         _v_max = max(len(_v), _v_max)
                         _rows.append([
                             _info['section'],
                             _info['app'],
                             _p,
                             _v,
                             _md5,
                             len(_info['repo'])
                         ])
         # format columns
         # section
         _fmt = "{:"+str(_s_max)+"} "
         # app
         _fmt += "{:"+str(_a_max)+"} "
         # package name
         _fmt += "{:"+str(_p_max)+"} "
         # version
         _fmt += "{:"+str(_v_max)+"} "
         # md5 and number of repos is fixed
         _fmt += "{} in {} repos"

         # fill rows
         _rows = [_fmt.format(s, a, p, v, m, l) for s, a, p, v, m, l in _rows]
         _rows.sort()
         return _rows

     def show_app(self, name):
         c = 0
         rows = self.get_apps(self._versions_mirantis, name)
         if rows:
             logger_cli.info("\n# Mirantis packages for '{}'".format(name))
             logger_cli.info("\n".join(rows))
             c += 1
         rows = self.get_apps(self._versions_other, name)
         if rows:
             logger_cli.info("\n# Other packages for '{}'".format(name))
             logger_cli.info("\n".join(rows))
             c += 1
         if c == 0:
             logger_cli.info("\n# No app found for '{}'".format(name))

     def get_mirantis_pkg_names(self):
         # Mirantis maintainers only
         return set(
             self._versions_mirantis.keys()
         ) - set(
             self._versions_other.keys()
         )

     def get_other_pkg_names(self):
         # Non-mirantis Maintainers
         return set(
             self._versions_other.keys()
         ) - set(
             self._versions_mirantis.keys()
         )

     def get_mixed_pkg_names(self):
         # Mixed maintainers
         return set(
             self._versions_mirantis.keys()
         ).intersection(set(
             self._versions_other.keys()
         ))

     def is_mirantis(self, name, tag=None):
         """Method checks if this package is mainteined
         by mirantis in target tag repo
         """
         if name in self._versions_mirantis:
             # check tag
             if tag:
                 _pkg = self.get_package_versions(
                     name,
                     tagged=True
                 )
                 _tags = []
                 for s in _pkg.keys():
                     for a in _pkg[s].keys():
                         for t in _pkg[s][a].keys():
                             _tags.append(t)
                 if any([t.startswith(tag) for t in _tags]):
                     return True
                 else:
                     return None
             else:
                 return True
         elif name in self._versions_other:
             # check tag
             if tag:
                 _pkg = self.get_package_versions(
                     name,
                     tagged=True
                 )
                 _tags = []
                 for s in _pkg.keys():
                     for a in _pkg[s].keys():
                         for t in _pkg[s][a].keys():
                             _tags.append(t)
                 if any([t.startswith(tag) for t in _tags]):
                     return False
                 else:
                     return None
             else:
                 return False
         else:
             logger.error(
                 "# ERROR: package '{}' not found "
                 "while determining maintainer".format(
                     name
                 )
             )
             return None

     def get_filtered_versions(
         self,
         name,
         tag=None,
         include=None,
         exclude=None
     ):
         """Method gets all the versions for the package
         and filters them using keys above
         """
         if tag:
             tag = str(tag) if not isinstance(tag, str) else tag
         _out = {}
         _vs = self.get_package_versions(name, tagged=True)
         # iterate to filter out keywords
         for s, apps in _vs.items():
             for a, _tt in apps.items():
                 for t, vs in _tt.items():
                     # filter tags
                     if tag and t != tag and t.rsplit('.', 1)[0] != tag:
                         continue
                     # Skip hotfix tag
                     if t == tag + ".hotfix":
                         continue
                     for v, rp in vs.items():
                         for h, p in rp.items():
                             # filter headers with all keywords matching
                             _h = re.split(r"[\-\_]+", h)
                             _included = all([kw in _h for kw in include])
                             _excluded = any([kw in _h for kw in exclude])
                             if not _included or _excluded:
                                 continue
                             else:
                                 nested_set(_out, [s, a, v], [])
                                 _dat = {
                                     "header": h
                                 }
                                 _dat.update(p)
                                 _out[s][a][v].append(_dat)
         return _out

     def get_package_versions(self, name, tagged=False):
         """Method builds package version structure
         with repository properties included
         """
         # get data
         _vs = {}

         if name in self._versions_mirantis:
             _vs.update(self._versions_mirantis[name])
         if name in self._versions_other:
             _vs.update(self._versions_other[name])

         # insert repo data, insert props into headers place
         _package = {}
         if tagged:
             for _v, _d1 in _vs.items():
                 # use tag as a next step
                 for _md5, _info in _d1.items():
                     _s = _info['section']
                     _a = _info['app']
                     for _pair in _info['repo']:
                         _rp = {}
                         # extract props for a repo
                         _r, _m = self._get_indexed_values(_pair)
                         # get tag
                         _tag = _r["props"]["tag"]
                         # cut tag from the header
                         _cut_head = _r["header"].split("_", 1)[1]
                         # populate dict
                         _rp["maintainer"] = _m
                         _rp["md5"] = _md5
                         _rp.update(_r["props"])
                         nested_set(
                             _package,
                             [_s, _a, _tag, _v, _cut_head],
                             _rp
                         )
         else:
             for _v, _d1 in _vs.items():
                 for _md5, _info in _d1.items():
                     _s = _info['section']
                     _a = _info['app']
                     for _pair in _info['repo']:
                         _r, _m = self._get_indexed_values(_pair)
                         _info["maintainer"] = _m
                         _info.update(_r["props"])
                         nested_set(
                             _package,
                             [_s, _a, _v, _md5, _r["header"]],
                             _info
                         )

         return _package

     def parse_repos(self):
         # all tags to check
         major, updates, hotfix = self._info_class.list_tags(splitted=True)

         # major tags
         logger_cli.info("# Processing major tags")
         for _tag in major:
             self.fetch_versions(_tag)

         # updates tags
         logger_cli.info("# Processing update tags")
         for _tag in updates:
             self.fetch_versions(_tag + ".update")

         # hotfix tags
         logger_cli.info("# Processing hotfix tags")
         for _tag in hotfix:
             self.fetch_versions(_tag + ".hotfix")