blob: dac460ab863fd9944991bc4405ee31e42f18538c [file] [log] [blame]
Max Rasskazov7f3c53c2014-12-09 14:19:17 +03001#!/usr/bin/env python
2#-*- coding: utf-8 -*-
3
4
5import datetime
Max Rasskazov11653ab2015-01-15 15:45:16 +03006import logging
Max Rasskazov7f3c53c2014-12-09 14:19:17 +03007import os
Max Rasskazove99d8372015-01-13 20:07:01 +03008import re
Max Rasskazov7f3c53c2014-12-09 14:19:17 +03009import subprocess
10import tempfile
Max Rasskazovd5b47eb2015-05-27 22:26:54 +030011import shutil
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030012
13
Max Rasskazov11653ab2015-01-15 15:45:16 +030014logging.basicConfig(level=logging.INFO)
15logger = logging.getLogger('rsync_staging')
16
Max Rasskazov3fe42712015-01-15 15:34:22 +030017now = datetime.datetime.utcnow()
18staging_snapshot_stamp_format = r'%Y-%m-%d-%H%M%S'
19staging_snapshot_stamp_regexp = r'[0-9]{4}-[0-9]{2}-[0-9]{2}-[0-9]{6}'
20staging_snapshot_stamp = now.strftime(staging_snapshot_stamp_format)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030021
22
Max Rasskazovd5b47eb2015-05-27 22:26:54 +030023class RsyncHost(object):
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030024 def __init__(self,
25 mirror_name,
26 host,
27 module='mirror-sync',
28 root_path='fwm',
29 files_dir='files',
30 save_last_days=61,
31 rsync_extra_params='-v',
Max Rasskazovd5b47eb2015-05-27 22:26:54 +030032 staging_postfix='staging',
33 init_directory_structure=True):
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030034 self.mirror_name = mirror_name
35 self.host = host
36 self.module = module
37 self.root_path = root_path
38 self.files_dir = files_dir
39 self.save_last_days = save_last_days
40 self.rsync_extra_params = rsync_extra_params
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030041 self.staging_postfix = staging_postfix
Max Rasskazov3fe42712015-01-15 15:34:22 +030042 self.staging_snapshot_stamp = staging_snapshot_stamp
43 self.staging_snapshot_stamp_format = staging_snapshot_stamp_format
44 if re.match(staging_snapshot_stamp_regexp,
45 self.staging_snapshot_stamp) \
46 is not None:
47 self.staging_snapshot_stamp_regexp = staging_snapshot_stamp_regexp
48 else:
49 raise RuntimeError('Wrong regexp for staging_snapshot_stamp\n'
50 'staging_snapshot_stamp = "{}"\n'
51 'staging_snapshot_stamp_regexp = "{}"'.
52 format(staging_snapshot_stamp,
53 staging_snapshot_stamp_regexp)
54 )
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030055
Max Rasskazovd5b47eb2015-05-27 22:26:54 +030056 if init_directory_structure is True:
57 self.init_directory_structure()
58
Max Rasskazov7f3c53c2014-12-09 14:19:17 +030059 @property
60 def url(self):
61 return '{}::{}'.format(self.host, self.module)
62
63 @property
64 def root_url(self):
65 return '{}/{}'.format(self.url, self.root_path)
66
67 @property
68 def files_path(self):
69 return '{}/{}'.format(self.root_path, self.files_dir)
70
71 @property
72 def files_url(self):
73 return '{}/{}'.format(self.root_url, self.files_dir)
74
75 def http_url(self, path):
76 return 'http://{}/{}'.format(self.host, path)
77
78 def html_link(self, path, link_name):
79 return '<a href="{}">{}</a>'.format(self.http_url(path), link_name)
80
81 @property
82 def staging_dir(self):
83 return '{}-{}'.format(self.mirror_name, self.staging_snapshot_stamp)
84
85 @property
86 def staging_dir_path(self):
87 return '{}/{}'.format(self.files_path, self.staging_dir)
88
89 @property
90 def staging_dir_url(self):
91 return '{}/{}'.format(self.url, self.staging_dir_path)
92
93 @property
94 def staging_link(self):
95 return '{}-{}'.format(self.mirror_name, self.staging_postfix)
96
97 @property
98 def staging_link_path(self):
99 return '{}/{}'.format(self.files_path, self.staging_link)
100
101 @property
102 def staging_link_url(self):
103 return '{}/{}'.format(self.url, self.staging_link_path)
104
Max Rasskazovd5b47eb2015-05-27 22:26:54 +0300105 def init_directory_structure(self):
106 root_dir_present = self.rsync_ls_dirs(
107 '/',
108 pattern=r'^{}$'.format(self.root_path)
109 )[1]
110 root_dir_present = True if len(root_dir_present) > 0 else False
111 if root_dir_present is True:
112 files_dir_present = self.rsync_ls_dirs(
113 '{}/'.format(self.root_path),
114 pattern=r'^{}$'.format(self.files_dir)
115 )[1]
116 files_dir_present = True if len(files_dir_present) > 0 else False
117
118 if not root_dir_present or not files_dir_present:
119 dir_to_sync = tempfile.mkdtemp()
120 os.makedirs('{}/{}'.format(dir_to_sync, self.files_path))
121 self._do_rsync(
122 source='{}/'.format(dir_to_sync),
123 dest='{}/'.format(self.url),
124 opts='-a'
125 )
126 shutil.rmtree(dir_to_sync)
127
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300128 @property
129 def empty_dir(self):
130 if self.__dict__.get('_empty_dir') is None:
131 self._empty_dir = tempfile.mkdtemp()
132 return self._empty_dir
133
134 def symlink_to(self, target):
135 linkname = tempfile.mktemp()
136 os.symlink(target, linkname)
137 return linkname
138
139 def _shell(self, cmd, raise_error=True):
Max Rasskazov11653ab2015-01-15 15:45:16 +0300140 logger.info(cmd)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300141 process = subprocess.Popen(cmd,
142 stdin=subprocess.PIPE,
143 stdout=subprocess.PIPE,
144 stderr=subprocess.PIPE,
145 shell=True)
146 out, err = process.communicate()
Max Rasskazov11653ab2015-01-15 15:45:16 +0300147 logger.debug(out)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300148 exitcode = process.returncode
149 if process.returncode != 0 and raise_error:
150 msg = '"{cmd}" failed. Exit code == {exitcode}'\
151 '\n\nSTDOUT: \n{out}'\
152 '\n\nSTDERR: \n{err}'\
153 .format(**(locals()))
Max Rasskazov11653ab2015-01-15 15:45:16 +0300154 logger.error(msg)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300155 raise RuntimeError(msg)
156 return exitcode, out, err
157
158 def _do_rsync(self, source='', dest=None, opts='', extra=None):
159 if extra is None:
160 extra = self.rsync_extra_params
161 cmd = 'rsync {opts} {extra} {source} {dest}'.format(**(locals()))
162 return self._shell(cmd)
163
Max Rasskazove99d8372015-01-13 20:07:01 +0300164 def _rsync_ls(self, dirname=None, pattern=r'.*', opts=''):
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300165 if dirname is None:
166 dirname = '{}/'.format(self.root_path)
167 dest = '{}/{}'.format(self.url, dirname)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300168 extra = self.rsync_extra_params + ' --no-v'
169 exitcode, out, err = self._do_rsync(dest=dest, opts=opts, extra=extra)
Max Rasskazove99d8372015-01-13 20:07:01 +0300170 regexp = re.compile(pattern)
171 out = [_ for _ in out.splitlines()
172 if (_.split()[-1] != '.') and
173 (regexp.match(_.split()[-1]) is not None)]
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300174 return exitcode, out, err
175
Max Rasskazove99d8372015-01-13 20:07:01 +0300176 def rsync_ls(self, dirname, pattern=r'.*'):
177 exitcode, out, err = self._rsync_ls(dirname, pattern=pattern)
178 out = [_.split()[-1] for _ in out]
179 return exitcode, out, err
180
181 def rsync_ls_dirs(self, dirname, pattern=r'.*'):
182 exitcode, out, err = self._rsync_ls(dirname, pattern=pattern)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300183 out = [_.split()[-1] for _ in out if _.startswith('d')]
184 return exitcode, out, err
185
Max Rasskazove99d8372015-01-13 20:07:01 +0300186 def rsync_ls_symlinks(self, dirname, pattern=r'.*'):
187 exitcode, out, err = self._rsync_ls(dirname,
188 pattern=pattern,
189 opts='-l')
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300190 out = [_.split()[-3:] for _ in out if _.startswith('l')]
191 out = [[_[0], _[-1]] for _ in out]
192 return exitcode, out, err
193
194 def rsync_delete_file(self, filename):
195 dirname, filename = os.path.split(filename)
196 source = '{}/'.format(self.empty_dir)
197 dest = '{}/{}/'.format(self.url, dirname)
198 opts = "-r --delete --include={} '--exclude=*'".format(filename)
199 return self._do_rsync(source=source, dest=dest, opts=opts)
200
201 def rsync_delete_dir(self, dirname):
202 source = '{}/'.format(self.empty_dir)
203 dest = '{}/{}/'.format(self.url, dirname)
204 opts = "-a --delete"
205 exitcode, out, err = self._do_rsync(source=source,
206 dest=dest,
207 opts=opts)
208 return self.rsync_delete_file(dirname)
209
210 def rsync_staging_transfer(self, source, tgt_symlink_name=None):
211 if tgt_symlink_name is None:
212 tgt_symlink_name = self.mirror_name
213 opts = '--archive --force --ignore-errors '\
214 '--delete-excluded --no-owner --no-group --delete '\
215 '--link-dest=/{}'.format(self.staging_link_path)
216 try:
217 exitcode, out, err = self._do_rsync(source=source,
218 dest=self.staging_dir_url,
219 opts=opts)
220 self.rsync_delete_file(self.staging_link_path)
221 self._do_rsync(source=self.symlink_to(self.staging_dir),
222 dest=self.staging_link_url,
223 opts='-l')
224 # cleaning of old snapshots
Max Rasskazov3fe42712015-01-15 15:34:22 +0300225 self._remove_old_snapshots()
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300226 return exitcode, out, err
227 except RuntimeError as e:
Max Rasskazov11653ab2015-01-15 15:45:16 +0300228 logger.error(e.message)
Max Rasskazov7f3c53c2014-12-09 14:19:17 +0300229 self.rsync_delete_dir(self.staging_dir_path)
230 raise
Max Rasskazov3fe42712015-01-15 15:34:22 +0300231
232 def _remove_old_snapshots(self, save_last_days=None):
233 if save_last_days is None:
234 save_last_days = self.save_last_days
235 if save_last_days is None \
236 or save_last_days is False \
237 or save_last_days == 0:
238 # skipping deletion if save_last_days == None or False or 0
Max Rasskazov11653ab2015-01-15 15:45:16 +0300239 logger.info('Skip deletion of old snapshots because of '
240 'save_last_days == {}'.format(save_last_days))
Max Rasskazov3fe42712015-01-15 15:34:22 +0300241 return
242 warn_date = now - datetime.timedelta(days=save_last_days)
243 warn_date = datetime.datetime.combine(warn_date, datetime.time(0))
244 dirs = self.rsync_ls_dirs(
245 '{}/'.format(self.files_path),
246 pattern='^{}-{}'.format(self.mirror_name,
247 self.staging_snapshot_stamp_regexp)
248 )[1]
249 links = self.rsync_ls_symlinks('{}/'.format(self.root_path))[1]
250 links += self.rsync_ls_symlinks('{}/'.format(self.files_path))[1]
251 for d in dirs:
252 dir_date = datetime.datetime.strptime(
253 d,
254 '{}-{}'.format(self.mirror_name,
255 self.staging_snapshot_stamp_format)
256 )
257 dir_date = datetime.datetime.combine(dir_date, datetime.time(0))
258 dir_path = '{}/{}'.format(self.files_path, d)
259 if dir_date < warn_date:
260 dir_links = [_[0] for _ in links
261 if _[1] == d
262 or _[1].endswith('/{}'.format(d))
263 ]
264 if not dir_links:
265 self.rsync_delete_dir(dir_path)
266 else:
Max Rasskazov11653ab2015-01-15 15:45:16 +0300267 logger.info('Skip deletion of "{}" because there are '
268 'symlinks found: {}'.format(d, dir_links))