Merge "additional healthcheck while doing ceph mon backups" into release/2019.2.0

commit: 81597c5d39694d884dd5e4becbde609a73642c32 [log] [tgz]
author: mcp-jenkins <mcp-jenkins@mirantis.com> Mon May 27 15:12:58 2019 +0000
committer: Gerrit Code Review <mail@domain.com> Mon May 27 15:12:58 2019 +0000
tree: ce98b8bc1bbeafb903c701f0b058db86e3fe5cd6
parent: 57d577db91fe9187dee227573866a082525e0e09 [diff]
parent: ae1e7ad536a01594c375f17ef88f9789cea7c064 [diff]
diff --git a/ceph/files/backup/ceph-backup-client-runner.sh b/ceph/files/backup/ceph-backup-client-runner.sh
index 971f944..329494a 100644
--- a/ceph/files/backup/ceph-backup-client-runner.sh
+++ b/ceph/files/backup/ceph-backup-client-runner.sh

@@ -8,6 +8,7 @@
     TMPDIR="$( pwd )/tmp_ceph_backup"
     HOSTNAME="$( hostname )"
     TIMESTAMP="$( date +%m%d%H%M )"
+    HEALTH="$(ceph health)"
 
     # Need write access to local directory to create dump file
     if [ ! -w $( pwd ) ]; then
@@ -45,9 +46,14 @@
     rsync -arv --exclude=osd/{{ common.get('cluster_name', 'ceph') }}-*/current /var/lib/ceph $TMPDIR/{{ common.get('cluster_name', 'ceph') }}-$HOSTNAME/
 {%- elif mon.get('enabled', False) %}
     cp -a /etc/ceph/ $TMPDIR/
-    service ceph-mon@$HOSTNAME stop
-    cp -a /var/lib/ceph/ $TMPDIR/{{ common.get('cluster_name', 'ceph') }}-$HOSTNAME/
-    service ceph-mon@$HOSTNAME start
+    if echo $HEALTH | grep -v "mons down"; then
+      service ceph-mon@$HOSTNAME stop
+      cp -a /var/lib/ceph/ $TMPDIR/{{ common.get('cluster_name', 'ceph') }}-$HOSTNAME/
+      service ceph-mon@$HOSTNAME start
+    else
+      printf "One or more monitor nodes are already stopped or not working correctly. Cannot continue"
+      exit 1
+    fi
 {%- endif %}
 
     tar -cvzf $BACKUPDIR/$HOSTNAME/{{ common.get('cluster_name', 'ceph') }}-$HOSTNAME-$TIMESTAMP.tgz $TMPDIR
commit	81597c5d39694d884dd5e4becbde609a73642c32	[log] [tgz]
author	mcp-jenkins <mcp-jenkins@mirantis.com>	Mon May 27 15:12:58 2019 +0000
committer	Gerrit Code Review <mail@domain.com>	Mon May 27 15:12:58 2019 +0000
tree	ce98b8bc1bbeafb903c701f0b058db86e3fe5cd6
parent	57d577db91fe9187dee227573866a082525e0e09 [diff]
parent	ae1e7ad536a01594c375f17ef88f9789cea7c064 [diff]