[ceph] Add warning for component version diffrence during upgrade
Change-Id: I66b9f2fdbe09ee01a0d102f1d85443b3da1547f1
Related-Prod: PROD-36790
diff --git a/ceph-upgrade.groovy b/ceph-upgrade.groovy
index 39695f2..a0d6a1f 100644
--- a/ceph-upgrade.groovy
+++ b/ceph-upgrade.groovy
@@ -6,7 +6,6 @@
* SALT_MASTER_URL URL of Salt master
* SALT_MASTER_CREDENTIALS Credentials to the Salt API
*
- * ADMIN_HOST Host (minion id) with admin keyring and /etc/crushmap file present
* CLUSTER_FLAGS Comma separated list of tags to apply to cluster
* WAIT_FOR_HEALTHY Wait for cluster rebalance before stoping daemons
* ASK_CONFIRMATION Ask for manual confirmation
@@ -31,14 +30,17 @@
pepperEnv = "pepperEnv"
flags = CLUSTER_FLAGS.tokenize(',')
+// sortbitwise is set by default on version >jewel.
+// For jewel upgrade we will set and keep it while for other cases shouldn't be there
+flags.removeElement('sortbitwise')
def backup(master, target) {
- stage("backup ${target}") {
+ stage("backup $target") {
if (target == 'osd') {
try {
salt.enforceState(master, "I@ceph:${target}", "ceph.backup", true)
- salt.cmdRun(master, "I@ceph:${target}", "su root -c '/usr/local/bin/ceph-backup-runner-call.sh'")
+ ceph.cmdRunOnTarget(master, "I@ceph:${target}", "su root -c '/usr/local/bin/ceph-backup-runner-call.sh'")
} catch (Exception e) {
common.errorMsg(e)
common.errorMsg("Make sure Ceph backup on OSD nodes is enabled")
@@ -58,24 +60,24 @@
def provider_pillar = salt.getPillar(master, "${kvm01}", "salt:control:cluster:internal:node:${minion_name}:provider")
def minionProvider = provider_pillar['return'][0].values()[0]
- ceph.waitForHealthy(master, ADMIN_HOST, flags)
+ ceph.waitForHealthy(master, flags)
try {
- salt.cmdRun(master, "${minionProvider}", "[ ! -f ${BACKUP_DIR}/${minion_name}.${domain}.qcow2.bak ] && virsh destroy ${minion_name}.${domain}")
+ ceph.cmdRunOnTarget(master, minionProvider, "[ ! -f ${BACKUP_DIR}/${minion_name}.${domain}.qcow2.bak ] && virsh destroy ${minion_name}.${domain}")
} catch (Exception e) {
common.warningMsg('Backup already exists')
}
try {
- salt.cmdRun(master, "${minionProvider}", "[ ! -f ${BACKUP_DIR}/${minion_name}.${domain}.qcow2.bak ] && cp /var/lib/libvirt/images/${minion_name}.${domain}/system.qcow2 ${BACKUP_DIR}/${minion_name}.${domain}.qcow2.bak")
+ ceph.cmdRunOnTarget(master, minionProvider, "[ ! -f ${BACKUP_DIR}/${minion_name}.${domain}.qcow2.bak ] && cp /var/lib/libvirt/images/${minion_name}.${domain}/system.qcow2 ${BACKUP_DIR}/${minion_name}.${domain}.qcow2.bak")
} catch (Exception e) {
common.warningMsg('Backup already exists')
}
try {
- salt.cmdRun(master, "${minionProvider}", "virsh start ${minion_name}.${domain}")
+ ceph.cmdRunOnTarget(master, minionProvider, "virsh start ${minion_name}.${domain}")
} catch (Exception e) {
common.warningMsg(e)
}
salt.minionsReachable(master, 'I@salt:master', "${minion_name}*")
- ceph.waitForHealthy(master, ADMIN_HOST, flags)
+ ceph.waitForHealthy(master, flags)
}
}
}
@@ -84,7 +86,7 @@
def upgrade(master, target) {
- stage("Change ${target} repos") {
+ stage("Change $target repos") {
salt.runSaltProcessStep(master, "I@ceph:${target}", 'saltutil.refresh_pillar', [], null, true, 5)
salt.enforceState(master, "I@ceph:${target}", 'linux.system.repo', true)
}
@@ -95,20 +97,34 @@
}
if (target == 'common') {
stage('Upgrade ceph-common pkgs') {
- salt.runSaltProcessStep(master, "I@ceph:${target}", 'pkg.install', ["ceph-common"], 'only_upgrade=True')
+ salt.runSaltProcessStep(master, "I@ceph:common", 'pkg.install', ["ceph-common"], 'only_upgrade=True')
}
} else {
minions = salt.getMinions(master, "I@ceph:${target}")
+ def ignoreDifferentSubversions = false
for (minion in minions) {
// upgrade pkgs
if (target == 'radosgw') {
- stage('Upgrade radosgw pkgs') {
- salt.runSaltProcessStep(master, "I@ceph:${target}", 'pkg.install', [target], 'only_upgrade=True')
+ stage("Upgrade radosgw pkgs on $minion") {
+ salt.runSaltProcessStep(master, minion, 'pkg.install', [target], 'only_upgrade=True')
}
} else {
- stage("Upgrade ${target} pkgs on ${minion}") {
- salt.runSaltProcessStep(master, "${minion}", 'pkg.install', ["ceph-${target}"], 'only_upgrade=True')
+ stage("Upgrade $target pkgs on $minion") {
+ salt.runSaltProcessStep(master, minion, 'pkg.install', ["ceph-${target}"], 'only_upgrade=True')
+ }
+ }
+ // check for subversion difference before restart
+ if (ignoreDifferentSubversions) {
+ targetVersion = ceph.cmdRun(master, "ceph versions | grep $TARGET_RELEASE | awk '{print \$3}' | sort -V | tail -1")
+ updatedVersion = ceph.cmdRunOnTarget(master, minion, "ceph version | awk '{print \$3}'")
+ if (targetVersion != updatedVersion) {
+ stage('Version differnce warning') {
+ common.warningMsg("A potential problem has been spotted.")
+ common.warningMsg("Some components already have $targetVersion version while ceph-$target has just been updated to $updatedVersion")
+ input message: "Do you want to proceed with restarts and silence this warning?"
+ ignoreDifferentSubversions = true
+ }
}
}
// restart services
@@ -116,29 +132,30 @@
if(target == 'osd') {
def ceph_disks = salt.getGrain(master, minion, 'ceph')['return'][0].values()[0].values()[0]['ceph_disk']
ceph_disks.each { osd, param ->
- salt.cmdRun(master, "${minion}", "systemctl restart ceph-${target}@${osd}")
+ ceph.cmdRunOnTarget(master, minion, "systemctl restart ceph-${target}@${osd}")
}
}
else {
- salt.cmdRun(master, "${minion}", "systemctl restart ceph-${target}.target")
+ ceph.cmdRunOnTarget(master, minion, "systemctl restart ceph-${target}.target")
}
- ceph.waitForHealthy(master, ADMIN_HOST, flags)
+ ceph.waitForHealthy(master, flags)
}
- stage("Verify services for ${minion}") {
+ stage("Verify services for $minion") {
sleep(10)
- salt.cmdRun(master, "${minion}", "systemctl status ceph-${target}.target")
+ ceph.cmdRunOnTarget(master, minion, "systemctl status ceph-${target}.target")
}
- if (askConfirmation) {
- stage('Ask for manual confirmation') {
- input message: "From the verification command above, please check Ceph ${target} joined the cluster correctly. If so, Do you want to continue to upgrade next node?"
+ stage('Verify Ceph status') {
+ ceph.cmdRun(master, "ceph -s", true, true)
+ if (askConfirmation) {
+ input message: "From the verification command above, please check Ceph $target joined the cluster correctly. If so, Do you want to continue to upgrade next node?"
}
}
}
}
- salt.cmdRun(master, ADMIN_HOST, "ceph versions")
+ ceph.cmdRun(master, "ceph versions")
sleep(5)
return
}
@@ -150,21 +167,21 @@
python.setupPepperVirtualenv(pepperEnv, SALT_MASTER_URL, SALT_MASTER_CREDENTIALS)
stage('Check user choices') {
- if (STAGE_UPGRADE_RGW.toBoolean() == true) {
+ if (STAGE_UPGRADE_RGW.toBoolean()) {
// if rgw, check if other stuff has required version
def mon_ok = true
- if (STAGE_UPGRADE_MON.toBoolean() == false) {
- def mon_v = salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph mon versions")['return'][0].values()[0]
+ if (!STAGE_UPGRADE_MON.toBoolean()) {
+ def mon_v = ceph.cmdRun(pepperEnv, "ceph mon versions")
mon_ok = mon_v.contains("${TARGET_RELEASE}") && !mon_v.contains("${ORIGIN_RELEASE}")
}
def mgr_ok = true
- if (STAGE_UPGRADE_MGR.toBoolean() == false) {
- def mgr_v = salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph mgr versions")['return'][0].values()[0]
+ if (!STAGE_UPGRADE_MGR.toBoolean()) {
+ def mgr_v = ceph.cmdRun(pepperEnv, "ceph mgr versions")
mgr_ok = mgr_v.contains("${TARGET_RELEASE}") && !mgr_v.contains("${ORIGIN_RELEASE}")
}
def osd_ok = true
- if (STAGE_UPGRADE_OSD.toBoolean() == false) {
- def osd_v = salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph osd versions")['return'][0].values()[0]
+ if (!STAGE_UPGRADE_OSD.toBoolean()) {
+ def osd_v = ceph.cmdRun(pepperEnv, "ceph osd versions")
osd_ok = osd_v.contains("${TARGET_RELEASE}") && !osd_v.contains("${ORIGIN_RELEASE}")
}
if (!mon_ok || !osd_ok || !mgr_ok) {
@@ -186,14 +203,10 @@
}
}
- if (flags.size() > 0) {
- stage('Set cluster flags') {
- for (flag in flags) {
- salt.cmdRun(pepperEnv, ADMIN_HOST, 'ceph osd set ' + flag)
- }
- if (ORIGIN_RELEASE == 'jewel') {
- salt.cmdRun(pepperEnv, ADMIN_HOST, 'ceph osd set sortbitwise')
- }
+ stage('Set cluster flags') {
+ ceph.setFlags(pepperEnv, flags)
+ if (ORIGIN_RELEASE == 'jewel') {
+ ceph.setFlags('sortbitwise')
}
}
@@ -218,32 +231,25 @@
}
// remove cluster flags
- if (flags.size() > 0) {
- stage('Unset cluster flags') {
- for (flag in flags) {
- if (!flag.contains('sortbitwise')) {
- common.infoMsg('Removing flag ' + flag)
- salt.cmdRun(pepperEnv, ADMIN_HOST, 'ceph osd unset ' + flag)
- }
- }
- }
+ stage('Unset cluster flags') {
+ ceph.unsetFlags(flags)
}
if (STAGE_FINALIZE.toBoolean() == true) {
stage("Finalize ceph version upgrade") {
- salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph osd require-osd-release ${TARGET_RELEASE}")
+ ceph.cmdRun(pepperEnv, "ceph osd require-osd-release ${TARGET_RELEASE}")
try {
- salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph osd set-require-min-compat-client ${ORIGIN_RELEASE}")
+ ceph.cmdRun(pepperEnv, "ceph osd set-require-min-compat-client ${ORIGIN_RELEASE}")
} catch (Exception e) {
common.warningMsg(e)
}
try {
- salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph osd crush tunables optimal")
+ ceph.cmdRun(pepperEnv, "ceph osd crush tunables optimal")
} catch (Exception e) {
common.warningMsg(e)
}
if (TARGET_RELEASE == 'nautilus' ) {
- salt.cmdRun(pepperEnv, ADMIN_HOST, "ceph mon enable-msgr2")
+ ceph.cmdRun(pepperEnv, "ceph mon enable-msgr2")
}
salt.enforceState(pepperEnv, "I@ceph:common", "ceph.common")
}
@@ -251,7 +257,7 @@
// wait for healthy cluster
if (WAIT_FOR_HEALTHY.toBoolean()) {
- ceph.waitForHealthy(pepperEnv, ADMIN_HOST, flags)
+ ceph.waitForHealthy(pepperEnv, flags)
}
}
}