blob: 7ca8d0c66210d65eb3d22a2a24581b870a060850 [file] [log] [blame]
Martin Polreichaae1b9d2018-12-05 11:12:23 +01001/**
2 * Verify and restore Galera cluster
3 *
4 * Expected parameters:
5 * SALT_MASTER_CREDENTIALS Credentials to the Salt API.
6 * SALT_MASTER_URL Full Salt API address [http://10.10.10.1:8000].
Martin Polreich0d538262019-02-01 14:46:10 +01007 * ASK_CONFIRMATION Ask confirmation for restore
Martin Polreich0d538262019-02-01 14:46:10 +01008 * VERIFICATION_RETRIES Number of restries to verify the restoration.
Martin Polreich2aa74402019-01-21 14:42:48 +01009 * CHECK_TIME_SYNC Set to true to check time synchronization accross selected nodes.
Martin Polreich7ba33592019-03-21 15:12:15 +010010 * RESTORE_TYPE Sets restoration method
Martin Polreichaae1b9d2018-12-05 11:12:23 +010011 *
12**/
13
14def common = new com.mirantis.mk.Common()
15def salt = new com.mirantis.mk.Salt()
Martin Polreich71a08db2019-02-15 10:09:10 +010016def galera = new com.mirantis.mk.Galera()
Martin Polreichaae1b9d2018-12-05 11:12:23 +010017def python = new com.mirantis.mk.Python()
Martin Polreichaae1b9d2018-12-05 11:12:23 +010018def pepperEnv = "pepperEnv"
19def resultCode = 99
Martin Polreich7ba33592019-03-21 15:12:15 +010020def restoreType = env.RESTORE_TYPE
21def runRestoreDb = false
22def runBackupDb = false
Martin Polreichaae1b9d2018-12-05 11:12:23 +010023
Martin Polreich0d538262019-02-01 14:46:10 +010024askConfirmation = (env.getProperty('ASK_CONFIRMATION') ?: true).toBoolean()
Martin Polreich2aa74402019-01-21 14:42:48 +010025checkTimeSync = (env.getProperty('CHECK_TIME_SYNC') ?: true).toBoolean()
Sergeyc8a8a792019-01-15 17:27:59 +040026
Martin Polreich0d538262019-02-01 14:46:10 +010027if (common.validInputParam(VERIFICATION_RETRIES) && VERIFICATION_RETRIES.isInteger()) {
28 verificationRetries = VERIFICATION_RETRIES.toInteger()
29} else {
30 verificationRetries = 5
31}
Martin Polreich7ba33592019-03-21 15:12:15 +010032if (restoreType.equals("BACKUP_AND_RESTORE") || restoreType.equals("ONLY_RESTORE")) {
33 runRestoreDb = true
34}
35if (restoreType.equals("BACKUP_AND_RESTORE")) {
36 runBackupDb = true
37}
Martin Polreich0d538262019-02-01 14:46:10 +010038
Martin Polreichaae1b9d2018-12-05 11:12:23 +010039timeout(time: 12, unit: 'HOURS') {
40 node() {
41 stage('Setup virtualenv for Pepper') {
42 python.setupPepperVirtualenv(pepperEnv, SALT_MASTER_URL, SALT_MASTER_CREDENTIALS)
43 }
Martin Polreich7ba33592019-03-21 15:12:15 +010044 stage('Verify status') {
Ivan Berezovskiyb6d18d52019-07-24 15:30:54 +040045 def sysstatTargets = 'I@xtrabackup:client or I@xtrabackup:server'
46 def sysstatTargetsNodes = salt.getMinions(pepperEnv, sysstatTargets)
47 try {
48 if (!salt.isPackageInstalled(['saltId': pepperEnv, 'target': sysstatTargets, 'packageName': 'sysstat', 'output': false])) {
49 if (askConfirmation) {
50 input message: "Do you want to install 'sysstat' package on targeted nodes: ${sysstatTargetsNodes}? Click to confirm"
51 }
52 salt.runSaltProcessStep(pepperEnv, sysstatTargets, 'pkg.install', ['sysstat'])
53 }
54 } catch (Exception e) {
55 common.errorMsg("Unable to determine status of sysstat package on target nodes: ${sysstatTargetsNodes}.")
56 if (askConfirmation) {
57 input message: "Do you want to continue? Click to confirm"
58 }
59 }
Martin Polreich71a08db2019-02-15 10:09:10 +010060 resultCode = galera.verifyGaleraStatus(pepperEnv, false, checkTimeSync)
Martin Polreichaae1b9d2018-12-05 11:12:23 +010061 if (resultCode == 128) {
62 common.errorMsg("Unable to connect to Galera Master. Trying slaves...")
Martin Polreich71a08db2019-02-15 10:09:10 +010063 resultCode = galera.verifyGaleraStatus(pepperEnv, true, checkTimeSync)
Martin Polreichaae1b9d2018-12-05 11:12:23 +010064 if (resultCode == 129) {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +040065 common.errorMsg("Unable to obtain Galera slave minions list. Without fixing this issue, pipeline cannot continue in verification, backup and restoration.")
Martin Polreichaae1b9d2018-12-05 11:12:23 +010066 currentBuild.result = "FAILURE"
Martin Polreich0d538262019-02-01 14:46:10 +010067 return
Martin Polreichaae1b9d2018-12-05 11:12:23 +010068 } else if (resultCode == 130) {
Martin Polreich7ba33592019-03-21 15:12:15 +010069 common.errorMsg("Neither master or slaves are reachable. Without fixing this issue, pipeline cannot continue in verification, backup and restoration.")
Martin Polreichaae1b9d2018-12-05 11:12:23 +010070 currentBuild.result = "FAILURE"
Martin Polreich0d538262019-02-01 14:46:10 +010071 return
Martin Polreichaae1b9d2018-12-05 11:12:23 +010072 }
73 }
Martin Polreich2aa74402019-01-21 14:42:48 +010074 if (resultCode == 131) {
Martin Polreich323ffde2019-05-07 15:56:38 +020075 common.errorMsg("Time desynced - Please fix this issue and rerun the pipeline.")
Martin Polreich2aa74402019-01-21 14:42:48 +010076 currentBuild.result = "FAILURE"
Martin Polreich323ffde2019-05-07 15:56:38 +020077 return
78 }
79 if (resultCode == 140 || resultCode == 141) {
80 common.errorMsg("Disk utilization check failed - Please fix this issue and rerun the pipeline.")
81 currentBuild.result = "FAILURE"
82 return
Martin Polreich2aa74402019-01-21 14:42:48 +010083 }
Martin Polreichaae1b9d2018-12-05 11:12:23 +010084 if (resultCode == 1) {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +040085 if (askConfirmation) {
86 input message: "There was a problem with parsing the status output or with determining it. Do you want to run a restore?"
Sergeyc8a8a792019-01-15 17:27:59 +040087 } else {
88 common.warningMsg("There was a problem with parsing the status output or with determining it. Try to restore.")
89 }
Martin Polreichaae1b9d2018-12-05 11:12:23 +010090 } else if (resultCode > 1) {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +040091 if (askConfirmation) {
92 input message: "There's something wrong with the cluster, do you want to continue with backup and/or restore?"
Sergeyc8a8a792019-01-15 17:27:59 +040093 } else {
Martin Polreich7ba33592019-03-21 15:12:15 +010094 common.warningMsg("There's something wrong with the cluster, try to backup and/or restore.")
Sergeyc8a8a792019-01-15 17:27:59 +040095 }
Martin Polreichaae1b9d2018-12-05 11:12:23 +010096 } else {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +040097 if (askConfirmation) {
98 input message: "There seems to be everything alright with the cluster, do you still want to continue with backup and/or restore?"
Sergeyc8a8a792019-01-15 17:27:59 +040099 } else {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +0400100 common.warningMsg("There seems to be everything alright with the cluster, no backup and no restoration will be done.")
101 currentBuild.result = "SUCCESS"
102 return
Sergeyc8a8a792019-01-15 17:27:59 +0400103 }
Martin Polreichaae1b9d2018-12-05 11:12:23 +0100104 }
Martin Polreich7ba33592019-03-21 15:12:15 +0100105 }
106 if (runBackupDb) {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +0400107 if (askConfirmation) {
108 input message: "Are you sure you want to run a backup? Click to confirm"
109 }
Martin Polreich7ba33592019-03-21 15:12:15 +0100110 stage('Backup') {
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +0400111 deployBuild = build(job: 'galera_backup_database', parameters: [
112 [$class: 'StringParameterValue', name: 'SALT_MASTER_URL', value: SALT_MASTER_URL],
113 [$class: 'StringParameterValue', name: 'SALT_MASTER_CREDENTIALS', value: SALT_MASTER_CREDENTIALS],
114 [$class: 'StringParameterValue', name: 'OVERRIDE_BACKUP_NODE', value: "none"],
115 ]
Martin Polreich7ba33592019-03-21 15:12:15 +0100116 )
117 }
118 }
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +0400119 if (runRestoreDb) {
120 stage('Restore') {
121 if (askConfirmation) {
122 input message: "Are you sure you want to run a restore? Click to confirm"
Sergeyc8a8a792019-01-15 17:27:59 +0400123 }
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +0400124 try {
125 if ((!askConfirmation && resultCode > 0) || askConfirmation) {
126 galera.restoreGaleraCluster(pepperEnv, runRestoreDb)
127 }
128 } catch (Exception e) {
129 common.errorMsg("Restoration process has failed.")
130 }
Martin Polreichaae1b9d2018-12-05 11:12:23 +0100131 }
Ivan Berezovskiy6ef32f02019-07-26 15:55:24 +0400132 stage('Verify restoration result') {
133 common.retry(verificationRetries, 15) {
134 exitCode = galera.verifyGaleraStatus(pepperEnv, false, false)
135 if (exitCode >= 1) {
136 error("Verification attempt finished with an error. This may be caused by cluster not having enough time to come up or to sync. Next verification attempt in 5 seconds.")
137 } else {
138 common.infoMsg("Restoration procedure seems to be successful. See verification report to be sure.")
139 currentBuild.result = "SUCCESS"
140 }
Martin Polreich0d538262019-02-01 14:46:10 +0100141 }
Martin Polreichc9466c72019-01-18 14:17:52 +0100142 }
143 }
Martin Polreichaae1b9d2018-12-05 11:12:23 +0100144 }
145}