| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 1 | /** | 
|  | 2 | * | 
|  | 3 | * Remove OSD from existing cluster | 
|  | 4 | * | 
|  | 5 | * Requred parameters: | 
|  | 6 | *  SALT_MASTER_URL             URL of Salt master | 
|  | 7 | *  SALT_MASTER_CREDENTIALS     Credentials to the Salt API | 
|  | 8 | * | 
|  | 9 | *  HOST                        Host (minion id) to be removed | 
| Jiri Broulik | 2c00f4c | 2017-10-26 13:23:11 +0200 | [diff] [blame] | 10 | *  OSD                         Comma separated list of osd ids to be removed | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 11 | *  ADMIN_HOST                  Host (minion id) with admin keyring | 
|  | 12 | *  CLUSTER_FLAGS               Comma separated list of tags to apply to cluster | 
|  | 13 | *  WAIT_FOR_HEALTHY            Wait for cluster rebalance before stoping daemons | 
|  | 14 | * | 
|  | 15 | */ | 
|  | 16 |  | 
|  | 17 | common = new com.mirantis.mk.Common() | 
|  | 18 | salt = new com.mirantis.mk.Salt() | 
| chnyda | 625f4b4 | 2017-10-11 14:10:31 +0200 | [diff] [blame] | 19 | def python = new com.mirantis.mk.Python() | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 20 |  | 
| chnyda | 625f4b4 | 2017-10-11 14:10:31 +0200 | [diff] [blame] | 21 | def pepperEnv = "pepperEnv" | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 22 | def flags = CLUSTER_FLAGS.tokenize(',') | 
| Tomáš Kukrál | 9d6228b | 2017-08-15 16:54:55 +0200 | [diff] [blame] | 23 | def osds = OSD.tokenize(',') | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 24 |  | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 25 | def removePartition(master, target, partition_uuid) { | 
|  | 26 | def partition = "" | 
|  | 27 | try { | 
|  | 28 | // partition = /dev/sdi2 | 
|  | 29 | partition = runCephCommand(master, target, "blkid | grep ${partition_uuid} ")['return'][0].values()[0].split("(?<=[0-9])")[0] | 
|  | 30 | } catch (Exception e) { | 
|  | 31 | common.warningMsg(e) | 
|  | 32 | } | 
|  | 33 |  | 
|  | 34 | if (partition?.trim()) { | 
|  | 35 | // dev = /dev/sdi | 
|  | 36 | def dev = partition.replaceAll('\\d+$', "") | 
|  | 37 | // part_id = 2 | 
|  | 38 | def part_id = partition.substring(partition.lastIndexOf("/")+1).replaceAll("[^0-9]", "") | 
|  | 39 | runCephCommand(master, target, "parted ${dev} rm ${part_id}") | 
|  | 40 | } | 
|  | 41 | return | 
|  | 42 | } | 
|  | 43 |  | 
|  | 44 | def runCephCommand(master, target, cmd) { | 
|  | 45 | return salt.cmdRun(master, target, cmd) | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 46 | } | 
|  | 47 |  | 
| Jiri Broulik | 96c867a | 2017-11-07 16:14:10 +0100 | [diff] [blame] | 48 | def waitForHealthy(master, count=0, attempts=300) { | 
|  | 49 | // wait for healthy cluster | 
|  | 50 | while (count<attempts) { | 
|  | 51 | def health = runCephCommand(master, ADMIN_HOST, 'ceph health')['return'][0].values()[0] | 
|  | 52 | if (health.contains('HEALTH_OK')) { | 
|  | 53 | common.infoMsg('Cluster is healthy') | 
|  | 54 | break; | 
|  | 55 | } | 
|  | 56 | count++ | 
|  | 57 | sleep(10) | 
|  | 58 | } | 
|  | 59 | } | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 60 | timeout(time: 12, unit: 'HOURS') { | 
|  | 61 | node("python") { | 
| Jiri Broulik | 96c867a | 2017-11-07 16:14:10 +0100 | [diff] [blame] | 62 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 63 | // create connection to salt master | 
|  | 64 | python.setupPepperVirtualenv(pepperEnv, SALT_MASTER_URL, SALT_MASTER_CREDENTIALS) | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 65 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 66 | if (flags.size() > 0) { | 
|  | 67 | stage('Set cluster flags') { | 
|  | 68 | for (flag in flags) { | 
|  | 69 | runCephCommand(pepperEnv, ADMIN_HOST, 'ceph osd set ' + flag) | 
|  | 70 | } | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 71 | } | 
|  | 72 | } | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 73 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 74 | def osd_ids = [] | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 75 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 76 | // get list of osd disks of the host | 
|  | 77 | salt.runSaltProcessStep(pepperEnv, HOST, 'saltutil.sync_grains', [], null, true, 5) | 
|  | 78 | def ceph_disks = salt.getGrain(pepperEnv, HOST, 'ceph')['return'][0].values()[0].values()[0]['ceph_disk'] | 
|  | 79 | common.prettyPrint(ceph_disks) | 
| Jiri Broulik | adc7ecd | 2017-10-18 06:59:27 +0200 | [diff] [blame] | 80 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 81 | for (i in ceph_disks) { | 
|  | 82 | def osd_id = i.getKey().toString() | 
|  | 83 | if (osd_id in osds || OSD == '*') { | 
|  | 84 | osd_ids.add('osd.' + osd_id) | 
|  | 85 | print("Will delete " + osd_id) | 
|  | 86 | } else { | 
|  | 87 | print("Skipping " + osd_id) | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 88 | } | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 89 | } | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 90 |  | 
|  | 91 | // wait for healthy cluster | 
|  | 92 | if (WAIT_FOR_HEALTHY.toBoolean() == true) { | 
|  | 93 | waitForHealthy(pepperEnv) | 
|  | 94 | } | 
|  | 95 |  | 
|  | 96 | // `ceph osd out <id> <id>` | 
|  | 97 | stage('Set OSDs out') { | 
|  | 98 | runCephCommand(pepperEnv, ADMIN_HOST, 'ceph osd out ' + osd_ids.join(' ')) | 
|  | 99 | } | 
|  | 100 |  | 
|  | 101 | // wait for healthy cluster | 
|  | 102 | if (WAIT_FOR_HEALTHY.toBoolean() == true) { | 
|  | 103 | sleep(5) | 
|  | 104 | waitForHealthy(pepperEnv) | 
|  | 105 | } | 
|  | 106 |  | 
|  | 107 | // stop osd daemons | 
|  | 108 | stage('Stop OSD daemons') { | 
|  | 109 | for (i in osd_ids) { | 
|  | 110 | salt.runSaltProcessStep(pepperEnv, HOST, 'service.stop', ['ceph-osd@' + i.replaceAll('osd.', '')],  null, true) | 
|  | 111 | } | 
|  | 112 | } | 
|  | 113 |  | 
|  | 114 | // `ceph osd crush remove osd.2` | 
|  | 115 | stage('Remove OSDs from CRUSH') { | 
|  | 116 | for (i in osd_ids) { | 
|  | 117 | runCephCommand(pepperEnv, ADMIN_HOST, 'ceph osd crush remove ' + i) | 
|  | 118 | } | 
|  | 119 | } | 
|  | 120 |  | 
|  | 121 | // remove keyring `ceph auth del osd.3` | 
|  | 122 | stage('Remove OSD keyrings from auth') { | 
|  | 123 | for (i in osd_ids) { | 
|  | 124 | runCephCommand(pepperEnv, ADMIN_HOST, 'ceph auth del ' + i) | 
|  | 125 | } | 
|  | 126 | } | 
|  | 127 |  | 
|  | 128 | // remove osd `ceph osd rm osd.3` | 
|  | 129 | stage('Remove OSDs') { | 
|  | 130 | for (i in osd_ids) { | 
|  | 131 | runCephCommand(pepperEnv, ADMIN_HOST, 'ceph osd rm ' + i) | 
|  | 132 | } | 
|  | 133 | } | 
|  | 134 |  | 
|  | 135 | for (osd_id in osd_ids) { | 
|  | 136 |  | 
|  | 137 | id = osd_id.replaceAll('osd.', '') | 
|  | 138 | def dmcrypt = "" | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 139 | try { | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 140 | dmcrypt = runCephCommand(pepperEnv, HOST, "ls -la /var/lib/ceph/osd/ceph-${id}/ | grep dmcrypt")['return'][0].values()[0] | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 141 | } catch (Exception e) { | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 142 | common.warningMsg(e) | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 143 | } | 
|  | 144 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 145 | if (dmcrypt?.trim()) { | 
|  | 146 | mount = runCephCommand(pepperEnv, HOST, "lsblk -rp | grep /var/lib/ceph/osd/ceph-${id} -B1")['return'][0].values()[0] | 
|  | 147 | dev = mount.split()[0].replaceAll("[0-9]","") | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 148 |  | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 149 | // remove partition tables | 
|  | 150 | stage("dd part table on ${dev}") { | 
|  | 151 | runCephCommand(pepperEnv, HOST, "dd if=/dev/zero of=${dev} bs=512 count=1 conv=notrunc") | 
|  | 152 | } | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 153 |  | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 154 | } | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 155 | // remove journal, block_db, block_wal partition `parted /dev/sdj rm 3` | 
|  | 156 | stage('Remove journal / block_db / block_wal partition') { | 
|  | 157 | def partition_uuid = "" | 
|  | 158 | def journal_partition_uuid = "" | 
|  | 159 | def block_db_partition_uuid = "" | 
|  | 160 | def block_wal_partition_uuid = "" | 
|  | 161 | try { | 
|  | 162 | journal_partition_uuid = runCephCommand(pepperEnv, HOST, "ls -la /var/lib/ceph/osd/ceph-${id}/ | grep journal | grep partuuid") | 
|  | 163 | journal_partition_uuid = journal_partition_uuid.toString().trim().split("\n")[0].substring(journal_partition_uuid.toString().trim().lastIndexOf("/")+1) | 
|  | 164 | } catch (Exception e) { | 
|  | 165 | common.infoMsg(e) | 
|  | 166 | } | 
|  | 167 | try { | 
|  | 168 | block_db_partition_uuid = runCephCommand(pepperEnv, HOST, "ls -la /var/lib/ceph/osd/ceph-${id}/ | grep 'block.db' | grep partuuid") | 
|  | 169 | block_db_partition_uuid = block_db_partition_uuid.toString().trim().split("\n")[0].substring(block_db_partition_uuid.toString().trim().lastIndexOf("/")+1) | 
|  | 170 | } catch (Exception e) { | 
|  | 171 | common.infoMsg(e) | 
|  | 172 | } | 
|  | 173 |  | 
|  | 174 | try { | 
|  | 175 | block_wal_partition_uuid = runCephCommand(pepperEnv, HOST, "ls -la /var/lib/ceph/osd/ceph-${id}/ | grep 'block.wal' | grep partuuid") | 
|  | 176 | block_wal_partition_uuid = block_wal_partition_uuid.toString().trim().split("\n")[0].substring(block_wal_partition_uuid.toString().trim().lastIndexOf("/")+1) | 
|  | 177 | } catch (Exception e) { | 
|  | 178 | common.infoMsg(e) | 
|  | 179 | } | 
|  | 180 |  | 
|  | 181 | // set partition_uuid = 2c76f144-f412-481e-b150-4046212ca932 | 
|  | 182 | if (journal_partition_uuid?.trim()) { | 
|  | 183 | partition_uuid = journal_partition_uuid | 
|  | 184 | } else if (block_db_partition_uuid?.trim()) { | 
|  | 185 | partition_uuid = block_db_partition_uuid | 
|  | 186 | } | 
|  | 187 |  | 
|  | 188 | // if disk has journal, block_db or block_wal on different disk, then remove the partition | 
|  | 189 | if (partition_uuid?.trim()) { | 
|  | 190 | removePartition(pepperEnv, HOST, partition_uuid) | 
|  | 191 | } | 
|  | 192 | if (block_wal_partition_uuid?.trim()) { | 
|  | 193 | removePartition(pepperEnv, HOST, block_wal_partition_uuid) | 
|  | 194 | } | 
| Jiri Broulik | eb7b82f | 2017-11-30 13:55:40 +0100 | [diff] [blame] | 195 | } | 
|  | 196 | } | 
| Jakub Josef | a63f986 | 2018-01-11 17:58:38 +0100 | [diff] [blame] | 197 | // remove cluster flags | 
|  | 198 | if (flags.size() > 0) { | 
|  | 199 | stage('Unset cluster flags') { | 
|  | 200 | for (flag in flags) { | 
|  | 201 | common.infoMsg('Removing flag ' + flag) | 
|  | 202 | runCephCommand(pepperEnv, ADMIN_HOST, 'ceph osd unset ' + flag) | 
|  | 203 | } | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 204 | } | 
|  | 205 | } | 
|  | 206 | } | 
| Tomáš Kukrál | f72096d | 2017-08-11 12:58:03 +0200 | [diff] [blame] | 207 | } |