Reworked purge cluster playbook

author Ivan Font <ivan.font@redhat.com>

Thu, 6 Oct 2016 04:32:38 +0000 (21:32 -0700)

committer Ivan Font <ivan.font@redhat.com>

Thu, 6 Oct 2016 04:32:38 +0000 (21:32 -0700)
author Ivan Font <ivan.font@redhat.com>
Thu, 6 Oct 2016 04:32:38 +0000 (21:32 -0700)
committer Ivan Font <ivan.font@redhat.com>
Thu, 6 Oct 2016 04:32:38 +0000 (21:32 -0700)
diff --git a/infrastructure-playbooks/purge-cluster.yml b/infrastructure-playbooks/purge-cluster.yml

index 9c82503662abafbe9c4955ad790f95f47769ee46..bfe310d16b745cc3d72af64d105003cc80a6d3d2 100644 (file)
--- a/infrastructure-playbooks/purge-cluster.yml
+++ b/infrastructure-playbooks/purge-cluster.yml
@@ -13,6 +13,7 @@
  
  - name: confirm whether user really meant to purge the cluster
    hosts: localhost
+  gather_facts: false
  
    vars_prompt:
      - name: ireallymeanit
@@ -30,90 +31,52 @@
           invoking the playbook"
      when: ireallymeanit != 'yes'
  
-- name: stop ceph cluster
-  hosts:
-    - mons
-    - osds
-    - mdss
-    - rgws
-    - nfss
  
-  become: yes
+- name: gather facts and check if using systemd
  
    vars:
-    osd_group_name: osds
-    mon_group_name: mons
-    rgw_group_name: rgws
-    mds_group_name: mdss
-    nfs_group_name: nfss
+    mon_group_name:       mons
+    osd_group_name:       osds
+    mds_group_name:       mdss
+    rgw_group_name:       rgws
      rbdmirror_group_name: rbdmirrors
+    nfs_group_name:       nfss
  
-# When set to true both groups of packages are purged.
-# This can cause problem with qemu-kvm
-    purge_all_packages: true
+  hosts:
+    - "{{ mon_group_name }}"
+    - "{{ osd_group_name }}"
+    - "{{ mds_group_name }}"
+    - "{{ rgw_group_name }}"
+    - "{{ rbdmirror_group_name }}"
+    - "{{ nfs_group_name }}"
  
-# When set to true and raw _multi_journal is used then block devices are also zapped
-    zap_block_devs: true
+  become: true
  
-    ceph_packages:
-      - ceph
-      - ceph-common
-      - ceph-fs-common
-      - ceph-fuse
-      - ceph-mds
-      - ceph-release
-      - ceph-radosgw
+  tasks:
+  - name: are we using systemd
+    shell: "if [ -d /usr/lib/systemd ] ; then find /usr/lib/systemd/system -name 'ceph*' | wc -l ; else echo 0 ; fi"
+    register: systemd_unit_files
  
-    ceph_remaining_packages:
-      - libcephfs1
-      - librados2
-      - libradosstriper1
-      - librbd1
-      - python-cephfs
-      - python-rados
-      - python-rbd
  
-    cluster: ceph # name of the cluster
-    monitor_name: "{{ ansible_hostname }}"
-    mds_name: "{{ ansible_hostname }}"
-    osd_auto_discovery: false
+- name: purge ceph mds cluster
  
+  vars:
+    mds_group_name: mdss
  
-  handlers:
-  - name: restart machine
-    shell: sleep 2 && shutdown -r now "Ansible updates triggered"
-    async: 1
-    poll: 0
-    ignore_errors: true
+  hosts:
+    - "{{ mds_group_name }}"
  
-  - name: wait for server to boot
-    become: false
-    local_action: wait_for port=22 host={{ inventory_hostname }} state=started delay=10 timeout=500
+  gather_facts: false # Already gathered previously
  
-  - name: remove data
-    file:
-     path: /var/lib/ceph
-     state: absent
+  become: true
  
    tasks:
-  - name: check for a device list
-    fail:
-      msg: "OSD automatic discovery was detected, purge cluster does not support this scenario. If you want to purge the cluster, manually provide the list of devices in group_vars/osds using the devices variable."
-    when:
-      osd_group_name in group_names and
-      devices is not defined and
-      osd_auto_discovery
-
-  - name: get osd numbers
-    shell: "if [ -d /var/lib/ceph/osd ] ; then ls /var/lib/ceph/osd | cut -d '-' -f 2 ; fi"
-    register: osd_ids
-    changed_when: false
-
-  - name: are we using systemd
-    shell: "if [ -d /usr/lib/systemd ] ; then find /usr/lib/systemd/system -name 'ceph*' | wc -l ; else echo 0 ; fi"
-    register: systemd_unit_files
-
-# after Hammer release
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../roles/ceph-mds/defaults/main.yml
+  - include_vars: ../group_vars/all
+    failed_when: false
+  - include_vars: ../group_vars/mdss
+    failed_when: false
  
    - name: stop ceph.target with systemd
      service:
@@ -124,53 +87,107 @@
        ansible_os_family == 'RedHat' and
        systemd_unit_files.stdout != "0"
  
-  - name: stop ceph-osd with systemd
+  - name: stop ceph mdss with systemd
      service:
-      name: ceph-osd@{{item}}
+      name: ceph-mds@{{ ansible_hostname }}
        state: stopped
        enabled: no
-    with_items: "{{ osd_ids.stdout_lines }}"
      when:
        ansible_os_family == 'RedHat' and
-      systemd_unit_files.stdout != "0" and
-      osd_group_name in group_names
+      systemd_unit_files.stdout != "0"
  
-  - name: stop ceph mons with systemd
-    service:
-      name: ceph-mon@{{ ansible_hostname }}
-      state: stopped
-      enabled: no
+  - name: stop ceph mdss
+    shell: "service ceph status mds ; if [ $? == 0 ] ; then service ceph stop mds ; else echo ; fi"
      when:
-      ansible_os_family == 'RedHat' and
-      systemd_unit_files.stdout != "0" and
-      mon_group_name in group_names
+      ansible_os_family == 'RedHat'
  
-  - name: stop ceph mdss with systemd
+# Ubuntu 14.04
+  - name: stop ceph mdss on ubuntu
+    command: initctl stop ceph-mds cluster={{ cluster }} id={{ ansible_hostname }}
+    failed_when: false
+    when:
+      ansible_distribution == 'Ubuntu'
+
+
+- name: purge ceph rgw cluster
+
+  vars:
+    rgw_group_name: rgws
+
+  hosts:
+    - "{{ rgw_group_name }}"
+
+  gather_facts: false # Already gathered previously
+
+  become: true
+
+  tasks:
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../roles/ceph-rgw/defaults/main.yml
+  - include_vars: ../group_vars/all
+    failed_when: false
+  - include_vars: ../group_vars/rgws
+    failed_when: false
+
+  - name: stop ceph.target with systemd
      service:
-      name: ceph-mds@{{ ansible_hostname }}
+      name: ceph.target
        state: stopped
+      enabled: no
      when:
        ansible_os_family == 'RedHat' and
-      systemd_unit_files.stdout != "0" and
-      mds_group_name in group_names
+      systemd_unit_files.stdout != "0"
  
    - name: stop ceph rgws with systemd
      service:
        name: ceph-radosgw@rgw.{{ ansible_hostname }}
        state: stopped
+      enabled: no
      when:
        ansible_os_family == 'RedHat' and
-      systemd_unit_files.stdout != "0" and
-      rgw_group_name in group_names
+      systemd_unit_files.stdout != "0"
  
-  - name: stop ceph nfss with systemd
+  - name: stop ceph rgws
+    shell: "service ceph-radosgw status ; if [ $? == 0 ] ; then service ceph-radosgw stop ; else echo ; fi"
+    when:
+      ansible_os_family == 'RedHat'
+
+# Ubuntu 14.04
+  - name: stop ceph rgws on ubuntu
+    command: initctl stop radosgw cluster={{ cluster }} id={{ ansible_hostname }}
+    failed_when: false
+    when:
+      ansible_distribution == 'Ubuntu'
+
+
+- name: purge ceph rbd-mirror cluster
+
+  vars:
+    rbdmirror_group_name: rbdmirrors
+
+  hosts:
+    - "{{ rbdmirror_group_name }}"
+
+  gather_facts: false # Already gathered previously
+
+  become: true
+
+  tasks:
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../roles/ceph-rbd-mirror/defaults/main.yml
+  - include_vars: ../group_vars/all
+    failed_when: false
+  - include_vars: ../group_vars/rbd-mirrors
+    failed_when: false
+
+  - name: stop ceph.target with systemd
      service:
-      name: nfs-ganesha
+      name: ceph.target
        state: stopped
+      enabled: no
      when:
        ansible_os_family == 'RedHat' and
-      systemd_unit_files.stdout != "0" and
-      nfs_group_name in group_names
+      systemd_unit_files.stdout != "0"
  
    - name: stop ceph rbd mirror with systemd
      service:
@@ -178,94 +195,155 @@
        state: stopped
      when:
        ansible_os_family == 'RedHat' and
-      systemd_unit_files.stdout != "0" and
-      rbdmirror_group_name in group_names
-
-# before infernalis release, using sysvinit scripts
-# we use this test so we do not have to know which RPM contains the boot script
-# or where it is placed.
+      systemd_unit_files.stdout != "0"
  
-  - name: stop ceph osds
-    shell: "service ceph status osd ; if [ $? == 0 ] ; then service ceph stop osd ; else echo ; fi"
+# Ubuntu 14.04
+  - name: stop ceph rbd mirror on ubuntu
+    command: initctl stop ceph-rbd-mirorr cluster={{ cluster }} id=admin
+    failed_when: false
      when:
-      ansible_os_family == 'RedHat' and
-      osd_group_name in group_names
+      ansible_distribution == 'Ubuntu'
  
-  - name: stop ceph mons
-    shell: "service ceph status mon ; if [ $? == 0 ] ; then service ceph stop mon ; else echo ; fi"
-    when:
-      ansible_os_family == 'RedHat' and
-      mon_group_name in group_names
  
-  - name: stop ceph mdss
-    shell: "service ceph status mds ; if [ $? == 0 ] ; then service ceph stop mds ; else echo ; fi"
+- name: purge ceph nfs cluster
+
+  vars:
+    nfs_group_name: nfss
+
+  hosts:
+    - "{{ nfs_group_name }}"
+
+  gather_facts: false # Already gathered previously
+
+  become: true
+
+  tasks:
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../roles/ceph-nfs/defaults/main.yml
+  - include_vars: ../group_vars/all
+    failed_when: false
+  - include_vars: ../group_vars/nfss
+    failed_when: false
+
+  - name: stop ceph.target with systemd
+    service:
+      name: ceph.target
+      state: stopped
+      enabled: no
      when:
        ansible_os_family == 'RedHat' and
-      mds_group_name in group_names
+      systemd_unit_files.stdout != "0"
  
-  - name: stop ceph rgws
-    shell: "service ceph-radosgw status ; if [ $? == 0 ] ; then service ceph-radosgw stop ; else echo ; fi"
+  - name: stop ceph nfss with systemd
+    service:
+      name: nfs-ganesha
+      state: stopped
      when:
        ansible_os_family == 'RedHat' and
-      rgw_group_name in group_names
+      systemd_unit_files.stdout != "0"
  
    - name: stop ceph nfss
      shell: "service nfs-ganesha status ; if [ $? == 0 ] ; then service nfs-ganesha stop ; else echo ; fi"
      when:
-      ansible_os_family == 'RedHat' and
-      nfs_group_name in group_names
+      ansible_os_family == 'RedHat'
  
  # Ubuntu 14.04
-  - name: stop ceph osds on ubuntu
-    shell: |
-      for id in $(ls /var/lib/ceph/osd/ |grep -oh '[0-9]*'); do
-        initctl stop ceph-osd cluster={{ cluster }} id=$id
-      done
+  - name: stop ceph nfss on ubuntu
+    command: initctl stop nfs-ganesha
      failed_when: false
      when:
-      ansible_distribution == 'Ubuntu' and
-      osd_group_name in group_names
-    with_items: "{{ osd_ids.stdout_lines }}"
+      ansible_distribution == 'Ubuntu'
  
-  - name: stop ceph mons on ubuntu
-    command: initctl stop ceph-mon cluster={{ cluster }} id={{ monitor_name }}
+
+- name: purge ceph osd cluster
+
+  vars:
+    osd_group_name: osds
+
+# When set to true and raw _multi_journal is used then block devices are also zapped
+    zap_block_devs: true
+
+  hosts:
+    - "{{ osd_group_name }}"
+
+  gather_facts: false # Already gathered previously
+
+  become: true
+
+  handlers:
+  - name: restart machine
+    shell: sleep 2 && shutdown -r now "Ansible updates triggered"
+    async: 1
+    poll: 0
+    ignore_errors: true
+
+  - name: wait for server to boot
+    become: false
+    local_action: wait_for port=22 host={{ inventory_hostname }} state=started delay=10 timeout=500
+
+  - name: remove data
+    file:
+     path: /var/lib/ceph
+     state: absent
+
+  tasks:
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../roles/ceph-osd/defaults/main.yml
+  - include_vars: ../group_vars/all
      failed_when: false
+  - include_vars: ../group_vars/osds
+    failed_when: false
+
+  - name: check for a device list
+    fail:
+      msg: "OSD automatic discovery was detected, purge cluster does not support this scenario. If you want to purge the cluster, manually provide the list of devices in group_vars/osds using the devices variable."
      when:
-      ansible_distribution == 'Ubuntu' and
-      mon_group_name in group_names
+      devices is not defined and
+      osd_auto_discovery
  
-  - name: stop ceph mdss on ubuntu
-    command: initctl stop ceph-mds cluster={{ cluster }} id={{ mds_name }}
-    failed_when: false
+  - name: get osd numbers
+    shell: "if [ -d /var/lib/ceph/osd ] ; then ls /var/lib/ceph/osd | cut -d '-' -f 2 ; fi"
+    register: osd_ids
+    changed_when: false
+
+  - name: stop ceph.target with systemd
+    service:
+      name: ceph.target
+      state: stopped
+      enabled: no
      when:
-      ansible_distribution == 'Ubuntu' and
-      mds_group_name in group_names
+      ansible_os_family == 'RedHat' and
+      systemd_unit_files.stdout != "0"
  
-  - name: stop ceph rgws on ubuntu
-    command: initctl stop radosgw cluster={{ cluster }} id={{ ansible_hostname }}
-    failed_when: false
+  - name: stop ceph-osd with systemd
+    service:
+      name: ceph-osd@{{item}}
+      state: stopped
+      enabled: no
+    with_items: "{{ osd_ids.stdout_lines }}"
      when:
-      ansible_distribution == 'Ubuntu' and
-      rgw_group_name in group_names
+      ansible_os_family == 'RedHat' and
+      systemd_unit_files.stdout != "0"
  
-  - name: stop ceph nfss on ubuntu
-    command: initctl stop nfs-ganesha
-    failed_when: false
+# before infernalis release, using sysvinit scripts
+# we use this test so we do not have to know which RPM contains the boot script
+# or where it is placed.
+
+  - name: stop ceph osds
+    shell: "service ceph status osd ; if [ $? == 0 ] ; then service ceph stop osd ; else echo ; fi"
      when:
-      ansible_distribution == 'Ubuntu' and
-      nfs_group_name in group_names
+      ansible_os_family == 'RedHat'
  
-  - name: stop ceph rbd mirror on ubuntu
-    command: initctl stop ceph-rbd-mirorr cluster={{ cluster }} id=admin
+# Ubuntu 14.04
+  - name: stop ceph osds on ubuntu
+    shell: |
+      for id in $(ls /var/lib/ceph/osd/ |grep -oh '[0-9]*'); do
+        initctl stop ceph-osd cluster={{ cluster }} id=$id
+      done
      failed_when: false
      when:
-      ansible_distribution == 'Ubuntu' and
-      rbdmirror_group_name in group_names
-
-  - name: check for anything running ceph
-    shell: "ps awux | grep -- /usr/bin/[c]eph-"
-    register: check_for_running_ceph
-    failed_when: check_for_running_ceph.rc == 0
+      ansible_distribution == 'Ubuntu'
+    with_items: "{{ osd_ids.stdout_lines }}"
  
    - name: see if ceph-disk-created data partitions are present
      shell: |
@@ -291,20 +369,14 @@
      shell: "(grep /var/lib/ceph/osd /proc/mounts || echo -n) | awk '{ print $2 }'"
      register: mounted_osd
      changed_when: false
-    when:
-      osd_group_name in group_names
  
    - name: drop all cache
      shell: "sync && sleep 1 && echo 3 > /proc/sys/vm/drop_caches"
-    when:
-      osd_group_name in group_names
  
    - name: umount osd data partition
      shell: umount {{ item }}
      with_items:
       - "{{ mounted_osd.stdout_lines }}"
-    when:
-     osd_group_name in group_names
  
    - name: remove osd mountpoint tree
      file:
@@ -312,15 +384,6 @@
        state: absent
      register: remove_osd_mountpoints
      ignore_errors: true
-    when:
-      osd_group_name in group_names
-
-  - name: remove monitor store and bootstrap keys
-    file:
-      path: /var/lib/ceph/
-      state: absent
-    when:
-      mon_group_name in group_names
  
    - name: is reboot needed
      local_action: shell echo requesting reboot
@@ -330,7 +393,6 @@
        - wait for server to boot
        - remove data
      when:
-      osd_group_name in group_names and
        remove_osd_mountpoints.failed is defined
  
    - name: see if ceph-disk is installed
@@ -342,7 +404,6 @@
      shell: ceph-disk zap "{{ item }}"
      with_items: "{{ devices | default([]) }}"
      when:
-     osd_group_name in group_names and
       ceph_disk_present.rc == 0 and
       ceph_data_partlabels.rc == 0 and
       zap_block_devs
@@ -361,10 +422,123 @@
        sgdisk --delete $partition_nb $raw_device
      with_items: "{{ceph_journal_partition_to_erase_path.stdout_lines}}"
      when:
-      osd_group_name in group_names and
        ceph_journal_partlabels.rc == 0 and
        zap_block_devs
  
+
+- name: purge ceph mon cluster
+
+  vars:
+    mon_group_name: mons
+
+  hosts:
+    - "{{ mon_group_name }}"
+
+  gather_facts: false # Already gathered previously
+
+  become: true
+
+  tasks:
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../roles/ceph-mon/defaults/main.yml
+  - include_vars: ../roles/ceph-restapi/defaults/main.yml
+  - include_vars: ../group_vars/all
+    failed_when: false
+  - include_vars: ../group_vars/mons
+    failed_when: false
+  - include_vars: ../group_vars/restapis
+    failed_when: false
+
+  - name: stop ceph.target with systemd
+    service:
+      name: ceph.target
+      state: stopped
+      enabled: no
+    when:
+      ansible_os_family == 'RedHat' and
+      systemd_unit_files.stdout != "0"
+
+  - name: stop ceph mons with systemd
+    service:
+      name: ceph-mon@{{ ansible_hostname }}
+      state: stopped
+      enabled: no
+    when:
+      ansible_os_family == 'RedHat' and
+      systemd_unit_files.stdout != "0"
+
+  - name: stop ceph mons
+    shell: "service ceph status mon ; if [ $? == 0 ] ; then service ceph stop mon ; else echo ; fi"
+    when:
+      ansible_os_family == 'RedHat'
+
+  - name: stop ceph mons on ubuntu
+    command: initctl stop ceph-mon cluster={{ cluster }} id={{ ansible_hostname }}
+    failed_when: false
+    when:
+      ansible_distribution == 'Ubuntu'
+
+  - name: remove monitor store and bootstrap keys
+    file:
+      path: /var/lib/ceph/
+      state: absent
+
+- name: final cleanup - check any running ceph, purge ceph packages, purge config and remove data
+
+  vars:
+    mon_group_name:       mons
+    osd_group_name:       osds
+    mds_group_name:       mdss
+    rgw_group_name:       rgws
+    rbdmirror_group_name: rbdmirrors
+    nfs_group_name:       nfss
+
+# When set to true both groups of packages are purged.
+# This can cause problem with qemu-kvm
+    purge_all_packages: true
+
+    ceph_packages:
+      - ceph
+      - ceph-common
+      - ceph-fs-common
+      - ceph-fuse
+      - ceph-mds
+      - ceph-release
+      - ceph-radosgw
+
+    ceph_remaining_packages:
+      - libcephfs1
+      - librados2
+      - libradosstriper1
+      - librbd1
+      - python-cephfs
+      - python-rados
+      - python-rbd
+
+  hosts:
+    - "{{ mon_group_name }}"
+    - "{{ osd_group_name }}"
+    - "{{ mds_group_name }}"
+    - "{{ rgw_group_name }}"
+    - "{{ rbdmirror_group_name }}"
+    - "{{ nfs_group_name }}"
+
+  gather_facts: false # Already gathered previously
+
+  become: true
+
+  handlers:
+  - name: remove data
+    file:
+     path: /var/lib/ceph
+     state: absent
+
+  tasks:
+  - name: check for anything running ceph
+    shell: "ps awux | grep -- /usr/bin/[c]eph-"
+    register: check_for_running_ceph
+    failed_when: check_for_running_ceph.rc == 0
+
    - name: purge ceph packages with yum
      yum:
        name: "{{ item }}"
@@ -474,3 +648,35 @@
        state: absent
      when:
        ansible_os_family == 'RedHat'
+
+
+- name: purge fetch directory
+
+  hosts:
+    - localhost
+
+  gather_facts: false
+
+  tasks:
+  - include_vars: ../roles/ceph-common/defaults/main.yml
+  - include_vars: ../group_vars/all
+    failed_when: false
+  - include_vars: ../group_vars/mdss
+    failed_when: false
+  - include_vars: ../group_vars/rgws
+    failed_when: false
+  - include_vars: ../group_vars/rbd-mirrors
+    failed_when: false
+  - include_vars: ../group_vars/nfss
+    failed_when: false
+  - include_vars: ../group_vars/osds
+    failed_when: false
+  - include_vars: ../group_vars/mons
+    failed_when: false
+  - include_vars: ../group_vars/restapis
+    failed_when: false
+
+  - name: purge fetch directory for localhost
+    file:
+      path: "{{ fetch_directory }}"
+      state: absent
author	Ivan Font <ivan.font@redhat.com>
	Thu, 6 Oct 2016 04:32:38 +0000 (21:32 -0700)
committer	Ivan Font <ivan.font@redhat.com>
	Thu, 6 Oct 2016 04:32:38 +0000 (21:32 -0700)