Restart all OSDs and do not stop after the first one.

author Christian Zunker <christian.zunker@codecentric.de>

Mon, 12 Jun 2017 08:30:22 +0000 (08:30 +0000)

committer Christian Zunker <christian.zunker@codecentric.de>

Wed, 14 Jun 2017 09:38:07 +0000 (09:38 +0000)
author Christian Zunker <christian.zunker@codecentric.de>
Mon, 12 Jun 2017 08:30:22 +0000 (08:30 +0000)
committer Christian Zunker <christian.zunker@codecentric.de>
Wed, 14 Jun 2017 09:38:07 +0000 (09:38 +0000)
diff --git a/roles/ceph-common/templates/restart_osd_daemon.sh.j2 b/roles/ceph-common/templates/restart_osd_daemon.sh.j2

index 5d1d04597b52a9de9eeae84855f5ea949c314ed4..f027574cf6d2c7244203f0a9a81c01f37e727d1d 100644 (file)
--- a/roles/ceph-common/templates/restart_osd_daemon.sh.j2
+++ b/roles/ceph-common/templates/restart_osd_daemon.sh.j2
@@ -8,7 +8,7 @@ check_pgs() {
    while [ $RETRIES -ne 0 ]; do
      test "[""$(ceph $CEPH_CLI -s -f json | python -c 'import sys, json; print(json.load(sys.stdin)["pgmap"]["num_pgs"])')""]" == "$(ceph $CEPH_CLI -s -f json | python -c 'import sys, json; print [ i["count"] for i in json.load(sys.stdin)["pgmap"]["pgs_by_state"] if i["state_name"] == "active+clean"]')"
      RET=$?
-    test $RET -eq 0 && exit 0
+    test $RET -eq 0 && return 0
      sleep $DELAY
      let RETRIES=RETRIES-1
    done
@@ -28,7 +28,7 @@ for id in $(ls /var/lib/ceph/osd/ | sed 's/.*-//'); do
    # Wait and ensure the socket exists after restarting the daemon
    SOCKET=/var/run/ceph/{{ cluster }}-osd.${id}.asok
    while [ $COUNT -ne 0 ]; do
-    test -S $SOCKET && check_pgs
+    test -S $SOCKET && check_pgs && continue 2
      sleep 1
      let COUNT=COUNT-1
    done
author	Christian Zunker <christian.zunker@codecentric.de>
	Mon, 12 Jun 2017 08:30:22 +0000 (08:30 +0000)
committer	Christian Zunker <christian.zunker@codecentric.de>
	Wed, 14 Jun 2017 09:38:07 +0000 (09:38 +0000)