ceph-ansible/roles/ceph-common/templates/restart_osd_daemon.sh.j2

#!/bin/bash

RETRIES="{{ handler_health_osd_check_retries }}"
DELAY="{{ handler_health_osd_check_delay }}"
CEPH_CLI="--name client.bootstrap-osd --keyring /var/lib/ceph/bootstrap-osd/{{ cluster }}.keyring --cluster {{ cluster }}"

check_pgs() {
  while [ $RETRIES -ne 0 ]; do
    ceph $CEPH_CLI -s | grep -sq 'active+clean'
    RET=$?
    test $RET -eq 0 && exit 0
    sleep $DELAY
    let RETRIES=RETRIES-1
  done
  # PGs not clean, exiting with return code 1
  echo "Error with PGs, check config"
  exit 1
}


for id in $(ls /var/lib/ceph/osd/ | sed 's/.*-//'); do
  # First, restart daemon(s)
  systemctl restart ceph-osd@${id}
  # We need to wait because it may take some time for the socket to actually exists
  COUNT=10
  # Wait and ensure the socket exists after restarting the daemon
  SOCKET=/var/run/ceph/{{ cluster }}-osd.${id}.asok
  while [ $COUNT -ne 0 ]; do
    test -S $SOCKET && check_pgs
    sleep 1
    let COUNT=COUNT-1
  done
  # If we reach this point, it means the socket is not present.
  echo "Error while restarting mon daemon"
  exit 1
done
Common: Fix handlers that are not properly triggered. Until now, only the first task were executed. The idea here is to use `listen` statement to be able to notify multiple handler and regroup all of them in `./handlers/main.yml` as notifying an included handler task is not possible. Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com> 2017-04-04 01:55:11 +08:00			`#!/bin/bash`

			`RETRIES="{{ handler_health_osd_check_retries }}"`
			`DELAY="{{ handler_health_osd_check_delay }}"`
			`CEPH_CLI="--name client.bootstrap-osd --keyring /var/lib/ceph/bootstrap-osd/{{ cluster }}.keyring --cluster {{ cluster }}"`

			`check_pgs() {`
			`while [ $RETRIES -ne 0 ]; do`
			`ceph $CEPH_CLI -s \| grep -sq 'active+clean'`
			`RET=$?`
			`test $RET -eq 0 && exit 0`
			`sleep $DELAY`
			`let RETRIES=RETRIES-1`
			`done`
			`# PGs not clean, exiting with return code 1`
			`echo "Error with PGs, check config"`
			`exit 1`
			`}`


			`for id in $(ls /var/lib/ceph/osd/ \| sed 's/.*-//'); do`
			`# First, restart daemon(s)`
			`systemctl restart ceph-osd@${id}`
			`# We need to wait because it may take some time for the socket to actually exists`
			`COUNT=10`
			`# Wait and ensure the socket exists after restarting the daemon`
			`SOCKET=/var/run/ceph/{{ cluster }}-osd.${id}.asok`
			`while [ $COUNT -ne 0 ]; do`
			`test -S $SOCKET && check_pgs`
			`sleep 1`
			`let COUNT=COUNT-1`
			`done`
			`# If we reach this point, it means the socket is not present.`
			`echo "Error while restarting mon daemon"`
			`exit 1`
			`done`