2017-09-27 08:08:40 +08:00
|
|
|
#!/bin/bash
|
|
|
|
|
|
|
|
RETRIES="{{ handler_health_mgr_check_retries }}"
|
|
|
|
DELAY="{{ handler_health_mgr_check_delay }}"
|
2021-03-03 22:43:50 +08:00
|
|
|
MGR_NAME="{{ ansible_facts['hostname'] }}"
|
|
|
|
{% if containerized_deployment | bool %}
|
|
|
|
DOCKER_EXEC="{{ container_binary }} exec ceph-mgr-{{ ansible_facts['hostname'] }}"
|
2017-09-28 00:22:15 +08:00
|
|
|
{% endif %}
|
2017-09-27 08:08:40 +08:00
|
|
|
|
2018-07-31 21:18:28 +08:00
|
|
|
# Backward compatibility
|
2021-03-03 22:43:50 +08:00
|
|
|
$DOCKER_EXEC test -S /var/run/ceph/{{ cluster }}-mgr.{{ ansible_facts['fqdn'] }}.asok && SOCKET=/var/run/ceph/{{ cluster }}-mgr.{{ ansible_facts['fqdn'] }}.asok
|
|
|
|
$DOCKER_EXEC test -S /var/run/ceph/{{ cluster }}-mgr.{{ ansible_facts['hostname'] }}.asok && SOCKET=/var/run/ceph/{{ cluster }}-mgr.{{ ansible_facts['hostname'] }}.asok
|
2018-07-31 21:18:28 +08:00
|
|
|
|
2018-06-20 13:01:06 +08:00
|
|
|
systemctl reset-failed ceph-mgr@${MGR_NAME}
|
2017-09-27 08:08:40 +08:00
|
|
|
# First, restart the daemon
|
|
|
|
systemctl restart ceph-mgr@${MGR_NAME}
|
|
|
|
|
|
|
|
# Wait and ensure the socket exists after restarting the daemds
|
|
|
|
while [ $RETRIES -ne 0 ]; do
|
2017-09-28 00:22:15 +08:00
|
|
|
$DOCKER_EXEC test -S $SOCKET && exit 0
|
2017-09-27 08:08:40 +08:00
|
|
|
sleep $DELAY
|
|
|
|
let RETRIES=RETRIES-1
|
|
|
|
done
|
|
|
|
# If we reach this point, it means the socket is not present.
|
2018-11-27 17:45:05 +08:00
|
|
|
echo "Socket file ${SOCKET} could not be found, which means ceph manager is not running. Showing ceph-mgr unit logs now:"
|
|
|
|
journalctl -u ceph-mgr@${MGR_NAME}
|
2017-09-27 08:08:40 +08:00
|
|
|
exit 1
|