#!/bin/bash RETRIES="{{ handler_health_rgw_check_retries }}" DELAY="{{ handler_health_rgw_check_delay }}" HOST_NAME="{{ ansible_hostname }}" RGW_NUMS={{ radosgw_num_instances }} RGW_BASE_PORT={{ radosgw_frontend_port }} RGW_FRONTEND_SSL_CERT={{ radosgw_frontend_ssl_certificate }} if [ -n "$RGW_FRONTEND_SSL_CERT" ]; then RGW_PROTOCOL=https else RGW_PROTOCOL=http fi declare -a DOCKER_EXECS for ((i=0; i<${RGW_NUMS}; i++)); do DOCKER_EXECS[i]="" {% if containerized_deployment %} CONTAINER_NAME="ceph-rgw-${HOST_NAME}-rgw${i}" DOCKER_EXECS[i]="{{ container_binary }} exec ${CONTAINER_NAME}" {% endif %} done declare -a SOCKETS # Backward compatibility for ((i=0; i<${RGW_NUMS}; i++)); do SOCKET[i]="EMPTY_SOCKET" ${DOCKER_EXECS[i]} test -S /var/run/ceph/{{ cluster }}-client.rgw.{{ ansible_fqdn }}.asok && SOCKETS[i]=/var/run/ceph/{{ cluster }}-client.rgw.{{ ansible_fqdn }}.asok ${DOCKER_EXECS[i]} test -S /var/run/ceph/{{ cluster }}-client.rgw.${HOST_NAME}.rgw${i}.asok && SOCKETS[i]=/var/run/ceph/{{ cluster }}-client.rgw.${HOST_NAME}.rgw${i}.asok done RGW_IP={{ hostvars[inventory_hostname]['_radosgw_address'] }} check_socket() { local i=$1 local succ=0 local count=10 # Wait and ensure the socket exists after restarting the daemon while [ $count -ne 0 ]; do ${DOCKER_EXECS[i]} test -S ${SOCKETS[i]} && succ=$((succ+1)) && break sleep $DELAY let count=count-1 done if [ $succ -ne 1 ]; then echo "Socket file ${SOCKETS[i]} could not be found, which means Rados Gateway is not running. Showing ceph-rgw unit logs now:" journalctl -u ceph-radosgw@rgw.${HOST_NAME}.rgw${i} exit 1 fi } check_for_curl_or_wget() { local i=$1 if ${DOCKER_EXECS[i]} command -v wget &>/dev/null; then rgw_test_command="wget --quiet" elif ${DOCKER_EXECS[i]} command -v curl &>/dev/null; then rgw_test_command="curl --fail --silent --output /dev/null" else echo "It seems that neither curl or wget are available on your system." echo "Cannot test rgw connection." exit 0 fi } check_rest() { local i=$1 check_for_curl_or_wget ${i} local succ=0 while [ $RETRIES -ne 0 ]; do test "$rgw_test_command $RGW_PROTOCOL://$RGW_IP:$((RGW_BASE_PORT+i))" && succ=$((succ+1)) && break sleep $DELAY let RETRIES=RETRIES-1 done if [ $succ -ne 1 ]; then # If we reach this point, it means there is a problem with the connection to rgw echo "Error connecting locally to Rados Gateway service: $RGW_PROTOCOL://$rgw_listen" exit 1 fi } # First, restart the daemon for ((i=0; i<${RGW_NUMS}; i++)); do systemctl restart ceph-radosgw@rgw.${HOST_NAME}.rgw${i} done # Check socket files for ((i=0; i<${RGW_NUMS}; i++)); do check_socket ${i} done # Check rest for ((i=0; i<${RGW_NUMS}; i++)); do check_rest ${i} done