#!/bin/bash
#
#
# OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute)
#
# Description: Manages an OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute) process as an HA resource
#
# Authors: Emilien Macchi
# Mainly inspired by the Nova Scheduler resource agent written by Sebastien Han
#
# Support: openstack@lists.launchpad.net
# License: Apache Software License (ASL) 2.0
#
#
# See usage() function below for more details ...
#
# OCF instance parameters:
# OCF_RESKEY_binary
# OCF_RESKEY_config
# OCF_RESKEY_user
# OCF_RESKEY_pid
# OCF_RESKEY_monitor_binary
# OCF_RESKEY_amqp_server_port
# OCF_RESKEY_additional_parameters
#######################################################################
# Initialization:

: ${OCF_FUNCTIONS_DIR=${OCF_ROOT}/lib/heartbeat}
. ${OCF_FUNCTIONS_DIR}/ocf-shellfuncs
: ${OCF_FUEL_FUNCTIONS_DIR=${OCF_ROOT}/resource.d/fuel}
. ${OCF_FUEL_FUNCTIONS_DIR}/ocf-fuel-funcs

#######################################################################

# Fill in some defaults if no values are specified

OCF_RESKEY_binary_default="ceilometer-polling"
OCF_RESKEY_config_default="/etc/ceilometer/ceilometer.conf"
OCF_RESKEY_user_default="ceilometer"
OCF_RESKEY_pid_default="$HA_RSCTMP/$OCF_RESOURCE_INSTANCE.pid"
OCF_RESKEY_amqp_server_port_default="5673"

: ${HA_LOGTAG="ocf-ceilometer-agent-compute"}
: ${HA_LOGFACILITY="daemon"}
: ${OCF_RESKEY_binary=${OCF_RESKEY_binary_default}}
: ${OCF_RESKEY_config=${OCF_RESKEY_config_default}}
: ${OCF_RESKEY_user=${OCF_RESKEY_user_default}}
: ${OCF_RESKEY_pid=${OCF_RESKEY_pid_default}}
: ${OCF_RESKEY_amqp_server_port=${OCF_RESKEY_amqp_server_port_default}}

#######################################################################

usage() {
    cat <<UEND
        usage: $0 (start|stop|validate-all|meta-data|status|monitor)

        $0 manages an OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute) process as an HA resource

        The 'start' operation starts the scheduler service.
        The 'stop' operation stops the scheduler service.
        The 'validate-all' operation reports whether the parameters are valid
        The 'meta-data' operation reports this RA's meta-data information
        The 'status' operation reports whether the scheduler service is running
        The 'monitor' operation reports whether the scheduler service seems to be working

UEND
}

meta_data() {
    cat <<END
<?xml version="1.0"?>
<!DOCTYPE resource-agent SYSTEM "ra-api-1.dtd">
<resource-agent name="ceilometer-agent-compute">
<version>1.0</version>

<longdesc lang="en">
Resource agent for the OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute)
May manage a ceilometer-agent-compute instance or a clone set that
creates a distributed ceilometer-agent-compute cluster.
</longdesc>
<shortdesc lang="en">Manages the OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute)</shortdesc>
<parameters>

<parameter name="binary" unique="0" required="0">
<longdesc lang="en">
Location of the OpenStack Ceilometer Compute Agent server binary (ceilometer-agent-compute)
</longdesc>
<shortdesc lang="en">OpenStack Ceilometer Compute Agent server binary (ceilometer-agent-compute)</shortdesc>
<content type="string" default="${OCF_RESKEY_binary_default}" />
</parameter>

<parameter name="config" unique="0" required="0">
<longdesc lang="en">
Location of the OpenStack Ceilometer Compute Agent Compute (ceilometer-agent-compute) configuration file
</longdesc>
<shortdesc lang="en">OpenStack Ceilometer Compute Agent (ceilometer-agent-compute registry) config file</shortdesc>
<content type="string" default="${OCF_RESKEY_config_default}" />
</parameter>

<parameter name="user" unique="0" required="0">
<longdesc lang="en">
User running OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute)
</longdesc>
<shortdesc lang="en">OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute) user</shortdesc>
<content type="string" default="${OCF_RESKEY_user_default}" />
</parameter>

<parameter name="pid" unique="0" required="0">
<longdesc lang="en">
The pid file to use for this OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute) instance
</longdesc>
<shortdesc lang="en">OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute) pid file</shortdesc>
<content type="string" default="${OCF_RESKEY_pid_default}" />
</parameter>

<parameter name="amqp_server_port" unique="0" required="0">
<longdesc lang="en">
The listening port number of the AMQP server. Use for monitoring purposes
</longdesc>
<shortdesc lang="en">AMQP listening port</shortdesc>
<content type="integer" default="${OCF_RESKEY_amqp_server_port_default}" />
</parameter>

<parameter name="additional_parameters" unique="0" required="0">
<longdesc lang="en">
Additional parameters to pass on to the OpenStack Ceilometer Compute Agent Service (ceilometer-agent-compute)
</longdesc>
<shortdesc lang="en">Additional parameters for ceilometer-agent-compute</shortdesc>
<content type="string" />
</parameter>

</parameters>

<actions>
<action name="start" timeout="20" />
<action name="stop" timeout="20" />
<action name="status" timeout="20" />
<action name="monitor" timeout="30" interval="20" />
<action name="validate-all" timeout="5" />
<action name="meta-data" timeout="5" />
</actions>
</resource-agent>
END
}

#######################################################################
# Functions invoked by resource manager actions

ceilometer_agent_compute_validate() {
    local rc

    check_binary $OCF_RESKEY_binary
    check_binary netstat

    if ! validate_port $OCF_RESKEY_amqp_server_port; then
      return ${OCF_ERR_CONFIGURED}
    fi

    # A config file on shared storage that is not available
    # during probes is OK.
    if [ ! -f $OCF_RESKEY_config ]; then
        if ! ocf_is_probe; then
            ocf_log err "Config $OCF_RESKEY_config doesn't exist"
            return $OCF_ERR_INSTALLED
        fi
        ocf_log_warn "Config $OCF_RESKEY_config not available during a probe"
    fi

    getent passwd $OCF_RESKEY_user >/dev/null 2>&1
    rc=$?
    if [ $rc -ne 0 ]; then
        ocf_log err "User $OCF_RESKEY_user doesn't exist"
        return $OCF_ERR_INSTALLED
    fi

    return ${OCF_SUCCESS}
}

ceilometer_agent_compute_status() {
    local pid
    local rc

    if [ ! -f $OCF_RESKEY_pid ]; then
        ocf_log info "OpenStack Ceilometer Compute Agent (ceilometer-agent-compute) is not running"
        return $OCF_NOT_RUNNING
    else
        pid=`cat $OCF_RESKEY_pid`
    fi

    ocf_run -warn kill -s 0 $pid
    rc=$?
    if [ $rc -eq 0 ]; then
        return $OCF_SUCCESS
    else
        ocf_log info "Old PID file found, but OpenStack Ceilometer Compute Agent (ceilometer-agent-compute) is not running"
        return $OCF_NOT_RUNNING
    fi
}

ceilometer_agent_compute_monitor() {
    local rc
    local pid
    local scheduler_amqp_check

    ceilometer_agent_compute_status
    rc=$?

    # If status returned anything but success, return that immediately
    if [ $rc -ne $OCF_SUCCESS ]; then
        return $rc
    fi

    # Check the connections according to the PID.
    # We are sure to hit the scheduler process and not other process with the same connection behavior
    pid=`cat $OCF_RESKEY_pid`
    scheduler_amqp_check=`netstat -punt | grep -s "$OCF_RESKEY_amqp_server_port" | grep -s "$pid" | grep -qs "ESTABLISHED"`
    rc=$?
    ocf_log debug "OpenStack Ceilometer Compute Agent (ceilometer-agent-compute) monitor succeeded"
    return $OCF_SUCCESS
}

ceilometer_agent_compute_start() {
    local rc

    ceilometer_agent_compute_status
    rc=$?
    if [ $rc -eq $OCF_SUCCESS ]; then
        ocf_log info "OpenStack Ceilometer Compute Agent (ceilometer-agent-compute) already running"
        return $OCF_SUCCESS
    fi

    # run the actual ceilometer-agent-compute daemon. Don't use ocf_run as we're sending the tool's output
    # straight to /dev/null anyway and using ocf_run would break stdout-redirection here.
    su ${OCF_RESKEY_user} -s /bin/sh -c "${OCF_RESKEY_binary} --polling-namespaces compute --config-file=$OCF_RESKEY_config \
       $OCF_RESKEY_additional_parameters"' >> /dev/null 2>&1 & echo $!' > $OCF_RESKEY_pid

    # Spin waiting for the server to come up.
    while true; do
    ceilometer_agent_compute_monitor
    rc=$?
    [ $rc -eq $OCF_SUCCESS ] && break
    if [ $rc -ne $OCF_NOT_RUNNING ]; then
        ocf_log err "OpenStack Ceilometer Compute Agent (ceilometer-agent-compute) start failed"
        exit $OCF_ERR_GENERIC
    fi
    sleep 1
    done

    ocf_log info "OpenStack Ceilometer Compute Agent (ceilometer-agent-compute) started"
    return $OCF_SUCCESS
}

ceilometer_agent_compute_stop() {
    local rc
    local shutdown_timeout=15
    if [ -n "$OCF_RESKEY_CRM_meta_timeout" ]; then
        shutdown_timeout=$(( ($OCF_RESKEY_CRM_meta_timeout/1000) ))
    fi

    ceilometer_agent_compute_status
    rc="${?}"
    if [ "${rc}" -eq "${OCF_NOT_RUNNING}" ]; then
        ocf_log info "OpenStack Compute Compute Agent (${OCF_RESKEY_binary}) already stopped"
        return "${OCF_SUCCESS}"
    fi

    proc_stop "${OCF_RESKEY_pid}" "${OCF_RESKEY_binary}" $shutdown_timeout
    return "${?}"
}

#######################################################################

case "$1" in
  meta-data) meta_data
                exit $OCF_SUCCESS;;
  usage|help) usage
                exit $OCF_SUCCESS;;
esac

# Anything except meta-data and help must pass validation
ceilometer_agent_compute_validate || exit $?

# What kind of method was invoked?
case "$1" in
  start) ceilometer_agent_compute_start;;
  stop) ceilometer_agent_compute_stop;;
  status) ceilometer_agent_compute_status;;
  monitor) ceilometer_agent_compute_monitor;;
  validate-all) ;;
  *) usage
                exit $OCF_ERR_UNIMPLEMENTED;;
esac
