#!/bin/sh # # # OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) # # Description: Manages an OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) process as an HA resource # # Authors: Emilien Macchi # Mainly inspired by the Nova Scheduler resource agent written by Sebastien Han # # Support: openstack@lists.launchpad.net # License: Apache Software License (ASL) 2.0 # # # See usage() function below for more details ... # # OCF instance parameters: # OCF_RESKEY_binary # OCF_RESKEY_config # OCF_RESKEY_user # OCF_RESKEY_pid # OCF_RESKEY_monitor_binary # OCF_RESKEY_additional_parameters ####################################################################### # Initialization: : ${OCF_FUNCTIONS_DIR=${OCF_ROOT}/lib/heartbeat} . ${OCF_FUNCTIONS_DIR}/ocf-shellfuncs ####################################################################### # Fill in some defaults if no values are specified OCF_RESKEY_binary_default="ceilometer-alarm-evaluator" OCF_RESKEY_config_default="/etc/ceilometer/ceilometer.conf" OCF_RESKEY_user_default="ceilometer" OCF_RESKEY_pid_default="${HA_RSCTMP}/${__SCRIPT_NAME}/${__SCRIPT_NAME}.pid" : ${HA_LOGTAG="ocf-ceilometer-alarm-evaluator"} : ${HA_LOGFACILITY="daemon"} : ${OCF_RESKEY_binary=${OCF_RESKEY_binary_default}} : ${OCF_RESKEY_config=${OCF_RESKEY_config_default}} : ${OCF_RESKEY_user=${OCF_RESKEY_user_default}} : ${OCF_RESKEY_pid=${OCF_RESKEY_pid_default}} ####################################################################### usage() { cat < 1.0 Resource agent for the OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) May manage a ceilometer-alarm-evaluatorinstance or a clone set that creates a distributed ceilometer-alarm-evaluator cluster. Manages the OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) Location of the OpenStack Ceilometer Alarm Evaluator server binary (ceilometer-alarm-evaluator) OpenStack Ceilometer Alarm Evaluator server binary (ceilometer-alarm-evaluator) Location of the OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) configuration file OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) config file User running OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) user The pid file to use for this OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) instance OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) pid file Additional parameters to pass on to the OpenStack Ceilometer Alarm Evaluator Service (ceilometer-alarm-evaluator) Additional parameters for ceilometer-alarm-evaluator END } ####################################################################### # Functions invoked by resource manager actions ceilometer_alarm_evaluator_check_port() { # This function has been taken from the squid RA and improved a bit # The length of the integer must be 4 # Examples of valid port: "1080", "0080" # Examples of invalid port: "1080bad", "0", "0000", "" local int local cnt int="$1" cnt=${#int} echo $int |egrep -qx '[0-9]+(:[0-9]+)?(,[0-9]+(:[0-9]+)?)*' if [ $? -ne 0 ] || [ $cnt -ne 4 ]; then ocf_log err "Invalid port number: $1" exit $OCF_ERR_CONFIGURED fi } ceilometer_alarm_evaluator_validate() { local rc check_binary $OCF_RESKEY_binary check_binary netstat # A config file on shared storage that is not available # during probes is OK. if [ ! -f $OCF_RESKEY_config ]; then if ! ocf_is_probe; then ocf_log err "Config $OCF_RESKEY_config doesn't exist" return $OCF_ERR_INSTALLED fi ocf_log_warn "Config $OCF_RESKEY_config not available during a probe" fi getent passwd $OCF_RESKEY_user >/dev/null 2>&1 rc=$? if [ $rc -ne 0 ]; then ocf_log err "User $OCF_RESKEY_user doesn't exist" return $OCF_ERR_INSTALLED fi true } ceilometer_alarm_evaluator_status() { local pid local rc # check and make PID file dir local PID_DIR="$( dirname ${OCF_RESKEY_pid} )" if [ ! -d "${PID_DIR}" ] ; then ocf_log debug "Create pid file dir: ${PID_DIR} and chown to ${OCF_RESKEY_user}" mkdir -p "${PID_DIR}" chown -R ${OCF_RESKEY_user} "${PID_DIR}" chmod 755 "${PID_DIR}" fi if [ ! -f $OCF_RESKEY_pid ]; then ocf_log info "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) is not running" return $OCF_NOT_RUNNING else pid=`cat $OCF_RESKEY_pid` fi if [ -n "${pid}" ]; then ocf_run -warn kill -s 0 $pid rc=$? else ocf_log err "PID file ${OCF_RESKEY_pid} is empty!" return $OCF_ERR_GENERIC fi if [ $rc -eq 0 ]; then return $OCF_SUCCESS else ocf_log info "Old PID file found, but OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) is not running" return $OCF_NOT_RUNNING fi } ceilometer_alarm_evaluator_monitor() { local rc local pid ceilometer_alarm_evaluator_status rc=$? # If status returned anything but success, return that immediately if [ $rc -ne $OCF_SUCCESS ]; then return $rc fi ocf_log debug "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) monitor succeeded" return $OCF_SUCCESS } ceilometer_alarm_evaluator_start() { local rc ceilometer_alarm_evaluator_status rc=$? if [ $rc -eq $OCF_SUCCESS ]; then ocf_log info "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) already running" return $OCF_SUCCESS fi # run the actual ceilometer-alarm-evaluator daemon. Don't use ocf_run as we're sending the tool's output # straight to /dev/null anyway and using ocf_run would break stdout-redirection here. su ${OCF_RESKEY_user} -s /bin/sh -c "${OCF_RESKEY_binary} --config-file=$OCF_RESKEY_config \ $OCF_RESKEY_additional_parameters"' >> /dev/null 2>&1 & echo $!' > $OCF_RESKEY_pid ocf_log debug "Create pid file: ${OCF_RESKEY_pid} with content $(cat ${OCF_RESKEY_pid})" # Spin waiting for the server to come up. while true; do ceilometer_alarm_evaluator_monitor rc=$? [ $rc -eq $OCF_SUCCESS ] && break if [ $rc -ne $OCF_NOT_RUNNING ]; then ocf_log err "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) start failed" exit $OCF_ERR_GENERIC fi sleep 1 done ocf_log info "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) started" return $OCF_SUCCESS } ceilometer_alarm_evaluator_stop() { local rc local pid ceilometer_alarm_evaluator_status rc=$? if [ $rc -eq $OCF_NOT_RUNNING ]; then ocf_log info "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) already stopped" return $OCF_SUCCESS fi # Try SIGTERM pid=`cat $OCF_RESKEY_pid` ocf_run kill -s TERM $pid rc=$? if [ $rc -ne 0 ]; then ocf_log err "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) couldn't be stopped" exit $OCF_ERR_GENERIC fi # stop waiting shutdown_timeout=15 if [ -n "$OCF_RESKEY_CRM_meta_timeout" ]; then shutdown_timeout=$((($OCF_RESKEY_CRM_meta_timeout/1000)-5)) fi count=0 while [ $count -lt $shutdown_timeout ]; do ceilometer_alarm_evaluator_status rc=$? if [ $rc -eq $OCF_NOT_RUNNING ]; then break fi count=`expr $count + 1` sleep 1 ocf_log debug "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) still hasn't stopped yet. Waiting ..." done ceilometer_alarm_evaluator_status rc=$? if [ $rc -ne $OCF_NOT_RUNNING ]; then # SIGTERM didn't help either, try SIGKILL ocf_log info "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) failed to stop after ${shutdown_timeout}s \ using SIGTERM. Trying SIGKILL ..." ocf_run kill -s KILL $pid fi ocf_log info "OpenStack Ceilometer Alarm Evaluator (ceilometer-alarm-evaluator) stopped" ocf_log debug "Delete pid file: ${OCF_RESKEY_pid} with content $(cat ${OCF_RESKEY_pid})" rm -f $OCF_RESKEY_pid return $OCF_SUCCESS } ####################################################################### case "$1" in meta-data) meta_data exit $OCF_SUCCESS;; usage|help) usage exit $OCF_SUCCESS;; esac # Anything except meta-data and help must pass validation ceilometer_alarm_evaluator_validate || exit $? # What kind of method was invoked? case "$1" in start) ceilometer_alarm_evaluator_start;; stop) ceilometer_alarm_evaluator_stop;; status) ceilometer_alarm_evaluator_status;; monitor) ceilometer_alarm_evaluator_monitor;; validate-all) ;; *) usage exit $OCF_ERR_UNIMPLEMENTED;; esac