diff --color -uNr a/doc/man/Makefile.am b/doc/man/Makefile.am --- a/doc/man/Makefile.am 2021-08-25 09:51:53.037906134 +0200 +++ b/doc/man/Makefile.am 2021-08-25 09:48:44.578408475 +0200 @@ -97,6 +97,8 @@ ocf_heartbeat_ManageRAID.7 \ ocf_heartbeat_ManageVE.7 \ ocf_heartbeat_NodeUtilization.7 \ + ocf_heartbeat_nova-compute-wait.7 \ + ocf_heartbeat_NovaEvacuate.7 \ ocf_heartbeat_Pure-FTPd.7 \ ocf_heartbeat_Raid1.7 \ ocf_heartbeat_Route.7 \ diff --color -uNr a/heartbeat/Makefile.am b/heartbeat/Makefile.am --- a/heartbeat/Makefile.am 2021-08-25 09:51:53.038906137 +0200 +++ b/heartbeat/Makefile.am 2021-08-25 09:48:44.588408501 +0200 @@ -29,6 +29,8 @@ ocfdir = $(OCF_RA_DIR_PREFIX)/heartbeat +ospdir = $(OCF_RA_DIR_PREFIX)/openstack + dtddir = $(datadir)/$(PACKAGE_NAME) dtd_DATA = ra-api-1.dtd metadata.rng @@ -50,6 +52,9 @@ send_ua_SOURCES = send_ua.c IPv6addr_utils.c send_ua_LDADD = $(LIBNETLIBS) +osp_SCRIPTS = nova-compute-wait \ + NovaEvacuate + ocf_SCRIPTS = AoEtarget \ AudibleAlarm \ ClusterMon \ diff --color -uNr a/heartbeat/nova-compute-wait b/heartbeat/nova-compute-wait --- a/heartbeat/nova-compute-wait 1970-01-01 01:00:00.000000000 +0100 +++ b/heartbeat/nova-compute-wait 2021-08-25 09:50:14.626646141 +0200 @@ -0,0 +1,345 @@ +#!/bin/sh +# +# +# nova-compute-wait agent manages compute daemons. +# +# Copyright (c) 2015 +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of version 2 of the GNU General Public License as +# published by the Free Software Foundation. +# +# This program is distributed in the hope that it would be useful, but +# WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. +# +# Further, this software is distributed without any warranty that it is +# free of the rightful claim of any third person regarding infringement +# or the like. Any license provided herein, whether implied or +# otherwise, applies only to this software file. Patent licenses, if +# any, provided herein do not apply to combinations of this program with +# other software, or any other product whatsoever. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write the Free Software Foundation, +# Inc., 59 Temple Place - Suite 330, Boston MA 02111-1307, USA. +# + +####################################################################### +# Initialization: + + +### +: ${OCF_FUNCTIONS_DIR=${OCF_ROOT}/lib/heartbeat} +. ${OCF_FUNCTIONS_DIR}/ocf-shellfuncs +### + +: ${__OCF_ACTION=$1} + +####################################################################### + +meta_data() { + cat < + + +1.0 + + +OpenStack Nova Compute Server. + +OpenStack Nova Compute Server + + + + + +Deprecated option not in use + +Deprecated + + + + + +Deprecated option not in use + +Deprecated + + + + +Deprecated option not in use + +Deprecated + + + + + +Deprecated option not in use + +Deprecated + + + + + +DNS domain in which hosts live, useful when the cluster uses short names and nova uses FQDN + +DNS domain + + + + + +Deprecated option not in use + +Deprecated + + + + + +Deprecated option not in use + +Deprecated + + + + + +How long to wait for nova to finish evacuating instances elsewhere +before starting nova-compute. Only used when the agent detects +evacuations might be in progress. + +You may need to increase the start timeout when increasing this value. + +Delay to allow evacuations time to complete + + + + + + + + + + + + + +END +} + +####################################################################### + +# don't exit on TERM, to test that lrmd makes sure that we do exit +trap sigterm_handler TERM +sigterm_handler() { + ocf_log info "They use TERM to bring us down. No such luck." + return +} + +nova_usage() { + cat </run/systemd/system/openstack-nova-compute.service.d/unfence-20.conf +[Service] +ExecStartPost=/sbin/fence_compute ${fence_options} -o on -n ${NOVA_HOST} +EOF +} + +nova_validate() { + rc=$OCF_SUCCESS + + check_binary crudini + check_binary nova-compute + check_binary fence_compute + + if [ ! -f /etc/nova/nova.conf ]; then + ocf_exit_reason "/etc/nova/nova.conf not found" + exit $OCF_ERR_CONFIGURED + fi + + # Is the state directory writable? + state_dir=$(dirname $statefile) + touch "$state_dir/$$" + if [ $? != 0 ]; then + ocf_exit_reason "Invalid state directory: $state_dir" + return $OCF_ERR_ARGS + fi + rm -f "$state_dir/$$" + + NOVA_HOST=$(crudini --get /etc/nova/nova.conf DEFAULT host 2>/dev/null) + if [ $? = 1 ]; then + short_host=$(uname -n | awk -F. '{print $1}') + if [ "x${OCF_RESKEY_domain}" != x ]; then + NOVA_HOST=${short_host}.${OCF_RESKEY_domain} + else + NOVA_HOST=$(uname -n) + fi + fi + + if [ $rc != $OCF_SUCCESS ]; then + exit $rc + fi + return $rc +} + +statefile="${HA_RSCTMP}/${OCF_RESOURCE_INSTANCE}.active" + +: ${OCF_RESKEY_evacuation_delay=120} +case $__OCF_ACTION in +meta-data) meta_data + exit $OCF_SUCCESS + ;; +usage|help) nova_usage + exit $OCF_SUCCESS + ;; +esac + +case $__OCF_ACTION in +start) nova_validate; nova_start;; +stop) nova_stop;; +monitor) nova_validate; nova_monitor;; +notify) nova_notify;; +validate-all) exit $OCF_SUCCESS;; +*) nova_usage + exit $OCF_ERR_UNIMPLEMENTED + ;; +esac +rc=$? +ocf_log debug "${OCF_RESOURCE_INSTANCE} $__OCF_ACTION : $rc" +exit $rc + diff --color -uNr a/heartbeat/NovaEvacuate b/heartbeat/NovaEvacuate --- a/heartbeat/NovaEvacuate 1970-01-01 01:00:00.000000000 +0100 +++ b/heartbeat/NovaEvacuate 2021-08-25 09:50:23.780670326 +0200 @@ -0,0 +1,400 @@ +#!/bin/bash +# +# Copyright 2015 Red Hat, Inc. +# +# Description: Manages evacuation of nodes running nova-compute +# +# Authors: Andrew Beekhof +# +# Support: openstack@lists.openstack.org +# License: Apache Software License (ASL) 2.0 +# + + +####################################################################### +# Initialization: + +### +: ${OCF_FUNCTIONS_DIR=${OCF_ROOT}/lib/heartbeat} +. ${OCF_FUNCTIONS_DIR}/ocf-shellfuncs +### + +: ${__OCF_ACTION=$1} + +####################################################################### + +meta_data() { + cat < + + +1.0 + + +Facility for tacking a list of compute nodes and reliably evacuating the ones that fence_evacuate has flagged. + +Evacuator for OpenStack Nova Compute Server + + + + + +Authorization URL for connecting to keystone in admin context + +Authorization URL + + + + + +Username for connecting to keystone in admin context + +Username + + + + + +Password for connecting to keystone in admin context + +Password + + + + + +Tenant name for connecting to keystone in admin context. +Note that with Keystone V3 tenant names are only unique within a domain. + +Tenant name + + + + + +DNS domain in which hosts live, useful when the cluster uses short names and nova uses FQDN + +DNS domain + + + + + +Nova API location (internal, public or admin URL) + +Nova API location (internal, public or admin URL) + + + + + +Region name for connecting to nova. + +Region name + + + + + +Explicitly allow client to perform "insecure" TLS (https) requests. +The server's certificate will not be verified against any certificate authorities. +This option should be used with caution. + +Allow insecure TLS requests + + + + + +Indicate that nova storage for instances is not shared across compute +nodes. This must match the reality of how nova storage is configured! +Otherwise VMs could end up in error state upon evacuation. When +storage is non-shared, instances on dead hypervisors will be rebuilt +from their original image or volume, so anything on ephemeral storage +will be lost. + +Disable shared storage recovery for instances + + + + + +Enable extra logging from the evacuation process + +Enable debug logging + + + + + +Allows delaying the nova evacuate API call, e.g. to give a storage array time to clean +up eventual locks/leases. + +Nova evacuate delay + + + + + + + + + + + + + +END +} + +####################################################################### + +# don't exit on TERM, to test that lrmd makes sure that we do exit +trap sigterm_handler TERM +sigterm_handler() { + ocf_log info "They use TERM to bring us down. No such luck." + return +} + +evacuate_usage() { + cat < >(grep -v "attribute does not exist" 1>&2) | + sed 's/ value=""/ value="no"/' | + tr '="' ' ' | + awk '{print $4" "$6}' + ) + return $OCF_SUCCESS +} + +evacuate_validate() { + rc=$OCF_SUCCESS + fence_options="" + + if ! have_binary fence_evacuate; then + check_binary fence_compute + fi + + # Is the state directory writable? + state_dir=$(dirname $statefile) + touch "$state_dir/$$" + if [ $? != 0 ]; then + ocf_exit_reason "Invalid state directory: $state_dir" + return $OCF_ERR_ARGS + fi + rm -f "$state_dir/$$" + + if [ -z "${OCF_RESKEY_auth_url}" ]; then + ocf_exit_reason "auth_url not configured" + exit $OCF_ERR_CONFIGURED + fi + + fence_options="${fence_options} -k ${OCF_RESKEY_auth_url}" + + if [ -z "${OCF_RESKEY_username}" ]; then + ocf_exit_reason "username not configured" + exit $OCF_ERR_CONFIGURED + fi + + fence_options="${fence_options} -l ${OCF_RESKEY_username}" + + if [ -z "${OCF_RESKEY_password}" ]; then + ocf_exit_reason "password not configured" + exit $OCF_ERR_CONFIGURED + fi + + fence_options="${fence_options} -p ${OCF_RESKEY_password}" + + if [ -z "${OCF_RESKEY_tenant_name}" ]; then + ocf_exit_reason "tenant_name not configured" + exit $OCF_ERR_CONFIGURED + fi + + fence_options="${fence_options} -t ${OCF_RESKEY_tenant_name}" + + if [ -n "${OCF_RESKEY_domain}" ]; then + fence_options="${fence_options} -d ${OCF_RESKEY_domain}" + fi + + if [ -n "${OCF_RESKEY_region_name}" ]; then + fence_options="${fence_options} \ + --region-name ${OCF_RESKEY_region_name}" + fi + + if [ -n "${OCF_RESKEY_insecure}" ]; then + if ocf_is_true "${OCF_RESKEY_insecure}"; then + fence_options="${fence_options} --insecure" + fi + fi + + if [ -n "${OCF_RESKEY_no_shared_storage}" ]; then + if ocf_is_true "${OCF_RESKEY_no_shared_storage}"; then + fence_options="${fence_options} --no-shared-storage" + fi + fi + + if [ -n "${OCF_RESKEY_verbose}" ]; then + if ocf_is_true "${OCF_RESKEY_verbose}"; then + fence_options="${fence_options} --verbose" + fi + fi + + if [ -n "${OCF_RESKEY_endpoint_type}" ]; then + case ${OCF_RESKEY_endpoint_type} in + adminURL|publicURL|internalURL) + ;; + *) + ocf_exit_reason "endpoint_type ${OCF_RESKEY_endpoint_type}" \ + "not valid. Use adminURL or publicURL or internalURL" + exit $OCF_ERR_CONFIGURED + ;; + esac + fence_options="${fence_options} -e ${OCF_RESKEY_endpoint_type}" + fi + + if [ $rc != $OCF_SUCCESS ]; then + exit $rc + fi + return $rc +} + +statefile="${HA_RSCTMP}/${OCF_RESOURCE_INSTANCE}.active" + +case $__OCF_ACTION in + start) + evacuate_validate + evacuate_start + ;; + stop) + evacuate_stop + ;; + monitor) + evacuate_validate + evacuate_monitor + ;; + meta-data) + meta_data + exit $OCF_SUCCESS + ;; + usage|help) + evacuate_usage + exit $OCF_SUCCESS + ;; + validate-all) + exit $OCF_SUCCESS + ;; + *) + evacuate_usage + exit $OCF_ERR_UNIMPLEMENTED + ;; +esac +rc=$? +ocf_log debug "${OCF_RESOURCE_INSTANCE} $__OCF_ACTION : $rc" +exit $rc