summaryrefslogtreecommitdiffstats
path: root/extras/ganesha/scripts/ganesha-ha.sh
diff options
context:
space:
mode:
authorKaleb S. KEITHLEY <kkeithle@redhat.com>2017-01-06 10:37:54 -0500
committerKaleb KEITHLEY <kkeithle@redhat.com>2017-01-17 16:53:30 -0800
commitc822e354e16646adf18bbc5123798663faa543b2 (patch)
treef22b87c6711639135f991293f5c406f06466ec92 /extras/ganesha/scripts/ganesha-ha.sh
parent7b61434257f68749bfceee481fa505de7f945747 (diff)
storhaug HA: first step, remove resource agents and setup script
resource agents and setup script(s) are now in storhaug This is a phased switch-over to storhaug. Ultimately all components here should be (re)moved to the storhaug project and its packages. But for now some will linger here. Change-Id: Ied3956972b14b14d8a76e22c583b1fe25869f8e7 BUG: 1410843 Signed-off-by: Kaleb S. KEITHLEY <kkeithle@redhat.com> Reviewed-on: http://review.gluster.org/16349 Smoke: Gluster Build System <jenkins@build.gluster.org> NetBSD-regression: NetBSD Build System <jenkins@build.gluster.org> CentOS-regression: Gluster Build System <jenkins@build.gluster.org>
Diffstat (limited to 'extras/ganesha/scripts/ganesha-ha.sh')
-rw-r--r--extras/ganesha/scripts/ganesha-ha.sh1126
1 files changed, 0 insertions, 1126 deletions
diff --git a/extras/ganesha/scripts/ganesha-ha.sh b/extras/ganesha/scripts/ganesha-ha.sh
deleted file mode 100644
index e4135ba4776..00000000000
--- a/extras/ganesha/scripts/ganesha-ha.sh
+++ /dev/null
@@ -1,1126 +0,0 @@
-#!/bin/bash
-
-# Copyright 2015-2016 Red Hat Inc. All Rights Reserved
-#
-# Pacemaker+Corosync High Availability for NFS-Ganesha
-#
-# setup, teardown, add, delete, refresh-config, and status
-#
-# Each participating node in the cluster is assigned a virtual IP (VIP)
-# which fails over to another node when its associated ganesha.nfsd dies
-# for any reason. After the VIP is moved to another node all the
-# ganesha.nfsds are send a signal using DBUS to put them into NFS GRACE.
-#
-# There are six resource agent types used: ganesha_mon, ganesha_grace,
-# ganesha_nfsd, IPaddr, and Dummy. ganesha_mon is used to monitor the
-# ganesha.nfsd. ganesha_grace is used to send the DBUS signal to put
-# the remaining ganesha.nfsds into grace. ganesha_nfsd is used to start
-# and stop the ganesha.nfsd during setup and teardown. IPaddr manages
-# the VIP. A Dummy resource named $hostname-trigger_ip-1 is used to
-# ensure that the NFS GRACE DBUS signal is sent after the VIP moves to
-# the new host.
-
-HA_NUM_SERVERS=0
-HA_SERVERS=""
-HA_VOL_NAME="gluster_shared_storage"
-HA_VOL_MNT="/var/run/gluster/shared_storage"
-HA_CONFDIR=$HA_VOL_MNT"/nfs-ganesha"
-SERVICE_MAN="DISTRO_NOT_FOUND"
-
-RHEL6_PCS_CNAME_OPTION="--name"
-SECRET_PEM="/var/lib/glusterd/nfs/secret.pem"
-
-# UNBLOCK RA uses shared_storage which may become unavailable
-# during any of the nodes reboot. Hence increase timeout value.
-PORTBLOCK_UNBLOCK_TIMEOUT="60s"
-
-# Try loading the config from any of the distro
-# specific configuration locations
-if [ -f /etc/sysconfig/ganesha ]
- then
- . /etc/sysconfig/ganesha
-fi
-if [ -f /etc/conf.d/ganesha ]
- then
- . /etc/conf.d/ganesha
-fi
-if [ -f /etc/default/ganesha ]
- then
- . /etc/default/ganesha
-fi
-
-GANESHA_CONF=
-
-function find_rhel7_conf
-{
- while [[ $# > 0 ]]
- do
- key="$1"
- case $key in
- -f)
- CONFFILE="$2"
- break;
- ;;
- *)
- ;;
- esac
- shift
- done
-}
-
-if [ -z $CONFFILE ]
- then
- find_rhel7_conf $OPTIONS
-
-fi
-
-GANESHA_CONF=${CONFFILE:-/etc/ganesha/ganesha.conf}
-
-usage() {
-
- echo "Usage : add|delete|refresh-config|status"
- echo "Add-node : ganesha-ha.sh --add <HA_CONF_DIR> \
-<NODE-HOSTNAME> <NODE-VIP>"
- echo "Delete-node: ganesha-ha.sh --delete <HA_CONF_DIR> \
-<NODE-HOSTNAME>"
- echo "Refresh-config : ganesha-ha.sh --refresh-config <HA_CONFDIR> \
-<volume>"
- echo "Status : ganesha-ha.sh --status <HA_CONFDIR>"
-}
-
-determine_service_manager () {
-
- if [ -e "/usr/bin/systemctl" ];
- then
- SERVICE_MAN="/usr/bin/systemctl"
- elif [ -e "/sbin/invoke-rc.d" ];
- then
- SERVICE_MAN="/sbin/invoke-rc.d"
- elif [ -e "/sbin/service" ];
- then
- SERVICE_MAN="/sbin/service"
- fi
- if [ "$SERVICE_MAN" == "DISTRO_NOT_FOUND" ]
- then
- echo "Service manager not recognized, exiting"
- exit 1
- fi
-}
-
-manage_service ()
-{
- local action=${1}
- local new_node=${2}
- local option=
-
- if [ "$action" == "start" ]; then
- option="yes"
- else
- option="no"
- fi
- ssh -oPasswordAuthentication=no -oStrictHostKeyChecking=no -i \
-${SECRET_PEM} root@${new_node} "/usr/libexec/ganesha/ganesha-ha.sh --setup-ganesha-conf-files $HA_CONFDIR $option"
-
- if [ "$SERVICE_MAN" == "/usr/bin/systemctl" ]
- then
- ssh -oPasswordAuthentication=no -oStrictHostKeyChecking=no -i \
-${SECRET_PEM} root@${new_node} "$SERVICE_MAN ${action} nfs-ganesha"
- else
- ssh -oPasswordAuthentication=no -oStrictHostKeyChecking=no -i \
-${SECRET_PEM} root@${new_node} "$SERVICE_MAN nfs-ganesha ${action}"
- fi
-}
-
-
-check_cluster_exists()
-{
- local name=${1}
- local cluster_name=""
-
- if [ -e /var/run/corosync.pid ]; then
- cluster_name=$(pcs status | grep "Cluster name:" | cut -d ' ' -f 3)
- if [ ${cluster_name} -a ${cluster_name} = ${name} ]; then
- logger "$name already exists, exiting"
- exit 0
- fi
- fi
-}
-
-
-determine_servers()
-{
- local cmd=${1}
- local num_servers=0
- local tmp_ifs=${IFS}
- local ha_servers=""
-
- if [ "X${cmd}X" != "XsetupX" -a "X${cmd}X" != "XstatusX" ]; then
- ha_servers=$(pcs status | grep "Online:" | grep -o '\[.*\]' | sed -e 's/\[//' | sed -e 's/\]//')
- IFS=$' '
- for server in ${ha_servers} ; do
- num_servers=$(expr ${num_servers} + 1)
- done
- IFS=${tmp_ifs}
- HA_NUM_SERVERS=${num_servers}
- HA_SERVERS="${ha_servers}"
- else
- IFS=$','
- for server in ${HA_CLUSTER_NODES} ; do
- num_servers=$(expr ${num_servers} + 1)
- done
- IFS=${tmp_ifs}
- HA_NUM_SERVERS=${num_servers}
- HA_SERVERS="${HA_CLUSTER_NODES//,/ }"
- fi
-}
-
-
-setup_cluster()
-{
- local name=${1}
- local num_servers=${2}
- local servers=${3}
- local unclean=""
- local quorum_policy="stop"
-
- logger "setting up cluster ${name} with the following ${servers}"
-
- pcs cluster auth ${servers}
- # pcs cluster setup --name ${name} ${servers}
- pcs cluster setup ${RHEL6_PCS_CNAME_OPTION} ${name} --transport udpu ${servers}
- if [ $? -ne 0 ]; then
- logger "pcs cluster setup ${RHEL6_PCS_CNAME_OPTION} ${name} ${servers} failed"
- exit 1;
- fi
- pcs cluster start --all
- if [ $? -ne 0 ]; then
- logger "pcs cluster start failed"
- exit 1;
- fi
-
- sleep 1
- # wait for the cluster to elect a DC before querying or writing
- # to the CIB. BZ 1334092
- crmadmin --dc_lookup --timeout=5000 > /dev/null 2>&1
- while [ $? -ne 0 ]; do
- crmadmin --dc_lookup --timeout=5000 > /dev/null 2>&1
- done
-
- unclean=$(pcs status | grep -u "UNCLEAN")
- while [[ "${unclean}X" = "UNCLEANX" ]]; do
- sleep 1
- unclean=$(pcs status | grep -u "UNCLEAN")
- done
- sleep 1
-
- if [ ${num_servers} -lt 3 ]; then
- quorum_policy="ignore"
- fi
- pcs property set no-quorum-policy=${quorum_policy}
- if [ $? -ne 0 ]; then
- logger "warning: pcs property set no-quorum-policy=${quorum_policy} failed"
- fi
-
- pcs property set stonith-enabled=false
- if [ $? -ne 0 ]; then
- logger "warning: pcs property set stonith-enabled=false failed"
- fi
-}
-
-
-setup_finalize_ha()
-{
- local cibfile=${1}
- local stopped=""
-
- stopped=$(pcs status | grep -u "Stopped")
- while [[ "${stopped}X" = "StoppedX" ]]; do
- sleep 1
- stopped=$(pcs status | grep -u "Stopped")
- done
-}
-
-
-refresh_config ()
-{
- local short_host=$(hostname -s)
- local VOL=${1}
- local HA_CONFDIR=${2}
- local short_host=$(hostname -s)
-
- local export_id=$(grep ^[[:space:]]*Export_Id $HA_CONFDIR/exports/export.$VOL.conf |\
- awk -F"[=,;]" '{print $2}' | tr -d '[[:space:]]')
-
-
- if [ -e ${SECRET_PEM} ]; then
- while [[ ${3} ]]; do
- current_host=`echo ${3} | cut -d "." -f 1`
- if [ ${short_host} != ${current_host} ]; then
- output=$(ssh -oPasswordAuthentication=no \
--oStrictHostKeyChecking=no -i ${SECRET_PEM} root@${current_host} \
-"dbus-send --print-reply --system --dest=org.ganesha.nfsd \
-/org/ganesha/nfsd/ExportMgr org.ganesha.nfsd.exportmgr.UpdateExport \
-string:$HA_CONFDIR/exports/export.$VOL.conf \
-string:\"EXPORT(Export_Id=$export_id)\" 2>&1")
- ret=$?
- logger <<< "${output}"
- if [ ${ret} -ne 0 ]; then
- echo "Error: refresh-config failed on ${current_host}."
- exit 1
- else
- echo "Refresh-config completed on ${current_host}."
- fi
-
- fi
- shift
- done
- else
- echo "Error: refresh-config failed. Passwordless ssh is not enabled."
- exit 1
- fi
-
- # Run the same command on the localhost,
- output=$(dbus-send --print-reply --system --dest=org.ganesha.nfsd \
-/org/ganesha/nfsd/ExportMgr org.ganesha.nfsd.exportmgr.UpdateExport \
-string:$HA_CONFDIR/exports/export.$VOL.conf \
-string:"EXPORT(Export_Id=$export_id)" 2>&1)
- ret=$?
- logger <<< "${output}"
- if [ ${ret} -ne 0 ] ; then
- echo "Error: refresh-config failed on localhost."
- exit 1
- else
- echo "Success: refresh-config completed."
- fi
-}
-
-
-teardown_cluster()
-{
- local name=${1}
-
- for server in ${HA_SERVERS} ; do
- if [[ ${HA_CLUSTER_NODES} != *${server}* ]]; then
- logger "info: ${server} is not in config, removing"
-
- pcs cluster stop ${server} --force
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster stop ${server} failed"
- fi
-
- pcs cluster node remove ${server}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster node remove ${server} failed"
- fi
- fi
- done
-
- # BZ 1193433 - pcs doesn't reload cluster.conf after modification
- # after teardown completes, a subsequent setup will appear to have
- # 'remembered' the deleted node. You can work around this by
- # issuing another `pcs cluster node remove $node`,
- # `crm_node -f -R $server`, or
- # `cibadmin --delete --xml-text '<node id="$server"
- # uname="$server"/>'
-
- pcs cluster stop --all
- if [ $? -ne 0 ]; then
- logger "warning pcs cluster stop --all failed"
- fi
-
- pcs cluster destroy
- if [ $? -ne 0 ]; then
- logger "error pcs cluster destroy failed"
- exit 1
- fi
-}
-
-
-cleanup_ganesha_config ()
-{
- rm -f /etc/corosync/corosync.conf
- rm -rf /etc/cluster/cluster.conf*
- rm -rf /var/lib/pacemaker/cib/*
-}
-
-do_create_virt_ip_constraints()
-{
- local cibfile=${1}; shift
- local primary=${1}; shift
- local weight="1000"
-
- # first a constraint location rule that says the VIP must be where
- # there's a ganesha.nfsd running
- pcs -f ${cibfile} constraint location ${primary}-group rule score=-INFINITY ganesha-active ne 1
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint location ${primary}-group rule score=-INFINITY ganesha-active ne 1 failed"
- fi
-
- # then a set of constraint location prefers to set the prefered order
- # for where a VIP should move
- while [[ ${1} ]]; do
- pcs -f ${cibfile} constraint location ${primary}-group prefers ${1}=${weight}
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint location ${primary}-group prefers ${1}=${weight} failed"
- fi
- weight=$(expr ${weight} + 1000)
- shift
- done
- # and finally set the highest preference for the VIP to its home node
- # default weight when created is/was 100.
- # on Fedora setting appears to be additive, so to get the desired
- # value we adjust the weight
- # weight=$(expr ${weight} - 100)
- pcs -f ${cibfile} constraint location ${primary}-group prefers ${primary}=${weight}
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint location ${primary}-group prefers ${primary}=${weight} failed"
- fi
-}
-
-
-wrap_create_virt_ip_constraints()
-{
- local cibfile=${1}; shift
- local primary=${1}; shift
- local head=""
- local tail=""
-
- # build a list of peers, e.g. for a four node cluster, for node1,
- # the result is "node2 node3 node4"; for node2, "node3 node4 node1"
- # and so on.
- while [[ ${1} ]]; do
- if [ "${1}" = "${primary}" ]; then
- shift
- while [[ ${1} ]]; do
- tail=${tail}" "${1}
- shift
- done
- else
- head=${head}" "${1}
- fi
- shift
- done
- do_create_virt_ip_constraints ${cibfile} ${primary} ${tail} ${head}
-}
-
-
-create_virt_ip_constraints()
-{
- local cibfile=${1}; shift
-
- while [[ ${1} ]]; do
- wrap_create_virt_ip_constraints ${cibfile} ${1} ${HA_SERVERS}
- shift
- done
-}
-
-
-setup_create_resources()
-{
- local cibfile=$(mktemp -u)
-
- # fixup /var/lib/nfs
- logger "pcs resource create nfs_setup ocf:heartbeat:ganesha_nfsd ha_vol_mnt=${HA_VOL_MNT} --clone"
- pcs resource create nfs_setup ocf:heartbeat:ganesha_nfsd ha_vol_mnt=${HA_VOL_MNT} --clone
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource create nfs_setup ocf:heartbeat:ganesha_nfsd ha_vol_mnt=${HA_VOL_MNT} --clone failed"
- fi
-
- pcs resource create nfs-mon ocf:heartbeat:ganesha_mon --clone
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource create nfs-mon ocf:heartbeat:ganesha_mon --clone failed"
- fi
-
- # see comment in (/usr/lib/ocf/resource.d/heartbeat/ganesha_grace
- # start method. Allow time for ganesha_mon to start and set the
- # ganesha-active crm_attribute
- sleep 5
-
- pcs resource create nfs-grace ocf:heartbeat:ganesha_grace --clone meta notify=true
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource create nfs-grace ocf:heartbeat:ganesha_grace --clone failed"
- fi
-
- pcs constraint location nfs-grace-clone rule score=-INFINITY grace-active ne 1
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint location nfs-grace-clone rule score=-INFINITY grace-active ne 1"
- fi
-
- pcs cluster cib ${cibfile}
-
- while [[ ${1} ]]; do
-
- # this is variable indirection
- # from a nvs like 'VIP_host1=10.7.6.5' or 'VIP_host1="10.7.6.5"'
- # (or VIP_host-1=..., or VIP_host-1.my.domain.name=...)
- # a variable 'clean_name' is created (e.g. w/ value 'VIP_host_1')
- # and a clean nvs (e.g. w/ value 'VIP_host_1="10_7_6_5"')
- # after the `eval ${clean_nvs}` there is a variable VIP_host_1
- # with the value '10_7_6_5', and the following \$$ magic to
- # reference it, i.e. `eval tmp_ipaddr=\$${clean_name}` gives us
- # ${tmp_ipaddr} with 10_7_6_5 and then convert the _s back to .s
- # to give us ipaddr="10.7.6.5". whew!
- name="VIP_${1}"
- clean_name=${name//[-.]/_}
- nvs=$(grep "^${name}=" ${HA_CONFDIR}/ganesha-ha.conf)
- clean_nvs=${nvs//[-.]/_}
- eval ${clean_nvs}
- eval tmp_ipaddr=\$${clean_name}
- ipaddr=${tmp_ipaddr//_/.}
-
- pcs -f ${cibfile} resource create ${1}-nfs_block ocf:heartbeat:portblock protocol=tcp \
- portno=2049 action=block ip=${ipaddr} --group ${1}-group
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${1}-nfs_block failed"
- fi
- pcs -f ${cibfile} resource create ${1}-cluster_ip-1 ocf:heartbeat:IPaddr ip=${ipaddr} \
- cidr_netmask=32 op monitor interval=15s --group ${1}-group --after ${1}-nfs_block
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${1}-cluster_ip-1 ocf:heartbeat:IPaddr ip=${ipaddr} \
- cidr_netmask=32 op monitor interval=15s failed"
- fi
-
- pcs -f ${cibfile} constraint order nfs-grace-clone then ${1}-cluster_ip-1
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint order nfs-grace-clone then ${1}-cluster_ip-1 failed"
- fi
-
- pcs -f ${cibfile} resource create ${1}-nfs_unblock ocf:heartbeat:portblock protocol=tcp \
- portno=2049 action=unblock ip=${ipaddr} reset_local_on_unblock_stop=true \
- tickle_dir=${HA_VOL_MNT}/nfs-ganesha/tickle_dir/ --group ${1}-group --after ${1}-cluster_ip-1 \
- op stop timeout=${PORTBLOCK_UNBLOCK_TIMEOUT} op start timeout=${PORTBLOCK_UNBLOCK_TIMEOUT} \
- op monitor interval=10s timeout=${PORTBLOCK_UNBLOCK_TIMEOUT}
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${1}-nfs_unblock failed"
- fi
-
-
- shift
- done
-
- create_virt_ip_constraints ${cibfile} ${HA_SERVERS}
-
- pcs cluster cib-push ${cibfile}
- if [ $? -ne 0 ]; then
- logger "warning pcs cluster cib-push ${cibfile} failed"
- fi
- rm -f ${cibfile}
-}
-
-
-teardown_resources()
-{
- # local mntpt=$(grep ha-vol-mnt ${HA_CONFIG_FILE} | cut -d = -f 2)
-
- # restore /var/lib/nfs
- logger "notice: pcs resource delete nfs_setup-clone"
- pcs resource delete nfs_setup-clone
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource delete nfs_setup-clone failed"
- fi
-
- # delete -clone resource agents
- # in particular delete the ganesha monitor so we don't try to
- # trigger anything when we shut down ganesha next.
- pcs resource delete nfs-mon-clone
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource delete nfs-mon-clone failed"
- fi
-
- pcs resource delete nfs-grace-clone
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource delete nfs-grace-clone failed"
- fi
-
- while [[ ${1} ]]; do
- pcs resource delete ${1}-group
- if [ $? -ne 0 ]; then
- logger "warning: pcs resource delete ${1}-group failed"
- fi
- shift
- done
-
-}
-
-
-recreate_resources()
-{
- local cibfile=${1}; shift
-
- while [[ ${1} ]]; do
- # this is variable indirection
- # see the comment on the same a few lines up
- name="VIP_${1}"
- clean_name=${name//[-.]/_}
- nvs=$(grep "^${name}=" ${HA_CONFDIR}/ganesha-ha.conf)
- clean_nvs=${nvs//[-.]/_}
- eval ${clean_nvs}
- eval tmp_ipaddr=\$${clean_name}
- ipaddr=${tmp_ipaddr//_/.}
-
- pcs -f ${cibfile} resource create ${1}-nfs_block ocf:heartbeat:portblock protocol=tcp \
- portno=2049 action=block ip=${ipaddr} --group ${1}-group
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${1}-nfs_block failed"
- fi
- pcs -f ${cibfile} resource create ${1}-cluster_ip-1 ocf:heartbeat:IPaddr ip=${ipaddr} \
- cidr_netmask=32 op monitor interval=15s --group ${1}-group --after ${1}-nfs_block
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${1}-cluster_ip-1 ocf:heartbeat:IPaddr ip=${ipaddr} \
- cidr_netmask=32 op monitor interval=15s failed"
- fi
-
- pcs -f ${cibfile} constraint order nfs-grace-clone then ${1}-cluster_ip-1
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint order nfs-grace-clone then ${1}-cluster_ip-1 failed"
- fi
-
- pcs -f ${cibfile} resource create ${1}-nfs_unblock ocf:heartbeat:portblock protocol=tcp \
- portno=2049 action=unblock ip=${ipaddr} reset_local_on_unblock_stop=true \
- tickle_dir=${HA_VOL_MNT}/nfs-ganesha/tickle_dir/ --group ${1}-group --after ${1}-cluster_ip-1 \
- op stop timeout=${PORTBLOCK_UNBLOCK_TIMEOUT} op start timeout=${PORTBLOCK_UNBLOCK_TIMEOUT} \
- op monitor interval=10s timeout=${PORTBLOCK_UNBLOCK_TIMEOUT}
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${1}-nfs_unblock failed"
- fi
-
- shift
- done
-}
-
-
-addnode_recreate_resources()
-{
- local cibfile=${1}; shift
- local add_node=${1}; shift
- local add_vip=${1}; shift
-
- recreate_resources ${cibfile} ${HA_SERVERS}
-
- pcs -f ${cibfile} resource create ${add_node}-nfs_block ocf:heartbeat:portblock \
- protocol=tcp portno=2049 action=block ip=${add_vip} --group ${add_node}-group
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${add_node}-nfs_block failed"
- fi
- pcs -f ${cibfile} resource create ${add_node}-cluster_ip-1 ocf:heartbeat:IPaddr \
- ip=${add_vip} cidr_netmask=32 op monitor interval=15s --group ${add_node}-group \
- --after ${add_node}-nfs_block
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${add_node}-cluster_ip-1 ocf:heartbeat:IPaddr \
- ip=${add_vip} cidr_netmask=32 op monitor interval=15s failed"
- fi
-
- pcs -f ${cibfile} constraint order nfs-grace-clone then ${add_node}-cluster_ip-1
- if [ $? -ne 0 ]; then
- logger "warning: pcs constraint order nfs-grace-clone then ${add_node}-cluster_ip-1 failed"
- fi
- pcs -f ${cibfile} resource create ${add_node}-nfs_unblock ocf:heartbeat:portblock \
- protocol=tcp portno=2049 action=unblock ip=${add_vip} reset_local_on_unblock_stop=true \
- tickle_dir=${HA_VOL_MNT}/nfs-ganesha/tickle_dir/ --group ${add_node}-group --after \
- ${add_node}-cluster_ip-1 op stop timeout=${PORTBLOCK_UNBLOCK_TIMEOUT} op start \
- timeout=${PORTBLOCK_UNBLOCK_TIMEOUT} op monitor interval=10s \
- timeout=${PORTBLOCK_UNBLOCK_TIMEOUT}
- if [ $? -ne 0 ]; then
- logger "warning pcs resource create ${add_node}-nfs_unblock failed"
- fi
-}
-
-
-clear_resources()
-{
- local cibfile=${1}; shift
-
- while [[ ${1} ]]; do
- pcs -f ${cibfile} resource delete ${1}-group
- if [ $? -ne 0 ]; then
- logger "warning: pcs -f ${cibfile} resource delete ${1}-group"
- fi
-
- shift
- done
-}
-
-
-addnode_create_resources()
-{
- local add_node=${1}; shift
- local add_vip=${1}; shift
- local cibfile=$(mktemp -u)
-
- # start HA on the new node
- pcs cluster start ${add_node}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster start ${add_node} failed"
- fi
-
- pcs cluster cib ${cibfile}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster cib ${cibfile} failed"
- fi
-
- # delete all the -cluster_ip-1 resources, clearing
- # their constraints, then create them again so we can
- # recompute their constraints
- clear_resources ${cibfile} ${HA_SERVERS}
- addnode_recreate_resources ${cibfile} ${add_node} ${add_vip}
-
- HA_SERVERS="${HA_SERVERS} ${add_node}"
- create_virt_ip_constraints ${cibfile} ${HA_SERVERS}
-
- pcs cluster cib-push ${cibfile}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster cib-push ${cibfile} failed"
- fi
- rm -f ${cibfile}
-}
-
-
-deletenode_delete_resources()
-{
- local node=${1}; shift
- local ha_servers=$(echo "${HA_SERVERS}" | sed s/${node}//)
- local cibfile=$(mktemp -u)
-
- pcs cluster cib ${cibfile}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster cib ${cibfile} failed"
- fi
-
- # delete all the -cluster_ip-1 and -trigger_ip-1 resources,
- # clearing their constraints, then create them again so we can
- # recompute their constraints
- clear_resources ${cibfile} ${HA_SERVERS}
- recreate_resources ${cibfile} ${ha_servers}
- HA_SERVERS=$(echo "${ha_servers}" | sed -e "s/ / /")
-
- create_virt_ip_constraints ${cibfile} ${HA_SERVERS}
-
- pcs cluster cib-push ${cibfile}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster cib-push ${cibfile} failed"
- fi
- rm -f ${cibfile}
-
-}
-
-
-deletenode_update_haconfig()
-{
- local name="VIP_${1}"
- local clean_name=${name//[-.]/_}
-
- ha_servers=$(echo ${HA_SERVERS} | sed -e "s/ /,/")
- sed -i -e "s/^HA_CLUSTER_NODES=.*$/HA_CLUSTER_NODES=\"${ha_servers// /,}\"/" -e "s/^${name}=.*$//" -e "/^$/d" ${HA_CONFDIR}/ganesha-ha.conf
-}
-
-
-setup_state_volume()
-{
- local mnt=${HA_VOL_MNT}
- local longname=""
- local shortname=""
- local dname=""
- local dirname=""
-
- longname=$(hostname)
- dname=${longname#$(hostname -s)}
-
- while [[ ${1} ]]; do
-
- if [[ ${1} == *${dname} ]]; then
- dirname=${1}
- else
- dirname=${1}${dname}
- fi
-
- if [ ! -d ${mnt}/nfs-ganesha/tickle_dir ]; then
- mkdir ${mnt}/nfs-ganesha/tickle_dir
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname} ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/statd ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/statd
- fi
- if [ ! -e ${mnt}/nfs-ganesha/${dirname}/nfs/state ]; then
- touch ${mnt}/nfs-ganesha/${dirname}/nfs/state
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4recov ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4recov
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4old ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4old
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm.bak ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm.bak
- fi
- if [ ! -e ${mnt}/nfs-ganesha/${dirname}/nfs/statd/state ]; then
- touch ${mnt}/nfs-ganesha/${dirname}/nfs/statd/state
- fi
- for server in ${HA_SERVERS} ; do
- if [ ${server} != ${dirname} ]; then
- ln -s ${mnt}/nfs-ganesha/${server}/nfs/ganesha ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/${server}
- ln -s ${mnt}/nfs-ganesha/${server}/nfs/statd ${mnt}/nfs-ganesha/${dirname}/nfs/statd/${server}
- fi
- done
- shift
- done
-
-}
-
-
-addnode_state_volume()
-{
- local newnode=${1}; shift
- local mnt=${HA_VOL_MNT}
- local longname=""
- local dname=""
- local dirname=""
-
- longname=$(hostname)
- dname=${longname#$(hostname -s)}
-
- if [[ ${newnode} == *${dname} ]]; then
- dirname=${newnode}
- else
- dirname=${newnode}${dname}
- fi
-
- if [ ! -d ${mnt}/nfs-ganesha/${dirname} ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/statd ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/statd
- fi
- if [ ! -e ${mnt}/nfs-ganesha/${dirname}/nfs/state ]; then
- touch ${mnt}/nfs-ganesha/${dirname}/nfs/state
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4recov ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4recov
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4old ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/v4old
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm
- fi
- if [ ! -d ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm.bak ]; then
- mkdir ${mnt}/nfs-ganesha/${dirname}/nfs/statd/sm.bak
- fi
- if [ ! -e ${mnt}/nfs-ganesha/${dirname}/nfs/statd/state ]; then
- touch ${mnt}/nfs-ganesha/${dirname}/nfs/statd/state
- fi
-
- for server in ${HA_SERVERS} ; do
-
- if [[ ${server} != ${dirname} ]]; then
- ln -s ${mnt}/nfs-ganesha/${server}/nfs/ganesha ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha/${server}
- ln -s ${mnt}/nfs-ganesha/${server}/nfs/statd ${mnt}/nfs-ganesha/${dirname}/nfs/statd/${server}
-
- ln -s ${mnt}/nfs-ganesha/${dirname}/nfs/ganesha ${mnt}/nfs-ganesha/${server}/nfs/ganesha/${dirname}
- ln -s ${mnt}/nfs-ganesha/${dirname}/nfs/statd ${mnt}/nfs-ganesha/${server}/nfs/statd/${dirname}
- fi
- done
-
-}
-
-
-delnode_state_volume()
-{
- local delnode=${1}; shift
- local mnt=${HA_VOL_MNT}
- local longname=""
- local dname=""
- local dirname=""
-
- longname=$(hostname)
- dname=${longname#$(hostname -s)}
-
- if [[ ${delnode} == *${dname} ]]; then
- dirname=${delnode}
- else
- dirname=${delnode}${dname}
- fi
-
- rm -rf ${mnt}/nfs-ganesha/${dirname}
-
- for server in ${HA_SERVERS} ; do
- if [[ "${server}" != "${dirname}" ]]; then
- rm -f ${mnt}/nfs-ganesha/${server}/nfs/ganesha/${dirname}
- rm -f ${mnt}/nfs-ganesha/${server}/nfs/statd/${dirname}
- fi
- done
-}
-
-
-status()
-{
- local scratch=$(mktemp)
- local regex_str="^${1}-cluster_ip-1"
- local healthy=0
- local index=1
- local nodes
-
- # change tabs to spaces, strip leading spaces
- pcs status | sed -e "s/\t/ /g" -e "s/^[ ]*//" > ${scratch}
-
- nodes[0]=${1}; shift
-
- # make a regex of the configured nodes
- # and initalize the nodes array for later
- while [[ ${1} ]]; do
-
- regex_str="${regex_str}|^${1}-cluster_ip-1"
- nodes[${index}]=${1}
- ((index++))
- shift
- done
-
- # print the nodes that are expected to be online
- grep -E "^Online:" ${scratch}
-
- echo
-
- # print the VIPs and which node they are on
- grep -E "${regex_str}" < ${scratch} | cut -d ' ' -f 1,4
-
- echo
-
- # check if the VIP and port block/unblock RAs are on the expected nodes
- for n in ${nodes[*]}; do
-
- grep -E -x "${n}-nfs_block \(ocf::heartbeat:portblock\): Started ${n}" > /dev/null 2>&1 ${scratch}
- result=$?
- ((healthy+=${result}))
- grep -E -x "${n}-cluster_ip-1 \(ocf::heartbeat:IPaddr\): Started ${n}" > /dev/null 2>&1 ${scratch}
- result=$?
- ((healthy+=${result}))
- grep -E -x "${n}-nfs_unblock \(ocf::heartbeat:portblock\): Started ${n}" > /dev/null 2>&1 ${scratch}
- result=$?
- ((healthy+=${result}))
- done
-
- grep -E "\):\ Stopped|FAILED" > /dev/null 2>&1 ${scratch}
- result=$?
-
- if [ ${result} -eq 0 ]; then
- echo "Cluster HA Status: BAD"
- elif [ ${healthy} -eq 0 ]; then
- echo "Cluster HA Status: HEALTHY"
- else
- echo "Cluster HA Status: FAILOVER"
- fi
-
- rm -f ${scratch}
-}
-
-create_ganesha_conf_file()
-{
- if [ $1 == "yes" ];
- then
- if [ -e $GANESHA_CONF ];
- then
- rm -rf $GANESHA_CONF
- fi
- # The symlink /etc/ganesha/ganesha.conf need to be
- # created using ganesha conf file mentioned in the
- # shared storage. Every node will only have this
- # link and actual file will stored in shared storage,
- # so that ganesha conf editing of ganesha conf will
- # be easy as well as it become more consistent.
-
- ln -s $HA_CONFDIR/ganesha.conf $GANESHA_CONF
- else
- # Restoring previous file
- rm -rf $GANESHA_CONF
- cp $HA_CONFDIR/ganesha.conf $GANESHA_CONF
- sed -r -i -e '/^%include[[:space:]]+".+\.conf"$/d' $GANESHA_CONF
- fi
-}
-
-set_quorum_policy()
-{
- local quorum_policy="stop"
- local num_servers=${1}
-
- if [ ${num_servers} -lt 3 ]; then
- quorum_policy="ignore"
- fi
- pcs property set no-quorum-policy=${quorum_policy}
- if [ $? -ne 0 ]; then
- logger "warning: pcs property set no-quorum-policy=${quorum_policy} failed"
- fi
-}
-
-main()
-{
-
- local cmd=${1}; shift
- if [[ ${cmd} == *help ]]; then
- usage
- exit 0
- fi
- HA_CONFDIR=${1%/}; shift
- local ha_conf=${HA_CONFDIR}/ganesha-ha.conf
- local node=""
- local vip=""
-
- # ignore any comment lines
- cfgline=$(grep ^HA_NAME= ${ha_conf})
- eval $(echo ${cfgline} | grep -F HA_NAME=)
- cfgline=$(grep ^HA_CLUSTER_NODES= ${ha_conf})
- eval $(echo ${cfgline} | grep -F HA_CLUSTER_NODES=)
-
- case "${cmd}" in
-
- setup | --setup)
- logger "setting up ${HA_NAME}"
-
- check_cluster_exists ${HA_NAME}
-
- determine_servers "setup"
-
- if [ "X${HA_NUM_SERVERS}X" != "X1X" ]; then
-
- setup_cluster ${HA_NAME} ${HA_NUM_SERVERS} "${HA_SERVERS}"
-
- setup_create_resources ${HA_SERVERS}
-
- setup_finalize_ha
-
- setup_state_volume ${HA_SERVERS}
-
- else
-
- logger "insufficient servers for HA, aborting"
- fi
- ;;
-
- teardown | --teardown)
- logger "tearing down ${HA_NAME}"
-
- determine_servers "teardown"
-
- teardown_resources ${HA_SERVERS}
-
- teardown_cluster ${HA_NAME}
-
- cleanup_ganesha_config ${HA_CONFDIR}
- ;;
-
- cleanup | --cleanup)
- cleanup_ganesha_config ${HA_CONFDIR}
- ;;
-
- add | --add)
- node=${1}; shift
- vip=${1}; shift
-
- logger "adding ${node} with ${vip} to ${HA_NAME}"
-
- determine_service_manager
-
- manage_service "start" ${node}
-
- determine_servers "add"
-
- pcs cluster node add ${node}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster node add ${node} failed"
- fi
-
- addnode_create_resources ${node} ${vip}
- # Subsequent add-node recreates resources for all the nodes
- # that already exist in the cluster. The nodes are picked up
- # from the entries in the ganesha-ha.conf file. Adding the
- # newly added node to the file so that the resources specfic
- # to this node is correctly recreated in the future.
- clean_node=${node//[-.]/_}
- echo "VIP_${node}=\"${vip}\"" >> ${HA_CONFDIR}/ganesha-ha.conf
-
- NEW_NODES="$HA_CLUSTER_NODES,${node}"
-
- sed -i s/HA_CLUSTER_NODES.*/"HA_CLUSTER_NODES=\"$NEW_NODES\""/ \
-$HA_CONFDIR/ganesha-ha.conf
-
- addnode_state_volume ${node}
-
- # addnode_create_resources() already appended ${node} to
- # HA_SERVERS, so only need to increment HA_NUM_SERVERS
- # and set quorum policy
- HA_NUM_SERVERS=$(expr ${HA_NUM_SERVERS} + 1)
- set_quorum_policy ${HA_NUM_SERVERS}
- ;;
-
- delete | --delete)
- node=${1}; shift
-
- logger "deleting ${node} from ${HA_NAME}"
-
- determine_servers "delete"
-
- deletenode_delete_resources ${node}
-
- pcs cluster node remove ${node}
- if [ $? -ne 0 ]; then
- logger "warning: pcs cluster node remove ${node} failed"
- fi
-
- deletenode_update_haconfig ${node}
-
- delnode_state_volume ${node}
-
- determine_service_manager
-
- manage_service "stop" ${node}
-
- HA_NUM_SERVERS=$(expr ${HA_NUM_SERVERS} - 1)
- set_quorum_policy ${HA_NUM_SERVERS}
- ;;
-
- status | --status)
- determine_servers "status"
-
- status ${HA_SERVERS}
- ;;
-
- refresh-config | --refresh-config)
- VOL=${1}
-
- determine_servers "refresh-config"
-
- refresh_config ${VOL} ${HA_CONFDIR} ${HA_SERVERS}
- ;;
-
- setup-ganesha-conf-files | --setup-ganesha-conf-files)
-
- create_ganesha_conf_file ${1}
- ;;
-
- *)
- # setup and teardown are not intended to be used by a
- # casual user
- usage
- logger "Usage: ganesha-ha.sh add|delete|status"
- ;;
-
- esac
-}
-
-main $*
-