#!/bin/sh # # # HealthLUSTRE OCF RA that utilizes the lustre /proc/fs/lustre/health_check # # License: GNU General Public License (GPL)v2 # Description: Manages ZFS and Lustre on a shared storage # Written by: Gabriele Paciucci # Release Date: 01 June 2016 # Release Version: 0.97 # Copyright (c) 2009 Andrew Beekhof # Copyright © 2016, Intel Corporation # # This program is free software; you can redistribute it and/or modify # it under the terms of version 2 of the GNU General Public License as # published by the Free Software Foundation. # # This program is distributed in the hope that it would be useful, but # WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. # # Further, this software is distributed without any warranty that it is # free of the rightful claim of any third person regarding infringement # or the like. Any license provided herein, whether implied or # otherwise, applies only to this software file. Patent licenses, if # any, provided herein do not apply to combinations of this program with # other software, or any other product whatsoever. # # You should have received a copy of the GNU General Public License # along with this program; if not, write the Free Software Foundation, # Inc., 59 Temple Place - Suite 330, Boston MA 02111-1307, USA. # ####################################################################### # Initialization: : ${OCF_FUNCTIONS=${OCF_ROOT}/resource.d/heartbeat/.ocf-shellfuncs} . ${OCF_FUNCTIONS} : ${__OCF_ACTION=$1} ####################################################################### meta_data() { cat < 1.0 Every time the monitor action is run, this resource agent records (in the CIB) the current number of healthy lustre server lustre servers healthy PID file PID file The time to wait (dampening) further changes occur Dampening interval The name of the attributes to set. This is the name to be used in the constraints. Attribute name Enables to use default attrd_updater verbose logging on every call. Verbose logging END } ####################################################################### lustre_conditional_log() { level=$1; shift if [ ${OCF_RESKEY_debug} = "true" ]; then ocf_log $level "$*" fi } lustre_usage() { cat <&1`; rc=$? case $rc in 0) active=`expr $active + 1`;; 1) lustre_conditional_log warn "Lustre is not healthy: $l_out";; *) ocf_log err "Unexpected result for '/proc/fs/lustre/health_check' $rc: $l_out";; esac return $active } lustre_update() { lustre_check active=$? attrd_updater -n $OCF_RESKEY_name -v $active -d $OCF_RESKEY_dampen $attrd_options rc=$? case $rc in 0) lustre_conditional_log debug "Updated $OCF_RESKEY_name = $active" ;; *) ocf_log warn "Could not update $OCF_RESKEY_name = $active: rc=$rc";; esac if [ $rc -ne 0 ]; then return $rc fi return 0 } : ${OCF_RESKEY_name:="lustred"} : ${OCF_RESKEY_dampen:="5s"} : ${OCF_RESKEY_attempts:="3"} : ${OCF_RESKEY_debug:="false"} : ${OCF_RESKEY_CRM_meta_timeout:="20000"} : ${OCF_RESKEY_CRM_meta_globally_unique:="true"} # I don't think we need to care about timeout #integer=`echo ${OCF_RESKEY_timeout} | egrep -o '[0-9]*'` #case ${OCF_RESKEY_timeout} in # *[0-9]ms|*[0-9]msec) OCF_RESKEY_timeout=`expr $integer / 1000`;; # *[0-9]m|*[0-9]min) OCF_RESKEY_timeout=`expr $integer \* 60`;; # *[0-9]h|*[0-9]hr) OCF_RESKEY_timeout=`expr $integer \* 60 \* 60`;; # *) OCF_RESKEY_timeout=$integer;; #esac #if [ -z ${OCF_RESKEY_timeout} ]; then # if [ x"$OCF_RESKEY_host_list" != x ]; then # host_count=`echo $OCF_RESKEY_host_list | awk '{print NF}'` # OCF_RESKEY_timeout=`expr $OCF_RESKEY_CRM_meta_timeout / $host_count / $OCF_RESKEY_attempts` # OCF_RESKEY_timeout=`expr $OCF_RESKEY_timeout / 1100` # Convert to seconds and finish 10% early # else # OCF_RESKEY_timeout=5 # fi #fi #if [ ${OCF_RESKEY_timeout} -lt 1 ]; then # OCF_RESKEY_timeout=5 #elif [ ${OCF_RESKEY_timeout} -gt 1000 ]; then # # ping actually complains if this value is too high, 5 minutes is plenty # OCF_RESKEY_timeout=300 #fi if [ ${OCF_RESKEY_CRM_meta_globally_unique} = "false" ]; then : ${OCF_RESKEY_pidfile:="$HA_VARRUN/healthLUSTRE-${OCF_RESKEY_name}"} else : ${OCF_RESKEY_pidfile:="$HA_VARRUN/healthLUSTRE-${OCF_RESOURCE_INSTANCE}"} fi attrd_options='-q' if ocf_is_true ${OCF_RESKEY_debug} ; then attrd_options='' fi # Check the debug option case "${OCF_RESKEY_debug}" in true|True|TRUE|1) OCF_RESKEY_debug=true;; false|False|FALSE|0) OCF_RESKEY_debug=false;; *) ocf_log warn "Value for 'debug' is incorrect. Please specify 'true' or 'false' not: ${OCF_RESKEY_debug}" OCF_RESKEY_debug=false ;; esac case $__OCF_ACTION in meta-data) meta_data exit $OCF_SUCCESS ;; start) lustre_start;; stop) lustre_stop;; monitor) lustre_monitor;; reload) lustre_start;; validate-all) lustre_usage exit $OCF_SUCCESS ;; usage|help) lustre_usage exit $OCF_SUCCESS ;; *) lustre_usage exit $OCF_ERR_UNIMPLEMENTED ;; esac exit $?