blob: 355f06f2ab9c1de2ed128d1f2df698534268eb41 [file] [log] [blame]
#!/bin/bash
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
#set -x
usage() {
printf "Usage: %s [uuid of this host] [timeout in seconds] [interval in seconds]\n" $(basename $0) >&2
}
if [ -z $1 ]; then
usage
exit 2
else
host=$1
fi
if [ -z $2 ]; then
usage
exit 3
else
timeout=$2
fi
if [ ! -z $3 ]; then
interval=$3
else
interval=5
fi
if [ $interval -gt $timeout ]; then
usage
exit 3
fi
file=/opt/cloud/bin/heartbeat
lastdate=$(($(date +%s) + $interval))
while [ $(date +%s) -lt $(($lastdate + $timeout)) ]
do
sleep $interval
if [ ! -f $file ]
then
continue
fi
# test heartbeat file
dirs=$(cat $file | grep "sr-mount\|VG_XenStorage")
if [ ! -n "$dirs" ];then
/usr/bin/logger -t heartbeat "Problem with heartbeat, no iSCSI or NFS mount defined in $file!"
lastdate=$(date +%s)
continue
fi
# for iscsi
dirs=$(cat $file | grep VG_XenStorage)
for dir in $dirs
do
if [ -d $dir ]; then
hb=$dir/hb-$host
date +%s | dd of=$hb count=100 bs=1 2>/dev/null
if [ $? -ne 0 ]; then
/usr/bin/logger -t heartbeat "Potential problem with $hb: not reachable since $(($(date +%s) - $lastdate)) seconds"
else
lastdate=$(date +%s)
fi
else
/usr/bin/logger -t heartbeat "Potential problem with heartbeat, dir not found for $dir"
lastdate=$(date +%s)
sed -i /${dir##/*/}/d $file
fi
done
# for nfs
dirs=$(cat $file | grep sr-mount)
for dir in $dirs
do
mp=`mount | grep $dir`
if [ -n "$mp" ]; then
hb=$dir/hb-$host
date +%s | dd of=$hb count=100 bs=1 2>/dev/null
if [ $? -ne 0 ]; then
/usr/bin/logger -t heartbeat "Potential problem with $hb: not reachable since $(($(date +%s) - $lastdate)) seconds"
else
lastdate=$(date +%s)
fi
else
/usr/bin/logger -t heartbeat "Potential problem with heartbeat, mount not found for $dir"
lastdate=$(date +%s)
sed -i /${dir##/*/}/d $file
fi
done
done
/usr/bin/logger -t heartbeat "Problem with $hb: not reachable for $(($(date +%s) - $lastdate)) seconds, rebooting system!"
echo b > /proc/sysrq-trigger