| #!/usr/bin/env bash |
| # |
| #/** |
| # * Licensed to the Apache Software Foundation (ASF) under one |
| # * or more contributor license agreements. See the NOTICE file |
| # * distributed with this work for additional information |
| # * regarding copyright ownership. The ASF licenses this file |
| # * to you under the Apache License, Version 2.0 (the |
| # * "License"); you may not use this file except in compliance |
| # * with the License. You may obtain a copy of the License at |
| # * |
| # * http://www.apache.org/licenses/LICENSE-2.0 |
| # * |
| # * Unless required by applicable law or agreed to in writing, software |
| # * distributed under the License is distributed on an "AS IS" BASIS, |
| # * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # * See the License for the specific language governing permissions and |
| # * limitations under the License. |
| # */ |
| # |
| # Runs a Hadoop hbase command as a daemon. |
| # |
| # Environment Variables |
| # |
| # HBASE_CONF_DIR Alternate hbase conf dir. Default is ${HBASE_HOME}/conf. |
| # HBASE_LOG_DIR Where log files are stored. PWD by default. |
| # HBASE_PID_DIR The pid files are stored. /tmp by default. |
| # HBASE_IDENT_STRING A string representing this instance of hadoop. $USER by default |
| # HBASE_NICENESS The scheduling priority for daemons. Defaults to 0. |
| # HBASE_STOP_TIMEOUT Time, in seconds, after which we kill -9 the server if it has not stopped. |
| # Default 1200 seconds. |
| # |
| # Modelled after $HADOOP_HOME/bin/hadoop-daemon.sh |
| |
| usage="Usage: hbase-daemon.sh [--config <conf-dir>]\ |
| [--autostart-window-size <window size in hours>]\ |
| [--autostart-window-retry-limit <retry count limit for autostart>]\ |
| (start|stop|restart|autostart|autorestart|foreground_start) <hbase-command> \ |
| <args...>" |
| |
| # if no args specified, show usage |
| if [ $# -le 1 ]; then |
| echo $usage |
| exit 1 |
| fi |
| |
| # default autostart args value indicating infinite window size and no retry limit |
| AUTOSTART_WINDOW_SIZE=0 |
| AUTOSTART_WINDOW_RETRY_LIMIT=0 |
| |
| bin=`dirname "${BASH_SOURCE-$0}"` |
| bin=`cd "$bin">/dev/null; pwd` |
| |
| . "$bin"/hbase-config.sh |
| . "$bin"/hbase-common.sh |
| |
| # get arguments |
| startStop=$1 |
| shift |
| |
| command=$1 |
| shift |
| |
| hbase_rotate_log () |
| { |
| log=$1; |
| num=5; |
| if [ -n "$2" ]; then |
| num=$2 |
| fi |
| if [ -f "$log" ]; then # rotate logs |
| while [ $num -gt 1 ]; do |
| prev=`expr $num - 1` |
| [ -f "$log.$prev" ] && mv -f "$log.$prev" "$log.$num" |
| num=$prev |
| done |
| mv -f "$log" "$log.$num"; |
| fi |
| } |
| |
| cleanAfterRun() { |
| if [ -f ${HBASE_PID} ]; then |
| # If the process is still running time to tear it down. |
| kill -9 `cat ${HBASE_PID}` > /dev/null 2>&1 |
| rm -f ${HBASE_PID} > /dev/null 2>&1 |
| fi |
| |
| if [ -f ${HBASE_ZNODE_FILE} ]; then |
| if [ "$command" = "master" ]; then |
| HBASE_OPTS="$HBASE_OPTS $HBASE_MASTER_OPTS" $bin/hbase master clear > /dev/null 2>&1 |
| else |
| #call ZK to delete the node |
| ZNODE=`cat ${HBASE_ZNODE_FILE}` |
| HBASE_OPTS="$HBASE_OPTS $HBASE_REGIONSERVER_OPTS" $bin/hbase zkcli delete ${ZNODE} > /dev/null 2>&1 |
| fi |
| rm ${HBASE_ZNODE_FILE} |
| fi |
| } |
| |
| check_before_start(){ |
| #ckeck if the process is not running |
| mkdir -p "$HBASE_PID_DIR" |
| if [ -f $HBASE_PID ]; then |
| if kill -0 `cat $HBASE_PID` > /dev/null 2>&1; then |
| echo $command running as process `cat $HBASE_PID`. Stop it first. |
| exit 1 |
| fi |
| fi |
| } |
| |
| wait_until_done () |
| { |
| p=$1 |
| cnt=${HBASE_SLAVE_TIMEOUT:-300} |
| origcnt=$cnt |
| while kill -0 $p > /dev/null 2>&1; do |
| if [ $cnt -gt 1 ]; then |
| cnt=`expr $cnt - 1` |
| sleep 1 |
| else |
| echo "Process did not complete after $origcnt seconds, killing." |
| kill -9 $p |
| exit 1 |
| fi |
| done |
| return 0 |
| } |
| |
| # get log directory |
| if [ "$HBASE_LOG_DIR" = "" ]; then |
| export HBASE_LOG_DIR="$HBASE_HOME/logs" |
| fi |
| mkdir -p "$HBASE_LOG_DIR" |
| |
| if [ "$HBASE_PID_DIR" = "" ]; then |
| HBASE_PID_DIR=/tmp |
| fi |
| |
| if [ "$HBASE_IDENT_STRING" = "" ]; then |
| export HBASE_IDENT_STRING="$USER" |
| fi |
| |
| # Some variables |
| # Work out java location so can print version into log. |
| if [ "$JAVA_HOME" != "" ]; then |
| #echo "run java in $JAVA_HOME" |
| JAVA_HOME=$JAVA_HOME |
| fi |
| if [ "$JAVA_HOME" = "" ]; then |
| echo "Error: JAVA_HOME is not set." |
| exit 1 |
| fi |
| |
| JAVA=$JAVA_HOME/bin/java |
| export HBASE_LOG_PREFIX=hbase-$HBASE_IDENT_STRING-$command-$HOSTNAME |
| export HBASE_LOGFILE=$HBASE_LOG_PREFIX.log |
| |
| if [ -z "${HBASE_ROOT_LOGGER_LEVEL}" ]; then |
| export HBASE_ROOT_LOGGER_LEVEL=${HBASE_ROOT_LOGGER_LEVEL:-"INFO"} |
| fi |
| |
| if [ -z "${HBASE_ROOT_LOGGER_APPENDER}" ]; then |
| export HBASE_ROOT_LOGGER_APPENDER=${HBASE_ROOT_LOGGER_APPENDER:-"RFA"} |
| fi |
| |
| if [ -z "${HBASE_SECURITY_LOGGER_LEVEL}" ]; then |
| export HBASE_SECURITY_LOGGER_LEVEL=${HBASE_SECURITY_LOGGER_LEVEL:-"INFO"} |
| fi |
| |
| if [ -z "${HBASE_SECURITY_LOGGER_APPENDER}" ]; then |
| export HBASE_SECURITY_LOGGER_APPENDER=${HBASE_SECURITY_LOGGER_APPENDER:-"RFAS"} |
| fi |
| |
| HBASE_LOGOUT=${HBASE_LOGOUT:-"$HBASE_LOG_DIR/$HBASE_LOG_PREFIX.out"} |
| HBASE_LOGGC=${HBASE_LOGGC:-"$HBASE_LOG_DIR/$HBASE_LOG_PREFIX.gc"} |
| HBASE_LOGLOG=${HBASE_LOGLOG:-"${HBASE_LOG_DIR}/${HBASE_LOGFILE}"} |
| HBASE_PID=$HBASE_PID_DIR/hbase-$HBASE_IDENT_STRING-$command.pid |
| export HBASE_ZNODE_FILE=$HBASE_PID_DIR/hbase-$HBASE_IDENT_STRING-$command.znode |
| export HBASE_AUTOSTART_FILE=$HBASE_PID_DIR/hbase-$HBASE_IDENT_STRING-$command.autostart |
| |
| if [ -n "$SERVER_GC_OPTS" ]; then |
| export SERVER_GC_OPTS=${SERVER_GC_OPTS/"-Xloggc:<FILE-PATH>"/"-Xloggc:${HBASE_LOGGC}"} |
| fi |
| if [ -n "$CLIENT_GC_OPTS" ]; then |
| export CLIENT_GC_OPTS=${CLIENT_GC_OPTS/"-Xloggc:<FILE-PATH>"/"-Xloggc:${HBASE_LOGGC}"} |
| fi |
| |
| # Set default scheduling priority |
| if [ "$HBASE_NICENESS" = "" ]; then |
| export HBASE_NICENESS=0 |
| fi |
| |
| thiscmd="$bin/$(basename ${BASH_SOURCE-$0})" |
| args=$@ |
| |
| case $startStop in |
| |
| (start) |
| check_before_start |
| hbase_rotate_log $HBASE_LOGOUT |
| hbase_rotate_log $HBASE_LOGGC |
| echo running $command, logging to $HBASE_LOGOUT |
| $thiscmd --config "${HBASE_CONF_DIR}" \ |
| foreground_start $command $args < /dev/null > ${HBASE_LOGOUT} 2>&1 & |
| disown -h -r |
| sleep 1; head "${HBASE_LOGOUT}" |
| ;; |
| |
| (autostart) |
| check_before_start |
| hbase_rotate_log $HBASE_LOGOUT |
| hbase_rotate_log $HBASE_LOGGC |
| echo running $command, logging to $HBASE_LOGOUT |
| nohup $thiscmd --config "${HBASE_CONF_DIR}" --autostart-window-size ${AUTOSTART_WINDOW_SIZE} --autostart-window-retry-limit ${AUTOSTART_WINDOW_RETRY_LIMIT} \ |
| internal_autostart $command $args < /dev/null > ${HBASE_LOGOUT} 2>&1 & |
| ;; |
| |
| (autorestart) |
| echo running $command, logging to $HBASE_LOGOUT |
| # stop the command |
| $thiscmd --config "${HBASE_CONF_DIR}" stop $command $args & |
| wait_until_done $! |
| # wait a user-specified sleep period |
| sp=${HBASE_RESTART_SLEEP:-3} |
| if [ $sp -gt 0 ]; then |
| sleep $sp |
| fi |
| |
| check_before_start |
| hbase_rotate_log $HBASE_LOGOUT |
| nohup $thiscmd --config "${HBASE_CONF_DIR}" --autostart-window-size ${AUTOSTART_WINDOW_SIZE} --autostart-window-retry-limit ${AUTOSTART_WINDOW_RETRY_LIMIT} \ |
| internal_autostart $command $args < /dev/null > ${HBASE_LOGOUT} 2>&1 & |
| ;; |
| |
| (foreground_start) |
| trap cleanAfterRun SIGHUP SIGINT SIGTERM EXIT |
| if [ "$HBASE_NO_REDIRECT_LOG" != "" ]; then |
| # NO REDIRECT |
| echo "`date` Starting $command on `hostname`" |
| echo "`ulimit -a`" |
| # in case the parent shell gets the kill make sure to trap signals. |
| # Only one will get called. Either the trap or the flow will go through. |
| nice -n $HBASE_NICENESS "$HBASE_HOME"/bin/hbase \ |
| --config "${HBASE_CONF_DIR}" \ |
| $command "$@" start & |
| else |
| echo "`date` Starting $command on `hostname`" >> ${HBASE_LOGLOG} |
| echo "`ulimit -a`" >> "$HBASE_LOGLOG" 2>&1 |
| # in case the parent shell gets the kill make sure to trap signals. |
| # Only one will get called. Either the trap or the flow will go through. |
| nice -n $HBASE_NICENESS "$HBASE_HOME"/bin/hbase \ |
| --config "${HBASE_CONF_DIR}" \ |
| $command "$@" start >> ${HBASE_LOGOUT} 2>&1 & |
| fi |
| # Add to the command log file vital stats on our environment. |
| hbase_pid=$! |
| echo $hbase_pid > ${HBASE_PID} |
| wait $hbase_pid |
| ;; |
| |
| (internal_autostart) |
| ONE_HOUR_IN_SECS=3600 |
| autostartWindowStartDate=`date +%s` |
| autostartCount=0 |
| touch "$HBASE_AUTOSTART_FILE" |
| |
| # keep starting the command until asked to stop. Reloop on software crash |
| while true |
| do |
| hbase_rotate_log $HBASE_LOGGC |
| if [ -f $HBASE_PID ] && kill -0 "$(cat "$HBASE_PID")" > /dev/null 2>&1 ; then |
| wait "$(cat "$HBASE_PID")" |
| else |
| #if the file does not exist it means that it was not stopped properly by the stop command |
| if [ ! -f "$HBASE_AUTOSTART_FILE" ]; then |
| echo "`date` HBase might be stopped removing the autostart file. Exiting Autostart process" >> ${HBASE_LOGOUT} |
| exit 1 |
| fi |
| |
| echo "`date` Autostarting hbase $command service. Attempt no: $(( $autostartCount + 1))" >> ${HBASE_LOGLOG} |
| touch "$HBASE_AUTOSTART_FILE" |
| $thiscmd --config "${HBASE_CONF_DIR}" foreground_start $command $args |
| autostartCount=$(( $autostartCount + 1 )) |
| |
| # HBASE-6504 - only take the first line of the output in case verbose gc is on |
| distMode=`$bin/hbase --config "$HBASE_CONF_DIR" org.apache.hadoop.hbase.util.HBaseConfTool hbase.cluster.distributed | head -n 1` |
| |
| if [ "$distMode" != 'false' ]; then |
| #if the cluster is being stopped then do not restart it again. |
| zparent=`$bin/hbase org.apache.hadoop.hbase.util.HBaseConfTool zookeeper.znode.parent` |
| if [ "$zparent" == "null" ]; then zparent="/hbase"; fi |
| zkrunning=`$bin/hbase org.apache.hadoop.hbase.util.HBaseConfTool zookeeper.znode.state` |
| if [ "$zkrunning" == "null" ]; then zkrunning="running"; fi |
| zkFullRunning=$zparent/$zkrunning |
| $bin/hbase zkcli stat $zkFullRunning 2>&1 | grep "Node does not exist" 1>/dev/null 2>&1 |
| |
| #grep returns 0 if it found something, 1 otherwise |
| if [ $? -eq 0 ]; then |
| echo "`date` hbase znode does not exist. Exiting Autostart process" >> ${HBASE_LOGOUT} |
| rm -f "$HBASE_AUTOSTART_FILE" |
| exit 1 |
| fi |
| |
| #If ZooKeeper cannot be found, then do not restart |
| $bin/hbase zkcli stat $zkFullRunning 2>&1 | grep Exception | grep ConnectionLoss 1>/dev/null 2>&1 |
| if [ $? -eq 0 ]; then |
| echo "`date` zookeeper not found. Exiting Autostart process" >> ${HBASE_LOGOUT} |
| rm -f "$HBASE_AUTOSTART_FILE" |
| exit 1 |
| fi |
| fi |
| fi |
| |
| curDate=`date +%s` |
| autostartWindowReset=false |
| |
| # reset the auto start window size if it exceeds |
| if [ $AUTOSTART_WINDOW_SIZE -gt 0 ] && [ $(( $curDate - $autostartWindowStartDate )) -gt $(( $AUTOSTART_WINDOW_SIZE * $ONE_HOUR_IN_SECS )) ]; then |
| echo "Resetting Autorestart window size: $autostartWindowStartDate" >> ${HBASE_LOGOUT} |
| autostartWindowStartDate=$curDate |
| autostartWindowReset=true |
| autostartCount=0 |
| fi |
| |
| # kill autostart if the retry limit is exceeded within the given window size (window size other then 0) |
| if ! $autostartWindowReset && [ $AUTOSTART_WINDOW_RETRY_LIMIT -gt 0 ] && [ $autostartCount -gt $AUTOSTART_WINDOW_RETRY_LIMIT ]; then |
| echo "`date` Autostart window retry limit: $AUTOSTART_WINDOW_RETRY_LIMIT exceeded for given window size: $AUTOSTART_WINDOW_SIZE hours.. Exiting..." >> ${HBASE_LOGLOG} |
| rm -f "$HBASE_AUTOSTART_FILE" |
| exit 1 |
| fi |
| |
| # wait for shutdown hook to complete |
| sleep 20 |
| done |
| ;; |
| |
| (stop) |
| echo running $command, logging to $HBASE_LOGOUT |
| rm -f "$HBASE_AUTOSTART_FILE" |
| if [ -f $HBASE_PID ]; then |
| pidToKill=`cat $HBASE_PID` |
| # kill -0 == see if the PID exists |
| if kill -0 $pidToKill > /dev/null 2>&1; then |
| echo -n stopping $command |
| echo "`date` Terminating $command" >> $HBASE_LOGLOG |
| kill $pidToKill > /dev/null 2>&1 |
| waitForProcessEnd $pidToKill $command |
| else |
| retval=$? |
| echo no $command to stop because kill -0 of pid $pidToKill failed with status $retval |
| fi |
| else |
| echo no $command to stop because no pid file $HBASE_PID |
| fi |
| rm -f $HBASE_PID |
| ;; |
| |
| (restart) |
| echo running $command, logging to $HBASE_LOGOUT |
| # stop the command |
| $thiscmd --config "${HBASE_CONF_DIR}" stop $command $args & |
| wait_until_done $! |
| # wait a user-specified sleep period |
| sp=${HBASE_RESTART_SLEEP:-3} |
| if [ $sp -gt 0 ]; then |
| sleep $sp |
| fi |
| # start the command |
| $thiscmd --config "${HBASE_CONF_DIR}" start $command $args & |
| wait_until_done $! |
| ;; |
| |
| (*) |
| echo $usage |
| exit 1 |
| ;; |
| esac |