blob: de76620da2bf4bf90f9beb97e60e9675d4643fcd [file]
#!/usr/bin/env bash
# Filename:- gp_bash_functions.sh
# Status:- Released
# Author:- G L Coombe (Greenplum)
# Contact:- gcoombe@greenplum.com
# Release date:- March 2006
# Release stat:- Greenplum Internal
# Copyright (c) Metapa 2005. All Rights Reserved.
# Copyright (c) Greenplum 2005. All Rights Reserved
# Brief descn:- Common functions used by various scripts
#***************************************************************
# Location Functions
#******************************************************************************
#Check that SHELL is Bash
if [ -z $BASH ]; then
echo "[FATAL]:-Scripts must be executed using the Bash shell"
exit 1
fi
#CMDPATH is the list of locations to search for commands, in precedence order
declare -a CMDPATH
CMDPATH=(/usr/kerberos/bin /usr/sfw/bin /opt/sfw/bin /usr/local/bin /bin /usr/bin /sbin /usr/sbin /usr/ucb /sw/bin)
if hash brew 2> /dev/null; then
CMDPATH+=("$(brew --prefix)/bin")
fi
#GPPATH is the list of possible locations for the Apache Cloudberry binaries, in precedence order
declare -a GPPATH
GPPATH=( $GPHOME $MPPHOME $BIZHOME )
if [ ${#GPPATH[@]} -eq 0 ];then
echo "[FATAL]:-GPHOME environment variable is required to run GPDB but could not be found."
echo "Please set it by sourcing the cloudberry-env.sh in your GPDB installation directory."
echo "Example: ''. /usr/local/gpdb/cloudberry-env.sh''"
exit 1
fi
#GP_UNIQUE_COMMAND is used to identify the binary directory
GP_UNIQUE_COMMAND=gpstart
findCmdInPath() {
cmdtofind=$1
CMD=`which $cmdtofind`
if [ $? -eq 0 ]; then
echo $CMD
return
fi
for pathel in ${CMDPATH[@]}
do
CMD=$pathel/$cmdtofind
if [ x"$CMD" != x"" ] && [ -f $CMD ]; then
echo $CMD
return
fi
done
echo $cmdtofind
return "Problem in gp_bash_functions, command '$cmdtofind' not found in COMMAND path. You will need to edit the script named gp_bash_functions.sh to properly locate the needed commands for your platform."
}
findMppPath() {
cmdtofind=$GP_UNIQUE_COMMAND
for pathel in ${GPPATH[@]}
do
CMD=`find $pathel -follow -name $cmdtofind | tail -1`
if [ x"$CMD" != x"" ] && [ -f $CMD ]; then
echo $CMD
return
fi
done
}
#******************************************************************************
# OS Command Variables
#******************************************************************************
AWK=`findCmdInPath awk`
BASENAME=`findCmdInPath basename`
CAT=`findCmdInPath cat`
CUT=`findCmdInPath cut`
DATE=`findCmdInPath date`
DIRNAME=`findCmdInPath dirname`
ECHO=`findCmdInPath echo`
FIND=`findCmdInPath find`
GREP=`findCmdInPath grep`
HEAD=`findCmdInPath head`
HOSTNAME=`findCmdInPath hostname`
IP=`findCmdInPath ip`
LESSCMD=`findCmdInPath less`
LOCALE=`findCmdInPath locale`
MV=`findCmdInPath mv`
MKDIR=`findCmdInPath mkdir`
PING=`findCmdInPath ping`
RM=`findCmdInPath rm`
RSYNC=`findCmdInPath rsync`
SED=`findCmdInPath sed`
SLEEP=`findCmdInPath sleep`
SORT=`findCmdInPath sort`
SS=`findCmdInPath ss`
SSH=`findCmdInPath ssh`
TAIL=`findCmdInPath tail`
TEE=`findCmdInPath tee`
TOUCH=`findCmdInPath touch`
TR=`findCmdInPath tr`
WC=`findCmdInPath wc`
ETCD_ACCOUNT_ID="gp_etcd_account_id"
ETCD_CLUSTER_ID="gp_etcd_cluster_id"
ETCD_NAMESPACE="gp_etcd_namespace"
ETCD_ENDPOINTS="gp_etcd_endpoints"
#***************#******************************************************************************
# Script Specific Variables
#******************************************************************************
# By default set error logging level to verbose
VERBOSE=1
USER_NAME=`id|$AWK '{print $1}'|$CUT -d"(" -f2|$TR -d ')'`
PROG_NAME=`echo $0 | $TR -d '-'`
PROG_NAME=`$BASENAME $PROG_NAME`
PROG_PIDNAME=`echo $$ $PROG_NAME | awk '{printf "%06d %s\n", $1, $2}'`
CALL_HOST=`$HOSTNAME|$CUT -d. -f1`
#******************************************************************************
# Locate the postgres routines from the Cloudberry release
#******************************************************************************
PSQLBIN=`findMppPath`
if [ x"$PSQLBIN" = x"" ];then
echo "Problem in gp_bash_functions, command '$GP_UNIQUE_COMMAND' not found in Cloudberry path."
echo "Try setting GPHOME to the location of your Cloudberry distribution."
exit 1
fi
PSQLBIN=`$DIRNAME $PSQLBIN`
SCRIPTDIR="`$DIRNAME $PSQLBIN`/bin"
#******************************************************************************
# Cloudberry Scripts
#******************************************************************************
GPINITSYSTEM=$SCRIPTDIR/gpinitsystem
GPCONFIG=$SCRIPTDIR/gpconfig
GPINITSTANDBY=$SCRIPTDIR/gpinitstandby
GPRECOVERSEG=$SCRIPTDIR/gprecoverseg
GPSTART=$SCRIPTDIR/gpstart
GPSTATE=$SCRIPTDIR/gpstate
GPSTOP=$SCRIPTDIR/gpstop
GPDOCDIR=${GPHOME}/docs/cli_help/
#******************************************************************************
# Cloudberry Command Variables
#******************************************************************************
INITDB=$PSQLBIN/initdb
PG_CTL=$PSQLBIN/pg_ctl
PSQL=$PSQLBIN/psql
#******************************************************************************
# Cloudberry OS Settings
#******************************************************************************
OS_OPENFILES=65535
#******************************************************************************
# General Variables
#******************************************************************************
HOSTFILE=/etc/hosts
PG_PID=postmaster.pid
PG_OPT=postmaster.opts
PG_CONF=postgresql.conf
PG_INTERNAL_CONF=internal.auto.conf
PG_HBA=pg_hba.conf
if [ x"$TRUSTED_SHELL" = x"" ]; then TRUSTED_SHELL="$SSH"; fi
if [ x"$TRUSTED_COPY" = x"" ]; then TRUSTED_COPY="$RSYNC "; fi
PG_CONF_ADD_FILE=$WORKDIR/postgresql_conf_gp_additions
DEFAULTDB=template1
ETCD_CONFIG_TMP_FILE=/tmp/cbdb_etcd.conf
ETCD_HOST_FILE=etcd_host
FTS_HOST_FILE=fts_host
DEFAULT_CHK_PT_SEG=8
DEFAULT_QD_MAX_CONNECT=250
QE_CONNECT_FACTOR=3
# DEFAULT_BUFFERS sets the default shared_buffers unless overridden by '-b'.
# It applies to the coordinator db and segment dbs. Specify either the number of
# buffers (without suffix) or the amount of memory to use for buffers (with
# case-insensitive suffix 'kB', 'MB' or 'GB').
DEFAULT_BUFFERS=128000kB
DEBUG_LEVEL=0
BATCH_DEFAULT=60
WAIT_LIMIT=1800
WARN_MARK="<<<<<"
#******************************************************************************
# Functions
#******************************************************************************
#
# Simplified version of _nl_normalize_codeset from glibc
# https://sourceware.org/git/?p=glibc.git;a=blob;f=intl/l10nflist.c;h=078a450dfec21faf2d26dc5d0cb02158c1f23229;hb=1305edd42c44fee6f8660734d2dfa4911ec755d6#l294
# Input parameter - string with locale define as [language[_territory][.codeset][@modifier]]
NORMALIZE_CODESET_IN_LOCALE () {
local language_and_territory=$(echo $1 | perl -ne 'print for /(^.+?(?=\.|@|$))/s')
local codeset=$(echo $1 | perl -ne 'print for /((?<=\.).+?(?=@|$))/s')
local modifier=$(echo -n $1 | perl -ne 'print for /((?<=@).+)/s' )
local digit_pattern='^[0-9]+$'
if [[ $codeset =~ $digit_pattern ]] ;
then
codeset="iso$codeset"
else
codeset=$(echo $codeset | perl -pe 's/([[:alpha:]])/\L\1/g; s/[^[:alnum:]]//g')
fi
echo "$language_and_territory$([ ! -z $codeset ] && echo ".$codeset")$([ ! -z $modifier ] && echo "@$modifier")"
}
LOCALE_IS_AVAILABLE () {
local locale=$(NORMALIZE_CODESET_IN_LOCALE $1)
local all_available_locales=$(locale -a)
for v in $all_available_locales; do
if [ x"$locale" == x"$v" ] || [ x"$1" == x"$v" ]; then
return 1
fi
done
return 0
}
#
# NOTE: this function is called a lot; try to keep it quick.
#
LOG_MSG () {
TIMESTAMP=`$DATE +%Y%m%d":"%H":"%M":"%S`
DISPLAY_TXT=0
# Check to see if we need to update value of EXIT_STATUS. Strip off
# everything in the message after the first ending bracket ']' and
# compare it to WARN/FATAL.
level=${1%%]*}
case "$level" in
*FATAL*)
EXIT_STATUS=1
;;
esac
if [ x"" == x"$DEBUG_LEVEL" ];then
DEBUG_LEVEL=1
fi
if [ $# -eq 2 ];then
DISPLAY_TXT=1
fi
if [ $VERBOSE ]; then
if [ $DEBUG_LEVEL -eq 1 ] || [ $DISPLAY_TXT -eq 1 ];then
$ECHO "${TIMESTAMP}:${PROG_PIDNAME}:${CALL_HOST}:${USER_NAME}-$1" | $TEE -a $LOG_FILE
else
$ECHO "${TIMESTAMP}:${PROG_PIDNAME}:${CALL_HOST}:${USER_NAME}-$1" >> $LOG_FILE
fi
else
$ECHO "${TIMESTAMP}:${PROG_PIDNAME}:${CALL_HOST}:${USER_NAME}-$1" >> $LOG_FILE
fi
}
#Function Name: REMOTE_EXECUTE_AND_GET_OUTPUT
# Input Parameters: Takes 2 parameters
# Parameter 1 -> Host name to execute the command
# Parameter 2 -> Command/s to be executed
# Return value: String output of command execution on spcified remote host
# Description: This fuction adds a delimeter before executing the commands through ssh.
# this makes sure that in case if a banner set wrongly using .bashrc in then that gets ignored
# and we get the required results by ignoring the banner content
# Limitation: If the token used for separating command output from banner appears in the begining
# of the line in command output/banner output, in that case only partial command output will be returned
REMOTE_EXECUTE_AND_GET_OUTPUT () {
INITIAL_DEBUG_LEVEL=$DEBUG_LEVEL
DEBUG_LEVEL=0
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
HOST="$1"
CMD="echo 'GP_DELIMITER_FOR_IGNORING_BASH_BANNER';$2"
OUTPUT=$( $TRUSTED_SHELL "$HOST" "$CMD" | $AWK '/^GP_DELIMITER_FOR_IGNORING_BASH_BANNER/ {seen = 1} seen {print}' | $TAIL -n +2 )
RETVAL=$?
if [ $RETVAL -ne 0 ]; then
LOG_MSG "[FATAL]:- Command $CMD on $HOST failed with error status $RETVAL" 2
else
LOG_MSG "[INFO]:-Completed $TRUSTED_SHELL $HOST $CMD"
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
DEBUG_LEVEL=$INITIAL_DEBUG_LEVEL
#Return output
echo "$OUTPUT"
}
POSTGRES_VERSION_CHK() {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
HOST=$1;shift
CURRENT_VERSION=`$EXPORT_GPHOME; $EXPORT_LIB_PATH; $GPHOME/bin/postgres --gp-version`
VERSION_MATCH=0
VER=$( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "$EXPORT_GPHOME; $EXPORT_LIB_PATH; $GPHOME/bin/postgres --gp-version")
if [ $? -ne 0 ] ; then
LOG_MSG "[WARN]:- Failed to obtain postgres version on $HOST" 1
VERSION_MATCH=0
fi
LOG_MSG "[INFO]:- Current postgres version = $CURRENT_VERSION"
LOG_MSG "[INFO]:- postgres version on $HOST = $VER"
if [ x"$VER" != x"$CURRENT_VERSION" ] ; then
LOG_MSG "[WARN]:-Postgres version does not match. [$CURRENT_VERSION != $VER]" 1
VERSION_MATCH=0
else
VERSION_MATCH=1
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
ERROR_EXIT () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
TIME=`$DATE +%H":"%M":"%S`
CUR_DATE=`$DATE +%Y%m%d`
$ECHO "${CUR_DATE}:${TIME}:${PROG_PIDNAME}:${CALL_HOST}:${USER_NAME}-$1 Script Exiting!" >> $LOG_FILE
$ECHO "${CUR_DATE}:${TIME}:${PROG_PIDNAME}:${CALL_HOST}:${USER_NAME}-$1 Script Exiting!"
DEBUG_LEVEL=1
if [ $BACKOUT_FILE ]; then
if [ -s $BACKOUT_FILE ]; then
LOG_MSG "[WARN]:-Script has left Apache Cloudberry in an incomplete state"
LOG_MSG "[WARN]:-Run command bash $BACKOUT_FILE on coordinator to remove these changes"
$ECHO "$RM -f $BACKOUT_FILE" >> $BACKOUT_FILE
fi
fi
exit 1
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
ERROR_CHK () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
if [ $# -ne 3 ];then
LOG_MSG "[WARN]:-Incorrect # parameters supplied to $FUNCNAME" 1
return;
fi
RETVAL=$1;shift
MSG_TXT=$1;shift
ACTION=$1 #1=issue warn, 2=fatal
if [ $RETVAL -eq 0 ];then
LOG_MSG "[INFO]:-Successfully completed $MSG_TXT"
else
if [ $ACTION -eq 1 ];then
LOG_MSG "[WARN]:-Issue with $MSG_TXT" 1
else
LOG_MSG "[INFO]:-End Function $FUNCNAME"
ERROR_EXIT "[FATAL]:-Failed to complete $MSG_TXT "
fi
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
RETRY () {
RETVAL=$?
if [[ "$CURRENT" =~ "ssh" ]]; then
for i in 2 4 8; do
sleep $i
LOG_MSG "[WARN]:-Retrying command -- $CURRENT"
eval "$CURRENT"
if [ $? = 0 ]; then
RETVAL=0
# There seems to be no way of grabbing the return code of a
# trap other than saving it to a variable
return
fi
done
fi
}
SED_PG_CONF () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
APPEND=0
FILENAME=$1;shift
SEARCH_TXT=$1;shift
SUB_TXT="$1";shift
KEEP_PREV=$1;shift
SED_HOST=$1
if [ x"" == x"$SED_HOST" ]; then
if [ `$GREP -c "^[ ]*${SEARCH_TXT}[ ]*=" $FILENAME` -gt 1 ]; then
LOG_MSG "[INFO]:-Found more than 1 instance of $SEARCH_TXT in $FILENAME, will append" 1
APPEND=1
fi
if [ `$GREP -c "^[ ]*${SEARCH_TXT}[ ]*=" $FILENAME` -eq 0 ] || [ $APPEND -eq 1 ]; then
$ECHO $SUB_TXT >> $FILENAME
RETVAL=$?
if [ $RETVAL -ne 0 ]; then
LOG_MSG "[WARN]:-Failed to append line $SUB_TXT to $FILENAME" 1
else
LOG_MSG "[INFO]:-Appended line $SUB_TXT to $FILENAME"
fi
else
if [ $KEEP_PREV -eq 0 ];then
$SED -i'.bak1' -e "s/${SEARCH_TXT}/${SUB_TXT} #${SEARCH_TXT}/" $FILENAME
else
$SED -i'.bak1' -e "s/${SEARCH_TXT}.*/${SUB_TXT}/" $FILENAME
fi
RETVAL=$?
if [ $RETVAL -ne 0 ]; then
ERROR_EXIT "[FATAL]:-Failed to replace $SEARCH_TXT in $FILENAME"
else
LOG_MSG "[INFO]:-Replaced line in $FILENAME"
$RM -f ${FILENAME}.bak1
fi
$SED -i'.bak2' -e "s/^#${SEARCH_TXT}/${SEARCH_TXT}/" $FILENAME
RETVAL=$?
if [ $RETVAL -ne 0 ]; then
ERROR_EXIT "[FATAL]:-Failed to replace #$SEARCH_TXT in $FILENAME"
else
LOG_MSG "[INFO]:-Replaced line in $FILENAME"
$RM -f ${FILENAME}.bak2
fi
fi
else
# trap DEBUG will always be called first, when other traps are triggered.
# We need to make sure that we save the current running command, so
# that the RETRY function re-runs the command
trap 'CURRENT=$BASH_COMMAND' DEBUG
# Call out retry for commands that fail
trap RETRY ERR
RETVAL=0 # RETVAL gets modified in RETRY function whenever the trap is called
if [ $( REMOTE_EXECUTE_AND_GET_OUTPUT $SED_HOST "$GREP -c \"^[ ]*${SEARCH_TXT}[ ]*=\" $FILENAME") -gt 1 ]; then
LOG_MSG "[INFO]:-Found more than 1 instance of $SEARCH_TXT in $FILENAME on $SED_HOST, will append" 1
APPEND=1
fi
if [ $( REMOTE_EXECUTE_AND_GET_OUTPUT $SED_HOST "$GREP -c \"^[ ]*${SEARCH_TXT}[ ]*=\" $FILENAME") -eq 0 ] || [ $APPEND -eq 1 ]; then
$TRUSTED_SHELL $SED_HOST "$ECHO \"$SUB_TXT\" >> $FILENAME"
if [ $RETVAL -ne 0 ]; then
ERROR_EXIT "[FATAL]:-Failed to append line $SUB_TXT to $FILENAME on $SED_HOST"
else
LOG_MSG "[INFO]:-Appended line $SUB_TXT to $FILENAME on $SED_HOST" 1
fi
else
if [ $KEEP_PREV -eq 0 ];then
SED_COMMAND="s/${SEARCH_TXT}/${SUB_TXT} #${SEARCH_TXT}/"
else
SED_COMMAND="s/${SEARCH_TXT}.*/${SUB_TXT}/"
fi
$TRUSTED_SHELL $SED_HOST sed -i'.bak1' -f /dev/stdin "$FILENAME" <<< "$SED_COMMAND" > /dev/null 2>&1
if [ $RETVAL -ne 0 ]; then
ERROR_EXIT "[FATAL]:-Failed to insert $SUB_TXT in $FILENAME on $SED_HOST"
else
LOG_MSG "[INFO]:-Replaced line in $FILENAME on $SED_HOST"
$TRUSTED_SHELL $SED_HOST "$RM -f ${FILENAME}.bak1" > /dev/null 2>&1
fi
SED_COMMAND="s/^#${SEARCH_TXT}/${SEARCH_TXT}/"
$TRUSTED_SHELL $SED_HOST sed -i'.bak2' -f /dev/stdin "$FILENAME" <<< "$SED_COMMAND" > /dev/null 2>&1
if [ $RETVAL -ne 0 ]; then
ERROR_EXIT "[FATAL]:-Failed to substitute #${SEARCH_TXT} in $FILENAME on $SED_HOST"
else
LOG_MSG "[INFO]:-Replaced line in $FILENAME on $SED_HOST"
$TRUSTED_SHELL $SED_HOST "$RM -f ${FILENAME}.bak2" > /dev/null 2>&1
fi
fi
trap - ERR DEBUG # Disable trap
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
POSTGRES_PORT_CHK () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
GET_PG_PID_ACTIVE $1 $2
if [ $PID -ne 0 ];then
ERROR_EXIT "[FATAL]:-Host $2 has an active database process on port = $1"
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
CREATE_SPREAD_MIRROR_ARRAY () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
((MAX_ARRAY=${#QE_PRIMARY_ARRAY[@]}-1))
# Current host and subnet we are working on
CURRENT_HOST=0
CURRENT_SUBNET=0
# Destination host and subnet
DEST_HOST=0
DEST_SUBNET=0
if [ x"$NUM_MHOST_NODE" != x"" ] && [ $NUM_MHOST_NODE -gt 0 ] ; then
((DIRS_PER_SUBNET=$NUM_DATADIR/$NUM_MHOST_NODE))
else
DIRS_PER_SUBNET=$NUM_DATADIR
fi
((MAX_SUBNET=$NUM_DATADIR/$DIRS_PER_SUBNET))
((MAX_HOST=${#QE_PRIMARY_ARRAY[@]}/$NUM_DATADIR))
SEGS_PROCESSED=0
SEGS_PROCESSED_HOST=0
# The following is heavily dependent on sort order of primary array. This sort
# order will be affected by hostnames so something non-standard will cause
# strange behaviour. This isn't new (just recording this fact for future generations)
# and can be worked around with a mapping file to gpinitsystem (-I option).
# The right way to do this would require us to connect to remote hosts, determine
# what subnet we are on for that hostname and then build the array that way. We *will*
# do this once this is in python (or anything other than BASH)
LOG_MSG "[INFO]:-Building spread mirror array type $MULTI_TXT, please wait..." 1
for QE_LINE in ${QE_PRIMARY_ARRAY[@]}
do
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $NOLINE_ECHO ".\c";fi
if [ $(($SEGS_PROCESSED%$NUM_DATADIR)) -eq 0 ] ; then
# A new host group is starting
if [ $SEGS_PROCESSED -ne 0 ] ; then ((CURRENT_HOST=$CURRENT_HOST+1)); fi
# Start the mirroring on the next host
((DEST_HOST=$CURRENT_HOST+1))
# Always subnet "0" to start
CURRENT_SUBNET=0
DEST_SUBNET=1
# Make sure we loop back when needed
if [ $DEST_HOST -ge $MAX_HOST ] ; then DEST_HOST=0; fi
SEGS_PROCESSED_HOST=0
else
# Continue with current host
# move dest host to the next one (This is spread mirroring)
((DEST_HOST=$DEST_HOST+1))
# Make sure we look back when needed
if [ $DEST_HOST -ge $MAX_HOST ] ; then DEST_HOST=0; fi
# Get what subnet we are on, we may have moved to next
((CURRENT_SUBNET=($SEGS_PROCESSED_HOST+1)/$DIRS_PER_SUBNET))
((DEST_SUBNET=$CURRENT_SUBNET+1))
# Handle looping over
if [ $DEST_SUBNET -ge $MAX_SUBNET ] ; then DEST_SUBNET=0; fi
# Increment the number of segments we've processed for this host
((SEGS_PROCESSED_HOST=$SEGS_PROCESSED_HOST+1))
fi
# Handle the case where it's a single hostname (thus a single subnet)
# This case will mainly be for QA testing
if [ $NUM_DATADIR -eq $DIRS_PER_SUBNET ] ; then DEST_SUBNET=0; fi
# Handle possible loop
if [ $DEST_SUBNET -ge $MAX_SUBNET ] ; then DEST_SUBNET=0; fi
# Calculate the index based on host and subnet number
((PRIM_SEG_INDEX=($DEST_HOST*$NUM_DATADIR)+($DEST_SUBNET*$DIRS_PER_SUBNET)))
QE_M_HOST=`$ECHO ${QE_PRIMARY_ARRAY[$PRIM_SEG_INDEX]}|$AWK -F"~" '{print $1}'`
QE_M_NAME=`$ECHO ${QE_PRIMARY_ARRAY[$PRIM_SEG_INDEX]}|$AWK -F"~" '{print $2}'`
GP_M_DIR=${MIRROR_DATA_DIRECTORY[$SEGS_PROCESSED%$NUM_DATADIR]}
P_PORT=`$ECHO $QE_LINE|$AWK -F"~" '{print $3}'`
((GP_M_PORT=$P_PORT+$MIRROR_OFFSET))
M_CONTENT=`$ECHO $QE_LINE|$AWK -F"~" '{print $6}'`
M_SEG=`$ECHO $QE_LINE|$AWK -F"~" '{print $4}'|$AWK -F"/" '{print $NF}'`
QE_MIRROR_ARRAY=(${QE_MIRROR_ARRAY[@]} ${QE_M_HOST}~${QE_M_NAME}~${GP_M_PORT}~${GP_M_DIR}/${M_SEG}~${DBID_COUNT}~${M_CONTENT})
POSTGRES_PORT_CHK $GP_M_PORT $QE_M_NAME
((DBID_COUNT=$DBID_COUNT+1))
((SEGS_PROCESSED=$SEGS_PROCESSED+1))
done
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $ECHO;fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
CREATE_GROUP_MIRROR_ARRAY () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
LOG_MSG "[INFO]:-Building group mirror array type $MULTI_TXT, please wait..." 1
PRI_HOST_COUNT=`$ECHO ${QE_PRIMARY_ARRAY[@]}|$TR ' ' '\n'|$AWK -F"~" '{print $1}'|$SORT -u|$WC -l`
if [ $MULTI_HOME -eq 1 ] && [ $REMOTE_HOST_COUNT -eq 1 ];then
PRI_HOST_COUNT=1
fi
if [ x"$NUM_MHOST_NODE" != x"" ] && [ $NUM_MHOST_NODE -gt 0 ] ; then
((DIRS_PER_SUBNET=$NUM_DATADIR/$NUM_MHOST_NODE))
else
DIRS_PER_SUBNET=$NUM_DATADIR
fi
((MAX_SUBNET=$NUM_DATADIR/$DIRS_PER_SUBNET))
((MAX_HOST=${#QE_PRIMARY_ARRAY[@]}/$NUM_DATADIR))
# Current host we are working on
CURRENT_HOST=0
# Destination host and subnet
DEST_HOST=0
DEST_SUBNET=0
PRIMARY_ARRAY_LENGTH=${#QE_PRIMARY_ARRAY[@]}
PRIMARY_INDEX=0
for QE_LINE in ${QE_PRIMARY_ARRAY[@]}
do
if [ $(($PRIMARY_INDEX%$NUM_DATADIR)) -eq 0 ] ; then
if [ $PRIMARY_INDEX -ne 0 ] ; then ((CURRENT_HOST=$CURRENT_HOST+1)); fi
((DEST_HOST=$CURRENT_HOST+1))
if [ $DEST_HOST -ge $MAX_HOST ] ; then DEST_HOST=0; fi
DEST_SUBNET=1
else
if [ $(($PRIMARY_INDEX%$DIRS_PER_SUBNET)) -eq 0 ] ; then
((DEST_SUBNET=$DEST_SUBNET+1))
fi
fi
# Handle possible loop
if [ $DEST_SUBNET -ge $MAX_SUBNET ] ; then DEST_SUBNET=0; fi
((MIRROR_INDEX=($DEST_HOST*$NUM_DATADIR)+($DEST_SUBNET*$DIRS_PER_SUBNET)))
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $NOLINE_ECHO ".\c";fi
QE_M_HOST=`$ECHO ${QE_PRIMARY_ARRAY[$MIRROR_INDEX]}|$AWK -F"~" '{print $1}'`
QE_M_NAME=`$ECHO ${QE_PRIMARY_ARRAY[$MIRROR_INDEX]}|$AWK -F"~" '{print $2}'`
GP_M_DIR=${MIRROR_DATA_DIRECTORY[$PRIMARY_INDEX%$NUM_DATADIR]}/`$ECHO $QE_LINE|$AWK -F"~" '{print $4}'|$AWK -F"/" '{print $NF}'`
M_CONTENT=`$ECHO $QE_LINE|$AWK -F"~" '{print $6}'`
P_PORT=`$ECHO $QE_LINE|$AWK -F"~" '{print $3}'`
GP_M_PORT=$(($P_PORT+$MIRROR_OFFSET))
QE_MIRROR_ARRAY=(${QE_MIRROR_ARRAY[@]} ${QE_M_HOST}~${QE_M_NAME}~${GP_M_PORT}~${GP_M_DIR}~${DBID_COUNT}~${M_CONTENT})
POSTGRES_PORT_CHK $GP_M_PORT $QE_M_NAME
DBID_COUNT=$(($DBID_COUNT+1))
PRIMARY_INDEX=$((PRIMARY_INDEX+1))
done
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $ECHO;fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
GET_REPLY () {
$ECHO -e "\n$1 Yy|Nn (default=N):"
$ECHO -n "> "
read REPLY
if [ -z $REPLY ]; then
LOG_MSG "[FATAL]:-User abort requested, Script Exits!" 1
exit 1
fi
if [ $REPLY != Y ] && [ $REPLY != y ]; then
LOG_MSG "[FATAL]:-User abort requested, Script Exits!" 1
exit 1
fi
}
CHK_FILE () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
FILENAME=$1
FILE_HOST=$2
if [ x"" == x"$FILE_HOST" ];then
LOG_MSG "[INFO]:-Checking file $FILENAME"
if [ ! -s $FILENAME ] || [ ! -r $FILENAME ]
then
EXISTS=1
else
EXISTS=0
fi
else
EXISTS=$( REMOTE_EXECUTE_AND_GET_OUTPUT $FILE_HOST "if [ ! -s $FILENAME ] || [ ! -r $FILENAME ];then $ECHO 1;else $ECHO 0;fi" )
RETVAL=$?
if [ $RETVAL -ne 0 ];then
LOG_MSG "[WARN]:-Failed to obtain details of $FILENAME on $FILE_HOST"
EXISTS=1
fi
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
CHK_DIR () {
# this function might be called very early, before logfiles are initialized
if [ x"" == x"$3" ];then
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
fi
DIR_NAME=$1
DIR_HOST=$2
if [ x"" == x"$DIR_HOST" ];then
EXISTS=`if [ -d $DIR_NAME ];then $ECHO 0;else $ECHO 1;fi`
else
EXISTS=$( REMOTE_EXECUTE_AND_GET_OUTPUT $DIR_HOST "if [ -d $DIR_NAME ];then $ECHO 0;else $ECHO 1;fi" )
RETVAL=$?
if [ $RETVAL -ne 0 ];then
LOG_MSG "[WARN]:-Failed to obtain details of $DIR_NAME on $DIR_HOST" 1
EXISTS=1
fi
fi
if [ x"" == x"$3" ];then
LOG_MSG "[INFO]:-End Function $FUNCNAME"
fi
}
GET_COORDINATOR_PORT () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
COORDINATOR_DATA_DIRECTORY=$1
if [ x"" == x"$COORDINATOR_DATA_DIRECTORY" ];then
ERROR_EXIT "[FATAL]:-COORDINATOR_DATA_DIRECTORY variable not set";fi
if [ ! -d $COORDINATOR_DATA_DIRECTORY ]; then
ERROR_EXIT "[FATAL]:-No $COORDINATOR_DATA_DIRECTORY directory"
fi
if [ -r $COORDINATOR_DATA_DIRECTORY/$PG_CONF ];then
COORDINATOR_PORT=`$AWK 'split($0,a,"#")>0 && split(a[1],b,"=")>1 {print b[1] " " b[2]}' $COORDINATOR_DATA_DIRECTORY/$PG_CONF | $AWK '$1=="port" {print $2}' | $TAIL -1`
if [ x"" == x"$COORDINATOR_PORT" ] ; then
#look for include files
for INC_FILE in `$AWK '/^[ ]*include /{print $2}' $COORDINATOR_DATA_DIRECTORY/$PG_CONF | $TR -d "'\""` ; do
if [[ $INC_FILE == /* ]] ; then
GET_COORDINATOR_PORT_RECUR "$INC_FILE" 1
else
GET_COORDINATOR_PORT_RECUR "$COORDINATOR_DATA_DIRECTORY/$INC_FILE" 1
fi
done
if [ x"" == x"$COORDINATOR_PORT" ] ; then
ERROR_EXIT "[FATAL]:-Failed to obtain coordinator port number from $COORDINATOR_DATA_DIRECTORY/$PG_CONF"
fi
fi
else
ERROR_EXIT "[FATAL]:-Do not have read access to $COORDINATOR_DATA_DIRECTORY/$PG_CONF"
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
GET_COORDINATOR_PORT_RECUR () {
INCLUDED_FILE=$1
RECUR=$2
if [ $RECUR -le 10 ] ; then
COORDINATOR_PORT=`$AWK 'split($0,a,"#")>0 && split(a[1],b,"=")>1 {print b[1] " " b[2]}' $INCLUDED_FILE | $AWK '$1=="port" {print $2}' | $TAIL -1`
if [ x"" == x"$COORDINATOR_PORT" ] ; then
#look for include files
let CURR_DEPTH=$RECUR+1
for INC_FILE in `$AWK '/^[ ]*include /{print $2}' $INC_FILE | $TR -d "'\""` ; do
if [[ $INC_FILE == /* ]] ; then
GET_COORDINATOR_PORT_RECUR "$INC_FILE" $CURR_DEPTH
else
GET_COORDINATOR_PORT_RECUR "$COORDINATOR_DATA_DIRECTORY/$INC_FILE" $CURR_DEPTH
fi
if [ x"" != x"$COORDINATOR_PORT" ] ; then
break
fi
done
fi
else
ERROR_EXIT "[FATAL]:-Could not open configuration file \"$INCLUDED_FILE\": maximum nesting depth exceeded"
fi
}
GET_CIDRADDR () {
# MPP-15889
# assuming argument is an ip address, return the address
# with a /32 or /128 cidr suffix based on whether or not the
# address contains a :
if [ `echo $1 | grep -c :` -gt 0 ]; then
echo $1/128
else
echo $1/32
fi
}
BUILD_COORDINATOR_PG_HBA_FILE () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
if [ $# -eq 0 ];then ERROR_EXIT "[FATAL]:-Passed zero parameters, expected at least 2";fi
GP_DIR=$1
HBA_HOSTNAMES=${2:-0}
LOG_MSG "[INFO]:-Clearing values in Coordinator $PG_HBA"
$GREP "^#" ${GP_DIR}/$PG_HBA > $TMP_PG_HBA
$MV $TMP_PG_HBA ${GP_DIR}/$PG_HBA
LOG_MSG "[INFO]:-Setting local access"
$ECHO "local all $USER_NAME $PG_METHOD" >> ${GP_DIR}/$PG_HBA
#$ECHO "local all all $PG_METHOD" >> ${GP_DIR}/$PG_HBA
LOG_MSG "[INFO]:-Setting local host access"
if [ $HBA_HOSTNAMES -eq 0 ];then
$ECHO "host all $USER_NAME 127.0.0.1/28 trust" >> ${GP_DIR}/$PG_HBA
for ADDR in "${COORDINATOR_IP_ADDRESS_ALL[@]}"
do
# MPP-15889
CIDRADDR=$(GET_CIDRADDR $ADDR)
$ECHO "host all $USER_NAME $CIDRADDR trust" >> ${GP_DIR}/$PG_HBA
done
for ADDR in "${STANDBY_IP_ADDRESS_ALL[@]}"
do
# MPP-15889
CIDRADDR=$(GET_CIDRADDR $ADDR)
$ECHO "host all $USER_NAME $CIDRADDR trust" >> ${GP_DIR}/$PG_HBA
done
# Add all local IPV6 addresses
for ADDR in "${COORDINATOR_IPV6_LOCAL_ADDRESS_ALL[@]}"
do
# MPP-15889
CIDRADDR=$(GET_CIDRADDR $ADDR)
$ECHO "host all $USER_NAME $CIDRADDR trust" >> ${GP_DIR}/$PG_HBA
done
else
$ECHO "host all $USER_NAME localhost trust" >> ${GP_DIR}/$PG_HBA
$ECHO "host all $USER_NAME $COORDINATOR_HOSTNAME trust" >> ${GP_DIR}/$PG_HBA
fi
# Add replication config
$ECHO "local replication $USER_NAME $PG_METHOD" >> ${GP_DIR}/$PG_HBA
# Add the samehost replication entry to support single-host development
$ECHO "host replication $USER_NAME samehost trust" >> ${GP_DIR}/$PG_HBA
if [ $HBA_HOSTNAMES -eq 0 ];then
local COORDINATOR_IP_ADDRESS_NO_LOOPBACK=($("$GPHOME"/libexec/ifaddrs --no-loopback))
if [ x"" != x"$STANDBY_HOSTNAME" ] && [ "$STANDBY_HOSTNAME" != "$COORDINATOR_HOSTNAME" ];then
local STANDBY_IP_ADDRESS_NO_LOOPBACK=($( REMOTE_EXECUTE_AND_GET_OUTPUT $STANDBY_HOSTNAME "'$GPHOME'/libexec/ifaddrs --no-loopback" ))
fi
for ADDR in "${COORDINATOR_IP_ADDRESS_NO_LOOPBACK[@]}" "${STANDBY_IP_ADDRESS_NO_LOOPBACK[@]}"
do
CIDRADDR=$(GET_CIDRADDR $ADDR)
$ECHO "host replication $USER_NAME $CIDRADDR trust" >> ${GP_DIR}/$PG_HBA
done
else
$ECHO "host replication $USER_NAME $COORDINATOR_HOSTNAME trust" >> ${GP_DIR}/$PG_HBA
if [ x"" != x"$STANDBY_HOSTNAME" ] && [ "$STANDBY_HOSTNAME" != "$COORDINATOR_HOSTNAME" ];then
$ECHO "host replication $USER_NAME $STANDBY_HOSTNAME trust" >> ${GP_DIR}/$PG_HBA
fi
fi
if [ "$CLUSTER_BOOT_MODE" = "PRODUCTION" ] && [ $USE_EXTERNAL_FTS -ne 0 ];then
for fts in ${FTS_HOST_MACHINE_LIST[*]}
do
if [ ! "$FTS_HOST" = "$COORDINATOR_HOSTNAME" ];then
$ECHO "host all $USER_NAME $fts trust" >> ${GP_DIR}/$PG_HBA
$ECHO "hostssl all $USER_NAME $fts trust" >> ${GP_DIR}/$PG_HBA
fi
done
fi
LOG_MSG "[INFO]:-Complete Coordinator $PG_HBA configuration"
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
BUILD_GPSSH_CONF () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
if [ $# -eq 0 ];then ERROR_EXIT "[FATAL]:-Passed zero parameters, expected at least 1";fi
GP_DIR=$1
$CAT <<_EOF_ >> $GP_DIR/gpssh.conf
[gpssh]
# delaybeforesend specifies the time in seconds to wait at the
# beginning of an ssh interaction before doing anything.
# Increasing this value can have a big runtime impact at the
# beginning of gpssh.
delaybeforesend = 0.05
# prompt_validation_timeout specifies a timeout multiplier that
# will be used in validating the ssh prompt. Increasing this
# value will have a small runtime impact at the beginning of
# gpssh.
prompt_validation_timeout = 1.0
# sync_retries specifies how many times to try the pxssh
# connection verification.
# Setting this value to 1 means gpssh will immediately pass
# along pxssh's best effort.
# Increasing this value will allow for slow network connections,
# cpu load, or other slowness on the segment host, but will
# also delay feedback when a connection cannot be established
# for other reasons
sync_retries = 3
_EOF_
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
GET_PG_PID_ACTIVE () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
# Expects port number and hostname for remote checking
PORT=$1;shift
HOST=$1
PG_LOCK_FILE="/tmp/.s.PGSQL.${PORT}.lock"
PG_LOCK_SS=""
if [ x"" == x"$HOST" ];then
#See if we have a ss entry for this local host
PORT_ARRAY=(`$SS -an 2>/dev/null |$AWK '{for (i =1; i<=NF ; i++) if ($i==".s.PGSQL.${PORT}") print $i}'|$AWK -F"." '{print $NF}'|$SORT -u`)
for P_CHK in ${PORT_ARRAY[@]}
do
if [ $P_CHK -eq $PORT ];then PG_LOCK_SS=$PORT;fi
done
#See if we have a lock file in /tmp
if [ -f ${PG_LOCK_FILE} ];then
PG_LOCK_TMP=1
else
PG_LOCK_TMP=0
fi
if [ x"" == x"$PG_LOCK_SS" ] && [ $PG_LOCK_TMP -eq 0 ];then
PID=0
LOG_MSG "[INFO]:-No socket connection or lock file in /tmp found for port=${PORT}"
else
#Now check the failure combinations
if [ $PG_LOCK_TMP -eq 0 ] && [ x"" != x"$PG_LOCK_SS" ];then
#Have a process but no lock file
LOG_MSG "[WARN]:-No lock file $PG_LOCK_FILE but process running on port $PORT" 1
PID=1
fi
if [ $PG_LOCK_TMP -eq 1 ] && [ x"" == x"$PG_LOCK_SS" ];then
#Have a lock file but no process
if [ -r ${PG_LOCK_FILE} ];then
PID=`$CAT ${PG_LOCK_FILE}|$HEAD -1|$AWK '{print $1}'`
else
LOG_MSG "[WARN]:-Unable to access ${PG_LOCK_FILE}" 1
PID=1
fi
LOG_MSG "[WARN]:-Have lock file $PG_LOCK_FILE but no process running on port $PORT" 1
fi
if [ $PG_LOCK_TMP -eq 1 ] && [ x"" != x"$PG_LOCK_SS" ];then
#Have both a lock file and a ss process
if [ -r ${PG_LOCK_FILE} ];then
PID=`$CAT ${PG_LOCK_FILE}|$HEAD -1|$AWK '{print $1}'`
else
LOG_MSG "[WARN]:-Unable to access ${PG_LOCK_FILE}" 1
PID=1
fi
LOG_MSG "[INFO]:-Have lock file $PG_LOCK_FILE and a process running on port $PORT"
fi
fi
else
PING_HOST $HOST 1
if [ $RETVAL -ne 0 ];then
PID=0
else
PORT_ARRAY=($( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "$SS -an 2>/dev/null" |$AWK '{for (i =1; i<=NF ; i++) if ($i==".s.PGSQL.${PORT}") print $i}'|$AWK -F"." '{print $NF}'|$SORT -u))
for P_CHK in ${PORT_ARRAY[@]}
do
if [ $P_CHK -eq $PORT ];then PG_LOCK_SS=$PORT;fi
done
PG_LOCK_TMP=$( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "ls ${PG_LOCK_FILE} 2>/dev/null|$WC -l" )
if [ x"" == x"$PG_LOCK_SS" ] && [ $PG_LOCK_TMP -eq 0 ];then
PID=0
LOG_MSG "[INFO]:-No socket connection or lock file $PG_LOCK_FILE found for port=${PORT}"
else
#Now check the failure combinations
if [ $PG_LOCK_TMP -eq 0 ] && [ x"" != x"$PG_LOCK_SS" ];then
#Have a process but no lock file
LOG_MSG "[WARN]:-No lock file $PG_LOCK_FILE but process running on port $PORT on $HOST" 1
PID=1
fi
if [ $PG_LOCK_TMP -eq 1 ] && [ x"" == x"$PG_LOCK_SS" ];then
#Have a lock file but no process
CAN_READ=$( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "if [ -r ${PG_LOCK_FILE} ];then echo 1;else echo 0;fi" )
if [ $CAN_READ -eq 1 ];then
PID=$( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "$CAT ${PG_LOCK_FILE}|$HEAD -1 2>/dev/null" | $AWK '{print $1}' )
else
LOG_MSG "[WARN]:-Unable to access ${PG_LOCK_FILE} on $HOST" 1
fi
LOG_MSG "[WARN]:-Have lock file $PG_LOCK_FILE but no process running on port $PORT on $HOST" 1
PID=1
fi
if [ $PG_LOCK_TMP -eq 1 ] && [ x"" != x"$PG_LOCK_SS" ];then
#Have both a lock file and a ss process
CAN_READ=$( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "if [ -r ${PG_LOCK_FILE} ];then echo 1;else echo 0;fi" )
if [ $CAN_READ -eq 1 ];then
PID=$( REMOTE_EXECUTE_AND_GET_OUTPUT $HOST "$CAT ${PG_LOCK_FILE}|$HEAD -1 2>/dev/null"|$AWK '{print $1}' )
else
LOG_MSG "[WARN]:-Unable to access ${PG_LOCK_FILE} on $HOST" 1
fi
LOG_MSG "[INFO]:-Have lock file $PG_LOCK_FILE and a process running on port $PORT on $HOST"
fi
fi
fi
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
RUN_COMMAND_REMOTE () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
HOST=$1
COMMAND=$2
LOG_MSG "[INFO]:-Commencing remote $TRUSTED_SHELL $HOST $COMMAND"
$TRUSTED_SHELL $HOST $COMMAND >> $LOG_FILE 2>&1
RETVAL=$?
if [ $RETVAL -ne 0 ]; then
LOG_MSG "[FATAL]:- Command $COMMAND on $HOST failed with error status $RETVAL" 2
else
LOG_MSG "[INFO]:-Completed $TRUSTED_SHELL $HOST $COMMAND"
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
return $RETVAL
}
BACKOUT_COMMAND () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
COMMAND=$1
if [ ! -f $BACKOUT_FILE ]; then
$ECHO $COMMAND > $BACKOUT_FILE
else
$CAT $BACKOUT_FILE > /tmp/backout_file.tmp.$$
$ECHO $COMMAND > $BACKOUT_FILE
$CAT /tmp/backout_file.tmp.$$ >> $BACKOUT_FILE
$RM -f /tmp/backout_file.tmp.$$
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
PING_HOST () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
TARGET_HOST=$1;shift
PING_EXIT=$1
if [ x"" == x"$PING_EXIT" ];then PING_EXIT=0;fi
OUTPUT=""
case $OS_TYPE in
darwin )
OUTPUT=$($PING $PING_TIME $TARGET_HOST 2>&1 || $PING6 $PING_TIME $TARGET_HOST 2>&1)
;;
linux )
OUTPUT=$($PING $TARGET_HOST $PING_TIME 2>&1 || $PING6 $TARGET_HOST $PING_TIME 2>&1)
;;
openbsd )
OUTPUT=$($PING $PING_TIME $TARGET_HOST 2>&1 || $PING6 $PING_TIME $TARGET_HOST 2>&1)
;;
* )
OUTPUT=$($PING $TARGET_HOST $PING_TIME 2>&1)
esac
RETVAL=$?
case $RETVAL in
0) LOG_MSG "[INFO]:-$TARGET_HOST contact established"
;;
1) if [ $PING_EXIT -eq 0 ];then
ERROR_EXIT "[FATAL]:-Unable to contact $TARGET_HOST: $OUTPUT"
else
LOG_MSG "[WARN]:-Unable to contact $TARGET_HOST: $OUTPUT" 1
fi
;;
2) if [ $PING_EXIT -eq 0 ];then
ERROR_EXIT "[FATAL]:-Unknown host $TARGET_HOST: $OUTPUT"
else
LOG_MSG "[WARN]:-Unknown host $TARGET_HOST: $OUTPUT" 1
fi
;;
*) if [ $PING_EXIT -eq 0 ];then
ERROR_EXIT "[FATAL]:-Cannot ping host $TARGET_HOST: $OUTPUT"
else
LOG_MSG "[WARN]:-Cannot ping host $TARGET_HOST: $OUTPUT" 1
fi
;;
esac
LOG_MSG "[INFO]:-End Function $FUNCNAME"
return $RETVAL
}
PARALLEL_SETUP () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
PARALLEL_STATUS_FILE=$1
$TOUCH $PARALLEL_STATUS_FILE
export PARALLEL_STATUS_FILE=$PARALLEL_STATUS_FILE
LOG_MSG "[INFO]:-Spawning parallel processes batch [1], please wait..." 1
BATCH_COUNT=0
INST_COUNT=0
BATCH_DONE=1
BATCH_TOTAL=0
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
PARALLEL_COUNT () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
if [ $# -ne 2 ];then ERROR_EXIT "[FATAL]:-Incorrect number of parameters passed to $FUNCNAME";fi
BATCH_LIMIT=$1
BATCH_DEFAULT=$2
((INST_COUNT=$INST_COUNT+1))
((BATCH_COUNT=$BATCH_COUNT+1))
((BATCH_TOTAL=$BATCH_TOTAL+1))
if [ $BATCH_COUNT -eq $BATCH_DEFAULT ] || [ $BATCH_LIMIT -eq $BATCH_TOTAL ];then
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $ECHO;fi
PARALLEL_WAIT
((BATCH_DONE=$BATCH_DONE+1))
BATCH_COUNT=0
if [ $BATCH_LIMIT -ne $BATCH_TOTAL ];then
LOG_MSG "[INFO]:-Spawning parallel processes batch [$BATCH_DONE], please wait..." 1
fi
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
PARALLEL_WAIT () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
LOG_MSG "[INFO]:-Waiting for parallel processes batch [$BATCH_DONE], please wait..." 1
SLEEP_COUNT=0
while [ `$WC -l $PARALLEL_STATUS_FILE|$AWK '{print $1}'` -ne $INST_COUNT ]
do
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $NOLINE_ECHO ".\c";fi
$SLEEP 1
((SLEEP_COUNT=$SLEEP_COUNT+1))
if [ $WAIT_LIMIT -lt $SLEEP_COUNT ];then
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $NOLINE_ECHO ".\c";fi
LOG_MSG "[FATAL]:-Failed to process this batch of segments within $WAIT_LIMIT seconds" 1
LOG_MSG "[INFO]:-Review contents of $LOG_FILE" 1
ERROR_EXIT "[FATAL]:-Process timeout failure"
fi
done
if [ $DEBUG_LEVEL -eq 0 ] && [ x"" != x"$VERBOSE" ];then $ECHO;fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
PARALLEL_SUMMARY_STATUS_REPORT () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
REPORT_FAIL=0
if [ -f $1 ];then
KILLED_COUNT=`$GREP -c "KILLED:" $PARALLEL_STATUS_FILE`
COMPLETED_COUNT=`$GREP -c "COMPLETED:" $PARALLEL_STATUS_FILE`
FAILED_COUNT=`$GREP -c "FAILED:" $PARALLEL_STATUS_FILE`
((TOTAL_FAILED_COUNT=$KILLED_COUNT+$FAILED_COUNT))
LOG_MSG "[INFO]:------------------------------------------------" 1
LOG_MSG "[INFO]:-Parallel process exit status" 1
LOG_MSG "[INFO]:------------------------------------------------" 1
LOG_MSG "[INFO]:-Total processes marked as completed = $COMPLETED_COUNT" 1
if [ $KILLED_COUNT -ne 0 ];then
LOG_MSG "[WARN]:-Total processes marked as killed = $KILLED_COUNT $WARN_MARK" 1
REPORT_FAIL=1
else
LOG_MSG "[INFO]:-Total processes marked as killed = 0" 1
fi
if [ $FAILED_COUNT -ne 0 ];then
LOG_MSG "[WARN]:-Total processes marked as failed = $FAILED_COUNT $WARN_MARK" 1
REPORT_FAIL=1
else
LOG_MSG "[INFO]:-Total processes marked as failed = 0" 1
fi
LOG_MSG "[INFO]:------------------------------------------------" 1
else
LOG_MSG "[WARN]:-Could not locate status file $1" 1
REPORT_FAIL=1
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
CHK_GPDB_ID () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
if [ -f ${INITDB} ];then
PERMISSION=`ls -al ${INITDB}|$AWK '{print $1}'`
COORDINATOR_INITDB_ID=`ls -al ${INITDB}|$AWK '{print $3}'`
INIT_CHAR=`$ECHO $COORDINATOR_INITDB_ID|$TR -d '\n'|$WC -c|$TR -d ' '`
COORDINATOR_INITDB_GROUPID=`ls -al ${INITDB}|$AWK '{print $4}'`
GROUP_INIT_CHAR=`$ECHO $COORDINATOR_INITDB_ID|$TR -d '\n'|$WC -c|$TR -d ' '`
GPDB_ID=`id|$TR '(' ' '|$TR ')' ' '|$AWK '{print $2}'`
GPDB_GROUPID=`id|$TR '(' ' '|$TR ')' ' '|$AWK '{print $4}'`
USER_EXECUTE=`$ECHO $PERMISSION | $SED -e 's/...\(.\).*/\1/g'`
GROUP_EXECUTE=`$ECHO $PERMISSION | $SED -e 's/......\(.\).*/\1/g'`
if [ `$ECHO $GPDB_ID|$TR -d '\n'|$WC -c` -gt $INIT_CHAR ];then
GPDB_ID_CHK=`$ECHO $GPDB_ID|$CUT -c1-$INIT_CHAR`
else
GPDB_ID_CHK=$GPDB_ID
fi
if [ `$ECHO $GPDB_GROUPID|$TR -d '\n'|$WC -c` -gt $GROUP_INIT_CHAR ];then
GPDB_GROUPID_CHK=`$ECHO $GPDB_GROUPID|$CUT -c1-$GROUP_INIT_CHAR`
else
GPDB_GROUPID_CHK=$GPDB_GROUPID
fi
if [ x$GPDB_ID_CHK == x$COORDINATOR_INITDB_ID ] && [ x"x" == x"$USER_EXECUTE" ];then
LOG_MSG "[INFO]:-Current user id of $GPDB_ID, matches initdb id of $COORDINATOR_INITDB_ID"
elif [ x$GPDB_GROUPID_CHK == x$COORDINATOR_INITDB_GROUPID ] && [ x"x" == x"$GROUP_EXECUTE" ] ; then
LOG_MSG "[INFO]:-Current group id of $GPDB_GROUPID, matches initdb group id of $COORDINATOR_INITDB_GROUPID"
else
LOG_MSG "[WARN]:-File permission mismatch. The $GPDB_ID_CHK owns the Apache Cloudberry installation directory."
LOG_MSG "[WARN]:-You are currently logged in as $COORDINATOR_INITDB_ID and may not have sufficient"
LOG_MSG "[WARN]:-permissions to run the Cloudberry binaries and management utilities."
fi
if [ x"" != x"$USER" ];then
if [ `$ECHO $USER|$TR -d '\n'|$WC -c` -gt $INIT_CHAR ];then
USER_CHK=`$ECHO $USER|$CUT -c1-$INIT_CHAR`
else
USER_CHK=$USER
fi
if [ x$GPDB_ID_CHK != x$USER_CHK ];then
LOG_MSG "[WARN]:-\$USER mismatch, id returns $GPDB_ID, \$USER returns $USER" 1
LOG_MSG "[WARN]:-The GPDB superuser account that owns the initdb binary should run these utilities" 1
LOG_MSG "[WARN]:-This may cause problems when these utilities are run as $USER" 1
fi
else
LOG_MSG "[INFO]:-Environment variable \$USER unset, will set to $GPDB_ID" 1
export USER=$GPDB_ID
fi
if [ x"" != x"$LOGNAME" ];then
if [ `$ECHO $LOGNAME|$TR -d '\n'|$WC -c` -gt $INIT_CHAR ];then
LOGNAME_CHK=`$ECHO $LOGNAME|$CUT -c1-$INIT_CHAR`
else
LOGNAME_CHK=$LOGNAME
fi
if [ x$GPDB_ID_CHK != x$LOGNAME_CHK ];then
LOG_MSG "[WARN]:-\$LOGNAME mismatch, id returns $GPDB_ID_CHK, \$LOGNAME returns $LOGNAME_CHK" 1
LOG_MSG "[WARN]:-The GPDB superuser account that owns the initdb binary should run these utilities" 1
LOG_MSG "[WARN]:-This may cause problems when these utilities are run as $LOGNAME" 1
fi
else
LOG_MSG "[INFO]:-Environment variable \$LOGNAME unset, will set to $GPDB_ID" 1
export LOGNAME=$GPDB_ID
fi
else
LOG_MSG "[WARN]:-No initdb file, unable to verify id" 1
fi
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
SET_GP_USER_PW () {
LOG_MSG "[INFO]:-Start Function $FUNCNAME"
local alter_statement="alter user :\"username\" password :'password';"
$PSQL --variable=ON_ERROR_STOP=1 \
-p $COORDINATOR_PORT \
-d "$DEFAULTDB" \
--variable=username="$USER_NAME" \
--variable=password="$GP_PASSWD" <<< "$alter_statement" >> $LOG_FILE 2>&1
ERROR_CHK $? "update Cloudberry superuser password" 1
LOG_MSG "[INFO]:-End Function $FUNCNAME"
}
RESOLVE_HOSTNAME() {
if [ "$#" -ne 1 ]
then
echo "RESOLVE_HOSTNAME invalid params..."
fi
HOSTNAME=$1
HOSTIP=`getent hosts $HOSTNAME | awk '{ print $1 }'`
echo "$HOSTIP"
}
OUTPUT_HOST_TO_FILE() {
if [ "$#" -ne 2 ];then
LOG_MSG "[ERROR]: OUTPUT_CONFIG invalid params..."
fi
CONFIG_FILE=$1
HOST=$2
local config_dir=${COORDINATOR_DIRECTORY}/${SEG_PREFIX}-1/config
local config_file=$config_dir/$CONFIG_FILE
if [ ! -d $config_dir ];then
mkdir -p $config_dir
fi
echo $HOST >> $config_file
}
PRECHECK_CBDB_CONFIG_FILE() {
local config_dir=$COORDINATOR_DATA_DIRECTORY/config
if [ -d $config_dir ];then
rm -rf $config_dir
fi
}
CLEANUP_ETCD() {
if [ "$#" -ne 1 ];then
LOG_MSG "[ERROR]: RETRIVE_ETCD_CONFIG_VAL invalid params..."
fi
local etcd_account_id=`RETRIVE_ETCD_CONFIG_VAL $ETCD_ACCOUNT_ID`
local etcd_cluster_id=`RETRIVE_ETCD_CONFIG_VAL $ETCD_CLUSTER_ID`
local etcd_namespace=`RETRIVE_ETCD_CONFIG_VAL $ETCD_NAMESPACE`
local etcd_endpoints=`RETRIVE_ETCD_CONFIG_VAL $ETCD_ENDPOINTS`
if [ \( ! "$etcd_account_id" = "" \) -a \( ! "$etcd_cluster_id" = "" \) -a \( ! "$etcd_namespace" = "" \) -a \( ! "$etcd_endpoints" = "" \) ];then
local etcd_key="/cbdb/fts/default/$etcd_account_id/$etcd_cluster_id/$etcd_namespace/fts_dump_file_key"
etcd_cleanup_res=`export ETCDCTL_API=3;etcdctl --endpoints=$etcd_endpoints del $etcd_key`
if [ "$etcd_cleanup_res" = "1" ]; then
ERROR_EXIT "[FATAL]: ETCD HOST key cleanup failed with key: $etcd_key, result: $etcd_cleanup_res"
fi
else
LOG_MSG "[WARNING]: CLEANUP_ETCD skipped caused by inproper key."
fi
}
RETRIVE_ETCD_CONFIG_VAL() {
if [ "$#" -ne 1 ];then
LOG_MSG "[ERROR]: RETRIVE_ETCD_CONFIG_VAL invalid params..."
fi
ETCD_CONFIG_VAL=$1
local tmpstr=`cat $ETCD_CONFIG_FILE_PATH | grep $ETCD_CONFIG_VAL | sed "s/['\"]//g"`
ETCD_CONFIG_VAL_RES=${tmpstr#*=}
echo "$ETCD_CONFIG_VAL_RES"
}
SETUP_ETCD () {
if [ "$#" -ne 4 ];then
LOG_MSG "[ERROR]: SETUP_ETCD invalid params..."
fi
ETCD_HOST=$1
ETCD_HOST_LIST=$2
ETCD_HOST_NUM=$3
ETCD_START_MODE=$4
ETCD_IP=`RESOLVE_HOSTNAME $ETCD_HOST`
if [ "$ETCD_START_MODE" = "DEMO" ];then
nohup etcd > /dev/null 2>&1 &
else
ETCD_START_CMD="nohup ${GPHOME}/bin/etcd --name ${ETCD_HOST_NUM} --listen-client-urls http://${ETCD_IP}:2379,http://127.0.0.1:2379 --advertise-client-urls http://${ETCD_IP}:2379 --listen-peer-urls http://${ETCD_IP}:2380 --initial-advertise-peer-urls http://${ETCD_IP}:2380 --initial-cluster-token etcd-cluster-1 --initial-cluster ${ETCD_HOST_LIST} --initial-cluster-state new --enable-pprof &"
gpssh -h $ETCD_HOST -e "${ETCD_START_CMD}"
fi
LOG_MSG "[INFO]: ETCD already installed on host $ETCD_HOST"
}
CHECK_ETCD () {
ret=1
if [ "$#" -ne 2 ];then
LOG_MSG "[ERROR]: CHECK_ETCD invalid params..."
fi
ETCD_HOST=$1
ETCD_START_MODE=$2
if [ "$ETCD_START_MODE" = "DEMO" ];then
ETCD_CHECK_CMD="ps -ef | grep -i 'etcd' | grep -v 'grep'"
else
ETCD_CHECK_CMD="ps -ef | grep -i 'etcd' | grep 'initial-cluster' | grep -v 'grep'"
fi
ETCD_PROCESS_RES=`gpssh -h ${ETCD_HOST} -e "${ETCD_CHECK_CMD}" | wc -l`
if [ ! "$ETCD_PROCESS_RES" -eq "1" ]; then
ret=0
fi
return $ret
}
SETUP_FTS() {
if [ "$#" -ne 3 ];then
LOG_MSG "[ERROR]: SETUP_FTS invalid params..."
fi
FTS_HOST=$1
FTS_LOG_DIR=$2
FTS_START_MODE=$3
if [ "$FTS_START_MODE" = "DEMO" ];then
nohup $GPHOME/bin/gpsync -F $GPHOME/bin/config/cbdb_etcd_default.conf -d ${FTS_LOG_DIR}/log/fts -D -C -a >/dev/null 2>&1 &
else
gpsync -h ${FTS_HOST} $ETCD_CONFIG_FILE_PATH =:${ETCD_CONFIG_TMP_FILE}
FTS_CMD="mkdir -p ${FTS_LOG_DIR}/log/fts;nohup ${GPHOME}/bin/gpfts -F ${ETCD_CONFIG_TMP_FILE} -d ${FTS_LOG_DIR}/log/fts >/dev/null 2>&1 &"
gpssh -h ${FTS_HOST} -e "${FTS_CMD}"
fi
OUTPUT_HOST_TO_FILE $FTS_HOST_FILE $ETCD_HOST
LOG_MSG "[INFO]: FTS already installed on host $FTS_HOST"
}
CHECK_FTS () {
ret=1
if [ "$#" -ne 2 ];then
LOG_MSG "[ERROR]: CHECK_FTS invalid params..."
fi
FTS_HOST=$1
FTS_CHECK_CMD="ps -ef | grep -i 'gpfts' | grep -v grep"
FTS_PROCESS_RES=`gpssh -h ${FTS_HOST} -e "${FTS_CHECK_CMD}" | wc -l`
if [ ! "$FTS_PROCESS_RES" -eq "1" ]; then
ret=0
fi
return $ret
}
SET_VAR () {
#
# MPP-13617: If segment contains a ~, we assume ~ is the field delimiter.
# Otherwise we assume : is the delimiter. This allows us to easily
# handle IPv6 addresses which may contain a : by using a ~ as a delimiter.
#
I=$1
case $I in
*~*)
S="~"
;;
*)
S=":"
;;
esac
GP_HOSTNAME=`$ECHO $I|$CUT -d$S -f1`
GP_HOSTADDRESS=`$ECHO $I|$CUT -d$S -f2`
GP_PORT=`$ECHO $I|$CUT -d$S -f3`
GP_DIR=`$ECHO $I|$CUT -d$S -f4`
GP_DBID=`$ECHO $I|$CUT -d$S -f5`
GP_CONTENT=`$ECHO $I|$CUT -d$S -f6`
}
#******************************************************************************
# Main Section
#******************************************************************************
#******************************************************************************
# Setup logging directory
#******************************************************************************
CUR_DATE=`$DATE +%Y%m%d`
DEFLOGDIR=$HOME/gpAdminLogs
if [ ! -d $DEFLOGDIR ]; then
mkdir $DEFLOGDIR
fi
LOG_FILE=$DEFLOGDIR/${PROG_NAME}_${CUR_DATE}.log
#Set up OS type for scripts to change command lines
OS_TYPE=`uname -s|tr '[A-Z]' '[a-z]'`
case $OS_TYPE in
linux ) IPV4_ADDR_LIST_CMD="$IP -4 address show"
IPV6_ADDR_LIST_CMD="$IP -6 address show"
PS_TXT="ax"
LIB_TYPE="LD_LIBRARY_PATH"
PG_METHOD="ident"
HOST_ARCH_TYPE="uname -i"
NOLINE_ECHO="$ECHO -e"
PING6=`findCmdInPath ping6`
PING_TIME="-c 1"
;;
darwin ) IFCONFIG=`findCmdInPath ifconfig`
IPV4_ADDR_LIST_CMD="$IFCONFIG -a inet"
IPV6_ADDR_LIST_CMD="$IFCONFIG -a inet6"
PS_TXT="ax"
LIB_TYPE="DYLD_LIBRARY_PATH"
# Darwin zcat wants to append ".Z" to the end of the file name; use "gunzip -c" instead
PG_METHOD="ident"
HOST_ARCH_TYPE="uname -m"
NOLINE_ECHO=$ECHO
PING6=`findCmdInPath ping6`
PING_TIME="-c 1"
;;
freebsd ) IFCONFIG=`findCmdInPath ifconfig`
IPV4_ADDR_LIST_CMD="$IFCONFIG -a inet"
IPV6_ADDR_LIST_CMD="$IFCONFIG -a inet6"
LIB_TYPE="LD_LIBRARY_PATH"
PG_METHOD="ident"
HOST_ARCH_TYPE="uname -m"
NOLINE_ECHO="$ECHO -e"
PING_TIME="-c 1"
;;
openbsd ) IPV4_ADDR_LIST_CMD="ifconfig -a inet"
IPV6_ADDR_LIST_CMD="ifconfig -a inet6"
LIB_TYPE="LD_LIBRARY_PATH"
PG_METHOD="ident"
HOST_ARCH_TYPE="uname -m"
NOLINE_ECHO="echo -e"
PING_TIME="-c 1"
DF="df -P"
;;
* ) echo unknown ;;
esac
GP_LIBRARY_PATH=`$DIRNAME \`$DIRNAME $INITDB\``/lib
##
# we setup some EXPORT foo='blah' commands for when we dispatch to segments and standby coordinator
##
EXPORT_GPHOME='export GPHOME='$GPHOME
if [ x"$LIB_TYPE" == x"LD_LIBRARY_PATH" ]; then
EXPORT_LIB_PATH="export LD_LIBRARY_PATH=$LD_LIBRARY_PATH"
else
EXPORT_LIB_PATH="export DYLD_LIBRARY_PATH=$DYLD_LIBRARY_PATH"
fi