#! /bin/ksh
#
#	Copyright 29 Sep 1997 Sun Microsystems, Inc.  All Rights Reserved.
#
# @(#)hasybase_fmon_start.shs	1.22	97/09/29 SMI
#
# hasybase_fmon_start - start an Sybase fault monitor (hasybase_fmon) for the
#			server #1
#
# Environment:
# HA_ENV - file name of HA environment file
# HA_METASETSERVE - list of the logical hosts to run on the local host
# HA_SIBLING_METASETSERVE - list of the logical hosts not on local host
#

# make sure we reread HA_ENV (might have changed)
# setting HA_CLUSTER to "" forces a re-read in sybase_boiler
#HA_ENV=/var/opt/SUNWhadf/hadf/ha_env
HA_CLUSTER=""
#	Copyright 10 Sep 1997 Sun Microsystems, Inc.  All Rights Reserved.
#
# @(#)sybase_boiler	1.24 97/09/10 SMI

# begin of common ha-dbms boilerplate

# remember our name
argv0=`basename $0`

# Get the BASEDIR and PRODUCTDIR settings from the installed pkgs
_basedir=`pkgparam SUNWscsyb BASEDIR 2>/dev/null`
_productdir=`pkgparam SUNWscsyb PRODUCTDIR 2>/dev/null`
_basedir=${_basedir:=""}
_productdir=${_productdir:="SUNWcluster"}

LOGGER=/usr/bin/logger

PATH=${_basedir}/${_productdir}/bin:${_basedir}/${_productdir}/ha/sybase:${PATH}
export PATH
HA_FILES=/etc/${_basedir}/SUNWscsyb; export HA_FILES
HA_VAR=/var/${_basedir}/SUNWscsyb; export HA_VAR

# include HA utilities library
. dbms_utilities
if [ $? -ne 0 ]; then
	$LOGGER -p local7.err -t "$HA_SLOGTAG" "$argv0: Cannot find HA utilities library"
	exit 1
fi

HA_CLUSTER=$CLUSTNAME; export HA_CLUSTER

# some default files and locations
# don't move this up - it depends on HA_FILES, which gets set above
HA_DATABASES=hasybase_databases
HA_DB_SUPPORT=${HA_FILES}/hasybase_support
ds="sybase"

PREFIX="SUNWcluster.ha.${ds}"
HA_FM_NAME="fault_mon"

# verify that we have the hasybase_support file
if [ ! -r $HA_DB_SUPPORT ] ; then
  logerr "4000" \
	"file ${HA_DB_SUPPORT} does not exist or is not readable!"
  exit 2
fi


# talk_start ... - echo the args, run them, and evaluate return value
talk_start() {
  	logprint "$$: $*"
  	if $* ; then
    		return 0
  	else
    		logprint "$$: $* ... failed"
    		return 1
  	fi
}


# talk_start_bg ... - print the args, then run them in the background
talk_start_bg() {
  	logprint "$$: $*"
  	$* &
  	}


# get_pid [ -u userid ] pattern - find the process id of a running program
# if called with "-u userid", only process for that user will be considered
get_pid() {
	if [ "$1" = "-u" ] ; then
		ps_args="-f -u $2"
		shift
		shift
	else
		ps_args="-ef"
	fi
	PID=`/usr/bin/ps $ps_args | grep "\<$*\>" | nawk -v pat="$*" '
 BEGIN { 
   search_pat = substr(pat, 0, 79)
   }
 { if ( match($0, search_pat) )
     if ( ! match($0, "nawk -v pat=") )
    	print $2
  }
'`
}

	
# kill_proc pattern - find and terminate a process
kill_proc() {
  	logprint "Killing $*..." 
  	get_pid $*
  	if [ "$PID" ] ; then
    		for p in ${PID} ; do
      			logprint "Killing process id $p"
      			kill -KILL $p
    		done
  	else
    		logprint "process \"$*\" could not be located..." 
  	fi
}

#get_server_pid <server name>  - check that the SQL dataserver is running or 
#                      not on the system
get_server_pid () {

servername="RUN_$*"
SPID=`/usr/bin/ps -fe | grep "\<$servername\>$" | 
			grep -v "grep" | nawk -v pat="$servername" '
 BEGIN { 
   search_pat = substr(pat,0,79)
   }
 { if ( match($0, search_pat) )
     if ( ! match($0, "nawk -v pat=") )
       		print $2
  }
'`
}

# get_pgid pattern - get the process group id of a running server
get_pgid() {

PGID=`/usr/bin/ps -o pgid -p $1 | grep -v "PGID" | nawk '{print $1}'`

}

# kill_server - kill server processes if it cannot be shutdown normally
kill_server() {

	get_server_pid $*
	if [ "${SPID}" != "" ]; then

		for gpid in $SPID ; do
			get_pgid $gpid
				if [ "${PGID}" != "" ]; then
					kill -KILL -${PGID}
 
				fi
		done
	fi

}

 

# read_ha_databases server - find an entry in the HA_DATABASES file,
# 	parse it apart, and return in variables. Assumes that sybase_home
#	is set!
read_ha_databases() {
#	conf_line=`grep "^o[nf][f]*	$1	" $HA_DATABASES`
        set_inst_name $1
	conf_line=$(get_instance "${ds}" "$1")
	if [ "$conf_line" = "" ] ; then
		logerr "4010" "$1 missing from HA SYBASE CCD!"
		return 1
	fi

        on_off_mode=`echo "$conf_line" | cut -s -f 1`
# The following 'server_name' is and extra line for sybase
	server_name=`echo "$conf_line" | cut -s -f 2`
	logical_host=`echo "$conf_line" | cut -s -f 3`
	poll_cycle=`echo "$conf_line" | cut -s -f 4`
	connect_cycle=`echo "$conf_line" | cut -s -f 5`
	timeout=`echo "$conf_line" | cut -s -f 6`
	restart_delay=`echo "$conf_line" | cut -s -f 7`
	db_login=`echo "$conf_line" | cut -s -f 8`
	runserver_file=`echo "$conf_line" | cut -s -f 9`
	if [ "`echo $conf_line | wc -w`" -eq 11 ] ; then
		backup_server=`echo "$conf_line" | cut -s -f 10`
		runbackup_file=`echo "$conf_line" | cut -s -f 11`
	fi

        set_logical_host $logical_host
	return 0
}

# find_sybase server - finds and sets various Sybase related variables:
#	SYBASE ISQL RUN_FILE
# in case of a problem, it returns with an empty SYBASE variable
find_sybase() {
  	SYBTAB=/var/opt/sybase/sybtab

  	SYBASE=""
	ISQL=""
	if sybtab_line=`grep "^[	 ]*$1:" $SYBTAB` ; then
		sybase_home=`echo $sybtab_line | awk -F: '{print $2}' -`
		if [ -d $sybase_home ] && [ -n "`disk_mounted $1`" ] ; then
			if [ -x ${sybase_home}/bin/isql ] ; then
				read_ha_databases $1
				SYBASE="$sybase_home"
				ISQL="${SYBASE}/bin/isql"
				RUN_FILE="$runserver_file"
			else
				logerr "4030" \
				"No isql executable in ${sybase_home}/bin!"
			fi
		fi
	else
		logerr "4040" \
			"Database '$1' not found in ${SYBTAB}"
	fi
    	export SYBASE ISQL RUN_FILE
}


make_rpc_call() {
  	logprint "Calling $3 for server $2 on host $1..."
  	ha_dbms_call $1 $2 $3 
  	}

get_remote_host(){
	get_diskgroups $1 $2
	RSHHOST=""
	for X in `haget  -f private_links -h $HA_REMOTEHOST` ; do
	  net_pinghost $X > /dev/null 2>&1
	  if [ $? -eq 0 ] ; then
		RSHHOST=$X
		export RSHHOST
		return 0
	  fi
	done
	return 1
	}

#end of common ha-dbms boiler plate
#include_boiler

prog="${HA_FM_NAME}"

. $HA_VAR/ha_env


# process_parm_file - process an Sybase parameter file $1, follow ifile
#    references, and echo the value for background_dump_dest
#    Only lines of the format 
#      variable = value
#    will be recognized
process_parm_file() {
	if [ -r "$1" ] ; then
		grep -v '^#' $1 | \
		while read var assign value ; do
			if [ "$assign" = "=" ] ; then
				case "$var" in
					ifile) 	if [ -r $value ] ; then
							process_parm_file $value
						else
							logerr "${prog}.4037" \
				"Sybase parameter file $1 includes $value - does not exist, or is not readable"
						fi ;;
					background_dump_dest) echo $value ;;
					*) ;;
				esac
			fi
		done
	else
		logerr "${prog}.4047" \
			"Sybase parameter file $1 does not exist or is not readable!"
	fi
	}

# Retrieve error log file name from RUN_FILE
get_error_log_name() {

# check '-e' in the begin of the error log name in the RUN_ file 
count=`egrep -c '^-e/' $RUN_FILE`
count1=`egrep -c ' -e/' $RUN_FILE`
total_cnt=`expr $count + $count1`

# if more than one '-e' were found, return error           
if [ "$total_cnt" -ne 1 ]; then
	return 1
fi

# If the -e/<error_log_name> is placed in the beginning of a line in RUN_ file
# we assume that we got the error log file name
if [ "$count" -eq 1 ] ; then
        error_log=`egrep '^-e/' $RUN_FILE | nawk '{print $1}' | cut -c 3-`
fi
 
# If the -e/<error_log_name> is placed in the middle of a line in RUN_ file 
if [ "$count1" -eq 1 ]; then
        buf=`egrep ' -e/' $RUN_FILE`
        for name in $buf ; do
                tmp=`echo $name | cut -b0-2`
                if [ "$tmp" = "-e" ] ; then
                        error_log=`echo $name | cut -c 3-`
                else
                        if [ "$name" = "" ] ; then
				return 1
                        fi
                fi
        done
fi
 
if [ -f "$error_log" ] ; then
	return 0
else
	return 1
fi

} 
# ############# Main ########################## Main ##########################
if [ $# -ne 1 ] ; then
	logerr "${prog}.4000" "usage: $argv0 server"
	exit 2
fi

DSQUERY=$1
read_ha_databases $DSQUERY
DB_LOGIN=$db_login
export DB_LOGIN
LOCALHOST=`uname -n`

find_logical_host=`haget -f all_logical_hosts | grep $logical_host`
if [ "$find_logical_host" = "" ] ; then
	logerr "${prog}.4001" \
		"logical host $logical_host is not in the cluster configuration"
	logerr "${prog}.4060" \
		"Monitors for Sybase database \"${DSQUERY}\" NOT started"
	exit 1
fi 

remote_args=""
#matches=`expr " $HA_METASETSERVE " : ".* $logical_host "`
#if [ "$matches" -eq 0 ] ; then

MASTERED_LOGICAL_HOSTS="`echo $HA_METASETSERVE | tr ',' ' '`"
is_member $logical_host "$MASTERED_LOGICAL_HOSTS"
if [ $? -ne 0 ] ; then
    	remote_args="-r $logical_host"
                
        # Don't start probe if diskset is in maintenance mode.
        # If this instance's logical host is in maint mode, exit now.
        MAINT=`haget -f is_maint -h ${logical_host}`
        if [ "$MAINT" = "1" ]; then
            exit 0
        fi

        need_to_run_probe ${logical_host} ${LOCALHOST}

        if [ $? -ne 0 ]; then
           exit 0
        fi

fi

current_mode=$(get_instance_dynamic "${ds}" "$DSQUERY" | awk '{print $1}')
if [ "$current_mode" != "on" ] ; then
         logerr "${prog}.4062"\
                  "on/off mode for \"$DSQUERY\" is not on. Fault monitor not started"
	 exit 0
fi

# Set environment variable HA_REMOTEHOST for this instance before starting
# starting fault monitor.

my_node=`uname -n`
res=$(haget -f physical_hosts -h $logical_host | tr '\012' ' ')
HA_REMOTEHOST=""
for next in ${res}; do
        if [ "$next" != "$my_node" ]; then
                HA_REMOTEHOST="${HA_REMOTEHOST} ${next}"
        fi
done
export HA_REMOTEHOST

binaries_on_logical=

if [ "$remote_args" != "" ] ; then
        SYBTAB=/var/opt/sybase/sybtab
        if sybtab_line=`grep "^[	 ]*$1:" $SYBTAB` ; then
                sybase_home=`echo $sybtab_line | awk -F: '{print $2}' -`
        fi
	if [ ! -d $sybase_home ] || [ -z "`disk_mounted $1`" ] ; then
        	binaries_on_logical="$sybase_home"
	fi		
fi


# starting up remote fault monitor when the Sybase binaries are
# installed on the logical host then the remote server does not
# have access to version and error log, thus, we hard coded here
# The remote fmon will be started and exit from here
if [ "$remote_args" != ""  -a "$binaries_on_logical" != "" ] ; then
        error_log="none"
        SYBASE="/var/opt/sybase"
        export SYBASE
	open_client_dir="$SYBASE/locales/us_english/iso_1"
	if [ ! -d $open_client_dir ] ; then
		mkdir -p $SYBASE/locales/us_english
	fi
	if [ ! -d $SYBASE/charsets ] ; then
		mkdir -p $SYBASE/charsets 
	fi

        ha_executable="hasybase_fmon"
        action_file="hasybase_config_V1"
        talk_start ${ha_executable} $remote_args $DSQUERY $poll_cycle $connect_cycle $timeout $restart_delay $HA_FILES/$action_file $error_log
        exit 0
fi

find_sybase $1

 
if [ -f $SYBASE/bin/dataserver ] ; then
	#  Lets figure out the Sybase version number
        syb_version=`$SYBASE/bin/dataserver -v | awk  -F/ '/SQL Server/ {print $2}'`
      	grep -v "^#" ${HA_DB_SUPPORT} | \
      	while read support_line ; do
        	pattern="\("`echo "$support_line" | cut -f 1`"\)"
        	result=`expr "$syb_version" : ${pattern}`
        	if [ "$result" != "" -a "$result" = "$syb_version" ] ; then
	  		ha_executable=`echo "$support_line" | cut -f 2`
	  		action_file=`echo "$support_line" | cut -f 3`
	  		if [ "$ha_executable" = "" ] ; then
				logerr "${prog}.4050" \
"server ${DSQUERY}: executable file name missing in line '$support_line' in file $HA_DB_SUPPORT"
				exit 1
			fi
	  		if [ "$action_file" = "" ] ; then
				logerr "${prog}.4061" \
"server ${DSQUERY}: action file name missing in line '$support_line' in file $HA_DB_SUPPORT"
				exit 1
			fi
      			if [ "$remote_args" = "" ] ; then
				get_error_log_name 
				if [ $? -ne 0 ]; then
					logerr "${prog}.4070" "Could not locate errorlog file"
					exit 1
				fi
          		else
            			error_log="none"
          		fi
      
	  		talk_start ${ha_executable} $remote_args $DSQUERY $poll_cycle $connect_cycle $timeout $restart_delay $HA_FILES/$action_file $error_log 
          		exit 3
        	fi
      	done
        case $? in
                1) ;;
                3) exit 0 ;;
                *) logerr "${prog}.4080" "Sybase ${syb_version} not supported!" ;;
        esac

fi

# if we reach here, then a fault monitor did not get started
# the reason did already get logged in the various logerr calls above
# Note: The "exit" statements in the while statement above do not
#       cause an exit of the entire script, but just the subshell that
#	executes the while command as part of a pipe!
logerr "${prog}.4060" "Monitors for Sybase database \"${DSQUERY}\" NOT started"
exit 1





