- 论坛徽章:
- 0
|
#
# Destroy any remaining processes with refs to $ORACLE_HOME
#
force_cleanup()
{
declare pids
declare pid
pids=`ps ax | grep $ORACLE_HOME | grep -v grep | awk '{print $1}'`
initlog -n $SCRIPT -s "<err> Not all Oracle processes exited cleanly, killing"
for pid in $pids; do
kill -9 $pid
if [ $? -eq 0 ]; then
initlog -n $SCRIPT -s "Killed $pid"
fi
done
return 0
}
#
# Wait for oracle processes to exit. Time out after 60 seconds
#
exit_idle()
{
declare -i n=0
while ps ax | grep $ORACLE_HOME | grep -q -v grep; do
if [ $n -ge 90 ]; then
force_cleanup
return 0
fi
sleep 1
((n++))
done
return 0
}
#
# Get database background process status. Restart it if it failed and
# we have seen the lock file.
#
get_db_status()
{
declare -i subsys_lock=$1
declare -i i=0
declare -i rv=0
declare ora_procname
for procname in $DB_PROCNAMES ; do
ora_procname="ora_${procname}_${ORACLE_SID}"
status $ora_procname
if [ $? -eq 0 ] ; then
# This one's okay; go to the next one.
continue
fi
#
# We're not supposed to be running, and we are,
# in fact, not running...
# XXX only works when monitoring one db process; consider
# extending in future.
#
if [ $subsys_lock -ne 0 ]; then
return 3
fi
for (( i=$RESTART_RETRIES ; i; i-- )) ; do
# this db process is down - stop and
# (re)start all ora_XXXX_$ORACLE_SID processes
initlog -q -n $SCRIPT -s "Restarting Oracle Database..."
stop_db
if [ $? != 0 ] ; then
# stop failed - return 1
return 1
fi
start_db
if [ $? == 0 ] ; then
# ora_XXXX_$ORACLE_SID processes started
# successfully, so break out of the
# stop/start # 'for' loop
break
fi
done
if [ $i -eq 0 ]; then
# stop/start's failed - return 1 (failure)
return 1
fi
done
return 0
}
#
# Get the status of the Oracle listener process
#
get_lsnr_status()
{
declare -i subsys_lock=$1
declare -i rv
status $LSNR_PROCNAME
rv=$?
if [ $rv == 0 ] ; then
return 0 # Listener is running fine
fi
#
# We're not supposed to be running, and we are,
# in fact, not running. Return 3
#
if [ $subsys_lock -ne 0 ]; then
return 3
fi
#
# Listener is NOT running (but should be) - try to restart
#
for (( i=$RESTART_RETRIES ; i; i-- )) ; do
action "Restarting Oracle listener:" lsnrctl start
lsnrctl status >& /dev/null
if [ $? == 0 ] ; then
break # Listener was (re)started and is running fine
fi
done
if [ $i -eq 0 ]; then
# stop/start's failed - return 1 (failure)
return 1
fi
status $LSNR_PROCNAME
if [ $? != 0 ] ; then
return 1 # Problem restarting the Listener
fi
return 0 # Success restarting the Listener
}
#
# usage: get_opmn_proc_status <ias-component> [process-type]
#
# Get the status of a specific OPMN-managed process. If process-type
# is not specified, assume the process-type is the same as the ias-component.
# If the lock-file exists (or no lock file is specified), try to restart
# the given process-type if it is not running.
#
get_opmn_proc_status()
{
declare comp=$1
declare opmntype=$2
declare type_pretty
declare _pid _status
[ -n "$comp" ] || return 1
if [ -z "$opmntype" ]; then
opmntype=$comp
else
type_pretty=" [$opmntype]"
fi
for (( i=$RESTART_RETRIES ; i; i-- )) ; do
_status=`opmnctl status | grep "^$comp " | grep " $opmntype " | cut -d '|' -f3,4 | sed -e 's/ //g' -e 's/|/ /g'`
_pid=`echo $_status | cut -f1 -d' '`
_status=`echo $_status | cut -f2 -d' '`
if [ "${_status}" == "Alive" ] || [ "${_status}" == "Init" ]; then
if [ $i -lt $RESTART_RETRIES ] ; then
echo " $comp$type_pretty restarted"
fi
echo " $comp$type_pretty (pid $_pid) is running..."
break
else
echo " $comp$type_pretty is stopped"
#
# Try to restart it, but don't worry if we fail. OPMN
# is supposed to handle restarting these anyway.
#
# If it's running and you tell OPMN to "start" it,
# you will get an error.
#
# If it's NOT running and you tell OPMN to "restart"
# it, you will also get an error.
#
opmnctl startproc process-type=$opmntype &> /dev/null
fi
done
if [ $i -eq 0 ]; then
# restarts failed - return 1 (failure)
return 1
fi
return 0
}
#
# Get the status of the OPMN-managed processes.
#
get_opmn_status()
{
declare -i subsys_lock=$1
declare -i ct_errors=0
opmnctl status &> /dev/null
if [ $? -eq 2 ]; then
#
# OPMN not running??
#
echo "opmn is stopped"
if [ $subsys_lock -eq 0 ]; then
#
# Don't handle full opmn-restart. XXX
#
return 1
fi
# That's okay, it's not supposed to be!
return 3
fi
#
# Print out the PIDs for everyone.
#
echo "opmn is running..."
echo "opmn components:"
#
# Check the OPMN-managed processes
#
get_opmn_proc_status OID || ((ct_errors++))
get_opmn_proc_status HTTP_Server || ((ct_errors++))
get_opmn_proc_status OC4J OC4J_SECURITY || ((ct_errors++))
#
# One or more OPMN-managed processes failed and could not be
# restarted.
#
if [ $ct_errors -ne 0 ]; then
return 1
fi
return 0
}
#
# Oracle needs the system's hostname to match the VIP. RHCS needs to not be
# tinkering with the hostname. Thus, we trick Oracle into believing that the
# hostname is the vhost by overloading gethostname().
#
hostname_hackery()
{
if [ "`hostname`" = "$ORACLE_HOSTNAME" ]; then
return 0
fi
PRELOADDIR=$ORACLE_HOME
cat > $PRELOADDIR/hostname.c <<EOT
/*
Hack to make Oracle 10g work in failover environments
without adjusting the hostname.
*/
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <errno.h>
#include <string.h>
#ifndef ORACLE_HOSTNAME
#define ORACLE_HOSTNAME "$ORACLE_HOSTNAME"
#endif
int
gethostname(char *buf, size_t len)
{
char *val = ORACLE_HOSTNAME;
if (!buf || len <= 0) {
errno = EINVAL;
return -1;
}
memset(buf,0,len);
if (!strlen(val))
return 0;
if (snprintf(buf, len, "%s", val) == len) {
errno = ENAMETOOLONG;
return -1;
}
return 0;
}
EOT
if [ -e $PRELOADDIR/hostname.so ]; then
export LD_PRELOAD=$PRELOADDIR/hostname.so
return 0
fi
action "Creating hostname preload library:" gcc -o $PRELOADDIR/hostname.so $PRELOADDIR/hostname.c -shared -Wall -fPIC || return 1
rm $PRELOADDIR/hostname.c
export LD_PRELOAD=$PRELOADDIR/hostname.so
return 0
}
#
# Helps us keep a running status so we know what our ultimate return
# code will be. Returns 1 if the $1 and $2 are not equivalent, otherwise
# returns $1. The return code is meant to be the next $1 when this is
# called, so, for example:
#
# update_status 0 <-- returns 0
# update_status $? 0 <-- returns 0
# update_status $? 3 <-- returns 1 (values different - error condition)
# update_status $? 1 <-- returns 1 (same, but happen to be error state!)
#
# update_status 3
# update_status $? 3 <-- returns 3
#
# (and so forth...)
#
update_status()
{
declare -i old_status=$1
declare -i new_status=$2
if [ -z "$2" ]; then
return $old_status
fi
if [ $old_status -ne $new_status ]; then
return 1
fi
return $old_status
}
#
# Print an error message to the user and exit.
#
oops()
{
echo "Please configure this script ($0) to"
echo "match your installation."
echo
echo " $1 failed validation checks."
exit 1
}
#
# Do some validation on the user-configurable stuff at the beginning of the
# script.
#
validation_checks()
{
#
# If the oracle user doesn't exist, we're done.
#
[ -n "$ORACLE_USER" ] || oops ORACLE_USER
id -u $ORACLE_USER > /dev/null || oops ORACLE_USER
id -g $ORACLE_USER > /dev/null || oops ORACLE_USER
#
# If the oracle home isn't a directory, we're done
#
[ -n "$ORACLE_HOME" ] || oops ORACLE_HOME
#[ -d "$ORACLE_HOME" ] || oops ORACLE_HOME
#
# If the oracle SID is NULL, we're done
#
[ -n "$ORACLE_SID" ] || oops ORACLE_SID
#
# If we don't know the type, we're done
#
[ "$ORACLE_TYPE" = "10g" ] || [ "$ORACLE_TYPE" = "10g-ias" ] || oops ORACLE_TYPE
#
# If the hostname is zero-length, fix it
#
[ -n "$ORACLE_HOSTNAME" ] || ORACLE_HOSTNAME=`hostname`
#
# Super user? Automatically change UID and exec as oracle user.
# Oracle needs to be run as the Oracle user, not root!
#
if [ "`id -u`" = "0" ]; then
echo "Restarting $0 as $ORACLE_USER."
exec sudo -u $ORACLE_USER $0 $*
fi
#
# If we're not root and not the Oracle user, we're done.
#
[ "`id -u`" = "`id -u $ORACLE_USER`" ] || exit 1
[ "`id -g`" = "`id -g $ORACLE_USER`" ] || exit 1
#
# Go home.
#
cd $ORACLE_HOME
pwd
return 0
}
#
# Start Oracle9i Application Server Infrastructure
#
start_oracle()
{
faction "Starting Oracle Database:" start_db || return 1
action "Starting Oracle Listener:" lsnrctl start || return 1
if [ -n "$LOCKFILE" ]; then
touch $LOCKFILE
fi
return 0
}
#
# Stop Oracle9i Application Server Infrastructure
#
stop_oracle()
{
if ! [ -e "$ORACLE_HOME/bin/lsnrctl" ]; then
echo "Oracle Listener Control is not available"
echo " ($ORACLE_HOME not mounted?)"
return 0
fi
faction "Stopping Oracle Database:" stop_db || return 1
action "Stopping Oracle Listener:" lsnrctl stop
faction "Waiting for all Oracle processes to exit:" exit_idle
if [ $? -ne 0 ]; then
echo "WARNING: Not all Oracle processes exited cleanly"
fi
if [ -n "$LOCKFILE" ]; then
rm -f $LOCKFILE
fi
return 0
}
#
# Find and display the status of iAS infrastructure.
#
# This has three parts:
# (1) Oracle database itself
# (2) Oracle listener process
# (3) OPMN and OPMN-managed processes
#
# - If all are (cleanly) down, we return 3. In order for this to happen,
# $LOCKFILE must not exist. In this case, we try and restart certain parts
# of the service - as this may be running in a clustered environment.
#
# - If some but not all are running (and, if $LOCKFILE exists, we could not
# restart the failed portions), we return 1 (ERROR)
#
# - If all are running, return 0. In the "all-running" case, we recreate
# $LOCKFILE if it does not exist.
#
status_oracle()
{
declare -i subsys_lock=1
declare -i last
declare -i depth=$1
#
# Check for lock file. Crude and rudimentary, but it works
#
if [ -z "$LOCKFILE" ] || [ -f $LOCKFILE ]; then
subsys_lock=0
fi
# Check database status
get_db_status $subsys_lock $depth
update_status $? # Start
last=$?
# Check & report listener status
get_lsnr_status $subsys_lock $depth
update_status $? $last
last=$?
if [ "$ORACLE_TYPE" = "10g" ]; then
# XXX Add isqlplus status check?!
emctl status dbconsole 2>&1 | grep "is running"
update_status $? $last
last=$?
elif [ "$ORACLE_TYPE" = "10g-ias" ]; then
# Check & report opmn / opmn-managed process status
get_opmn_status $subsys_lock $depth
update_status $? $last
last=$?
fi
#
# No lock file, but everything's running. Put the lock
# file back. XXX - this kosher?
#
if [ $last -eq 0 ] && [ $subsys_lock -ne 0 ]; then
touch $LOCKFILE
fi
return $last
}
########################
# Do some real work... #
########################
if [ "$1" = "meta-data" ]; then
meta_data
exit 0
fi
validation_checks $*
hostname_hackery || exit 1
case $1 in
start)
start_oracle
exit $?
;;
stop)
stop_oracle
exit $?
;;
status|monitor)
status_oracle $OCF_CHECK_LEVEL
exit $?
;;
restart)
$0 stop || exit $?
$0 start || exit $?
exit 0
;;
*)
echo "usage: $SCRIPT {start|stop|status|restart|meta-data}"
exit 1
;;
esac
exit 0 |
|