#!/bin/sh # # latigid010@yahoo.com # 01/06/2000 # # This Nagios plugin was created to check Oracle status # PROGNAME=`basename $0` PROGPATH=`echo $0 | sed -e 's,[\\/][^\\/][^\\/]*$,,'` REVISION=`echo '$Revision: 1.14 $' | sed -e 's/[^0-9.]//g'` . $PROGPATH/utils.sh print_usage() { echo "Usage:" echo " $PROGNAME --tns " echo " $PROGNAME --db " echo " $PROGNAME --login " echo " $PROGNAME --cache " echo " $PROGNAME --tablespace " echo " $PROGNAME --oranames " echo " $PROGNAME --help" echo " $PROGNAME --version" } print_help() { print_revision $PROGNAME $REVISION echo "" print_usage echo "" echo "Check Oracle status" echo "" echo "--tns SID/IP Address" echo " Check remote TNS server" echo "--db SID" echo " Check local database (search /bin/ps for PMON process) and check" echo " filesystem for sgadefORACLE_SID.dbf" echo "--login SID" echo " Attempt a dummy login and alert if not ORA-01017: invalid username/password" echo "--cache" echo " Check local database for library and buffer cache hit ratios" echo " ---> Requires Oracle user/password and SID specified." echo " ---> Requires select on v_$sysstat and v_$librarycache" echo "--tablespace" echo " Check local database for tablespace capacity in ORACLE_SID" echo " ---> Requires Oracle user/password specified." echo " ---> Requires select on dba_data_files and dba_free_space" echo "--oranames Hostname" echo " Check remote Oracle Names server" echo "--help" echo " Print this help screen" echo "--version" echo " Print version and license information" echo "" echo "If the plugin doesn't work, check that the ORACLE_HOME environment" echo "variable is set, that ORACLE_HOME/bin is in your PATH, and the" echo "tnsnames.ora file is locatable and is properly configured." echo "" echo "When checking local database status your ORACLE_SID is case sensitive." echo "" echo "If you want to use a default Oracle home, add in your oratab file:" echo "*:/opt/app/oracle/product/7.3.4:N" echo "" support } case "$1" in 1) cmd='--tns' ;; 2) cmd='--db' ;; *) cmd="$1" ;; esac # Information options case "$cmd" in --help) print_help exit $STATE_OK ;; -h) print_help exit $STATE_OK ;; --version) print_revision $PLUGIN $REVISION exit $STATE_OK ;; -V) print_revision $PLUGIN $REVISION exit $STATE_OK ;; esac # Hunt down a reasonable ORACLE_HOME if [ -z "$ORACLE_HOME" ] ; then # Adjust to taste for oratab in /var/opt/oracle/oratab /etc/oratab do [ ! -f $oratab ] && continue ORACLE_HOME=`IFS=: while read SID ORACLE_HOME junk; do if [ "$SID" = "$2" -o "$SID" = "*" ] ; then echo $ORACLE_HOME; exit; fi; done < $oratab` [ -n "$ORACLE_HOME" ] && break done fi # Last resort [ -z "$ORACLE_HOME" -a -d $PROGPATH/oracle ] && ORACLE_HOME=$PROGPATH/oracle if [ -z "$ORACLE_HOME" -o ! -d "$ORACLE_HOME" ] ; then echo "Cannot determine ORACLE_HOME for sid $2" exit $STATE_UNKNOWN fi PATH=$PATH:$ORACLE_HOME/bin LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$ORACLE_HOME/lib export ORACLE_HOME PATH LD_LIBRARY_PATH case "$cmd" in --tns) tnschk=` tnsping $2` tnschk2=` echo $tnschk | grep -c OK` if [ ${tnschk2} -eq 1 ] ; then tnschk3=` echo $tnschk | sed -e 's/.*(//' -e 's/).*//'` echo "OK - reply time ${tnschk3} from $2" exit $STATE_OK else echo "No TNS Listener on $2" exit $STATE_CRITICAL fi ;; --oranames) namesctl status $2 | awk ' /Server has been running for:/ { msg = "OK: Up" for (i = 6; i <= NF; i++) { msg = msg " " $i } status = '$STATE_OK' } /error/ { msg = "CRITICAL: " $0 status = '$STATE_CRITICAL' } END { print msg exit status }' ;; --db) pmonchk=`ps -ef | grep -v grep | grep -c "ora_pmon_${2}$"` if [ ${pmonchk} -ge 1 ] ; then echo "${2} OK - ${pmonchk} PMON process(es) running" exit $STATE_OK #if [ -f $ORACLE_HOME/dbs/sga*${2}* ] ; then #if [ ${pmonchk} -eq 1 ] ; then #utime=`ls -la $ORACLE_HOME/dbs/sga*$2* | cut -c 43-55` #echo "${2} OK - running since ${utime}" #exit $STATE_OK #fi else echo "${2} Database is DOWN" exit $STATE_CRITICAL fi ;; --login) loginchk=`sqlplus dummy/user@$2 < /dev/null` loginchk2=` echo $loginchk | grep -c ORA-01017` if [ ${loginchk2} -eq 1 ] ; then echo "OK - dummy login connected" exit $STATE_OK else loginchk3=` echo "$loginchk" | grep "ORA-" | head -1` echo "CRITICAL - $loginchk3" exit $STATE_CRITICAL fi ;; --cache) if [ ${5} -gt ${6} ] ; then echo "UNKNOWN - Warning level is less then Crit" exit $STATE_UNKNOWN fi result=`sqlplus -s ${3}/${4}@${2} << EOF set pagesize 0 set numf '9999999.99' select (1-(pr.value/(dbg.value+cg.value)))*100 from v\\$sysstat pr, v\\$sysstat dbg, v\\$sysstat cg where pr.name='physical reads' and dbg.name='db block gets' and cg.name='consistent gets'; EOF` if [ -n "`echo $result | grep ORA-`" ] ; then error=` echo "$result" | grep "ORA-" | head -1` echo "CRITICAL - $error" exit $STATE_CRITICAL fi buf_hr=`echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}'` buf_hrx=`echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}'` result=`sqlplus -s ${3}/${4}@${2} << EOF set pagesize 0 set numf '9999999.99' select sum(lc.pins)/(sum(lc.pins)+sum(lc.reloads))*100 from v\\$librarycache lc; EOF` if [ -n "`echo $result | grep ORA-`" ] ; then error=` echo "$result" | grep "ORA-" | head -1` echo "CRITICAL - $error" exit $STATE_CRITICAL fi lib_hr=`echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}'` lib_hrx=`echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}'` if [ $buf_hr -le ${5} -o $lib_hr -le ${5} ] ; then echo "${2} CRITICAL - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100" exit $STATE_CRITICAL fi if [ $buf_hr -le ${6} -o $lib_hr -le ${6} ] ; then echo "${2} WARNING - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100" exit $STATE_WARNING fi echo "${2} OK - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100" exit $STATE_OK ;; --tablespace) if [ ${6} -lt ${7} ] ; then echo "UNKNOWN - Warning level is more then Crit" exit $STATE_UNKNOWN fi result=`sqlplus -s ${3}/${4}@${2} << EOF set pagesize 0 set numf '9999999.99' select b.free,a.total,100 - trunc(b.free/a.total * 1000) / 10 prc from ( select tablespace_name,sum(bytes)/1024/1024 total from dba_data_files group by tablespace_name) A, ( select tablespace_name,sum(bytes)/1024/1024 free from dba_free_space group by tablespace_name) B where a.tablespace_name=b.tablespace_name and a.tablespace_name='${5}'; EOF` if [ -n "`echo $result | grep ORA-`" ] ; then error=` echo "$result" | grep "ORA-" | head -1` echo "CRITICAL - $error" exit $STATE_CRITICAL fi ts_free=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($1)}'` ts_total=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($2)}'` ts_pct=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($3)}'` ts_pctx=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print $3}'` if [ "$ts_free" -eq 0 -a "$ts_total" -eq 0 -a "$ts_pct" -eq 0 ] ; then echo "No data returned by Oracle - tablespace $5 not found?" exit $STATE_UNKNOWN fi if [ "$ts_pct" -ge ${6} ] ; then echo "${2} : ${5} CRITICAL - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100" exit $STATE_CRITICAL fi if [ "$ts_pct" -ge ${7} ] ; then echo "${2} : ${5} WARNING - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100" exit $STATE_WARNING fi echo "${2} : ${5} OK - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100" exit $STATE_OK ;; *) print_usage exit $STATE_UNKNOWN esac