check_oracle.sh 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304
  1. #!/bin/sh
  2. #
  3. # latigid010@yahoo.com
  4. # 01/06/2000
  5. #
  6. # This Nagios plugin was created to check Oracle status
  7. #
  8. PATH="@TRUSTED_PATH@"
  9. export PATH
  10. PROGNAME=`basename $0`
  11. PROGPATH=`echo $0 | sed -e 's,[\\/][^\\/][^\\/]*$,,'`
  12. REVISION="@NP_VERSION@"
  13. . $PROGPATH/utils.sh
  14. print_usage() {
  15. echo "Usage:"
  16. echo " $PROGNAME --tns <Oracle Sid or Hostname/IP address>"
  17. echo " $PROGNAME --db <ORACLE_SID>"
  18. echo " $PROGNAME --login <ORACLE_SID>"
  19. echo " $PROGNAME --connect <ORACLE_SID>"
  20. echo " $PROGNAME --cache <ORACLE_SID> <USER> <PASS> <CRITICAL> <WARNING>"
  21. echo " $PROGNAME --tablespace <ORACLE_SID> <USER> <PASS> <TABLESPACE> <CRITICAL> <WARNING>"
  22. echo " $PROGNAME --oranames <Hostname>"
  23. echo " $PROGNAME --help"
  24. echo " $PROGNAME --version"
  25. }
  26. print_help() {
  27. print_revision $PROGNAME $REVISION
  28. echo ""
  29. print_usage
  30. echo ""
  31. echo "Check Oracle status"
  32. echo ""
  33. echo "--tns SID/IP Address"
  34. echo " Check remote TNS server"
  35. echo "--db SID"
  36. echo " Check local database (search /bin/ps for PMON process) and check"
  37. echo " filesystem for sgadefORACLE_SID.dbf"
  38. echo "--login SID"
  39. echo " Attempt a dummy login and alert if not ORA-01017: invalid username/password"
  40. echo "--connect SID"
  41. echo " Attempt a login and alert if an ORA- error is returned"
  42. echo "--cache"
  43. echo " Check local database for library and buffer cache hit ratios"
  44. echo " ---> Requires Oracle user/password and SID specified."
  45. echo " ---> Requires select on v_$sysstat and v_$librarycache"
  46. echo "--tablespace"
  47. echo " Check local database for tablespace capacity in ORACLE_SID"
  48. echo " ---> Requires Oracle user/password specified."
  49. echo " ---> Requires select on dba_data_files and dba_free_space"
  50. echo "--oranames Hostname"
  51. echo " Check remote Oracle Names server"
  52. echo "--help"
  53. echo " Print this help screen"
  54. echo "--version"
  55. echo " Print version and license information"
  56. echo ""
  57. echo "If the plugin doesn't work, check that the ORACLE_HOME environment"
  58. echo "variable is set, that ORACLE_HOME/bin is in your PATH, and the"
  59. echo "tnsnames.ora file is locatable and is properly configured."
  60. echo ""
  61. echo "When checking local database status your ORACLE_SID is case sensitive."
  62. echo ""
  63. echo "If you want to use a default Oracle home, add in your oratab file:"
  64. echo "*:/opt/app/oracle/product/7.3.4:N"
  65. echo ""
  66. support
  67. }
  68. case "$1" in
  69. 1)
  70. cmd='--tns'
  71. ;;
  72. 2)
  73. cmd='--db'
  74. ;;
  75. *)
  76. cmd="$1"
  77. ;;
  78. esac
  79. # Information options
  80. case "$cmd" in
  81. --help)
  82. print_help
  83. exit $STATE_OK
  84. ;;
  85. -h)
  86. print_help
  87. exit $STATE_OK
  88. ;;
  89. --version)
  90. print_revision $PROGNAME $REVISION
  91. exit $STATE_OK
  92. ;;
  93. -V)
  94. print_revision $PROGNAME $REVISION
  95. exit $STATE_OK
  96. ;;
  97. esac
  98. # Hunt down a reasonable ORACLE_HOME
  99. if [ -z "$ORACLE_HOME" ] ; then
  100. # Adjust to taste
  101. for oratab in /var/opt/oracle/oratab /etc/oratab
  102. do
  103. [ ! -f $oratab ] && continue
  104. ORACLE_HOME=`IFS=:
  105. while read SID ORACLE_HOME junk;
  106. do
  107. if [ "$SID" = "$2" -o "$SID" = "*" ] ; then
  108. echo $ORACLE_HOME;
  109. exit;
  110. fi;
  111. done < $oratab`
  112. [ -n "$ORACLE_HOME" ] && break
  113. done
  114. fi
  115. # Last resort
  116. [ -z "$ORACLE_HOME" -a -d $PROGPATH/oracle ] && ORACLE_HOME=$PROGPATH/oracle
  117. if [ "$cmd" != "--db" ]; then
  118. if [ -z "$ORACLE_HOME" -o ! -d "$ORACLE_HOME" ] ; then
  119. echo "Cannot determine ORACLE_HOME for sid $2"
  120. exit $STATE_UNKNOWN
  121. fi
  122. fi
  123. PATH=$PATH:$ORACLE_HOME/bin
  124. LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$ORACLE_HOME/lib
  125. export ORACLE_HOME PATH LD_LIBRARY_PATH
  126. case "$cmd" in
  127. --tns)
  128. tnschk=` tnsping $2`
  129. tnschk2=` echo $tnschk | grep -c OK`
  130. if [ ${tnschk2} -eq 1 ] ; then
  131. tnschk3=${tnschk##*(}; tnschk3=${tnschk3%)*}
  132. echo "OK - reply time ${tnschk3} from $2"
  133. exit $STATE_OK
  134. else
  135. echo "No TNS Listener on $2"
  136. exit $STATE_CRITICAL
  137. fi
  138. ;;
  139. --oranames)
  140. namesctl status $2 | awk '
  141. /Server has been running for:/ {
  142. msg = "OK: Up"
  143. for (i = 6; i <= NF; i++) {
  144. msg = msg " " $i
  145. }
  146. status = '$STATE_OK'
  147. }
  148. /error/ {
  149. msg = "CRITICAL: " $0
  150. status = '$STATE_CRITICAL'
  151. }
  152. END {
  153. print msg
  154. exit status
  155. }'
  156. ;;
  157. --db)
  158. pmonchk=`ps -ef | grep -v grep | grep -E -c "(asm|ora)_pmon_${2}$"`
  159. if [ ${pmonchk} -ge 1 ] ; then
  160. echo "${2} OK - ${pmonchk} PMON process(es) running"
  161. exit $STATE_OK
  162. #if [ -f $ORACLE_HOME/dbs/sga*${2}* ] ; then
  163. #if [ ${pmonchk} -eq 1 ] ; then
  164. #utime=`ls -la $ORACLE_HOME/dbs/sga*$2* | cut -c 43-55`
  165. #echo "${2} OK - running since ${utime}"
  166. #exit $STATE_OK
  167. #fi
  168. else
  169. echo "${2} Database is DOWN"
  170. exit $STATE_CRITICAL
  171. fi
  172. ;;
  173. --login)
  174. loginchk=`sqlplus dummy/user@$2 < /dev/null`
  175. loginchk2=` echo $loginchk | grep -c ORA-01017`
  176. if [ ${loginchk2} -eq 1 ] ; then
  177. echo "OK - dummy login connected"
  178. exit $STATE_OK
  179. else
  180. loginchk3=` echo "$loginchk" | grep "ORA-" | head -1`
  181. echo "CRITICAL - $loginchk3"
  182. exit $STATE_CRITICAL
  183. fi
  184. ;;
  185. --connect)
  186. connectchk=`sqlplus $2 < /dev/null`
  187. connectchk2=` echo $connectchk | grep -c ORA-`
  188. if [ ${connectchk2} -eq 0 ] ; then
  189. echo "OK - login successful"
  190. exit $STATE_OK
  191. else
  192. connectchk3=` echo "$connectchk" | grep "ORA-" | head -1`
  193. echo "CRITICAL - $connectchk3"
  194. exit $STATE_CRITICAL
  195. fi
  196. ;;
  197. --cache)
  198. if [ ${5} -gt ${6} ] ; then
  199. echo "UNKNOWN - Warning level is less then Crit"
  200. exit $STATE_UNKNOWN
  201. fi
  202. result=`sqlplus -s ${3}/${4}@${2} << EOF
  203. set pagesize 0
  204. set numf '9999999.99'
  205. select (1-(pr.value/(dbg.value+cg.value)))*100
  206. from v\\$sysstat pr, v\\$sysstat dbg, v\\$sysstat cg
  207. where pr.name='physical reads'
  208. and dbg.name='db block gets'
  209. and cg.name='consistent gets';
  210. EOF`
  211. if [ -n "`echo $result | grep ORA-`" ] ; then
  212. error=` echo "$result" | grep "ORA-" | head -1`
  213. echo "CRITICAL - $error"
  214. exit $STATE_CRITICAL
  215. fi
  216. buf_hr=`echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}'`
  217. buf_hrx=`echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}'`
  218. result=`sqlplus -s ${3}/${4}@${2} << EOF
  219. set pagesize 0
  220. set numf '9999999.99'
  221. select sum(lc.pins)/(sum(lc.pins)+sum(lc.reloads))*100
  222. from v\\$librarycache lc;
  223. EOF`
  224. if [ -n "`echo $result | grep ORA-`" ] ; then
  225. error=` echo "$result" | grep "ORA-" | head -1`
  226. echo "CRITICAL - $error"
  227. exit $STATE_CRITICAL
  228. fi
  229. lib_hr=`echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}'`
  230. lib_hrx=`echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}'`
  231. if [ $buf_hr -le ${5} -o $lib_hr -le ${5} ] ; then
  232. echo "${2} CRITICAL - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  233. exit $STATE_CRITICAL
  234. fi
  235. if [ $buf_hr -le ${6} -o $lib_hr -le ${6} ] ; then
  236. echo "${2} WARNING - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  237. exit $STATE_WARNING
  238. fi
  239. echo "${2} OK - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  240. exit $STATE_OK
  241. ;;
  242. --tablespace)
  243. if [ ${6} -lt ${7} ] ; then
  244. echo "UNKNOWN - Warning level is more then Crit"
  245. exit $STATE_UNKNOWN
  246. fi
  247. result=`sqlplus -s ${3}/${4}@${2} << EOF
  248. set pagesize 0
  249. set numf '9999999.99'
  250. select NVL(b.free,0.0),a.total,100 - trunc(NVL(b.free,0.0)/a.total * 1000) / 10 prc
  251. from (
  252. select tablespace_name,sum(bytes)/1024/1024 total
  253. from dba_data_files group by tablespace_name) A
  254. LEFT OUTER JOIN
  255. ( select tablespace_name,sum(bytes)/1024/1024 free
  256. from dba_free_space group by tablespace_name) B
  257. ON a.tablespace_name=b.tablespace_name WHERE a.tablespace_name='${5}';
  258. EOF`
  259. if [ -n "`echo $result | grep ORA-`" ] ; then
  260. error=` echo "$result" | grep "ORA-" | head -1`
  261. echo "CRITICAL - $error"
  262. exit $STATE_CRITICAL
  263. fi
  264. ts_free=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($1)}'`
  265. ts_total=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($2)}'`
  266. ts_pct=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($3)}'`
  267. ts_pctx=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print $3}'`
  268. if [ "$ts_free" -eq 0 -a "$ts_total" -eq 0 -a "$ts_pct" -eq 0 ] ; then
  269. echo "No data returned by Oracle - tablespace $5 not found?"
  270. exit $STATE_UNKNOWN
  271. fi
  272. if [ "$ts_pct" -ge ${6} ] ; then
  273. echo "${2} : ${5} CRITICAL - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  274. exit $STATE_CRITICAL
  275. fi
  276. if [ "$ts_pct" -ge ${7} ] ; then
  277. echo "${2} : ${5} WARNING - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  278. exit $STATE_WARNING
  279. fi
  280. echo "${2} : ${5} OK - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  281. exit $STATE_OK
  282. ;;
  283. *)
  284. print_usage
  285. exit $STATE_UNKNOWN
  286. esac