check_oracle.sh 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303
  1. #!/bin/sh
  2. #
  3. # latigid010@yahoo.com
  4. # 01/06/2000
  5. #
  6. # This Nagios plugin was created to check Oracle status
  7. #
  8. PROGNAME=`basename $0`
  9. PROGPATH=`echo $0 | sed -e 's,[\\/][^\\/][^\\/]*$,,'`
  10. REVISION="@NP_VERSION@"
  11. PATH="@TRUSTED_PATH@"
  12. . $PROGPATH/utils.sh
  13. print_usage() {
  14. echo "Usage:"
  15. echo " $PROGNAME --tns <Oracle Sid or Hostname/IP address>"
  16. echo " $PROGNAME --db <ORACLE_SID>"
  17. echo " $PROGNAME --login <ORACLE_SID>"
  18. echo " $PROGNAME --connect <ORACLE_SID>"
  19. echo " $PROGNAME --cache <ORACLE_SID> <USER> <PASS> <CRITICAL> <WARNING>"
  20. echo " $PROGNAME --tablespace <ORACLE_SID> <USER> <PASS> <TABLESPACE> <CRITICAL> <WARNING>"
  21. echo " $PROGNAME --oranames <Hostname>"
  22. echo " $PROGNAME --help"
  23. echo " $PROGNAME --version"
  24. }
  25. print_help() {
  26. print_revision $PROGNAME $REVISION
  27. echo ""
  28. print_usage
  29. echo ""
  30. echo "Check Oracle status"
  31. echo ""
  32. echo "--tns SID/IP Address"
  33. echo " Check remote TNS server"
  34. echo "--db SID"
  35. echo " Check local database (search /bin/ps for PMON process) and check"
  36. echo " filesystem for sgadefORACLE_SID.dbf"
  37. echo "--login SID"
  38. echo " Attempt a dummy login and alert if not ORA-01017: invalid username/password"
  39. echo "--connect SID"
  40. echo " Attempt a login and alert if an ORA- error is returned"
  41. echo "--cache"
  42. echo " Check local database for library and buffer cache hit ratios"
  43. echo " ---> Requires Oracle user/password and SID specified."
  44. echo " ---> Requires select on v_$sysstat and v_$librarycache"
  45. echo "--tablespace"
  46. echo " Check local database for tablespace capacity in ORACLE_SID"
  47. echo " ---> Requires Oracle user/password specified."
  48. echo " ---> Requires select on dba_data_files and dba_free_space"
  49. echo "--oranames Hostname"
  50. echo " Check remote Oracle Names server"
  51. echo "--help"
  52. echo " Print this help screen"
  53. echo "--version"
  54. echo " Print version and license information"
  55. echo ""
  56. echo "If the plugin doesn't work, check that the ORACLE_HOME environment"
  57. echo "variable is set, that ORACLE_HOME/bin is in your PATH, and the"
  58. echo "tnsnames.ora file is locatable and is properly configured."
  59. echo ""
  60. echo "When checking local database status your ORACLE_SID is case sensitive."
  61. echo ""
  62. echo "If you want to use a default Oracle home, add in your oratab file:"
  63. echo "*:/opt/app/oracle/product/7.3.4:N"
  64. echo ""
  65. support
  66. }
  67. case "$1" in
  68. 1)
  69. cmd='--tns'
  70. ;;
  71. 2)
  72. cmd='--db'
  73. ;;
  74. *)
  75. cmd="$1"
  76. ;;
  77. esac
  78. # Information options
  79. case "$cmd" in
  80. --help)
  81. print_help
  82. exit $STATE_OK
  83. ;;
  84. -h)
  85. print_help
  86. exit $STATE_OK
  87. ;;
  88. --version)
  89. print_revision $PROGNAME $REVISION
  90. exit $STATE_OK
  91. ;;
  92. -V)
  93. print_revision $PROGNAME $REVISION
  94. exit $STATE_OK
  95. ;;
  96. esac
  97. # Hunt down a reasonable ORACLE_HOME
  98. if [ -z "$ORACLE_HOME" ] ; then
  99. # Adjust to taste
  100. for oratab in /var/opt/oracle/oratab /etc/oratab
  101. do
  102. [ ! -f $oratab ] && continue
  103. ORACLE_HOME=`IFS=:
  104. while read SID ORACLE_HOME junk;
  105. do
  106. if [ "$SID" = "$2" -o "$SID" = "*" ] ; then
  107. echo $ORACLE_HOME;
  108. exit;
  109. fi;
  110. done < $oratab`
  111. [ -n "$ORACLE_HOME" ] && break
  112. done
  113. fi
  114. # Last resort
  115. [ -z "$ORACLE_HOME" -a -d $PROGPATH/oracle ] && ORACLE_HOME=$PROGPATH/oracle
  116. if [ "$cmd" != "--db" ]; then
  117. if [ -z "$ORACLE_HOME" -o ! -d "$ORACLE_HOME" ] ; then
  118. echo "Cannot determine ORACLE_HOME for sid $2"
  119. exit $STATE_UNKNOWN
  120. fi
  121. fi
  122. PATH=$PATH:$ORACLE_HOME/bin
  123. LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$ORACLE_HOME/lib
  124. export ORACLE_HOME PATH LD_LIBRARY_PATH
  125. case "$cmd" in
  126. --tns)
  127. tnschk=` tnsping $2`
  128. tnschk2=` echo $tnschk | grep -c OK`
  129. if [ ${tnschk2} -eq 1 ] ; then
  130. tnschk3=${tnschk##*(}; tnschk3=${tnschk3%)*}
  131. echo "OK - reply time ${tnschk3} from $2"
  132. exit $STATE_OK
  133. else
  134. echo "No TNS Listener on $2"
  135. exit $STATE_CRITICAL
  136. fi
  137. ;;
  138. --oranames)
  139. namesctl status $2 | awk '
  140. /Server has been running for:/ {
  141. msg = "OK: Up"
  142. for (i = 6; i <= NF; i++) {
  143. msg = msg " " $i
  144. }
  145. status = '$STATE_OK'
  146. }
  147. /error/ {
  148. msg = "CRITICAL: " $0
  149. status = '$STATE_CRITICAL'
  150. }
  151. END {
  152. print msg
  153. exit status
  154. }'
  155. ;;
  156. --db)
  157. pmonchk=`ps -ef | grep -v grep | grep -E -c "(asm|ora)_pmon_${2}$"`
  158. if [ ${pmonchk} -ge 1 ] ; then
  159. echo "${2} OK - ${pmonchk} PMON process(es) running"
  160. exit $STATE_OK
  161. #if [ -f $ORACLE_HOME/dbs/sga*${2}* ] ; then
  162. #if [ ${pmonchk} -eq 1 ] ; then
  163. #utime=`ls -la $ORACLE_HOME/dbs/sga*$2* | cut -c 43-55`
  164. #echo "${2} OK - running since ${utime}"
  165. #exit $STATE_OK
  166. #fi
  167. else
  168. echo "${2} Database is DOWN"
  169. exit $STATE_CRITICAL
  170. fi
  171. ;;
  172. --login)
  173. loginchk=`sqlplus dummy/user@$2 < /dev/null`
  174. loginchk2=` echo $loginchk | grep -c ORA-01017`
  175. if [ ${loginchk2} -eq 1 ] ; then
  176. echo "OK - dummy login connected"
  177. exit $STATE_OK
  178. else
  179. loginchk3=` echo "$loginchk" | grep "ORA-" | head -1`
  180. echo "CRITICAL - $loginchk3"
  181. exit $STATE_CRITICAL
  182. fi
  183. ;;
  184. --connect)
  185. connectchk=`sqlplus $2 < /dev/null`
  186. connectchk2=` echo $connectchk | grep -c ORA-`
  187. if [ ${connectchk2} -eq 0 ] ; then
  188. echo "OK - login successful"
  189. exit $STATE_OK
  190. else
  191. connectchk3=` echo "$connectchk" | grep "ORA-" | head -1`
  192. echo "CRITICAL - $connectchk3"
  193. exit $STATE_CRITICAL
  194. fi
  195. ;;
  196. --cache)
  197. if [ ${5} -gt ${6} ] ; then
  198. echo "UNKNOWN - Warning level is less then Crit"
  199. exit $STATE_UNKNOWN
  200. fi
  201. result=`sqlplus -s ${3}/${4}@${2} << EOF
  202. set pagesize 0
  203. set numf '9999999.99'
  204. select (1-(pr.value/(dbg.value+cg.value)))*100
  205. from v\\$sysstat pr, v\\$sysstat dbg, v\\$sysstat cg
  206. where pr.name='physical reads'
  207. and dbg.name='db block gets'
  208. and cg.name='consistent gets';
  209. EOF`
  210. if [ -n "`echo $result | grep ORA-`" ] ; then
  211. error=` echo "$result" | grep "ORA-" | head -1`
  212. echo "CRITICAL - $error"
  213. exit $STATE_CRITICAL
  214. fi
  215. buf_hr=`echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}'`
  216. buf_hrx=`echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}'`
  217. result=`sqlplus -s ${3}/${4}@${2} << EOF
  218. set pagesize 0
  219. set numf '9999999.99'
  220. select sum(lc.pins)/(sum(lc.pins)+sum(lc.reloads))*100
  221. from v\\$librarycache lc;
  222. EOF`
  223. if [ -n "`echo $result | grep ORA-`" ] ; then
  224. error=` echo "$result" | grep "ORA-" | head -1`
  225. echo "CRITICAL - $error"
  226. exit $STATE_CRITICAL
  227. fi
  228. lib_hr=`echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}'`
  229. lib_hrx=`echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}'`
  230. if [ $buf_hr -le ${5} -o $lib_hr -le ${5} ] ; then
  231. echo "${2} CRITICAL - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  232. exit $STATE_CRITICAL
  233. fi
  234. if [ $buf_hr -le ${6} -o $lib_hr -le ${6} ] ; then
  235. echo "${2} WARNING - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  236. exit $STATE_WARNING
  237. fi
  238. echo "${2} OK - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  239. exit $STATE_OK
  240. ;;
  241. --tablespace)
  242. if [ ${6} -lt ${7} ] ; then
  243. echo "UNKNOWN - Warning level is more then Crit"
  244. exit $STATE_UNKNOWN
  245. fi
  246. result=`sqlplus -s ${3}/${4}@${2} << EOF
  247. set pagesize 0
  248. set numf '9999999.99'
  249. select NVL(b.free,0.0),a.total,100 - trunc(NVL(b.free,0.0)/a.total * 1000) / 10 prc
  250. from (
  251. select tablespace_name,sum(bytes)/1024/1024 total
  252. from dba_data_files group by tablespace_name) A
  253. LEFT OUTER JOIN
  254. ( select tablespace_name,sum(bytes)/1024/1024 free
  255. from dba_free_space group by tablespace_name) B
  256. ON a.tablespace_name=b.tablespace_name WHERE a.tablespace_name='${5}';
  257. EOF`
  258. if [ -n "`echo $result | grep ORA-`" ] ; then
  259. error=` echo "$result" | grep "ORA-" | head -1`
  260. echo "CRITICAL - $error"
  261. exit $STATE_CRITICAL
  262. fi
  263. ts_free=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($1)}'`
  264. ts_total=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($2)}'`
  265. ts_pct=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($3)}'`
  266. ts_pctx=`echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print $3}'`
  267. if [ "$ts_free" -eq 0 -a "$ts_total" -eq 0 -a "$ts_pct" -eq 0 ] ; then
  268. echo "No data returned by Oracle - tablespace $5 not found?"
  269. exit $STATE_UNKNOWN
  270. fi
  271. if [ "$ts_pct" -ge ${6} ] ; then
  272. echo "${2} : ${5} CRITICAL - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  273. exit $STATE_CRITICAL
  274. fi
  275. if [ "$ts_pct" -ge ${7} ] ; then
  276. echo "${2} : ${5} WARNING - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  277. exit $STATE_WARNING
  278. fi
  279. echo "${2} : ${5} OK - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  280. exit $STATE_OK
  281. ;;
  282. *)
  283. print_usage
  284. exit $STATE_UNKNOWN
  285. esac