check_oracle.sh 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305
  1. #!/bin/sh
  2. #
  3. # latigid010@yahoo.com
  4. # 01/06/2000
  5. #
  6. # This Nagios plugin was created to check Oracle status
  7. #
  8. PATH="@TRUSTED_PATH@"
  9. export PATH
  10. PROGNAME=$(basename "$0")
  11. PROGPATH=$(echo "$0" | sed -e 's,[\\/][^\\/][^\\/]*$,,')
  12. REVISION="@NP_VERSION@"
  13. PATH="@TRUSTED_PATH@"
  14. . "$PROGPATH"/utils.sh
  15. print_usage() {
  16. echo "Usage:"
  17. echo " $PROGNAME --tns <Oracle Sid or Hostname/IP address>"
  18. echo " $PROGNAME --db <ORACLE_SID>"
  19. echo " $PROGNAME --login <ORACLE_SID>"
  20. echo " $PROGNAME --connect <ORACLE_SID>"
  21. echo " $PROGNAME --cache <ORACLE_SID> <USER> <PASS> <CRITICAL> <WARNING>"
  22. echo " $PROGNAME --tablespace <ORACLE_SID> <USER> <PASS> <TABLESPACE> <CRITICAL> <WARNING>"
  23. echo " $PROGNAME --oranames <Hostname>"
  24. echo " $PROGNAME --help"
  25. echo " $PROGNAME --version"
  26. }
  27. print_help() {
  28. print_revision "$PROGNAME" $REVISION
  29. echo ""
  30. print_usage
  31. echo ""
  32. echo "Check Oracle status"
  33. echo ""
  34. echo "--tns SID/IP Address"
  35. echo " Check remote TNS server"
  36. echo "--db SID"
  37. echo " Check local database (search /bin/ps for PMON process) and check"
  38. echo " filesystem for sgadefORACLE_SID.dbf"
  39. echo "--login SID"
  40. echo " Attempt a dummy login and alert if not ORA-01017: invalid username/password"
  41. echo "--connect SID"
  42. echo " Attempt a login and alert if an ORA- error is returned"
  43. echo "--cache"
  44. echo " Check local database for library and buffer cache hit ratios"
  45. echo " ---> Requires Oracle user/password and SID specified."
  46. echo " ---> Requires select on v_$sysstat and v_$librarycache"
  47. echo "--tablespace"
  48. echo " Check local database for tablespace capacity in ORACLE_SID"
  49. echo " ---> Requires Oracle user/password specified."
  50. echo " ---> Requires select on dba_data_files and dba_free_space"
  51. echo "--oranames Hostname"
  52. echo " Check remote Oracle Names server"
  53. echo "--help"
  54. echo " Print this help screen"
  55. echo "--version"
  56. echo " Print version and license information"
  57. echo ""
  58. echo "If the plugin doesn't work, check that the ORACLE_HOME environment"
  59. echo "variable is set, that ORACLE_HOME/bin is in your PATH, and the"
  60. echo "tnsnames.ora file is locatable and is properly configured."
  61. echo ""
  62. echo "When checking local database status your ORACLE_SID is case sensitive."
  63. echo ""
  64. echo "If you want to use a default Oracle home, add in your oratab file:"
  65. echo "*:/opt/app/oracle/product/7.3.4:N"
  66. echo ""
  67. support
  68. }
  69. case "$1" in
  70. 1)
  71. cmd='--tns'
  72. ;;
  73. 2)
  74. cmd='--db'
  75. ;;
  76. *)
  77. cmd="$1"
  78. ;;
  79. esac
  80. # Information options
  81. case "$cmd" in
  82. --help)
  83. print_help
  84. exit "$STATE_OK"
  85. ;;
  86. -h)
  87. print_help
  88. exit "$STATE_OK"
  89. ;;
  90. --version)
  91. print_revision "$PROGNAME" $REVISION
  92. exit "$STATE_OK"
  93. ;;
  94. -V)
  95. print_revision "$PROGNAME" $REVISION
  96. exit "$STATE_OK"
  97. ;;
  98. esac
  99. # Hunt down a reasonable ORACLE_HOME
  100. if [ -z "$ORACLE_HOME" ] ; then
  101. # Adjust to taste
  102. for oratab in /var/opt/oracle/oratab /etc/oratab
  103. do
  104. [ ! -f $oratab ] && continue
  105. ORACLE_HOME=`IFS=:
  106. while read SID ORACLE_HOME junk;
  107. do
  108. if [ "$SID" = "$2" -o "$SID" = "*" ] ; then
  109. echo "$ORACLE_HOME";
  110. exit;
  111. fi;
  112. done < $oratab`
  113. [ -n "$ORACLE_HOME" ] && break
  114. done
  115. fi
  116. # Last resort
  117. [ -z "$ORACLE_HOME" -a -d "$PROGPATH"/oracle ] && ORACLE_HOME=$PROGPATH/oracle
  118. if [ "$cmd" != "--db" ]; then
  119. if [ -z "$ORACLE_HOME" -o ! -d "$ORACLE_HOME" ] ; then
  120. echo "Cannot determine ORACLE_HOME for sid $2"
  121. exit "$STATE_UNKNOWN"
  122. fi
  123. fi
  124. PATH=$PATH:$ORACLE_HOME/bin
  125. LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$ORACLE_HOME/lib
  126. export ORACLE_HOME PATH LD_LIBRARY_PATH
  127. case "$cmd" in
  128. --tns)
  129. tnschk=$(tnsping "$2")
  130. tnschk2=$(echo "$tnschk" | grep -c OK)
  131. if [ "${tnschk2}" -eq 1 ] ; then
  132. tnschk3=${tnschk##*(}; tnschk3=${tnschk3%)*}
  133. echo "OK - reply time ${tnschk3} from $2"
  134. exit "$STATE_OK"
  135. else
  136. echo "No TNS Listener on $2"
  137. exit "$STATE_CRITICAL"
  138. fi
  139. ;;
  140. --oranames)
  141. namesctl status "$2" | awk '
  142. /Server has been running for:/ {
  143. msg = "OK: Up"
  144. for (i = 6; i <= NF; i++) {
  145. msg = msg " " $i
  146. }
  147. status = '"$STATE_OK"'
  148. }
  149. /error/ {
  150. msg = "CRITICAL: " $0
  151. status = '"$STATE_CRITICAL"'
  152. }
  153. END {
  154. print msg
  155. exit status
  156. }'
  157. ;;
  158. --db)
  159. pmonchk=$(ps -ef | grep -v grep | grep -E -c "(asm|ora)_pmon_${2}$")
  160. if [ "${pmonchk}" -ge 1 ] ; then
  161. echo "${2} OK - ${pmonchk} PMON process(es) running"
  162. exit "$STATE_OK"
  163. #if [ -f $ORACLE_HOME/dbs/sga*${2}* ] ; then
  164. #if [ ${pmonchk} -eq 1 ] ; then
  165. #utime=`ls -la $ORACLE_HOME/dbs/sga*$2* | cut -c 43-55`
  166. #echo "${2} OK - running since ${utime}"
  167. #exit $STATE_OK
  168. #fi
  169. else
  170. echo "${2} Database is DOWN"
  171. exit "$STATE_CRITICAL"
  172. fi
  173. ;;
  174. --login)
  175. loginchk=$(sqlplus dummy/user@"$2" < /dev/null)
  176. loginchk2=$(echo "$loginchk" | grep -c ORA-01017)
  177. if [ "${loginchk2}" -eq 1 ] ; then
  178. echo "OK - dummy login connected"
  179. exit "$STATE_OK"
  180. else
  181. loginchk3=$(echo "$loginchk" | grep "ORA-" | head -1)
  182. echo "CRITICAL - $loginchk3"
  183. exit "$STATE_CRITICAL"
  184. fi
  185. ;;
  186. --connect)
  187. connectchk=$(sqlplus "$2" < /dev/null)
  188. connectchk2=$(echo "$connectchk" | grep -c ORA-)
  189. if [ "${connectchk2}" -eq 0 ] ; then
  190. echo "OK - login successful"
  191. exit "$STATE_OK"
  192. else
  193. connectchk3=$(echo "$connectchk" | grep "ORA-" | head -1)
  194. echo "CRITICAL - $connectchk3"
  195. exit "$STATE_CRITICAL"
  196. fi
  197. ;;
  198. --cache)
  199. if [ "${5}" -gt "${6}" ] ; then
  200. echo "UNKNOWN - Warning level is less then Crit"
  201. exit "$STATE_UNKNOWN"
  202. fi
  203. result=`sqlplus -s "${3}"/"${4}"@"${2}" << EOF
  204. set pagesize 0
  205. set numf '9999999.99'
  206. select (1-(pr.value/(dbg.value+cg.value)))*100
  207. from v\\$sysstat pr, v\\$sysstat dbg, v\\$sysstat cg
  208. where pr.name='physical reads'
  209. and dbg.name='db block gets'
  210. and cg.name='consistent gets';
  211. EOF`
  212. if echo "$result" | grep -q 'ORA-' ; then
  213. error=$(echo "$result" | grep "ORA-" | head -1)
  214. echo "CRITICAL - $error"
  215. exit "$STATE_CRITICAL"
  216. fi
  217. buf_hr=$(echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}')
  218. buf_hrx=$(echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}')
  219. result=`sqlplus -s "${3}"/"${4}"@"${2}" << EOF
  220. set pagesize 0
  221. set numf '9999999.99'
  222. select sum(lc.pins)/(sum(lc.pins)+sum(lc.reloads))*100
  223. from v\\$librarycache lc;
  224. EOF`
  225. if echo "$result" | grep -q 'ORA-' ; then
  226. error=$(echo "$result" | grep "ORA-" | head -1)
  227. echo "CRITICAL - $error"
  228. exit "$STATE_CRITICAL"
  229. fi
  230. lib_hr=$(echo "$result" | awk '/^[0-9\. \t]+$/ {print int($1)}')
  231. lib_hrx=$(echo "$result" | awk '/^[0-9\. \t]+$/ {print $1}')
  232. if [ "$buf_hr" -le "${5}" -o "$lib_hr" -le "${5}" ] ; then
  233. echo "${2} CRITICAL - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  234. exit "$STATE_CRITICAL"
  235. fi
  236. if [ "$buf_hr" -le "${6}" -o "$lib_hr" -le "${6}" ] ; then
  237. echo "${2} WARNING - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  238. exit "$STATE_WARNING"
  239. fi
  240. echo "${2} OK - Cache Hit Rates: $lib_hrx% Lib -- $buf_hrx% Buff|lib=$lib_hrx%;${6};${5};0;100 buffer=$buf_hrx%;${6};${5};0;100"
  241. exit "$STATE_OK"
  242. ;;
  243. --tablespace)
  244. if [ "${6}" -lt "${7}" ] ; then
  245. echo "UNKNOWN - Warning level is more then Crit"
  246. exit "$STATE_UNKNOWN"
  247. fi
  248. result=`sqlplus -s "${3}"/"${4}"@"${2}" << EOF
  249. set pagesize 0
  250. set numf '9999999.99'
  251. select NVL(b.free,0.0),a.total,100 - trunc(NVL(b.free,0.0)/a.total * 1000) / 10 prc
  252. from (
  253. select tablespace_name,sum(bytes)/1024/1024 total
  254. from dba_data_files group by tablespace_name) A
  255. LEFT OUTER JOIN
  256. ( select tablespace_name,sum(bytes)/1024/1024 free
  257. from dba_free_space group by tablespace_name) B
  258. ON a.tablespace_name=b.tablespace_name WHERE a.tablespace_name='${5}';
  259. EOF`
  260. if echo "$result" | grep -q 'ORA-'; then
  261. error=$(echo "$result" | grep 'ORA-' | head -1)
  262. echo "CRITICAL - $error"
  263. exit "$STATE_CRITICAL"
  264. fi
  265. ts_free=$(echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($1)}')
  266. ts_total=$(echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($2)}')
  267. ts_pct=$(echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print int($3)}')
  268. ts_pctx=$(echo "$result" | awk '/^[ 0-9\.\t ]+$/ {print $3}')
  269. if [ "$ts_free" -eq 0 -a "$ts_total" -eq 0 -a "$ts_pct" -eq 0 ] ; then
  270. echo "No data returned by Oracle - tablespace $5 not found?"
  271. exit "$STATE_UNKNOWN"
  272. fi
  273. if [ "$ts_pct" -ge "${6}" ] ; then
  274. echo "${2} : ${5} CRITICAL - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  275. exit "$STATE_CRITICAL"
  276. fi
  277. if [ "$ts_pct" -ge "${7}" ] ; then
  278. echo "${2} : ${5} WARNING - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  279. exit "$STATE_WARNING"
  280. fi
  281. echo "${2} : ${5} OK - $ts_pctx% used [ $ts_free / $ts_total MB available ]|${5}=$ts_pctx%;${7};${6};0;100"
  282. exit "$STATE_OK"
  283. ;;
  284. *)
  285. print_usage
  286. exit "$STATE_UNKNOWN"
  287. esac