check_log.sh 6.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241
  1. #!/bin/sh
  2. #
  3. # Log file pattern detector plugin for Nagios
  4. # Written by Ethan Galstad (nagios@nagios.org)
  5. #
  6. # Usage: ./check_log <log_file> <old_log_file> <pattern>
  7. #
  8. # Description:
  9. #
  10. # This plugin will scan a log file (specified by the <log_file> option)
  11. # for a specific pattern (specified by the <pattern> option). Successive
  12. # calls to the plugin script will only report *new* pattern matches in the
  13. # log file, since an copy of the log file from the previous run is saved
  14. # to <old_log_file>.
  15. #
  16. # Output:
  17. #
  18. # On the first run of the plugin, it will return an OK state with a message
  19. # of "Log check data initialized". On successive runs, it will return an OK
  20. # state if *no* pattern matches have been found in the *difference* between the
  21. # log file and the older copy of the log file. If the plugin detects any
  22. # pattern matches in the log diff, it will return a CRITICAL state and print
  23. # out a message is the following format: "(x) last_match", where "x" is the
  24. # total number of pattern matches found in the file and "last_match" is the
  25. # last entry in the log file which matches the pattern.
  26. #
  27. # Notes:
  28. #
  29. # If you use this plugin make sure to keep the following in mind:
  30. #
  31. # 1. The "max_attempts" value for the service should be 1, as this
  32. # will prevent Nagios from retrying the service check (the
  33. # next time the check is run it will not produce the same results).
  34. #
  35. # 2. The "notify_recovery" value for the service should be 0, so that
  36. # Nagios does not notify you of "recoveries" for the check. Since
  37. # pattern matches in the log file will only be reported once and not
  38. # the next time, there will always be "recoveries" for the service, even
  39. # though recoveries really don't apply to this type of check.
  40. #
  41. # 3. You *must* supply a different <old_file_log> for each service that
  42. # you define to use this plugin script - even if the different services
  43. # check the same <log_file> for pattern matches. This is necessary
  44. # because of the way the script operates.
  45. #
  46. # Examples:
  47. #
  48. # Check for login failures in the syslog...
  49. #
  50. # check_log /var/log/messages ./check_log.badlogins.old "LOGIN FAILURE"
  51. #
  52. # Check for port scan alerts generated by Psionic's PortSentry software...
  53. #
  54. # check_log /var/log/message ./check_log.portscan.old "attackalert"
  55. #
  56. # Paths to commands used in this script. These
  57. # may have to be modified to match your system setup.
  58. PATH="@TRUSTED_PATH@"
  59. export PATH
  60. PROGNAME=$(basename "$0")
  61. PROGPATH=$(echo "$0" | sed -e 's,[\\/][^\\/][^\\/]*$,,')
  62. REVISION="@NP_VERSION@"
  63. PATH="@TRUSTED_PATH@"
  64. export PATH
  65. . "$PROGPATH"/utils.sh
  66. print_usage() {
  67. echo "Usage: $PROGNAME -F logfile -O oldlog -q query"
  68. echo "Usage: $PROGNAME --help"
  69. echo "Usage: $PROGNAME --version"
  70. echo " Additional parameter:"
  71. echo " -w (--max_warning) If used, determines the maximum matching value to return as warning, when finding more matching lines than this parameter will return as critical. If not used, will consider as default 0 (any matching will consider as critical)"
  72. echo "Usage: $PROGNAME -F logfile -O oldlog -q query -w <number>"
  73. }
  74. print_help() {
  75. print_revision "$PROGNAME" $REVISION
  76. echo ""
  77. print_usage
  78. echo ""
  79. echo "Log file pattern detector plugin for Nagios"
  80. echo ""
  81. support
  82. }
  83. # Make sure the correct number of command line
  84. # arguments have been supplied
  85. if [ $# -lt 1 ]; then
  86. print_usage
  87. exit "$STATE_UNKNOWN"
  88. fi
  89. # Grab the command line arguments
  90. #logfile=$1
  91. #oldlog=$2
  92. #query=$3
  93. exitstatus=$STATE_WARNING #default
  94. while test -n "$1"; do
  95. case "$1" in
  96. --help)
  97. print_help
  98. exit "$STATE_OK"
  99. ;;
  100. -h)
  101. print_help
  102. exit "$STATE_OK"
  103. ;;
  104. --version)
  105. print_revision "$PROGNAME" $REVISION
  106. exit "$STATE_OK"
  107. ;;
  108. -V)
  109. print_revision "$PROGNAME" $REVISION
  110. exit "$STATE_OK"
  111. ;;
  112. --filename)
  113. logfile=$2
  114. shift
  115. ;;
  116. -F)
  117. logfile=$2
  118. shift
  119. ;;
  120. --oldlog)
  121. oldlog=$2
  122. shift
  123. ;;
  124. -O)
  125. oldlog=$2
  126. shift
  127. ;;
  128. --max_warning)
  129. MAX_WARNING=$2
  130. shift
  131. ;;
  132. -w)
  133. MAX_WARNING=$2
  134. shift
  135. ;;
  136. --query)
  137. query=$2
  138. shift
  139. ;;
  140. -q)
  141. query=$2
  142. shift
  143. ;;
  144. -x)
  145. exitstatus=$2
  146. shift
  147. ;;
  148. --exitstatus)
  149. exitstatus=$2
  150. shift
  151. ;;
  152. *)
  153. echo "Unknown argument: $1"
  154. print_usage
  155. exit "$STATE_UNKNOWN"
  156. ;;
  157. esac
  158. shift
  159. done
  160. if [ "$oldlog" = "" ]; then
  161. echo "Log check error: You must supply an Old Log File name using '-O'!"
  162. exit "$STATE_UNKNOWN"
  163. fi
  164. rc=`echo "$oldlog" | grep -q -- "^-"; echo $?`
  165. if [ $rc -eq 0 ]; then
  166. echo "Log check error: You must supply an Old Log File name using '-O'!"
  167. exit "$STATE_UNKNOWN"
  168. fi
  169. # If the source log file doesn't exist, exit
  170. if [ ! -e "$logfile" ]; then
  171. echo "Log check error: Log file $logfile does not exist!"
  172. exit "$STATE_UNKNOWN"
  173. elif [ ! -r "$logfile" ] ; then
  174. echo "Log check error: Log file $logfile is not readable!"
  175. exit "$STATE_UNKNOWN"
  176. fi
  177. # If the old log file doesn't exist, this must be the first time
  178. # we're running this test, so copy the original log file over to
  179. # the old diff file and exit
  180. if [ ! -e "$oldlog" ]; then
  181. cat "$logfile" > "$oldlog"
  182. echo "Log check data initialized..."
  183. exit "$STATE_OK"
  184. fi
  185. # The old log file exists, so compare it to the original log now
  186. # The temporary file that the script should use while
  187. # processing the log file.
  188. if [ -x /bin/mktemp ]; then
  189. tempdiff=$(/bin/mktemp /tmp/check_log.XXXXXXXXXX)
  190. else
  191. tempdiff=$(/bin/date '+%H%M%S')
  192. tempdiff="/tmp/check_log.${tempdiff}"
  193. touch "$tempdiff"
  194. chmod 600 "$tempdiff"
  195. fi
  196. diff "$logfile" "$oldlog" | grep -v "^>" > "$tempdiff"
  197. # Count the number of matching log entries we have and handle errors when grep fails
  198. count=$(grep -c "$query" "$tempdiff" 2>&1)
  199. if [ $? -gt 1 ];then
  200. echo "Log check error: $count"
  201. exit "$STATE_UNKNOWN"
  202. fi
  203. # Get the last matching entry in the diff file
  204. lastentry=$(egrep "$query" "$tempdiff" | tail -1)
  205. rm -f "$tempdiff"
  206. cat "$logfile" > "$oldlog"
  207. if [ "$count" = "0" ]; then # no matches, exit with no error
  208. echo "Log check ok - 0 pattern matches found|match=$count;;;0"
  209. exitstatus=$STATE_OK
  210. else # Print total matche count and the last entry we found
  211. echo "($count) $lastentry|match=$count;;;0"
  212. if [ "$MAX_WARNING" ] && [ "$count" -le "$MAX_WARNING" ] ; then
  213. exitstatus=$STATE_WARNING
  214. else
  215. exitstatus=$STATE_CRITICAL
  216. fi
  217. fi
  218. exit "$exitstatus"