Current File : //lib64/nagios/plugins/check_log |
#!/bin/sh
#
# Log file pattern detector plugin for Nagios
# Written by Ethan Galstad (nagios@nagios.org)
#
# Usage: ./check_log <log_file> <old_log_file> <pattern>
#
# Description:
#
# This plugin will scan a log file (specified by the <log_file> option)
# for a specific pattern (specified by the <pattern> option). Successive
# calls to the plugin script will only report *new* pattern matches in the
# log file, since an copy of the log file from the previous run is saved
# to <old_log_file>.
#
# Output:
#
# On the first run of the plugin, it will return an OK state with a message
# of "Log check data initialized". On successive runs, it will return an OK
# state if *no* pattern matches have been found in the *difference* between the
# log file and the older copy of the log file. If the plugin detects any
# pattern matches in the log diff, it will return a CRITICAL state and print
# out a message is the following format: "(x) last_match", where "x" is the
# total number of pattern matches found in the file and "last_match" is the
# last entry in the log file which matches the pattern.
#
# Notes:
#
# If you use this plugin make sure to keep the following in mind:
#
# 1. The "max_attempts" value for the service should be 1, as this
# will prevent Nagios from retrying the service check (the
# next time the check is run it will not produce the same results).
#
# 2. The "notify_recovery" value for the service should be 0, so that
# Nagios does not notify you of "recoveries" for the check. Since
# pattern matches in the log file will only be reported once and not
# the next time, there will always be "recoveries" for the service, even
# though recoveries really don't apply to this type of check.
#
# 3. You *must* supply a different <old_file_log> for each service that
# you define to use this plugin script - even if the different services
# check the same <log_file> for pattern matches. This is necessary
# because of the way the script operates.
#
# Examples:
#
# Check for login failures in the syslog...
#
# check_log /var/log/messages ./check_log.badlogins.old "LOGIN FAILURE"
#
# Check for port scan alerts generated by Psionic's PortSentry software...
#
# check_log /var/log/message ./check_log.portscan.old "attackalert"
#
# Paths to commands used in this script. These
# may have to be modified to match your system setup.
PATH="/usr/local/sbin:/usr/local/bin:/sbin:/bin:/usr/sbin:/usr/bin"
export PATH
PROGNAME=$(basename "$0")
PROGPATH=$(echo "$0" | sed -e 's,[\\/][^\\/][^\\/]*$,,')
REVISION="2.4.9"
PATH="/usr/local/sbin:/usr/local/bin:/sbin:/bin:/usr/sbin:/usr/bin"
export PATH
. "$PROGPATH"/utils.sh
print_usage() {
echo "Usage: $PROGNAME -F logfile -O oldlog -q query"
echo "Usage: $PROGNAME --help"
echo "Usage: $PROGNAME --version"
echo " Additional parameter:"
echo " -w (--max_warning) If used, determines the maximum matching value to return"
echo " as warning, when finding more matching lines than this parameter will"
echo " return as critical. If not used, will consider as default 0 (any matching"
echo " will consider as critical)"
echo "Usage: $PROGNAME -F logfile -O oldlog -q query -w <number>"
}
print_help() {
print_revision "$PROGNAME" $REVISION
echo ""
print_usage
echo ""
echo "Log file pattern detector plugin for Nagios"
echo ""
support
}
# Make sure the correct number of command line
# arguments have been supplied
if [ $# -lt 1 ]; then
print_usage
exit "$STATE_UNKNOWN"
fi
# Grab the command line arguments
#logfile=$1
#oldlog=$2
#query=$3
exitstatus=$STATE_WARNING #default
while test -n "$1"; do
case "$1" in
--help)
print_help
exit "$STATE_OK"
;;
-h)
print_help
exit "$STATE_OK"
;;
--version)
print_revision "$PROGNAME" $REVISION
exit "$STATE_OK"
;;
-V)
print_revision "$PROGNAME" $REVISION
exit "$STATE_OK"
;;
--filename)
logfile=$2
shift
;;
-F)
logfile=$2
shift
;;
--oldlog)
oldlog=$2
shift
;;
-O)
oldlog=$2
shift
;;
--max_warning)
MAX_WARNING=$2
shift
;;
-w)
MAX_WARNING=$2
shift
;;
--query)
query=$2
shift
;;
-q)
query=$2
shift
;;
-x)
exitstatus=$2
shift
;;
--exitstatus)
exitstatus=$2
shift
;;
-t)
TMPDIR=$2
shift
;;
*)
echo "Unknown argument: $1"
print_usage
exit "$STATE_UNKNOWN"
;;
esac
shift
done
if [ "$oldlog" = "" ]; then
echo "Log check error: You must supply an Old Log File name using '-O'!"
exit "$STATE_UNKNOWN"
fi
rc=`echo "$oldlog" | grep -q -- "^-"; echo $?`
if [ $rc -eq 0 ]; then
echo "Log check error: You must supply an Old Log File name using '-O'!"
exit "$STATE_UNKNOWN"
fi
# If the source log file doesn't exist or isn't readable, exit.
#
# Note that we deliberately use "dd" to check for read access instead
# of "[ -r $logfile ]", as the latter can return false-negatives on
# Linux if the check_log plugin is being run via nrpe with additional
# capabilities (e.g., CAP_DAC_READ_SEARCH). In contrast, "dd"
# actually attempts to open the file, which is a true test of whether
# the file is readable.
if [ ! -e "$logfile" ]; then
echo "Log check error: Log file $logfile does not exist!"
exit "$STATE_UNKNOWN"
elif ! dd if="$logfile" count=0 1>/dev/null 2>&1; then
echo "Log check error: Log file $logfile is not readable!"
exit "$STATE_UNKNOWN"
fi
# Only use /tmp as a fallback if $TMPDIR doesn't exist
if [ ! -d "$TMPDIR" ];then
TMPDIR="/tmp"
fi
# Copy the logfile to a temporary file, to prevent diff from
# never finishing when $logfile continues to be written to
# during the diff
templog="${TMPDIR}/temp_check_log.tmp"
if [ -x /bin/mktemp ]; then
templog=$(/bin/mktemp "${TMPDIR}/temp_check_log.XXXXXXXXXX")
else
templog=$(/bin/date '+%H%M%S')
templog="${TMPDIR}/temp_check_log.${templog}"
fi
cp "$logfile" "$templog"
logfile=$templog
# If the old log file doesn't exist, this must be the first time
# we're running this test, so copy the original log file over to
# the old diff file and exit
if [ ! -e "$oldlog" ]; then
cat "$logfile" > "$oldlog"
echo "Log check data initialized..."
exit "$STATE_OK"
fi
# The old log file exists, so compare it to the original log now
# The temporary file that the script should use while
# processing the log file.
if [ -x /bin/mktemp ]; then
tempdiff=$(/bin/mktemp "${TMPDIR}/check_log.XXXXXXXXXX")
else
tempdiff=$(/bin/date '+%H%M%S')
tempdiff="${TMPDIR}/check_log.${tempdiff}"
touch "$tempdiff"
chmod 600 "$tempdiff"
fi
diff "$logfile" "$oldlog" | grep -v "^>" > "$tempdiff"
# Count the number of matching log entries we have and handle errors when grep fails
count=$(grep -c "$query" "$tempdiff" 2>&1)
if [ $? -gt 1 ];then
echo "Log check error: $count"
exit "$STATE_UNKNOWN"
fi
# Get the last matching entry in the diff file
lastentry=$(egrep "$query" "$tempdiff" | tail -1)
rm -f "$tempdiff"
cat "$logfile" > "$oldlog"
# Need to remove the temp file otherwise it just fills up the temp directory
rm -f "$templog"
if [ "$count" = "0" ]; then # no matches, exit with no error
echo "Log check ok - 0 pattern matches found|match=$count;;;0"
exitstatus=$STATE_OK
else # Print total matche count and the last entry we found
echo "($count) $lastentry|match=$count;;;0"
if [ "$MAX_WARNING" ] && [ "$count" -le "$MAX_WARNING" ] ; then
exitstatus=$STATE_WARNING
else
exitstatus=$STATE_CRITICAL
fi
fi
exit "$exitstatus"