Compare commits

...

16 Commits

Author SHA1 Message Date
8822bfad31 Ignore recently-created temporary files (in the event that Ansible is doing shenanigans or something 2022-04-27 17:44:04 -05:00
edf1588c27 Fix a myriad of issues with that last script 2022-04-27 17:39:20 -05:00
815044fca0 Add a check for executables in /tmp
Yaknow, case we get owned
2022-04-27 17:25:04 -05:00
2d6a52f439 Make executable 2022-01-10 23:56:27 -06:00
9f8f59ecd3 Add check_temp 2022-01-10 21:58:49 -06:00
6e74d5d992 Use python2, not python for check_minecraft 2021-12-24 14:45:58 -06:00
4e7c418b04 Add a Minecraft checker script 2021-12-24 14:31:59 -06:00
c7f1097948 Revert "Revert "Add a quick little script to check a file's age""
This reverts commit 822c5193b8.
2021-12-11 15:58:58 -06:00
822c5193b8 Revert "Add a quick little script to check a file's age"
This reverts commit 6f85b4e493.
2021-12-09 16:45:23 -06:00
e7c70934f6 Revert "Add a readability check to that file"
This reverts commit dc4b522ef5.
2021-12-09 16:45:02 -06:00
dd66a4c03d Add justintime's edit of check_mem for ZFS compatibility 2021-12-09 16:39:23 -06:00
dc4b522ef5 Add a readability check to that file 2021-11-25 16:40:45 -06:00
6f85b4e493 Add a quick little script to check a file's age 2021-11-25 16:38:37 -06:00
ebfd7fbc3a Add check_ping_by_hostname 2021-10-15 19:17:13 -05:00
85de49d8ec Add check_cpu_stats plugin 2021-10-03 15:45:46 -05:00
98ab2f8f30 Fix typo in check_apt_pending 2021-10-03 15:35:12 -05:00
8 changed files with 1306 additions and 1 deletions

View File

@@ -16,7 +16,7 @@ if [ -n "$pending" ]; then
if (( pending >= threshold_crit )); then
echo "CRITICAL - $pending package updates pending"
exit 2
elif (( pending >= thresold_warn )); then
elif (( pending >= threshold_warn )); then
echo "WARNING - $pending package updates pending"
exit 1
elif (( pending > 0 )); then

192
check_cpu_stats Executable file
View File

@@ -0,0 +1,192 @@
#!/bin/bash
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
PROGNAME=`basename $0`
VERSION="Version 1.0,"
AUTHOR="2009, Mike Adolphs (http://www.matejunkie.com/)"
ST_OK=0
ST_WR=1
ST_CR=2
ST_UK=3
interval=1
print_version() {
echo "$VERSION $AUTHOR"
}
print_help() {
print_version $PROGNAME $VERSION
echo ""
echo "$PROGNAME is a Nagios plugin to monitor CPU utilization. It makes"
echo "use of /proc/stat and calculates it through Jiffies rather than"
echo "using another frontend tool like iostat or top."
echo "When using optional warning/critical thresholds all values except"
echo "idle are aggregated and compared to the thresholds. There's"
echo "currently no support for warning/critical thresholds for specific"
echo "usage parameters."
echo ""
echo "$PROGNAME [-i/--interval] [-w/--warning] [-c/--critical]"
echo ""
echo "Options:"
echo " --interval|-i)"
echo " Defines the pause between the two times /proc/stat is being"
echo " parsed. Higher values could lead to more accurate result."
echo " Default is: 1 second"
echo " --warning|-w)"
echo " Sets a warning level for CPU user. Default is: off"
echo " --critical|-c)"
echo " Sets a critical level for CPU user. Default is: off"
exit $ST_UK
}
while test -n "$1"; do
case "$1" in
--help|-h)
print_help
exit $ST_UK
;;
--version|-v)
print_version $PROGNAME $VERSION
exit $ST_UK
;;
--interval|-i)
interval=$2
shift
;;
--warning|-w)
warn=$2
shift
;;
--critical|-c)
crit=$2
shift
;;
*)
echo "Unknown argument: $1"
print_help
exit $ST_UK
;;
esac
shift
done
val_wcdiff() {
if [ ${warn} -gt ${crit} ]
then
wcdiff=1
fi
}
get_cpuvals() {
tmp1_cpu_user=`grep -m1 '^cpu' /proc/stat|awk '{print $2}'`
tmp1_cpu_nice=`grep -m1 '^cpu' /proc/stat|awk '{print $3}'`
tmp1_cpu_sys=`grep -m1 '^cpu' /proc/stat|awk '{print $4}'`
tmp1_cpu_idle=`grep -m1 '^cpu' /proc/stat|awk '{print $5}'`
tmp1_cpu_iowait=`grep -m1 '^cpu' /proc/stat|awk '{print $6}'`
tmp1_cpu_irq=`grep -m1 '^cpu' /proc/stat|awk '{print $7}'`
tmp1_cpu_softirq=`grep -m1 '^cpu' /proc/stat|awk '{print $8}'`
tmp1_cpu_total=`expr $tmp1_cpu_user + $tmp1_cpu_nice + $tmp1_cpu_sys + \
$tmp1_cpu_idle + $tmp1_cpu_iowait + $tmp1_cpu_irq + $tmp1_cpu_softirq`
sleep $interval
tmp2_cpu_user=`grep -m1 '^cpu' /proc/stat|awk '{print $2}'`
tmp2_cpu_nice=`grep -m1 '^cpu' /proc/stat|awk '{print $3}'`
tmp2_cpu_sys=`grep -m1 '^cpu' /proc/stat|awk '{print $4}'`
tmp2_cpu_idle=`grep -m1 '^cpu' /proc/stat|awk '{print $5}'`
tmp2_cpu_iowait=`grep -m1 '^cpu' /proc/stat|awk '{print $6}'`
tmp2_cpu_irq=`grep -m1 '^cpu' /proc/stat|awk '{print $7}'`
tmp2_cpu_softirq=`grep -m1 '^cpu' /proc/stat|awk '{print $8}'`
tmp2_cpu_total=`expr $tmp2_cpu_user + $tmp2_cpu_nice + $tmp2_cpu_sys + \
$tmp2_cpu_idle + $tmp2_cpu_iowait + $tmp2_cpu_irq + $tmp2_cpu_softirq`
diff_cpu_user=`echo "${tmp2_cpu_user} - ${tmp1_cpu_user}" | bc -l`
diff_cpu_nice=`echo "${tmp2_cpu_nice} - ${tmp1_cpu_nice}" | bc -l`
diff_cpu_sys=`echo "${tmp2_cpu_sys} - ${tmp1_cpu_sys}" | bc -l`
diff_cpu_idle=`echo "${tmp2_cpu_idle} - ${tmp1_cpu_idle}" | bc -l`
diff_cpu_iowait=`echo "${tmp2_cpu_iowait} - ${tmp1_cpu_iowait}" | bc -l`
diff_cpu_irq=`echo "${tmp2_cpu_irq} - ${tmp1_cpu_irq}" | bc -l`
diff_cpu_softirq=`echo "${tmp2_cpu_softirq} - ${tmp1_cpu_softirq}" \
| bc -l`
diff_cpu_total=`echo "${tmp2_cpu_total} - ${tmp1_cpu_total}" | bc -l`
cpu_user=`echo "scale=2; (1000*${diff_cpu_user}/${diff_cpu_total}+5)/10" \
| bc -l | sed 's/^\./0./'`
cpu_nice=`echo "scale=2; (1000*${diff_cpu_nice}/${diff_cpu_total}+5)/10" \
| bc -l | sed 's/^\./0./'`
cpu_sys=`echo "scale=2; (1000*${diff_cpu_sys}/${diff_cpu_total}+5)/10" \
| bc -l | sed 's/^\./0./'`
cpu_idle=`echo "scale=2; (1000*${diff_cpu_idle}/${diff_cpu_total}+5)/10" \
| bc -l | sed 's/^\./0./'`
cpu_iowait=`echo "scale=2; (1000*${diff_cpu_iowait}/${diff_cpu_total}+5)\\
/10" | bc -l | sed 's/^\./0./'`
cpu_irq=`echo "scale=2; (1000*${diff_cpu_irq}/${diff_cpu_total}+5)/10" \
| bc -l | sed 's/^\./0./'`
cpu_softirq=`echo "scale=2; (1000*${diff_cpu_softirq}/${diff_cpu_total}\\
+5)/10" | bc -l | sed 's/^\./0./'`
cpu_total=`echo "scale=2; (1000*${diff_cpu_total}/${diff_cpu_total}+5)\\
/10" | bc -l | sed 's/^\./0./'`
cpu_usage=`echo "(${cpu_user}+${cpu_nice}+${cpu_sys}+${cpu_iowait}+\\
${cpu_irq}+${cpu_softirq})/1" | bc`
}
do_output() {
output="user: ${cpu_user}, nice: ${cpu_nice}, sys: ${cpu_sys}, \
iowait: ${cpu_iowait}, irq: ${cpu_irq}, softirq: ${cpu_softirq} \
idle: ${cpu_idle}"
}
do_perfdata() {
perfdata="'user'=${cpu_user} 'nice'=${cpu_nice} 'sys'=${cpu_sys} \
'softirq'=${cpu_softirq} 'iowait'=${cpu_iowait} 'irq'=${cpu_irq} \
'idle'=${cpu_idle}"
}
if [ -n "$warn" -a -n "$crit" ]
then
val_wcdiff
if [ "$wcdiff" = 1 ]
then
echo "Please adjust your warning/critical thresholds. The warning\\
must be lower than the critical level!"
exit $ST_UK
fi
fi
get_cpuvals
do_output
do_perfdata
if [ -n "$warn" -a -n "$crit" ]
then
if [ "$cpu_usage" -ge "$warn" -a "$cpu_usage" -lt "$crit" ]
then
echo "WARNING - ${output} | ${perfdata}"
exit $ST_WR
elif [ "$cpu_usage" -ge "$crit" ]
then
echo "CRITICAL - ${output} | ${perfdata}"
exit $ST_CR
else
echo "OK - ${output} | ${perfdata}"
exit $ST_OK
fi
else
echo "OK - ${output} | ${perfdata}"
exit $ST_OK
fi

51
check_executables_in_tmp Executable file
View File

@@ -0,0 +1,51 @@
#! /bin/bash
#
# check_executables_in_tmpdir
# Check a directory for executables and become angry if we find them
#
# Copyright (C) 2022 Jacob Babor <jacob@babor.tech>
#
# Distributed under terms of the MIT license.
#
set -e
tmpdir="/tmp"
minfileage="3600"
#
# Compile a list of executables found in /tmp
#
# Note that we deliberately use the -perm flag instead of the -executable flag
#
# This is by design, as -executable will fail on systems with noexec on the
# filesystem we're checking. This runs counter to our goal here, which is just
# to see if some skid has dumped a cryptominer on the machine.
#
executables=""
while read line; do
# Ignore recently-created files
# This is so things like Ansible plays don't trigger us
filetimestamp="$(stat -c %Y -- "$line")"
now="$(date +%s)"
age="$(( now - filetimestamp ))"
if (( age <= minfileage )); then
continue
fi
# Add it to the list
if [ -z "$executables" ]; then
executables="$line"
else
executables="$executables, $line"
fi
done < <(find "$tmpdir" -type f -perm /u=x,g=x,o=x 2>/dev/null || true )
# If we found any, become angry
if [ -n "$executables" ]; then
echo "CRITICAL: Found executables in $tmpdir: $executables"
exit 2
else
echo "OK: No executables in $tmpdir older than ${minfileage}s"
exit 0
fi

170
check_file_age Executable file
View File

@@ -0,0 +1,170 @@
#! /bin/bash
#
# check_file_age
# Alerts if a file's age is beyond a specific threshold
# Copyright (C) 2021 Vintage Salt <rehashedsalt@cock.li>
#
# Distributed under terms of the MIT license.
#
set -e
# Read-only set-once variables
declare -r _name="$(basename -- "$0")"
# Options
declare -i _optcritthresh
declare -i _optwarnthresh
declare -i _opthelp
declare -i _optverbose
# Working variables
declare -a _args
declare _return
# Helper functions
log() {
# Print a line to the terminal if _optverbose is greater than $2
# $2 defaults to 0
# loglevel 0: Daily-use messages
# loglevel 1: Detailed but not quite debugging
# loglevel 2: Definitely debugging
[ -z "$1" ] && return 1
if (( _optverbose >= ${2:-0} )); then
printf "%s\\n" "$1"
fi
}
warn() {
# Print a yellow line to the terminal, respecting _optverbose
[ -z "$1" ] && return 1
if (( _optverbose >= ${2:-0} )); then
if [ -t 1 ]; then
printf "\\e[33m%s\\e[0m\\n" "$1"
else
printf "WARN: %s\\n" "$1"
fi
fi
}
error() {
# Print a red line to the terminal, exit if $2 is specified
[ -z "$1" ] && return 1
if [ -t 2 ]; then
printf "\\e[31m%s\\e[0m\\n" "$1" 1>&2
else
printf "ERROR: %s\\n" "$1" 1>&2
fi
[ -z "$2" ] && return
exit "${2:-1}"
}
has() {
# Parse out all arguments and try to find them in path
# If an argument cannot be found, set _return and fail
for prog in "$@"; do
if ! command -v "$prog" > /dev/null 2>&1; then
_return="$prog"
return 1
fi
done
return 0
}
# Core program functions
checkage() {
# Check a file's age against the values of _optwarnthres and _optcritthresh
file="${_args[0]}"
log "Checking file $file" 1
# Get some times
filetimestamp="$(stat -c %Y -- "$file")"
now="$(date +%s)"
# Get our age
age="$(( now - filetimestamp ))"
log "File is $age seconds old" 1
# Throw out warns and crits as necessary
if (( age >= _optcritthresh )); then
echo "CRITICAL: $file is $age seconds old (max $_optcritthresh)"
exit 2
elif (( age >= _optwarnthresh)); then
echo "WARNING: $file is $age seconds old (max $_optwarnthresh)"
exit 1
else
echo "OK: $file"
exit 0
fi
}
printhelp() {
cat << EOF
Usage: $_name <FILE> [OPTION]...
A Nagios monitoring plugin for checking a file's age
Arguments:
FILE The file to monitor
Flags:
-c The maximum age of the file in seconds before a CRITICAL status is
returned
-h Print this help text
-v Print more status messages. Stacks
-w The maximum age of the file in seconds before a WARNING status is
returned
Copyright (c) 2021 rehashedsalt@cock.li
Licensed under the MIT license
EOF
}
# Main
main() {
# Parse out arguments
while [ -n "$1" ]; do
# Parse out flags
while getopts ":c:hvw:" opt; do
case $opt in
c)
_optcritthresh="$OPTARG"
;;
h)
_opthelp=1
;;
v)
_optverbose+=1
;;
w)
_optwarnthresh="$OPTARG"
;;
:)
error "Option requires argument: -$OPTARG" 2
;;
*)
error "Invalid option: -$OPTARG" 2
;;
esac
done
# Store arguments
shift $((OPTIND - 1))
if [ -n "$1" ]; then
_args+=("$1")
shift
fi
unset OPTIND
done
# Early hook for help
[ -n "$_opthelp" ] && printhelp && exit 0
# Validate critical options
if [ -z "${_args[0]}" ]; then
error "Must specify a file" 50
fi
if ! (( _optcritthresh > 0 )) 2>/dev/null; then
error "Critical threshold must be an integer greater than 0" 50
fi
if ! (( _optwarnthresh > 0 )) 2>/dev/null; then
error "Warning threshold must be an integer greater than 0" 50
fi
# Validate core program dependencies
log "Validating dependencies" 2
if ! has basename; then
error "Failed to find program: $_return" 50
fi
# Do the do
checkage
}
main "$@"

409
check_mem_justintime Executable file
View File

@@ -0,0 +1,409 @@
#!/usr/bin/perl -w
# Heavily based on the script from:
# check_mem.pl Copyright (C) 2000 Dan Larsson <dl@tyfon.net>
# heavily modified by
# Justin Ellison <justin@techadvise.com>
#
# The MIT License (MIT)
# Copyright (c) 2011 justin@techadvise.com
# Permission is hereby granted, free of charge, to any person obtaining a copy of this
# software and associated documentation files (the "Software"), to deal in the Software
# without restriction, including without limitation the rights to use, copy, modify,
# merge, publish, distribute, sublicense, and/or sell copies of the Software, and to
# permit persons to whom the Software is furnished to do so, subject to the following conditions:
# The above copyright notice and this permission notice shall be included in all copies
# or substantial portions of the Software.
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
# INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
# PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
# FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT
# OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
# OTHER DEALINGS IN THE SOFTWARE.
# Tell Perl what we need to use
use strict;
use Getopt::Std;
#TODO - Convert to Nagios::Plugin
#TODO - Use an alarm
# Predefined exit codes for Nagios
use vars qw($opt_c $opt_f $opt_u $opt_w $opt_C $opt_v $opt_h %exit_codes);
%exit_codes = ('UNKNOWN' , 3,
'OK' , 0,
'WARNING' , 1,
'CRITICAL', 2,
);
# Get our variables, do our checking:
init();
# Get the numbers:
my ($free_memory_kb,$used_memory_kb,$caches_kb,$hugepages_kb) = get_memory_info();
print "$free_memory_kb Free\n$used_memory_kb Used\n$caches_kb Cache\n" if ($opt_v);
print "$hugepages_kb Hugepages\n" if ($opt_v and $opt_h);
if ($opt_C) { #Do we count caches as free?
$used_memory_kb -= $caches_kb;
$free_memory_kb += $caches_kb;
}
if ($opt_h) {
$used_memory_kb -= $hugepages_kb;
}
print "$used_memory_kb Used (after Hugepages)\n" if ($opt_v);
# Round to the nearest KB
$free_memory_kb = sprintf('%.0f',$free_memory_kb);
$used_memory_kb = sprintf('%.0f',$used_memory_kb);
$caches_kb = sprintf('%.0f',$caches_kb);
# Tell Nagios what we came up with
tell_nagios($used_memory_kb,$free_memory_kb,$caches_kb,$hugepages_kb);
sub tell_nagios {
my ($used,$free,$caches,$hugepages) = @_;
# Calculate Total Memory
my $total = $free + $used;
print "$total Total\n" if ($opt_v);
my $perf_warn;
my $perf_crit;
if ( $opt_u ) {
$perf_warn = int(${total} * $opt_w / 100);
$perf_crit = int(${total} * $opt_c / 100);
} else {
$perf_warn = int(${total} * ( 100 - $opt_w ) / 100);
$perf_crit = int(${total} * ( 100 - $opt_c ) / 100);
}
my $perfdata = "|TOTAL=${total}KB;;;; USED=${used}KB;${perf_warn};${perf_crit};; FREE=${free}KB;;;; CACHES=${caches}KB;;;;";
$perfdata .= " HUGEPAGES=${hugepages}KB;;;;" if ($opt_h);
if ($opt_f) {
my $percent = sprintf "%.1f", ($free / $total * 100);
if ($percent <= $opt_c) {
finish("CRITICAL - $percent% ($free kB) free!$perfdata",$exit_codes{'CRITICAL'});
}
elsif ($percent <= $opt_w) {
finish("WARNING - $percent% ($free kB) free!$perfdata",$exit_codes{'WARNING'});
}
else {
finish("OK - $percent% ($free kB) free.$perfdata",$exit_codes{'OK'});
}
}
elsif ($opt_u) {
my $percent = sprintf "%.1f", ($used / $total * 100);
if ($percent >= $opt_c) {
finish("CRITICAL - $percent% ($used kB) used!$perfdata",$exit_codes{'CRITICAL'});
}
elsif ($percent >= $opt_w) {
finish("WARNING - $percent% ($used kB) used!$perfdata",$exit_codes{'WARNING'});
}
else {
finish("OK - $percent% ($used kB) used.$perfdata",$exit_codes{'OK'});
}
}
}
# Show usage
sub usage() {
print "\ncheck_mem.pl v1.0 - Nagios Plugin\n\n";
print "usage:\n";
print " check_mem.pl -<f|u> -w <warnlevel> -c <critlevel>\n\n";
print "options:\n";
print " -f Check FREE memory\n";
print " -u Check USED memory\n";
print " -C Count OS caches as FREE memory\n";
print " -h Remove hugepages from the total memory count\n";
print " -w PERCENT Percent free/used when to warn\n";
print " -c PERCENT Percent free/used when critical\n";
print "\nCopyright (C) 2000 Dan Larsson <dl\@tyfon.net>\n";
print "check_mem.pl comes with absolutely NO WARRANTY either implied or explicit\n";
print "This program is licensed under the terms of the\n";
print "MIT License (check source code for details)\n";
exit $exit_codes{'UNKNOWN'};
}
sub get_memory_info {
my $used_memory_kb = 0;
my $free_memory_kb = 0;
my $total_memory_kb = 0;
my $caches_kb = 0;
my $hugepages_nr = 0;
my $hugepages_size = 0;
my $hugepages_kb = 0;
my $uname;
if ( -e '/usr/bin/uname') {
$uname = `/usr/bin/uname -a`;
}
elsif ( -e '/bin/uname') {
$uname = `/bin/uname -a`;
}
else {
die "Unable to find uname in /usr/bin or /bin!\n";
}
print "uname returns $uname" if ($opt_v);
if ( $uname =~ /Linux/ ) {
my @meminfo = `/bin/cat /proc/meminfo`;
foreach (@meminfo) {
chomp;
if (/^Mem(Total|Free):\s+(\d+) kB/) {
my $counter_name = $1;
if ($counter_name eq 'Free') {
$free_memory_kb = $2;
}
elsif ($counter_name eq 'Total') {
$total_memory_kb = $2;
}
}
elsif (/^(Buffers|Cached|SReclaimable):\s+(\d+) kB/) {
$caches_kb += $2;
}
elsif (/^Shmem:\s+(\d+) kB/) {
$caches_kb -= $1;
}
# These variables will most likely be overwritten once we look into
# /sys/kernel/mm/hugepages, unless we are running on linux <2.6.27
# and have to rely on them
elsif (/^HugePages_Total:\s+(\d+)/) {
$hugepages_nr = $1;
}
elsif (/^Hugepagesize:\s+(\d+) kB/) {
$hugepages_size = $1;
}
}
$hugepages_kb = $hugepages_nr * $hugepages_size;
$used_memory_kb = $total_memory_kb - $free_memory_kb;
# Read hugepages info from the newer sysfs interface if available
my $hugepages_sysfs_dir = '/sys/kernel/mm/hugepages';
if ( -d $hugepages_sysfs_dir ) {
# Reset what we read from /proc/meminfo
$hugepages_kb = 0;
opendir(my $dh, $hugepages_sysfs_dir)
|| die "Can't open $hugepages_sysfs_dir: $!";
while (my $entry = readdir $dh) {
if ($entry =~ /^hugepages-(\d+)kB/) {
$hugepages_size = $1;
my $hugepages_nr_file = "$hugepages_sysfs_dir/$entry/nr_hugepages";
open(my $fh, '<', $hugepages_nr_file)
|| die "Can't open $hugepages_nr_file for reading: $!";
$hugepages_nr = <$fh>;
close($fh);
$hugepages_kb += $hugepages_nr * $hugepages_size;
}
}
closedir($dh);
}
}
elsif ( $uname =~ /HP-UX/ ) {
# HP-UX, thanks to Christoph Fürstaller
my @meminfo = `/usr/bin/sudo /usr/local/bin/kmeminfo`;
foreach (@meminfo) {
chomp;
if (/^Physical memory\s\s+=\s+(\d+)\s+(\d+.\d)g/) {
$total_memory_kb = ($2 * 1024 * 1024);
}
elsif (/^Free memory\s\s+=\s+(\d+)\s+(\d+.\d)g/) {
$free_memory_kb = ($2 * 1024 * 1024);
}
}
$used_memory_kb = $total_memory_kb - $free_memory_kb;
}
elsif ( $uname =~ /FreeBSD/ ) {
# The FreeBSD case. 2013-03-19 www.claudiokuenzler.com
# free mem = Inactive*Page Size + Cache*Page Size + Free*Page Size
my $pagesize = `sysctl vm.stats.vm.v_page_size`;
$pagesize =~ s/[^0-9]//g;
my $mem_inactive = 0;
my $mem_cache = 0;
my $mem_free = 0;
my $mem_total = 0;
my $free_memory = 0;
my @meminfo = `/sbin/sysctl vm.stats.vm`;
foreach (@meminfo) {
chomp;
if (/^vm.stats.vm.v_inactive_count:\s+(\d+)/) {
$mem_inactive = ($1 * $pagesize);
}
elsif (/^vm.stats.vm.v_cache_count:\s+(\d+)/) {
$mem_cache = ($1 * $pagesize);
}
elsif (/^vm.stats.vm.v_free_count:\s+(\d+)/) {
$mem_free = ($1 * $pagesize);
}
elsif (/^vm.stats.vm.v_page_count:\s+(\d+)/) {
$mem_total = ($1 * $pagesize);
}
}
$free_memory = $mem_inactive + $mem_cache + $mem_free;
$free_memory_kb = ( $free_memory / 1024);
$total_memory_kb = ( $mem_total / 1024);
$used_memory_kb = $total_memory_kb - $free_memory_kb;
$caches_kb = ($mem_cache / 1024);
}
elsif ( $uname =~ /joyent/ ) {
# The SmartOS case. 2014-01-10 www.claudiokuenzler.com
# free mem = pagesfree * pagesize
my $pagesize = `pagesize`;
my $phys_pages = `kstat -p unix:0:system_pages:pagestotal | awk '{print \$NF}'`;
my $free_pages = `kstat -p unix:0:system_pages:pagesfree | awk '{print \$NF}'`;
my $arc_size = `kstat -p zfs:0:arcstats:size | awk '{print \$NF}'`;
my $arc_size_kb = $arc_size / 1024;
print "Pagesize is $pagesize" if ($opt_v);
print "Total pages is $phys_pages" if ($opt_v);
print "Free pages is $free_pages" if ($opt_v);
print "Arc size is $arc_size" if ($opt_v);
$caches_kb += $arc_size_kb;
$total_memory_kb = $phys_pages * $pagesize / 1024;
$free_memory_kb = $free_pages * $pagesize / 1024;
$used_memory_kb = $total_memory_kb - $free_memory_kb;
}
elsif ( $uname =~ /SunOS/ ) {
eval "use Sun::Solaris::Kstat";
if ($@) { #Kstat not available
if ($opt_C) {
print "You can't report on Solaris caches without Sun::Solaris::Kstat available!\n";
exit $exit_codes{UNKNOWN};
}
my @vmstat = `/usr/bin/vmstat 1 2`;
my $line;
foreach (@vmstat) {
chomp;
$line = $_;
}
$free_memory_kb = (split(/ /,$line))[5] / 1024;
my @prtconf = `/usr/sbin/prtconf`;
foreach (@prtconf) {
if (/^Memory size: (\d+) Megabytes/) {
$total_memory_kb = $1 * 1024;
}
}
$used_memory_kb = $total_memory_kb - $free_memory_kb;
}
else { # We have kstat
my $kstat = Sun::Solaris::Kstat->new();
my $phys_pages = ${kstat}->{unix}->{0}->{system_pages}->{physmem};
my $free_pages = ${kstat}->{unix}->{0}->{system_pages}->{freemem};
# We probably should account for UFS caching here, but it's unclear
# to me how to determine UFS's cache size. There's inode_cache,
# and maybe the physmem variable in the system_pages module??
# In the real world, it looks to be so small as not to really matter,
# so we don't grab it. If someone can give me code that does this,
# I'd be glad to put it in.
my $arc_size = (exists ${kstat}->{zfs} && ${kstat}->{zfs}->{0}->{arcstats}->{size}) ?
${kstat}->{zfs}->{0}->{arcstats}->{size} / 1024
: 0;
$caches_kb += $arc_size;
my $pagesize = `pagesize`;
$total_memory_kb = $phys_pages * $pagesize / 1024;
$free_memory_kb = $free_pages * $pagesize / 1024;
$used_memory_kb = $total_memory_kb - $free_memory_kb;
}
}
elsif ( $uname =~ /Darwin/ ) {
$total_memory_kb = (split(/ /,`/usr/sbin/sysctl hw.memsize`))[1]/1024;
my $pagesize = (split(/ /,`/usr/sbin/sysctl hw.pagesize`))[1];
$caches_kb = 0;
my @vm_stat = `/usr/bin/vm_stat`;
foreach (@vm_stat) {
chomp;
if (/^(Pages free):\s+(\d+)\.$/) {
$free_memory_kb = $2*$pagesize/1024;
}
# 'caching' concept works different on MACH
# this should be a reasonable approximation
elsif (/^Pages (inactive|purgable):\s+(\d+).$/) {
$caches_kb += $2*$pagesize/1024;
}
}
$used_memory_kb = $total_memory_kb - $free_memory_kb;
}
elsif ( $uname =~ /AIX/ ) {
my @meminfo = `/usr/bin/vmstat -vh`;
foreach (@meminfo) {
chomp;
if (/^\s*([0-9.]+)\s+(.*)/) {
my $counter_name = $2;
if ($counter_name eq 'memory pages') {
$total_memory_kb = $1*4;
}
if ($counter_name eq 'free pages') {
$free_memory_kb = $1*4;
}
if ($counter_name eq 'file pages') {
$caches_kb = $1*4;
}
if ($counter_name eq 'Number of 4k page frames loaned') {
$free_memory_kb += $1*4;
}
}
}
$used_memory_kb = $total_memory_kb - $free_memory_kb;
}
else {
if ($opt_C) {
print "You can't report on $uname caches!\n";
exit $exit_codes{UNKNOWN};
}
my $command_line = `vmstat | tail -1 | awk '{print \$4,\$5}'`;
chomp $command_line;
my @memlist = split(/ /, $command_line);
# Define the calculating scalars
$used_memory_kb = $memlist[0]/1024;
$free_memory_kb = $memlist[1]/1024;
$total_memory_kb = $used_memory_kb + $free_memory_kb;
}
return ($free_memory_kb,$used_memory_kb,$caches_kb,$hugepages_kb);
}
sub init {
# Get the options
if ($#ARGV le 0) {
&usage;
}
else {
getopts('c:fuChvw:');
}
# Shortcircuit the switches
if (!$opt_w or $opt_w == 0 or !$opt_c or $opt_c == 0) {
print "*** You must define WARN and CRITICAL levels!\n";
&usage;
}
elsif (!$opt_f and !$opt_u) {
print "*** You must select to monitor either USED or FREE memory!\n";
&usage;
}
# Check if levels are sane
if ($opt_w <= $opt_c and $opt_f) {
print "*** WARN level must not be less than CRITICAL when checking FREE memory!\n";
&usage;
}
elsif ($opt_w >= $opt_c and $opt_u) {
print "*** WARN level must not be greater than CRITICAL when checking USED memory!\n";
&usage;
}
}
sub finish {
my ($msg,$state) = @_;
print "$msg\n";
exit $state;
}

150
check_minecraft Executable file
View File

@@ -0,0 +1,150 @@
#!/usr/bin/env python2
# coding=utf8
from datetime import datetime, timedelta
import sys, string, socket, time, argparse
# Exit statuses recognized by Nagios.
STATE_OK = 0
STATE_WARNING = 1
STATE_CRITICAL = 2
STATE_UNKNOWN = 3
# Output formatting string.
OUTPUT_OK = "MINECRAFT OK: {0} - {1} bytes in {2:.3} second response time|time={2}s;{3};{4};0.0;{5}"
OUTPUT_WARNING = "MINECRAFT WARNING: {0} - {1} bytes in {2:.3} second response time|time={2}s;{3};{4};0.0;{5}"
OUTPUT_CRITICAL = "MINECRAFT CRITICAL: {0} - {1} bytes in {2:.3} second response time|time={2}s;{3};{4};0.0;{5}"
OUTPUT_EXCEPTION = "MINECRAFT CRITICAL: {0}"
OUTPUT_UNKNOWN = "MINECRAFT UNKNOWN: Invalid arguments"
# Minecraft packet ID:s, delimiters and encoding.
MC_SERVER_LIST_PING = "\xfe"
MC_DISCONNECT = "\xff"
MC_DELIMITER = u"\xa7"
MC_ENCODING = "utf-16be"
def log(start, message):
print("{0}: {1}".format(datetime.now() - start, message))
def get_server_info(host, port, num_checks, timeout, verbose):
start_time = datetime.now()
total_delta = timedelta()
byte_count = len(MC_SERVER_LIST_PING) * num_checks
# Contact the server multiple times to get a stable average response time.
for i in range(0, num_checks):
if (verbose): iteration = "Iteration {0}/{1}: ".format(i + 1, num_checks)
# Save start time and connect to server.
if (verbose): log(start_time, "{0}Connecting to {1} on port {2}.".format(iteration, host, port))
net_start_time = datetime.now()
s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
s.settimeout(timeout)
s.connect((host, port))
# Send Minecraft Server List Ping packet.
if (verbose): log(start_time, "{0}Sending Server List Ping.".format(iteration))
s.send(MC_SERVER_LIST_PING)
# Receive answer from server. The largest answer returned by the server that also works with the Minecraft client
# seems to be around 520 bytes (259 unicode character at 2 bytes each plus one start byte and one length byte).
if (verbose): log(start_time, "{0}Receiving data...".format(iteration))
data = s.recv(550)
data_len = len(data)
byte_count += data_len
if (verbose): log(start_time, "{0}Received {1} bytes".format(iteration, data_len))
s.close()
# Check if returned data seems valid. If not, throw AssertionError exception.
if (verbose):
if (data[0] == MC_DISCONNECT):
log(start_time, "Returned data seems valid.")
else:
log(start_time, "Returned data is invalid. First byte is {0:#x}.".format(ord(data[0])))
assert data[0] == MC_DISCONNECT
# Save response time for later average calculation.
delta = datetime.now() - net_start_time
total_delta += delta
time.sleep(0.1)
# Calculate the average response time in seconds
total_response = total_delta.seconds + total_delta.microseconds / 1000000.0
average_response = total_response / num_checks
# Decode and split returned skipping the first two bytes.
info = data[3:].decode(MC_ENCODING).split(MC_DELIMITER)
motd = info[:]
del motd[-1] # removing max_players
del motd[-1] # removing players
motd = ''.join(motd).replace("\n","") # removing newlines
return {'motd': motd,
'players': int(info[-2]),
'max_players': int(info[-1]),
'byte_count': byte_count,
'response_time': average_response}
def main():
parser = argparse.ArgumentParser(description="This plugin will try to connect to a Minecraft server.");
parser.add_argument('-H', '--hostname', dest='hostname', metavar='ADDRESS', required=True, help="host name or IP address")
parser.add_argument('-p', '--port', dest='port', type=int, default=25565, metavar='INTEGER', help="port number (default: 25565)")
parser.add_argument('-n', '--number-of-checks', dest='num_checks', type=int, default=5, metavar='INTEGER', help="number of checks to get stable average response time (default: 5)")
parser.add_argument('-m', '--motd', dest='motd', default='A Minecraft Server', metavar='STRING', help="expected motd in server response (default: A Minecraft Server)")
parser.add_argument('-f', '--warn-on-full', dest='full', action='store_true', help="generate warning if server is full")
parser.add_argument('-w', '--warning', dest='warning', type=float, default=0.0, metavar='DOUBLE', help="response time to result in warning status (seconds)")
parser.add_argument('-c', '--critical', dest='critical', type=float, default=0.0, metavar='DOUBLE', help="response time to result in critical status (seconds)")
parser.add_argument('-t', '--timeout', dest='timeout', type=float, default=10.0, metavar='DOUBLE', help="seconds before connection times out (default: 10)")
parser.add_argument('-v', '--verbose', dest='verbose', action='store_true', help="show details for command-line debugging (Nagios may truncate output)")
# Parse the arguments. If it failes, exit overriding exit code.
try:
args = parser.parse_args()
except SystemExit:
print(OUTPUT_UNKNOWN)
sys.exit(STATE_UNKNOWN)
try:
info = get_server_info(args.hostname, args.port, args.num_checks, args.timeout, args.verbose)
if string.find(info['motd'], args.motd) > -1:
# Check if response time is above critical level.
if args.critical and info['response_time'] > args.critical:
print(OUTPUT_CRITICAL.format("{0} second response time".format(info['response_time']), info['byte_count'], info['response_time'], args.warning, args.critical, args.timeout))
sys.exit(STATE_CRITICAL)
# Check if response time is above warning level.
if args.warning and info['response_time'] > args.warning:
print(OUTPUT_WARNING.format("{0} second response time".format(info['response_time']), info['byte_count'], info['response_time'], args.warning, args.critical, args.timeout))
sys.exit(STATE_WARNING)
# Check if server is full.
if args.full and info['players'] == info['max_players']:
print(OUTPUT_WARNING.format("Server full! {0} players online".format(info['players']), info['byte_count'], info['response_time'], args.warning, args.critical, args.timeout))
sys.exit(STATE_WARNING)
print(OUTPUT_OK.format("{0}/{1} players online".format(info['players'], info['max_players']), info['byte_count'], info['response_time'], args.warning, args.critical, args.timeout))
sys.exit(STATE_OK)
else:
print(OUTPUT_WARNING.format("Unexpected MOTD, {0}".format(info['motd']), info['byte_count'], info['response_time'], args.warning, args.critical, args.timeout))
sys.exit(STATE_WARNING)
except socket.error as msg:
print(OUTPUT_EXCEPTION.format(msg))
sys.exit(STATE_CRITICAL)
except AssertionError:
print(OUTPUT_EXCEPTION.format("Invalid data returned by server"))
sys.exit(STATE_CRITICAL)
except UnicodeDecodeError:
print(OUTPUT_EXCEPTION.format("Unable to decode server response"))
sys.exit(STATE_CRITICAL)
if __name__ == "__main__":
main()

38
check_ping_by_hostname Executable file
View File

@@ -0,0 +1,38 @@
#!/bin/bash
#
# check_ping_by_hostname
#
# Attempts to resolve the name for and ping ourselves based on the device's
# hostname.
#
name="$HOSTNAME"
# Ensure $name is available
if [ -z "$name" ]; then
echo "CRITICAL: No hostname(?!)"
exit 2
fi
# Ensure we have the tools we need
for cmd in dig ping; do
if ! command -v "$cmd" > /dev/null 2>&1; then
echo "UNKNOWN: Missing command for check: $cmd"
exit 3
fi
done
# Ensure we can dig ourselves
if [ -z "$(dig +short "$name")" ]; then
echo "CRITICAL: Could not resolve hostname or found empty record: $name"
exit 2
fi
# Ping ourselves
if ! ping "$name" -c 1 > /dev/null 2>&1; then
echo "CRITICAL: Could not ping self"
exit 2
else
echo "OK"
exit 0
fi

295
check_temp Executable file
View File

@@ -0,0 +1,295 @@
#!/bin/bash
################################################################################
# #
# Copyright (C) 2011 Jack-Benny Persson <jake@cyberinfo.se> #
# #
# This program is free software; you can redistribute it and/or modify #
# it under the terms of the GNU General Public License as published by #
# the Free Software Foundation; either version 2 of the License, or #
# (at your option) any later version. #
# #
# This program is distributed in the hope that it will be useful, #
# but WITHOUT ANY WARRANTY; without even the implied warranty of #
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the #
# GNU General Public License for more details. #
# #
# You should have received a copy of the GNU General Public License #
# along with this program; if not, write to the Free Software #
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA #
# #
################################################################################
###############################################################################
# #
# Nagios plugin to monitor CPU and M/B temperature with sensors. #
# Written in Bash (and uses sed & awk). #
# Latest version of check_temp can be found at the below URL: #
# https://github.com/jackbenny/check_temp #
# #
# If you are having problems getting it to work, check the instructions in #
# the README first. It walks you though install lm-sensors and getting it to #
# display sensor data. #
# #
###############################################################################
VERSION="Version 1.2"
AUTHOR="(c) 2011 Jack-Benny Persson (jack-benny@cyberinfo.se), (c) 2020 Onkobu Tanaake (oss@onkobutanaake.de)"
# Sensor program
SENSORPROG=$(whereis -b -B /{bin,sbin,usr} /{bin,sbin,usr}/* -f sensors | awk '{print $2}')
# Ryan's note: utils.sh is installed with nagios-plugins in with the plugins
# Check if utils.sh exists. This lets you use check_domain in a testing environment
# or outside of Nagios.
if [ -e "$PROGPATH/utils.sh" ]; then
. "$PROGPATH/utils.sh"
else
STATE_OK=0
STATE_WARNING=1
STATE_CRITICAL=2
STATE_UNKNOWN=3
# STATE_DEPENDENT=4 (Commented because it's unused.)
fi
shopt -s extglob
#### Functions ####
# Print version information
print_version()
{
echo "$0 - $VERSION"
}
#Print help information
print_help()
{
print_version
echo "$AUTHOR"
echo "Monitor temperature with the use of sensors"
/bin/cat <<EOT
Options:
-h, --help
Print detailed help screen
-V, --version
Print version information
-v, --verbose
Verbose output
-s, --sensor <WORD[,DISPLAY_NAME]>
Set what to monitor, for example CPU or MB (or M/B). Check sensors for the
correct word. Default is CPU. A different display name can be used in output,
by adding it next to sensor with a comma.
It can be used more than once, with different warning/critical thresholds optionally.
-w, --warning <INTEGER>
Exit with WARNING status if above INTEGER degrees
-c, --critical <INTEGER>
Exit with CRITICAL status if above INTEGER degrees
Warning and critical thresholds must be provided before the corresponding --sensor option.
-n
Use the new sed based filter in case classic filter yields no temperature.
Examples:
./check_temp.sh [-n] -w 65 -c 75 --sensor CPU
./check_temp.sh [-n] -w 65 -c 75 --sensor CPU --sensor temp1
./check_temp.sh [-n] -w 65 -c 75 --sensor CPU -w 75 -c 85 --sensor temp1,GPU
EOT
}
###### MAIN ########
# Warning threshold
thresh_warn=
# Critical threshold
thresh_crit=
# Hardware to monitor
default_sensor="CPU"
sensor_declared=false
STATE=$STATE_OK
# See if we have sensors program installed and can execute it
if [[ ! -x "$SENSORPROG" ]]; then
echo "It appears you don't have lm-sensors installed. You may find help in the readme for this script."
exit $STATE_UNKNOWN
fi
function set_state {
[[ "$STATE" -lt "$1" ]] && STATE=$1
}
function process_sensor {
sensor=$(echo $1 | cut -d, -f1)
sensor_display=$(echo $1 | cut -d, -f2)
# Check if a sensor were specified
if [[ -z "$sensor" ]]; then
# No sensor to monitor were specified
echo "No sensor specified"
print_help
exit $STATE_UNKNOWN
fi
# Check if the thresholds have been set correctly
if [[ -z "$thresh_warn" || -z "$thresh_crit" ]]; then
# One or both thresholds were not specified
echo "Threshold not set"
print_help
exit $STATE_UNKNOWN
elif [[ "$thresh_crit" -lt "$thresh_warn" ]]; then
# The warning threshold must be lower than the critical threshold
echo "Warning temperature should be lower than critical"
print_help
exit $STATE_UNKNOWN
fi
# Get the temperature
# Grep the first float with a plus sign and keep only the integer
if [ $CLASSIC_FILTER -eq 1 ]; then
WHOLE_TEMP=$(${SENSORPROG} | grep "$sensor" | head -n1 | grep -o "+[0-9]\+\(\.[0-9]\+\)\?[^ \t,()]*" | head -n1)
else
WHOLE_TEMP=$(${SENSORPROG} -A "$sensor" | sed -n '2 p' | grep -o "+[0-9]\+\(\.[0-9]\+\)\?[^ \t,()]*" | head -n1)
fi
TEMPF=$(echo "$WHOLE_TEMP" | grep -o "[0-9]\+\(\.[0-9]\+\)\?")
TEMP=$(echo "$TEMPF" | cut -d. -f1)
# Verbose output
if [[ "$verbosity" -ge 1 ]]; then
/bin/cat <<__EOT
Debugging information:
Warning threshold: $thresh_warn
Critical threshold: $thresh_crit
Verbosity level: $verbosity
Current $sensor temperature: $TEMP
__EOT
echo "Temperature lines directly from sensors:"
${SENSORPROG}
fi
# Get performance data for Nagios "Performance Data" field
PERFDATA="$PERFDATA $sensor_display=$TEMP;$thresh_warn;$thresh_crit"
# And finally check the temperature against our thresholds
if [[ "$TEMP" != +([0-9]) ]]; then
# Temperature not found for that sensor
OUTPUT_TEXT="$OUTPUT_TEXT, No data found for sensor ($sensor)"
set_state $STATE_UNKNOWN
elif [[ "$TEMP" -gt "$thresh_crit" ]]; then
# Temperature is above critical threshold
OUTPUT_TEXT="$OUTPUT_TEXT, $sensor_display has temperature: $WHOLE_TEMP"
set_state $STATE_CRITICAL
elif [[ "$TEMP" -gt "$thresh_warn" ]]; then
# Temperature is above warning threshold
OUTPUT_TEXT="$OUTPUT_TEXT, $sensor_display has temperature: $WHOLE_TEMP"
set_state $STATE_WARNING
else
# Temperature is ok
OUTPUT_TEXT="$OUTPUT_TEXT, $sensor_display has temperature: $WHOLE_TEMP"
set_state $STATE_OK
fi
}
CLASSIC_FILTER=1
# Parse command line options
while [[ -n "$1" ]]; do
case "$1" in
-h | --help)
print_help
exit $STATE_OK
;;
-V | --version)
print_version
exit $STATE_OK
;;
-v | --verbose)
: $(( verbosity++ ))
shift
;;
-w | --warning)
if [[ -z "$2" ]]; then
# Threshold not provided
echo "Option $1 requires an argument"
print_help
exit $STATE_UNKNOWN
elif [[ "$2" = +([0-9]) ]]; then
# Threshold is an integer
thresh=$2
else
# Threshold is not an integer
echo "Threshold must be an integer"
print_help
exit $STATE_UNKNOWN
fi
thresh_warn=$thresh
shift 2
;;
-c | --critical)
if [[ -z "$2" ]]; then
# Threshold not provided
echo "Option '$1' requires an argument"
print_help
exit $STATE_UNKNOWN
elif [[ "$2" = +([0-9]) ]]; then
# Threshold is an integer
thresh=$2
else
# Threshold is not an integer
echo "Threshold must be an integer"
print_help
exit $STATE_UNKNOWN
fi
thresh_crit=$thresh
shift 2
;;
-s | --sensor)
if [[ -z "$2" ]]; then
echo "Option $1 requires an argument"
print_help
exit $STATE_UNKNOWN
fi
sensor_declared=true
sensors_to_check="$2"
shift 2
;;
-n | --new-filter)
CLASSIC_FILTER=0
shift 1
;;
*)
echo "Invalid option '$1'"
print_help
exit $STATE_UNKNOWN
;;
esac
# argument order is irrelevant, Icinga2 gives no guarantees
# as soon as there are enough output is generated
if [ ! -z "$thresh_warn" ] && [ ! -z "$thresh_crit" ] && [ ! -z "$sensors_to_check" -o $# -eq 0 ]; then
if [ "$sensor_declared" = false ]; then
process_sensor "$default_sensor"
else
process_sensor "$sensors_to_check"
fi
fi
done
case "$STATE" in
"$STATE_OK") STATE_TEXT="OK" ;;
"$STATE_WARNING") STATE_TEXT="WARNING" ;;
"$STATE_CRITICAL") STATE_TEXT="CRITICAL" ;;
"$STATE_UNKNOWN") STATE_TEXT="UNKNOWN" ;;
esac
OUTPUT_TEXT=$(echo $OUTPUT_TEXT | sed -e 's/, //')
echo "TEMPERATURE $STATE_TEXT - $OUTPUT_TEXT |$PERFDATA"
exit $STATE