version 1.1, 2006/05/01 19:11:23 |
version 1.30, 2009/11/09 23:13:04 |
|
|
#!/usr/bin/perl
|
#!/usr/bin/perl -T |
# $RedRiver$
|
# $RedRiver: check_hw_sensors,v 1.29 2009/11/09 23:06:26 andrew Exp $ |
########################################################################
|
######################################################################## |
# check_sensors *** A nagios check for OpenBSD sensors
|
# check_hw_sensors *** A nagios check for OpenBSD sysctl hw.sensors |
#
|
# |
# 2006.05.01 #*#*# andrew fresh <andrew@mad-techies.org>
|
# 2006.05.01 #*#*# andrew fresh <andrew@mad-techies.org> |
########################################################################
|
######################################################################## |
use strict;
|
use strict; |
use warnings;
|
use warnings; |
|
|
|
%ENV = (); |
|
|
|
use constant NAGIOS_OUTPUT => 1; |
|
|
|
my $License = <<'EOL'; |
|
Copyright (c) 2009 Andrew Fresh <andrew@afresh1.com> |
|
Permission to use, copy, modify, and distribute this software for any |
|
purpose with or without fee is hereby granted, provided that the above |
|
copyright notice and this permission notice appear in all copies. |
|
|
|
THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES |
|
WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
|
MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR |
|
ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
|
WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
|
ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
|
OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
|
EOL |
|
|
|
use POSIX; |
|
use Config; |
|
use lib "/usr/local/libexec/nagios"; |
|
use utils qw($TIMEOUT %ERRORS &support); |
|
|
|
use Getopt::Long; |
|
Getopt::Long::Configure('bundling'); |
|
|
|
my $PROGNAME = "check_hw_sensors"; |
|
|
|
my $SYSCTL = '/sbin/sysctl'; |
|
my $GETCAP = '/usr/bin/getcap'; |
|
my $BASE = 'hw.sensors'; |
|
my $DEFAULT_CONFIG = '/etc/sensorsd.conf'; |
|
my $OSVer = $Config{'osvers'} || 0; |
|
|
|
my $state = 'UNKNOWN'; # tells whether the it is warning, critical, or OK |
|
my %states; # This stores the count of states; |
|
my $opt_V; |
|
my $opt_h; |
|
my $ignore_status; |
|
my $filename; |
|
my $sensor; |
|
my $warning; |
|
my $critical; |
|
|
|
my $CHECK_SENSOR = $BASE; |
|
my %CHECKS; |
|
my %SENSORS; |
|
|
|
#Option checking |
|
my $status = GetOptions( |
|
"version|V" => \$opt_V, |
|
"help|h" => \$opt_h, |
|
"ignore-status|i" => \$ignore_status, |
|
"filename|f:s" => \$filename, |
|
"sensor|s=s" => \$sensor, |
|
"warning|w=s" => \$warning, |
|
"critical|c=s" => \$critical, |
|
); |
|
|
|
# set the default this way so it only happens if someone typed -f or --filename |
|
$filename = $DEFAULT_CONFIG if ( defined $filename && $filename eq '' ); |
|
|
|
# Stuff is output in this file by print_sensor() |
|
# http://www.openbsd.org/cgi-bin/cvsweb/src/sbin/sysctl/sysctl.c |
|
my @Type_Map = ( |
|
{ type => 'temp', |
|
regex => qr/\sdegC$/, |
|
}, |
|
{ type => 'fanrpm', |
|
regex => qr/\sRPM$/, |
|
}, |
|
{ type => 'volts_dc', |
|
regex => qr/\sV\sDC$/, |
|
}, |
|
{ type => 'amps', |
|
regex => qr/\sA$/, |
|
}, |
|
{ type => 'watthour', |
|
regex => qr/\sWh$/, |
|
}, |
|
{ type => 'amphour', |
|
regex => qr/\sAh$/, |
|
}, |
|
{ type => 'indicator', |
|
regex => qr/^(On|Off)$/, |
|
}, |
|
{ type => 'integer', |
|
regex => qr/\sraw$/, |
|
}, |
|
{ type => 'percent', |
|
regex => qr/\s\%$/, |
|
}, |
|
{ type => 'lux', |
|
regex => qr/\slx$/, |
|
}, |
|
{ type => 'drive', |
|
regex => qr/^drive\s/, |
|
}, |
|
{ type => 'timedelta', |
|
regex => qr/\ssecs$/, |
|
}, |
|
); |
|
|
|
if ( $status == 0 ) { |
|
print_help(); |
|
exit $ERRORS{'OK'}; |
|
} |
|
|
|
if ($opt_V) { |
|
print_revision( $PROGNAME, '$Revision$ ' ); |
|
exit $ERRORS{'OK'}; |
|
} |
|
|
|
if ($opt_h) { |
|
print_help(); |
|
exit $ERRORS{'OK'}; |
|
} |
|
|
|
if ( defined $sensor ) { |
|
if ( $sensor !~ /^$BASE/ ) { |
|
$sensor = $BASE . '.' . $sensor; |
|
} |
|
$CHECK_SENSOR = $sensor; |
|
|
|
$CHECKS{$sensor}{'warn'} = $warning if defined $warning; |
|
$CHECKS{$sensor}{'crit'} = $critical if defined $critical; |
|
|
|
} |
|
elsif ( defined $filename ) { |
|
%CHECKS = parse_file($filename); |
|
} |
|
|
|
open my $sysctl, "-|", $SYSCTL, $CHECK_SENSOR |
|
or die "Couldn't open sysctl: $!"; |
|
while (<$sysctl>) { |
|
|
|
#while (<>) { |
|
chomp; |
|
my ( $id, $output ) = split /=/; |
|
my @s = split /\./, $id; |
|
my @o = split /,\s*/, $output; |
|
|
|
my ( $type, $source, $descr, $data, $status ); |
|
|
|
$source = $o[0]; |
|
$descr = $o[1]; |
|
|
|
if ( $OSVer >= 4.1 ) { |
|
$data = $o[0]; |
|
if ( $data =~ s/\s+\((.*)\).*$// ) { |
|
$descr = $1; |
|
} |
|
$status = $o[1]; |
|
( $source, $type ) = $id =~ /([^\.]+)\.([^\.]+?)\d+$/; |
|
} |
|
elsif ( $OSVer >= 4.0 ) { |
|
$data = $o[2]; |
|
$status = $o[3]; |
|
foreach my $t (@Type_Map) { |
|
if ( $data =~ /$t->{'regex'}/ ) { |
|
$type = $t->{'type'}; |
|
last; |
|
} |
|
} |
|
} |
|
else { |
|
$data = $o[-1]; |
|
$status = $o[2] if @o == 5; |
|
$type = $o[-2]; |
|
} |
|
|
|
$type ||= 'unknown'; |
|
|
|
$SENSORS{$id} = { |
|
id => $id, |
|
output => $output, |
|
source => $source, |
|
description => $descr, |
|
status => $status, |
|
type => $type, |
|
data => $data, |
|
}; |
|
|
|
} |
|
close $sysctl; |
|
|
|
sub as_if_numeric { |
|
my $_a = $a; |
|
my $_b = $b; |
|
$_a =~ s/\D//g; |
|
$_b =~ s/\D//g; |
|
$_a <=> $_b; |
|
} |
|
|
|
foreach my $s ( sort as_if_numeric keys %SENSORS ) { |
|
my ( $r, $data ); |
|
if ( exists $CHECKS{$s} ) { |
|
$r = check_sensor( $SENSORS{$s}, $CHECKS{$s} ); |
|
$data = $s . '=' . $SENSORS{$s}{'output'}; |
|
} |
|
elsif ( !$ignore_status ) { |
|
$r = check_sensor( $SENSORS{$s} ); |
|
$data = $s . '=' . $SENSORS{$s}{'output'}; |
|
} |
|
else { |
|
|
|
# ignore this sensor |
|
} |
|
next unless defined $r; |
|
push @{ $states{$r} }, $data; |
|
} |
|
|
|
$state = 'OK'; |
|
my $have_results = 0; |
|
foreach my $error ( sort { $ERRORS{$a} <=> $ERRORS{$b} } keys %ERRORS ) { |
|
if ( exists $states{$error} ) { |
|
$have_results++; |
|
$state = $error; |
|
} |
|
} |
|
foreach my $error ( sort { $ERRORS{$b} <=> $ERRORS{$a} } keys %ERRORS ) { |
|
if ( exists $states{$error} ) { |
|
if (NAGIOS_OUTPUT) { |
|
print "$error (" . scalar( @{ $states{$error} } ) . ")"; |
|
if ( $error ne 'OK' ) { |
|
print '<br>'; |
|
print map {" - $_<br>"} @{ $states{$error} }; |
|
} |
|
} |
|
else { |
|
print "$error (" . scalar( @{ $states{$error} } ) . "):\n"; |
|
foreach ( @{ $states{$error} } ) { |
|
print " $_\n"; |
|
} |
|
} |
|
} |
|
} |
|
if ( $have_results == 0 ) { |
|
print "No results found\n"; |
|
} |
|
exit $ERRORS{$state}; |
|
|
|
sub parse_file { |
|
my $filename = shift; |
|
my %contents; |
|
|
|
die "file '$filename' does not exist." unless -e $filename; |
|
|
|
open my $fh, '-|', $GETCAP, '-a', '-f', $filename |
|
or die "Couldn't open FILE '$GETCAP -a -f $filename': $!"; |
|
while (<$fh>) { |
|
chomp; |
|
my ( $key, @c ) = split /\:/; |
|
foreach (@c) { |
|
my ( $k, $v ) = split /\=/; |
|
if ( lc($k) eq 'ignore' ) { |
|
$contents{$key}{'IGNORE'} = 1; |
|
} |
|
elsif ( lc($k) eq 'status' ) { |
|
$contents{$key}{'STATUS'} = 1; |
|
} |
|
else { |
|
$contents{$key}{$k} = $v; |
|
} |
|
} |
|
} |
|
close $fh; |
|
|
|
return %contents; |
|
} |
|
|
|
sub parse_check { |
|
my $check = shift; |
|
|
|
return unless $check; |
|
return if $check->{'STATUS'}; |
|
return 'IGNORE' if $check->{'IGNORE'}; |
|
|
|
foreach my $code ( 'crit', 'warn' ) { |
|
if ( defined $check->{$code} && $check->{$code} =~ /:/ ) { |
|
if ( my ( $low, $high ) = split /:/, $check->{$code} ) { |
|
$check->{ $code . '.low' } = $low if length $low; |
|
$check->{ $code . '.high' } = $high if length $high; |
|
} |
|
delete $check->{$code}; |
|
} |
|
|
|
foreach my $severity ( 'low', 'high' ) { |
|
if ( defined $check->{$severity} ) { |
|
$check->{ $code . '.' . $severity } = $check->{$severity} |
|
if !defined $check->{ $code . '.' . $severity }; |
|
} |
|
} |
|
no warnings 'uninitialized'; |
|
$check->{$code} = [ split /,\s*/, $check->{$code} ]; |
|
} |
|
|
|
return $check; |
|
} |
|
|
|
sub check_sensor { |
|
my $sensor = shift; |
|
my $check = shift; |
|
my $result = 'UNKNOWN'; |
|
my %errors = ( |
|
'warn' => 'WARNING', |
|
'crit' => 'CRITICAL', |
|
); |
|
|
|
return $result unless ref $sensor eq 'HASH'; |
|
$check = parse_check($check) if $check; |
|
|
|
if ( !$check ) { |
|
|
|
# It looks like doing this should be safe, from |
|
# src/sbin/sysctl/sysctl.c |
|
return $sensor->{'status'} if $sensor->{'status'}; |
|
|
|
return; |
|
} |
|
elsif ( $check eq 'IGNORE' ) { |
|
return; |
|
} |
|
|
|
$result = 'OK'; |
|
foreach my $code ( 'warn', 'crit' ) { |
|
if ( $sensor->{'type'} eq 'fan' |
|
|| $sensor->{'type'} eq 'fanrpm' |
|
|| $sensor->{'type'} eq 'volt' |
|
|| $sensor->{'type'} eq 'volts_dc' |
|
|| $sensor->{'type'} eq 'amps' |
|
|| $sensor->{'type'} eq 'watthour' |
|
|| $sensor->{'type'} eq 'amphour' |
|
|| $sensor->{'type'} eq 'integer' |
|
|| $sensor->{'type'} eq 'raw' |
|
|| $sensor->{'type'} eq 'percent' |
|
|| $sensor->{'type'} eq 'lux' |
|
|| $sensor->{'type'} eq 'timedelta' ) |
|
{ |
|
my $data = $sensor->{'data'}; |
|
$data =~ s/[^\d\.]//g; |
|
if ( !length $data ) { |
|
warn |
|
"INVALID DATA ($sensor->{'data'}) for '$sensor->{'id'}'\n"; |
|
next; |
|
} |
|
|
|
if ( defined $check->{ $code . ".low" } |
|
|| defined $check->{ $code . ".high" } ) |
|
{ |
|
if ( defined $check->{ $code . ".low" } ) { |
|
my $c = $check->{ $code . ".low" }; |
|
$c =~ s/[^\d\.]//g; |
|
|
|
if ( !length $c ) { |
|
warn "INVALID CHECK (" |
|
. $check->{ $code . ".low" } |
|
. ") for '$sensor->{'id'}:$code.low'\n"; |
|
next; |
|
} |
|
|
|
$result = $errors{$code} |
|
if ( $c >= $data ); |
|
} |
|
if ( defined $check->{ $code . ".high" } ) { |
|
my $c = $check->{ $code . ".high" }; |
|
$c =~ s/[^\d\.]//g; |
|
if ( !length $c ) { |
|
warn "INVALID CHECK (" |
|
. $check->{ $code . ".high" } |
|
. ") for '$sensor->{'id'}:$code.high'\n"; |
|
next; |
|
} |
|
|
|
$result = $errors{$code} |
|
if ( $c <= $data ); |
|
} |
|
} |
|
elsif ( @{ $check->{$code} } ) { |
|
my $matched = 0; |
|
foreach ( @{ $check->{$code} } ) { |
|
my $c = $_; |
|
$c =~ s/[^\d\.]//g; |
|
if ( !length $c ) { |
|
warn "INVALID CHECK (" . $_ |
|
. ") for '$sensor->{'id'}:$code'\n"; |
|
next; |
|
} |
|
|
|
if ( $c eq $data ) { |
|
$matched = 1; |
|
last; |
|
} |
|
} |
|
$result = $errors{$code} unless $matched; |
|
} |
|
|
|
} |
|
elsif ( $sensor->{'type'} eq 'temp' ) { |
|
my ( $degC, $degF ) = split /\//, $sensor->{'data'}; |
|
$degC =~ s/[^\d\.]//g; |
|
$degF ||= $degC * 9 / 5 + 32; |
|
$degF =~ s/[^\d\.]//g; |
|
if ( defined $check->{ $code . ".low" } |
|
|| defined $check->{ $code . ".high" } ) |
|
{ |
|
if ( defined $check->{ $code . ".low" } ) { |
|
my $c = $check->{ $code . ".low" }; |
|
my $data = $degC; |
|
|
|
$data = $degF if ( $c =~ /F/i ); |
|
if ( !length $data ) { |
|
warn "INVALID DATA (" |
|
. $sensor->{'data'} |
|
. ") for '$sensor->{'id'}'\n"; |
|
next; |
|
} |
|
|
|
$c =~ s/[^\d\.]//g; |
|
if ( !length $c ) { |
|
warn "INVALID CHECK (" |
|
. $check->{ $code . ".low" } |
|
. ") for '$sensor->{'id'}':$code.low\n"; |
|
next; |
|
} |
|
|
|
$result = $errors{$code} |
|
if ( $c >= $data ); |
|
} |
|
if ( defined $check->{ $code . ".high" } ) { |
|
my $c = $check->{ $code . ".high" }; |
|
|
|
my $data = $degC; |
|
$data = $degF if ( $c =~ /F/i ); |
|
if ( !length $data ) { |
|
warn "INVALID DATA (" |
|
. $sensor->{'data'} |
|
. ") for '$sensor->{'id'}'\n"; |
|
next; |
|
} |
|
|
|
$c =~ s/[^\d\.]//g; |
|
if ( !length $c ) { |
|
warn "INVALID CHECK (" |
|
. $check->{ $code . ".high" } |
|
. ") for '$sensor->{'id'}:$code.high'\n"; |
|
next; |
|
} |
|
|
|
$result = $errors{$code} |
|
if ( $c <= $data ); |
|
} |
|
} |
|
elsif ( @{ $check->{$code} } ) { |
|
|
|
my $matched = 0; |
|
foreach ( @{ $check->{$code} } ) { |
|
my $c = $_; |
|
my $data = $degC; |
|
|
|
$data = $degF if ( $c =~ /F/i ); |
|
if ( !length $data ) { |
|
warn "INVALID DATA (" |
|
. $sensor->{'data'} |
|
. ") for '$sensor->{'id'}'\n"; |
|
next; |
|
} |
|
|
|
$c =~ s/[^\d\.]//g; |
|
if ( !length $c ) { |
|
warn "INVALID CHECK (" . $_ |
|
. ") for '$sensor->{'id'}':$code\n"; |
|
next; |
|
} |
|
|
|
if ( $c eq $data ) { |
|
$matched = 1; |
|
last; |
|
} |
|
} |
|
$result = $errors{$code} unless $matched; |
|
} |
|
} |
|
elsif ($sensor->{'type'} eq 'drive' |
|
|| $sensor->{'type'} eq 'indicator' ) |
|
{ |
|
$sensor->{'data'} =~ s/^drive\s+//; |
|
if ( @{ $check->{$code} } ) { |
|
my $matched = 0; |
|
foreach ( @{ $check->{$code} } ) { |
|
if ( $_ eq $sensor->{'data'} ) { |
|
$matched = 1; |
|
last; |
|
} |
|
} |
|
$result = $errors{$code} unless $matched; |
|
} |
|
|
|
} |
|
else { |
|
warn 'Unknown Sensor Type: ', |
|
$sensor->{'id'}, |
|
'=', |
|
$sensor->{'type'}, |
|
"\n"; |
|
$result = 'UNKNOWN'; |
|
} |
|
|
|
} |
|
|
|
return $result; |
|
} |
|
|
|
sub print_help { |
|
print <<"EOL"; |
|
$PROGNAME - monitors sysctl hw.sensors on OpenBSD |
|
$PROGNAME [-i] [-f [<FILENAME>]|(-s <hw.sensors id> [-w limit] [-c limit])] |
|
|
|
Usage: |
|
-i, --ignore-status |
|
Don't automatically check the status of sensors that report it. |
|
-f, --filename=FILE |
|
FILE to load checks from (defaults to /etc/sensorsd.conf) |
|
-s, --sensor=ID |
|
ID of a single sensor. "-s kate0.temp0" means hw.sensors.kate0.temp0 |
|
Overrides --filename. |
|
-w, --warning=RANGE or single ENTRY |
|
Exit with WARNING status if outside of RANGE or if != ENTRY |
|
-c, --critical=RANGE or single ENTRY |
|
Exit with CRITICAL status if outside of RANGE or if != ENTRY |
|
|
|
FILE is in the same format as sensorsd.conf(5) plus some additional |
|
entries. These additional entries in the file are ignored by |
|
sensorsd(8) this means you can use the same config file for $PROGNAME |
|
as well as sensorsd(8). |
|
|
|
$PROGNAME understands the following entries: |
|
|
|
low, high, crit, warn, crit.low, crit.high, warn.low, warn.high, |
|
ignore, status |
|
|
|
An ENTRY depends on the type. The descriptions in sensorsd.conf(5) |
|
can be used when appropriate, or you can use the following: |
|
|
|
fanrpm, volts_dc, amps, watthour, amphour, integer (raw), percent, |
|
lux or timedelta - Anything that includes digits. Both the value of |
|
the check and the value of the sensor response that are not either a |
|
digit or period are stripped and then the two resultant values are |
|
compared. |
|
|
|
temp - Can be as above, but if the entry has an F in it, |
|
it compares farenheit, otherwise it uses celcius. |
|
|
|
indicator or drive - does a case sensitive match of each |
|
entry in the comma separated list and if it does not match |
|
any of the entries, it sets the status. |
|
|
|
The entries 'crit' or 'warn' (or the -c or -w on the command line) |
|
may be a RANGE or a comma separated list of acceptable values. |
|
The comma separated list of values contains a list of things that |
|
will NOT cause the status. This is possibly counterintuitive, but |
|
you are more likely to know good values than bad values. |
|
|
|
A RANGE is a low ENTRY and a high ENTRY separated by a colon (:). |
|
It can also be low: or :high with the other side left blank to only |
|
make the single check. |
|
|
|
An entry marked "ignore" will cause that sensor to be skipped. |
|
Generally used with state checking of all sensors to ignore sensors you |
|
don't care about or that report incorrectly. |
|
|
|
If you are using --ignore-status, you can still check the status of |
|
individual sensors with a status entry. |
|
|
|
EOL |
|
|
|
print_revision( $PROGNAME, '$Revision$' ); |
|
|
|
print $License; |
|
} |
|
|
|
sub print_revision { |
|
my ( $prog, $rev ) = @_; |
|
$rev =~ s/^\D+([\d\.]+)\D+$/v$1/xms; |
|
|
|
print "$prog $rev\n"; |
|
} |
|
|