Skip to content

HTTPS clone URL

Subversion checkout URL

You can clone with
or
.
Download ZIP
Branch: master
Fetching contributors…

Cannot retrieve contributors at this time

executable file 5420 lines (4862 sloc) 187.366 kB
#!/usr/local/groundwork/perl/bin/perl
#
# Nagios plugin
#
# Monitor Dell server hardware status using Dell OpenManage Server
# Administrator, either locally via NRPE, or remotely via SNMP.
#
# $Id: check_openmanage 21113 2011-10-05 12:53:25Z trondham $
#
# Copyright (C) 2008-2011 Trond H. Amundsen
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
require 5.006; # Perl v5.6.0 or newer is required
use strict;
use warnings;
use POSIX qw(isatty ceil);
use Getopt::Long qw(:config no_ignore_case);
# Global (package) variables used throughout the code
use vars qw( $NAME $VERSION $AUTHOR $CONTACT $E_OK $E_WARNING $E_CRITICAL
$E_UNKNOWN $FW_LOCK $USAGE $HELP $LICENSE
$snmp_session $snmp_error $omreport $globalstatus $global
$linebreak $omopt_chassis $omopt_system $blade
$exit_code $snmp
%check %opt %reverse_exitcode %status2nagios
%snmp_status %snmp_probestatus %probestatus2nagios %sysinfo
%blacklist %nagios_alert_count %count %snmp_enclosure %snmp_controller
@perl_warnings @controllers @enclosures @perfdata
@report_storage @report_chassis @report_other
);
#---------------------------------------------------------------------
# Initialization and global variables
#---------------------------------------------------------------------
# Collect perl warnings in an array
$SIG{__WARN__} = sub { push @perl_warnings, [@_]; };
# Version and similar info
$NAME = 'check_openmanage';
$VERSION = '3.7.3';
$AUTHOR = 'Trond H. Amundsen';
$CONTACT = 't.h.amundsen@usit.uio.no';
# Exit codes
$E_OK = 0;
$E_WARNING = 1;
$E_CRITICAL = 2;
$E_UNKNOWN = 3;
# Firmware update lock file [FIXME: location on Windows?]
$FW_LOCK = '/var/lock/.spsetup'; # default on Linux
# Usage text
$USAGE = <<"END_USAGE";
Usage: $NAME [OPTION]...
END_USAGE
# Help text
$HELP = <<'END_HELP';
GENERAL OPTIONS:
-f, --config Specify configuration file
-p, --perfdata Output performance data [default=no]
-t, --timeout Plugin timeout in seconds [default=30]
-c, --critical Custom temperature critical limits
-w, --warning Custom temperature warning limits
-F, --fahrenheit Use Fahrenheit as temperature unit
-d, --debug Debug output, reports everything
-h, --help Display this help text
-V, --version Display version info
SNMP OPTIONS:
-H, --hostname Hostname or IP (required for SNMP)
-C, --community SNMP community string [default=public]
-P, --protocol SNMP protocol version [default=2]
--port SNMP port number [default=161]
-6, --ipv6 Use IPv6 instead of IPv4 [default=no]
--tcp Use TCP instead of UDP [default=no]
OUTPUT OPTIONS:
-i, --info Prefix any alerts with the service tag
-e, --extinfo Append system info to alerts
-s, --state Prefix alerts with alert state
-S, --short-state Prefix alerts with alert state abbreviated
-o, --okinfo Verbosity when check result is OK
-B, --show-blacklist Show blacklistings in OK output
-I, --htmlinfo HTML output with clickable links
CHECK CONTROL AND BLACKLISTING:
-a, --all Check everything, even log content
-b, --blacklist Blacklist missing and/or failed components
--only Only check a certain component or alert type
--check Fine-tune which components are checked
--no-storage Don't check storage
For more information and advanced options, see the manual page or URL:
http://folk.uio.no/trondham/software/check_openmanage.html
END_HELP
# Version and license text
$LICENSE = <<"END_LICENSE";
$NAME $VERSION
Copyright (C) 2008-2011 $AUTHOR
License GPLv3+: GNU GPL version 3 or later <http://gnu.org/licenses/gpl.html>
This is free software: you are free to change and redistribute it.
There is NO WARRANTY, to the extent permitted by law.
Written by $AUTHOR <$CONTACT>
END_LICENSE
# Options with default values
%opt = ( 'blacklist' => [], # blacklisting
'check' => [], # check control
'critical' => [], # temperature critical limits
'warning' => [], # temperature warning limits
'tempunit' => 'C', # temperature unit
'fahrenheit' => 0, # Use fahrenheit
'configfile' => undef, # configuration file
'timeout' => 30, # default timeout is 30 seconds
'debug' => 0, # debugging / verbose output
'help' => 0, # display help output
'perfdata' => undef, # output performance data
'legacy_perfdata' => 0, # legacy performance data output
'info' => 0, # display servicetag
'extinfo' => 0, # display extra info
'htmlinfo' => undef, # html tags in output
'postmsg' => undef, # post message
'state' => 0, # display alert type
'short-state' => 0, # display alert type (short)
'okinfo' => 0, # default "ok" output level
'show_blacklist' => 0, # show blacklisted components
'linebreak' => undef, # specify linebreak
'version' => 0, # plugin version info
'all' => 0, # check everything
'only' => undef, # only one component
'no_storage' => 0, # don't check storage
'omreport' => undef, # omreport path
'port' => 161, # default SNMP port
'hostname' => undef, # hostname or IP
'community' => 'public', # SMNP v1 or v2c
'protocol' => 2, # default SNMP protocol 2c
'ipv6' => 0, # default is IPv4
'tcp' => 0, # default is UDP
'username' => undef, # SMNP v3
'authpassword' => undef, # SMNP v3
'authkey' => undef, # SMNP v3
'authprotocol' => undef, # SMNP v3
'privpassword' => undef, # SMNP v3
'privkey' => undef, # SMNP v3
'privprotocol' => undef, # SMNP v3
'use_get_table' => 0, # hack for SNMPv3 on Windows with net-snmp
'hide_servicetag' => 0, # hidden servicetag
);
# Get options
GetOptions('b|blacklist=s' => \@{ $opt{blacklist} },
'check=s' => \@{ $opt{check} },
'c|critical=s' => \@{ $opt{critical} },
'w|warning=s' => \@{ $opt{warning} },
'tempunit=s' => \$opt{tempunit},
'F|fahrenheit' => \$opt{fahrenheit},
'f|configfile=s' => \$opt{configfile},
't|timeout=i' => \$opt{timeout},
'd|debug' => \$opt{debug},
'h|help' => \$opt{help},
'V|version' => \$opt{version},
'p|perfdata:s' => \$opt{perfdata},
'legacy-perfdata' => \$opt{legacy_perfdata},
'i|info' => \$opt{info},
'e|extinfo' => \$opt{extinfo},
'I|htmlinfo:s' => \$opt{htmlinfo},
'postmsg=s' => \$opt{postmsg},
's|state' => \$opt{state},
'S|short-state' => \$opt{shortstate},
'o|ok-info=i' => \$opt{okinfo},
'B|show-blacklist' => \$opt{show_blacklist},
'linebreak=s' => \$opt{linebreak},
'a|all' => \$opt{all},
'only=s' => \$opt{only},
'no-storage' => \$opt{no_storage},
'omreport=s' => \$opt{omreport},
'port=i' => \$opt{port},
'H|hostname=s' => \$opt{hostname},
'C|community=s' => \$opt{community},
'P|protocol=i' => \$opt{protocol},
'6|ipv6' => \$opt{ipv6},
'tcp' => \$opt{tcp},
'U|username=s' => \$opt{username},
'authpassword=s' => \$opt{authpassword},
'authkey=s' => \$opt{authkey},
'authprotocol=s' => \$opt{authprotocol},
'privpassword=s' => \$opt{privpassword},
'privkey=s' => \$opt{privkey},
'privprotocol=s' => \$opt{privprotocol},
'use-get_table' => \$opt{use_get_table},
'hide-servicetag' => \$opt{hide_servicetag},
) or do { print $USAGE; exit $E_UNKNOWN };
# If user requested help
if ($opt{help}) {
print $USAGE, $HELP;
exit $E_UNKNOWN;
}
# If user requested version info
if ($opt{version}) {
print $LICENSE;
exit $E_UNKNOWN;
}
# Initialize blacklist
%blacklist = ();
# Check flags, override available with the --check option
%check = ( 'storage' => 1, # check storage subsystem
'memory' => 1, # check memory (dimms)
'fans' => 1, # check fan status
'power' => 1, # check power supplies
'temp' => 1, # check temperature
'cpu' => 1, # check processors
'voltage' => 1, # check voltage
'batteries' => 1, # check battery probes
'amperage' => 1, # check power consumption
'intrusion' => 1, # check intrusion detection
'sdcard' => 1, # check removable flash media (SD cards)
'alertlog' => 0, # check the alert log
'esmlog' => 0, # check the ESM log (hardware log)
'esmhealth' => 1, # check the ESM log overall health
);
# Messages
@report_storage = (); # messages with associated nagios level (storage)
@report_chassis = (); # messages with associated nagios level (chassis)
@report_other = (); # messages with associated nagios level (other)
# Read config file
parse_configfile() if defined $opt{configfile};
# Setting timeout
$SIG{ALRM} = sub {
print "PLUGIN TIMEOUT: $NAME timed out after $opt{timeout} seconds\n";
exit $E_UNKNOWN;
};
alarm $opt{timeout};
# If we're using SNMP
$snmp = defined $opt{hostname} ? 1 : 0;
# SNMP session variables
$snmp_session = undef;
$snmp_error = undef;
# The omreport command
$omreport = undef;
# Default line break
$linebreak = isatty(*STDOUT) ? "\n" : '<br/>';
# Line break from option
if (defined $opt{linebreak}) {
if ($opt{linebreak} eq 'REG') {
$linebreak = "\n";
}
elsif ($opt{linebreak} eq 'HTML') {
$linebreak = '<br/>';
}
else {
$linebreak = $opt{linebreak};
}
}
# Exit with status=UNKNOWN if there is firmware upgrade in progress
if (!$snmp && -f $FW_LOCK) {
print "MONITORING DISABLED - Firmware update in progress ($FW_LOCK exists)\n";
exit $E_UNKNOWN;
}
# List of controllers and enclosures
@controllers = (); # controllers
@enclosures = (); # enclosures
%snmp_enclosure = (); # enclosures
# Counters for everything
%count
= (
'pdisk' => 0, # number of physical disks
'vdisk' => 0, # number of logical drives (virtual disks)
'temp' => 0, # number of temperature probes
'volt' => 0, # number of voltage probes
'amp' => 0, # number of amperage probes
'intr' => 0, # number of intrusion probes
'dimm' => 0, # number of memory modules
'mem' => 0, # total memory
'fan' => 0, # number of fan probes
'cpu' => 0, # number of CPUs
'bat' => 0, # number of batteries
'power' => 0, # number of power supplies
'sd' => 0, # number of SD cards
'esm' => {
'Critical' => 0, # critical entries in ESM log
'Non-Critical' => 0, # warning entries in ESM log
'Ok' => 0, # ok entries in ESM log
},
'alert' => {
'Critical' => 0, # critical entries in alert log
'Non-Critical' => 0, # warning entries in alert log
'Ok' => 0, # ok entries in alert log
},
);
# Performance data
@perfdata = ();
# Global health status
$global = 1; # default is to check global status
$globalstatus = $E_OK; # default global health status is "OK"
# Nagios error levels reversed
%reverse_exitcode
= (
$E_OK => 'OK',
$E_WARNING => 'WARNING',
$E_CRITICAL => 'CRITICAL',
$E_UNKNOWN => 'UNKNOWN',
);
# OpenManage (omreport) and SNMP error levels
%status2nagios
= (
'Unknown' => $E_CRITICAL,
'Critical' => $E_CRITICAL,
'Non-Critical' => $E_WARNING,
'Ok' => $E_OK,
'Non-Recoverable' => $E_CRITICAL,
'Other' => $E_CRITICAL,
);
# Status via SNMP
%snmp_status
= (
1 => 'Other',
2 => 'Unknown',
3 => 'Ok',
4 => 'Non-Critical',
5 => 'Critical',
6 => 'Non-Recoverable',
);
# Probe Status via SNMP
%snmp_probestatus
= (
1 => 'Other', # probe status is not one of the following:
2 => 'Unknown', # probe status is unknown (not known or monitored)
3 => 'Ok', # probe is reporting a value within the thresholds
4 => 'nonCriticalUpper', # probe has crossed upper noncritical threshold
5 => 'criticalUpper', # probe has crossed upper critical threshold
6 => 'nonRecoverableUpper', # probe has crossed upper non-recoverable threshold
7 => 'nonCriticalLower', # probe has crossed lower noncritical threshold
8 => 'criticalLower', # probe has crossed lower critical threshold
9 => 'nonRecoverableLower', # probe has crossed lower non-recoverable threshold
10 => 'failed', # probe is not functional
);
# Probe status translated to Nagios alarm levels
%probestatus2nagios
= (
'Other' => $E_CRITICAL,
'Unknown' => $E_CRITICAL,
'Ok' => $E_OK,
'nonCriticalUpper' => $E_WARNING,
'criticalUpper' => $E_CRITICAL,
'nonRecoverableUpper' => $E_CRITICAL,
'nonCriticalLower' => $E_WARNING,
'criticalLower' => $E_CRITICAL,
'nonRecoverableLower' => $E_CRITICAL,
'failed' => $E_CRITICAL,
);
# System information gathered
%sysinfo
= (
'bios' => 'N/A', # BIOS version
'biosdate' => 'N/A', # BIOS release date
'serial' => 'N/A', # serial number (service tag)
'model' => 'N/A', # system model
'rev' => q{}, # system revision
'osname' => 'N/A', # OS name
'osver' => 'N/A', # OS version
'om' => 'N/A', # OMSA version
'bmc' => 0, # HAS baseboard management controller (BMC)
'rac' => 0, # HAS remote access controller (RAC)
'rac_name' => 'N/A', # remote access controller (RAC)
'bmc_fw' => 'N/A', # BMC firmware
'rac_fw' => 'N/A', # RAC firmware
);
# Adjust which checks to perform
adjust_checks() if defined $opt{check};
# Blacklisted components
set_blacklist($opt{blacklist}) if defined $opt{blacklist};
# If blacklisting is in effect, don't check global health status
if (scalar keys %blacklist > 0) {
$global = 0;
}
# Take into account new hardware and blades
$omopt_chassis = 'chassis'; # default "chassis" option to omreport
$omopt_system = 'system'; # default "system" option to omreport
$blade = 0; # if this is a blade system
# Some initializations and checking before we begin
if ($snmp) {
snmp_initialize(); # initialize SNMP
snmp_check(); # check that SNMP works
snmp_detect_blade(); # detect blade via SNMP
}
else {
# Find the omreport binary
find_omreport();
# Check help output from omreport, see which options are available.
# Also detecting blade via omreport.
check_omreport_options();
}
# Temperature unit
if ($opt{fahrenheit}) {
$opt{tempunit} = 'F';
}
# Check tempunit syntax
if ($opt{tempunit} !~ m{\A C|F|K|R \z}xms) {
print "ERROR: Unknown temperature unit '$opt{tempunit}'\n";
exit $E_UNKNOWN;
}
#---------------------------------------------------------------------
# Helper functions
#---------------------------------------------------------------------
# Make a regex from a glob pattern. Shamelessly stolen from Perl
# Cookbook chapter 6.9
sub glob2regex {
my $globstr = shift;
my %patmap
= ( '*' => '.*',
'?' => '.',
'[' => '[',
']' => ']',
);
$globstr =~ s{(.)} { $patmap{$1} || "\Q$1" }ge;
return '\A' . $globstr . '\z';
}
#
# Read config file
#
sub parse_configfile {
our $tiny = undef;
# Regexp for boolean values
our $off = qr{\A (0|off|false) \s* \z}ixms;
our $on = qr{\A (1|on|true) \s* \z}ixms;
# Mapping between command line options and the corresponding
# config file options
our %opt2config
= ( 'info' => 'output_servicetag',
'extinfo' => 'output_sysinfo',
'postmsg' => 'output_post_message',
'state' => 'output_servicestate',
'shortstate' => 'output_servicestate_abbr',
'show_blacklist' => 'output_blacklist',
'hide_servicetag' => 'output_hide_servicetag',
'htmlinfo' => 'output_html',
'okinfo' => 'output_ok_verbosity',
'protocol' => 'snmp_version',
'community' => 'snmp_community',
'port' => 'snmp_port',
'ipv6' => 'snmp_use_ipv6',
'tcp' => 'snmp_use_tcp',
'warning' => 'temp_threshold_warning',
'critical' => 'temp_threshold_critical',
'all' => 'check_everything',
'perfdata' => 'performance_data',
'tempunit' => 'temperature_unit',
'timeout' => 'timeout',
'blacklist' => 'blacklist',
'legacy_perfdata' => 'legacy_performance_data',
);
# Load the perl module
if ( eval { require Config::Tiny; 1 } ) {
$tiny = Config::Tiny->new();
}
else {
print "ERROR: Required perl module 'Config::Tiny' not found\n";
exit $E_UNKNOWN;
}
# Read the config file
$tiny = Config::Tiny->read($opt{configfile})
or do { report('other', (sprintf q{Couldn't read configuration file: %s}, Config::Tiny->errstr()), $E_UNKNOWN);
return; };
# Syntax check
foreach my $section (keys %{ $tiny }) {
KEYWORD:
foreach my $keyword (keys %{ $tiny->{$section} }) {
next KEYWORD if $keyword eq 'check_everything';
if ($keyword =~ m{\A check_(.+)}xms) {
my $c = $1;
foreach my $cl (keys %check) {
next KEYWORD if $c eq $cl;
}
}
else {
LEGAL:
foreach my $legal (keys %opt2config) {
next KEYWORD if $keyword eq $opt2config{$legal};
}
}
if ($section eq '_') {
report('other', qq{CONFIG ERROR: In the global section: Unknown statement "$keyword"}, $E_UNKNOWN);
}
else {
report('other', qq{CONFIG ERROR: Unknown statement "$keyword" in section "$section"}, $E_UNKNOWN);
}
}
}
# Adjust checks according to statements in the configuration file
sub configfile_adjust_checks {
my $keyword = shift;
CHECK_CONFIG:
foreach my $key (keys %check) {
my $copt = join '_', 'check', $key;
next CHECK_CONFIG if !defined $tiny->{$keyword}->{$copt} or $tiny->{$keyword}->{$copt} eq q{};
if ($tiny->{$keyword}->{$copt} =~ m{$on}ixms) {
$check{$key} = 1;
}
elsif ($tiny->{$keyword}->{$copt} =~ m{$off}ixms) {
$check{$key} = 0;
}
else {
report('other', "CONFIG ERROR: Rvalue for '$copt' must be boolean (True/False)", $E_UNKNOWN);
}
}
return;
}
# Set blacklist according to statements in the configuration file
sub configfile_set_blacklist {
my $keyword = shift;
if (defined $tiny->{$keyword}->{blacklist} and $tiny->{$keyword}->{blacklist} ne q{}) {
# set_blacklist() takes an array ref
set_blacklist([$tiny->{$keyword}->{blacklist}]);
}
return;
}
# Set timeout according to statements in the configuration file
sub configfile_set_timeout {
my $keyword = shift;
if (defined $tiny->{$keyword}->{timeout} and $tiny->{$keyword}->{timeout} ne q{}) {
if ($tiny->{$keyword}->{timeout} =~ m{\A \d+ \z}xms) { # integer
$opt{timeout} = $tiny->{$keyword}->{timeout};
}
else {
report('other', "CONFIG ERROR: Rvalue for 'timeout' must be a positive integer", $E_UNKNOWN);
}
}
return;
}
# Set a boolean option
sub configfile_set_boolean {
my ($keyword, $bool) = @_;
my $cbool = $opt2config{$bool};
if (defined $tiny->{$keyword}->{$cbool} and $tiny->{$keyword}->{$cbool} ne q{}) {
if ($tiny->{$keyword}->{$cbool} =~ m{$on}ixms) {
$opt{$bool} = 1;
}
elsif ($tiny->{$keyword}->{$cbool} =~ m{$off}ixms) {
$opt{$bool} = 0;
}
else {
report('other', "CONFIG ERROR: Rvalue for '$cbool' must be boolean (True/False)", $E_UNKNOWN);
}
}
return;
}
# Set htmlinfo option from config file
sub configfile_set_htmlinfo {
my $keyword = shift;
my $conf = $opt2config{htmlinfo};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
if ($tiny->{$keyword}->{$conf} =~ m{$on}ixms) {
$opt{htmlinfo} = 1;
}
elsif ($tiny->{$keyword}->{$conf} =~ m{$off}ixms) {
$opt{htmlinfo} = undef;
}
else {
$opt{htmlinfo} = $tiny->{$keyword}->{$conf};
}
}
return;
}
# Set OK output verbosity
sub configfile_set_ok_verbosity {
my $keyword = shift;
my $conf = $opt2config{okinfo};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
if ($tiny->{$keyword}->{$conf} =~ m{\A \d+ \z}xms) {
$opt{okinfo} = $tiny->{$keyword}->{$conf};
}
else {
report('other', "CONFIG ERROR: Rvalue for '$conf' must be a positive integer", $E_UNKNOWN);
}
}
return;
}
# Set SNMP protocol version from config file
sub configfile_set_snmp_version {
my $keyword = shift;
my $conf = $opt2config{protocol};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
if ($tiny->{$keyword}->{$conf} =~ m{\A 1|2|3 \z}xms) {
$opt{protocol} = $tiny->{$keyword}->{$conf};
}
else {
report('other', "CONFIG ERROR: Rvalue for '$conf' must be '1', '2' or '3'", $E_UNKNOWN);
}
}
return;
}
# Set SNMP community name from config file
sub configfile_set_snmp_community {
my $keyword = shift;
my $conf = $opt2config{community};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
$opt{community} = $tiny->{$keyword}->{$conf};
}
return;
}
# Set SNMP port number from config file
sub configfile_set_snmp_port {
my $keyword = shift;
my $conf = $opt2config{port};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
if ($tiny->{$keyword}->{$conf} =~ m{\A \d+ \z}xms) { # integer
$opt{port} = $tiny->{$keyword}->{$conf};
}
else {
report('other', "CONFIG ERROR: Rvalue for '$conf' must be a positive integer", $E_UNKNOWN);
}
}
return;
}
# Set temperature threshold from config file
sub configfile_set_temp_threshold {
my $keyword = shift;
my $level = shift;
my $conf = $opt2config{$level};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
$opt{$level} = [$tiny->{$keyword}->{$conf}]; # array ref
}
return;
}
# Set perfdata from config file
sub configfile_set_perfdata {
my $keyword = shift;
my $conf = $opt2config{perfdata};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
if ($tiny->{$keyword}->{$conf} =~ m{$on}ixms) {
$opt{perfdata} = 1;
}
elsif ($tiny->{$keyword}->{$conf} =~ m{$off}ixms) {
$opt{perfdata} = undef;
}
elsif ($tiny->{$keyword}->{$conf} =~ m{\A minimal|multiline \z}xms) {
$opt{perfdata} = $tiny->{$keyword}->{$conf};
}
else {
report('other', "CONFIG ERROR: Rvalue for '$conf' must be either boolean, 'minimal' or 'multiline'", $E_UNKNOWN);
}
}
return;
}
# Set temp unit from config file
sub configfile_set_tempunit {
my $keyword = shift;
my $conf = $opt2config{tempunit};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
if ($tiny->{$keyword}->{$conf} =~ m{\A C|F|K|R \z}ixms) {
$opt{tempunit} = $tiny->{$keyword}->{$conf};
}
else {
report('other', "CONFIG ERROR: Rvalue for '$conf' must one of C/F/K/R", $E_UNKNOWN);
}
}
return;
}
# Set postmsg string from config file
sub configfile_set_postmsg {
my $keyword = shift;
my $conf = $opt2config{postmsg};
if (defined $tiny->{$keyword}->{$conf} and $tiny->{$keyword}->{$conf} ne q{}) {
$opt{postmsg} = $tiny->{$keyword}->{$conf}; # array ref
}
return;
}
# Sections in the config file to check for statements
my @sections = ();
# First: Populate the sections array with the global section
@sections = ('_');
# Last two steps only if hostname is defined
if (defined $opt{hostname}) {
# Second: Populate the sections array with host glob pattern (but
# not exact match)
PATTERN:
foreach my $glob (sort keys %{ $tiny }) {
next PATTERN if $glob eq '_'; # global section
next PATTERN if $glob eq $opt{hostname}; # exact match
my $regex = glob2regex($glob); # make regexp
if ($opt{hostname} =~ m{$regex}) {
push @sections, $glob;
}
}
# Third: Populate the sections array with exact hostname
if (defined $tiny->{$opt{hostname}}) {
push @sections, $opt{hostname};
}
}
# Loop through the sections array and get options
foreach my $sect (@sections) {
configfile_adjust_checks($sect);
configfile_set_blacklist($sect);
configfile_set_timeout($sect);
configfile_set_htmlinfo($sect);
configfile_set_ok_verbosity($sect);
configfile_set_boolean($sect, 'all');
configfile_set_boolean($sect, 'info');
configfile_set_boolean($sect, 'extinfo');
configfile_set_boolean($sect, 'state');
configfile_set_boolean($sect, 'shortstate');
configfile_set_boolean($sect, 'show_blacklist');
configfile_set_boolean($sect, 'ipv6');
configfile_set_boolean($sect, 'tcp');
configfile_set_boolean($sect, 'legacy_perfdata');
configfile_set_boolean($sect, 'hide_servicetag');
configfile_set_snmp_version($sect);
configfile_set_snmp_community($sect);
configfile_set_snmp_port($sect);
configfile_set_temp_threshold($sect, 'warning');
configfile_set_temp_threshold($sect, 'critical');
configfile_set_perfdata($sect);
configfile_set_tempunit($sect);
configfile_set_postmsg($sect);
}
return;
}
#
# Store a message in one of the message arrays
#
sub report {
my ($type, $msg, $exval, $id) = @_;
defined $id or $id = q{};
my %type2array
= (
'storage' => \@report_storage,
'chassis' => \@report_chassis,
'other' => \@report_other,
);
return push @{ $type2array{$type} }, [ $msg, $exval, $id ];
}
#
# Run command, put resulting output lines in an array and return a
# pointer to that array
#
sub run_command {
my $command = shift;
open my $CMD, '-|', $command
or do { report('other', "Couldn't run command '$command': $!", $E_UNKNOWN)
and return [] };
my @lines = <$CMD>;
close $CMD
or do { report('other', "Couldn't close filehandle for command '$command': $!", $E_UNKNOWN)
and return \@lines };
return \@lines;
}
#
# Run command, put resulting output in a string variable and return it
#
sub slurp_command {
my $command = shift;
open my $CMD, '-|', $command
or do { report('other', "Couldn't run command '$command': $!", $E_UNKNOWN) and return };
my $rawtext = do { local $/ = undef; <$CMD> }; # slurping
close $CMD;
# NOTE: We don't check the return value of close() since omreport
# does something weird sometimes.
return $rawtext;
}
#
# Initialize SNMP
#
sub snmp_initialize {
# Legal SNMP v3 protocols
my $snmp_v3_privprotocol = qr{\A des|aes|aes128|3des|3desde \z}xms;
my $snmp_v3_authprotocol = qr{\A md5|sha \z}xms;
# Parameters to Net::SNMP->session()
my %param
= (
'-port' => $opt{port},
'-hostname' => $opt{hostname},
'-version' => $opt{protocol},
);
# Setting the domain (IP version and transport protocol)
my $transport = $opt{tcp} ? 'tcp' : 'udp';
my $ipversion = $opt{ipv6} ? 'ipv6' : 'ipv4';
$param{'-domain'} = "$transport/$ipversion";
# Parameters for SNMP v3
if ($opt{protocol} == 3) {
# Username is mandatory
if (defined $opt{username}) {
$param{'-username'} = $opt{username};
}
else {
print "SNMP ERROR: With SNMPv3 the username must be specified\n";
exit $E_UNKNOWN;
}
# Authpassword is optional
if (defined $opt{authpassword}) {
$param{'-authpassword'} = $opt{authpassword};
}
# Authkey is optional
if (defined $opt{authkey}) {
$param{'-authkey'} = $opt{authkey};
}
# Privpassword is optional
if (defined $opt{privpassword}) {
$param{'-privpassword'} = $opt{privpassword};
}
# Privkey is optional
if (defined $opt{privkey}) {
$param{'-privkey'} = $opt{privkey};
}
# Privprotocol is optional
if (defined $opt{privprotocol}) {
if ($opt{privprotocol} =~ m/$snmp_v3_privprotocol/xms) {
$param{'-privprotocol'} = $opt{privprotocol};
}
else {
print "SNMP ERROR: Unknown privprotocol '$opt{privprotocol}', "
. "must be one of [des|aes|aes128|3des|3desde]\n";
exit $E_UNKNOWN;
}
}
# Authprotocol is optional
if (defined $opt{authprotocol}) {
if ($opt{authprotocol} =~ m/$snmp_v3_authprotocol/xms) {
$param{'-authprotocol'} = $opt{authprotocol};
}
else {
print "SNMP ERROR: Unknown authprotocol '$opt{authprotocol}', "
. "must be one of [md5|sha]\n";
exit $E_UNKNOWN;
}
}
}
# Parameters for SNMP v2c or v1
elsif ($opt{protocol} == 2 or $opt{protocol} == 1) {
$param{'-community'} = $opt{community};
}
else {
print "SNMP ERROR: Unknown SNMP version '$opt{protocol}'\n";
exit $E_UNKNOWN;
}
# Try to initialize the SNMP session
if ( eval { require Net::SNMP; 1 } ) {
($snmp_session, $snmp_error) = Net::SNMP->session( %param );
if (!defined $snmp_session) {
printf "SNMP: %s\n", $snmp_error;
exit $E_UNKNOWN;
}
}
else {
print "ERROR: You need perl module Net::SNMP to run $NAME in SNMP mode\n";
exit $E_UNKNOWN;
}
return;
}
#
# Checking if SNMP works by probing for "chassisModelName", which all
# servers should have
#
sub snmp_check {
my $chassisModelName = '1.3.6.1.4.1.674.10892.1.300.10.1.9.1';
my $result = $snmp_session->get_request(-varbindlist => [$chassisModelName]);
# Typically if remote host isn't responding
if (!defined $result) {
printf "SNMP CRITICAL: %s\n", $snmp_session->error;
exit $E_CRITICAL;
}
# If OpenManage isn't installed or is not working
if ($result->{$chassisModelName} =~ m{\A noSuch (Instance|Object) \z}xms) {
print "ERROR: (SNMP) OpenManage is not installed or is not working correctly\n";
exit $E_UNKNOWN;
}
return;
}
#
# Detecting blade via SNMP
#
sub snmp_detect_blade {
# In some setups, the IDs for the blade and interconnect
# board are mixed up, so we need to check both.
my $DellBaseBoardType1 = '1.3.6.1.4.1.674.10892.1.300.80.1.7.1.1';
my $DellBaseBoardType2 = '1.3.6.1.4.1.674.10892.1.300.80.1.7.1.2';
my $result1 = $snmp_session->get_request(-varbindlist => [$DellBaseBoardType1]);
my $result2 = $snmp_session->get_request(-varbindlist => [$DellBaseBoardType2]);
# Identify blade. Older models (4th and 5th gen models) and/or old
# OMSA (4.x) don't have this OID. If we get "noSuchInstance" or
# similar, we assume that this isn't a blade
if (exists $result1->{$DellBaseBoardType1} && $result1->{$DellBaseBoardType1} eq '3') {
$blade = 1;
return;
}
if (exists $result2->{$DellBaseBoardType2} && $result2->{$DellBaseBoardType2} eq '3') {
$blade = 1;
return;
}
return;
}
#
# Locate the omreport binary
#
sub find_omreport {
# If user has specified path to omreport
if (defined $opt{omreport} and -x $opt{omreport}) {
$omreport = qq{"$opt{omreport}"};
return;
}
# Possible full paths for omreport
my @omreport_paths
= (
'/opt/dell/srvadmin/bin/omreport', # default on Linux with OMSA >= 6.2.0
'/usr/bin/omreport', # default on Linux with OMSA < 6.2.0
'/opt/dell/srvadmin/oma/bin/omreport.sh', # alternate on Linux
'/opt/dell/srvadmin/oma/bin/omreport', # alternate on Linux
'C:\Program Files (x86)\Dell\SysMgt\oma\bin\omreport.exe', # default on Windows x64
'C:\Program Files\Dell\SysMgt\oma\bin\omreport.exe', # default on Windows x32
'c:\progra~1\dell\sysmgt\oma\bin\omreport.exe', # 8bit legacy default on Windows x32
'c:\progra~2\dell\sysmgt\oma\bin\omreport.exe', # 8bit legacy default on Windows x64
);
# Find the one to use
OMREPORT_PATH:
foreach my $bin (@omreport_paths) {
if (-x $bin) {
$omreport = qq{"$bin"};
last OMREPORT_PATH;
}
}
# Exit with status=UNKNOWN if OM is not installed, or we don't
# have permission to execute the binary
if (!defined $omreport) {
print "ERROR: Dell OpenManage Server Administrator (OMSA) is not installed\n";
exit $E_UNKNOWN;
}
return;
}
#
# Checks output from 'omreport -?' and searches for arguments to
# omreport, to accommodate deprecated options "chassis" and "system"
# (on newer hardware), as well as blade servers.
#
sub check_omreport_options {
foreach (@{ run_command("$omreport -? 2>&1") }) {
if (m/\A servermodule /xms) {
# If "servermodule" argument to omreport exists, use it
# instead of argument "system"
$omopt_system = 'servermodule';
}
elsif (m/\A mainsystem /xms) {
# If "mainsystem" argument to omreport exists, use it
# instead of argument "chassis"
$omopt_chassis = 'mainsystem';
}
elsif (m/\A modularenclosure /xms) {
# If "modularenclusure" argument to omreport exists, assume
# that this is a blade
$blade = 1;
}
}
return;
}
#
# Read the blacklist option and return a hash containing the
# blacklisted components
#
sub set_blacklist {
my $foo = shift;
my @bl = ();
if (scalar @{ $foo } >= 0) {
foreach my $black (@{ $foo }) {
my $tmp = q{};
if (-f $black) {
open my $BL, '<', $black
or do { report('other', "Couldn't open blacklist file $black: $!", $E_UNKNOWN)
and return {} };
chomp($tmp = <$BL>);
close $BL;
}
else {
$tmp = $black;
}
push @bl, $tmp;
}
}
return {} if $#bl < 0;
# Parse blacklist string, put in hash
foreach my $black (@bl) {
my @comps = split m{/}xms, $black;
foreach my $c (@comps) {
next if $c !~ m/=/xms;
my ($key, $val) = split /=/xms, $c;
my @vals = split /,/xms, $val;
push @{ $blacklist{$key} }, @vals;
}
}
return;
}
#
# Read the check option and adjust the hash %check, which is a rough
# list of components to be checked
#
sub adjust_checks {
my @cl = ();
# First, take the '--no-storage' option
if ($opt{no_storage}) {
$check{storage} = 0;
}
# Adjust checking based on the '--all' option
if ($opt{all}) {
# Check option usage
if (defined $opt{only} and $opt{only} !~ m{\A critical|warning \z}xms) {
print qq{ERROR: Wrong simultaneous usage of the "--all" and "--only" options\n};
exit $E_UNKNOWN;
}
if (scalar @{ $opt{check} } > 0) {
print qq{ERROR: Wrong simultaneous usage of the "--all" and "--check" options\n};
exit $E_UNKNOWN;
}
# set the check hash to check everything
map { $_ = 1 } values %check;
return;
}
# Adjust checking based on the '--only' option
if (defined $opt{only} and $opt{only} !~ m{\A critical|warning \z}xms) {
# Check option usage
if (scalar @{ $opt{check} } > 0) {
print qq{ERROR: Wrong simultaneous usage of the "--only" and "--check" options\n};
exit $E_UNKNOWN;
}
if (! exists $check{$opt{only}} && $opt{only} ne 'chassis') {
print qq{ERROR: "$opt{only}" is not a known keyword for the "--only" option\n};
exit $E_UNKNOWN;
}
# reset the check hash
map { $_ = 0 } values %check;
# adjust the check hash
if ($opt{only} eq 'chassis') {
map { $check{$_} = 1 } qw(memory fans power temp cpu voltage sdcard
batteries amperage intrusion esmhealth);
}
else {
$check{$opt{only}} = 1;
}
return;
}
# Adjust checking based on the '--check' option
if (scalar @{ $opt{check} } >= 0) {
foreach my $check (@{ $opt{check} }) {
my $tmp = q{};
if (-f $check) {
open my $CL, '<', $check
or do { report('other', "Couldn't open check file $check: $!", $E_UNKNOWN) and return };
chomp($tmp = <$CL>);
close $CL;
}
else {
$tmp = $check;
}
push @cl, $tmp;
}
}
return if $#cl < 0;
# Parse checklist string, put in hash
foreach my $check (@cl) {
my @checks = split /,/xms, $check;
foreach my $c (@checks) {
next if $c !~ m/=/xms;
my ($key, $val) = split /=/xms, $c;
$check{$key} = $val;
}
}
# Check if we should check global health status
CHECK_KEY:
foreach (keys %check) {
next CHECK_KEY if $_ eq 'esmlog'; # not part of global status
next CHECK_KEY if $_ eq 'alertlog'; # not part of global status
if ($check{$_} == 0) { # found something with checking turned off
$global = 0;
last CHECK_KEY;
}
}
return;
}
#
# Runs omreport and returns an array of anonymous hashes containing
# the output.
# Takes one argument: string containing parameters to omreport
#
sub run_omreport {
my $command = shift;
my @output = ();
my @keys = ();
# Errors that are OK. Some low-end poweredge (and blades) models
# don't have RAID controllers, intrusion detection sensor, or
# redundant/instrumented power supplies etc.
my $ok_errors
= qr{
Intrusion\sinformation\sis\snot\sfound\sfor\sthis\ssystem # No intrusion probe
| No\sinstrumented\spower\ssupplies\sfound\son\sthis\ssystem # No instrumented PS (blades/low-end)
| No\sbattery\sprobes\sfound\son\sthis\ssystem # No battery probes
| Invalid\scommand:\spwrmonitoring # Old hardware
| Hardware\sor\sfeature\snot\spresent\. # SD cards
| Invalid\scommand:\sremovableflashmedia # SD cards with old OMSA
| Error\sCorrection; # Memory stuff. Not really an error (new in OMSA 6.4)
# | Current\sprobes\snot\sfound # OMSA + RHEL5.4 bug
# | No\scontrollers\sfound # No RAID controller
}xms;
# Errors that are OK on blade servers
my $ok_blade_errors
= qr{
No\sfan\sprobes\sfound\son\sthis\ssystem # No fan probes
}xms;
# Run omreport and fetch output
my $rawtext = slurp_command("$omreport $command -fmt ssv 2>&1");
return [] if !defined $rawtext;
# Workaround for Openmanage BUG introduced in OMSA 5.5.0
$rawtext =~ s{\n;}{;}gxms if $command eq 'storage controller';
# Workaround for logical connectors where there are extra
# information that isn't possible to parse consistently. Remove
# everything after and including "Path Health"
if ($command =~ m{\A storage\sconnector}xms) {
$rawtext =~ s{Path\sHealth.*}{}xms;
}
# Report if no controllers found
if ($command eq 'storage controller' and $rawtext =~ m{No\scontrollers\sfound}xms) {
report('storage', 'Storage Error! No controllers found', $E_UNKNOWN);
}
# Openmanage sometimes puts a linebreak between "Error" and the
# actual error text
$rawtext =~ s{^Error\s*\n}{Error: }xms;
# Parse output, store in array
for ((split m{\n}xms, $rawtext)) {
if (m{\AError}xms) {
next if m{$ok_errors}xms;
next if ($blade and m{$ok_blade_errors}xms);
report('other', "Problem running 'omreport $command': $_", $E_UNKNOWN);
}
next if !m/(.*?;){2}/xms; # ignore lines with less than 3 fields
my @vals = split /;/xms;
if ($vals[0] =~ m/\A (Index|ID|Severity|Processor|Current\sSpeed|Connector\sName) \z/xms) {
@keys = @vals;
}
else {
my $i = 0;
push @output, { map { $_ => $vals[$i++] } @keys };
}
}
# Finally, return the collected information
return \@output;
}
#
# Checks if a component is blacklisted. Returns 1 if the component is
# blacklisted, 0 otherwise. Takes two arguments:
# arg1: component name
# arg2: component id or index
#
sub blacklisted {
my $name = shift; # component name
my $id = shift; # component id
my $ret = 0; # return value
if (defined $blacklist{$name}) {
foreach my $comp (@{ $blacklist{$name} }) {
if (defined $id and ($comp eq $id or uc($comp) eq 'ALL')) {
$ret = 1;
}
}
}
return $ret;
}
# Converts the NexusID from SNMP to our version
sub convert_nexus {
my $nexus = shift;
$nexus =~ s{\A \\}{}xms;
$nexus =~ s{\\}{:}gxms;
return $nexus;
}
# Sets custom temperature thresholds based on user supplied options
sub custom_temperature_thresholds {
my $type = shift; # type of threshold, either w (warning) or c (critical)
my %thres = (); # will contain the thresholds
my @limits = (); # holds the input
my @opt = $type eq 'w' ? @{ $opt{warning} } : @{ $opt{critical} };
if (scalar @opt >= 0) {
foreach my $t (@opt) {
my $tmp = q{};
if (-f $t) {
open my $F, '<', $t
or do { report('other', "Couldn't open temperature threshold file $t: $!",
$E_UNKNOWN) and return {} };
$tmp = <$F>;
close $F;
}
else {
$tmp = $t;
}
push @limits, $tmp;
}
}
# Parse checklist string, put in hash
foreach my $th (@limits) {
my @tmp = split m{,}xms, $th;
foreach my $t (@tmp) {
next if $t !~ m{=}xms;
my ($key, $val) = split m{=}xms, $t;
if ($val =~ m{/}xms) {
my ($max, $min) = split m{/}xms, $val;
$thres{$key}{max} = $max;
$thres{$key}{min} = $min;
}
else {
$thres{$key}{max} = $val;
}
}
}
return \%thres;
}
# Gets the output from SNMP result according to the OIDs checked
sub get_snmp_output {
my ($result,$oidref) = @_;
my @temp = ();
my @output = ();
foreach my $oid (keys %{ $result }) {
my $short = $oid;
$short =~ s{\s}{}gxms; # remove whitespace
$short =~ s{\A (.+) \. (\d+) \z}{$1}xms; # remove last number
my $id = $2;
if (exists $oidref->{$short}) {
$temp[$id]{$oidref->{$short}} = $result->{$oid};
}
}
# Remove any empty indexes
foreach my $out (@temp) {
if (defined $out) {
push @output, $out;
}
}
return \@output;
}
# Map the controller or other item in-place
sub map_item {
my ($key, $val, $list) = @_;
foreach my $lst (@{ $list }) {
if (!exists $lst->{$key}) {
$lst->{$key} = $val;
}
}
return;
}
# Return the URL for official Dell documentation for a specific
# PowerEdge server
sub documentation_url {
my $model = shift;
# create model short form, e.g. "r710"
$model =~ s{\A PowerEdge \s (.+?) \z}{lc($1)}exms;
# special case for blades (e.g. M600, M710), they have common
# documentation
$model =~ s{\A m\d+ \z}{m}xms;
return 'http://support.dell.com/support/edocs/systems/pe' . $model . '/';
}
# Return the URL for warranty information for a server with a given
# serial number (servicetag)
sub warranty_url {
my $tag = shift;
# Dell support sites for different parts of the world
my %supportsite
= (
'emea' => 'http://support.euro.dell.com/support/topics/topic.aspx/emea/shared/support/my_systems_info/',
'ap' => 'http://supportapj.dell.com/support/topics/topic.aspx/ap/shared/support/my_systems_info/en/details?',
'glob' => 'http://support.dell.com/support/topics/global.aspx/support/my_systems_info/details?',
);
# warranty URLs for different country codes
my %url
= (
# EMEA
'at' => $supportsite{emea} . 'de/details?c=at&l=de&ServiceTag=', # Austria
'be' => $supportsite{emea} . 'nl/details?c=be&l=nl&ServiceTag=', # Belgium
'cz' => $supportsite{emea} . 'cs/details?c=cz&l=cs&ServiceTag=', # Czech Republic
'de' => $supportsite{emea} . 'de/details?c=de&l=de&ServiceTag=', # Germany
'dk' => $supportsite{emea} . 'da/details?c=dk&l=da&ServiceTag=', # Denmark
'es' => $supportsite{emea} . 'es/details?c=es&l=es&ServiceTag=', # Spain
'fi' => $supportsite{emea} . 'fi/details?c=fi&l=fi&ServiceTag=', # Finland
'fr' => $supportsite{emea} . 'fr/details?c=fr&l=fr&ServiceTag=', # France
'gr' => $supportsite{emea} . 'en/details?c=gr&l=el&ServiceTag=', # Greece
'it' => $supportsite{emea} . 'it/details?c=it&l=it&ServiceTag=', # Italy
'il' => $supportsite{emea} . 'en/details?c=il&l=en&ServiceTag=', # Israel
'me' => $supportsite{emea} . 'en/details?c=me&l=en&ServiceTag=', # Middle East
'no' => $supportsite{emea} . 'no/details?c=no&l=no&ServiceTag=', # Norway
'nl' => $supportsite{emea} . 'nl/details?c=nl&l=nl&ServiceTag=', # The Netherlands
'pl' => $supportsite{emea} . 'pl/details?c=pl&l=pl&ServiceTag=', # Poland
'pt' => $supportsite{emea} . 'en/details?c=pt&l=pt&ServiceTag=', # Portugal
'ru' => $supportsite{emea} . 'ru/details?c=ru&l=ru&ServiceTag=', # Russia
'se' => $supportsite{emea} . 'sv/details?c=se&l=sv&ServiceTag=', # Sweden
'uk' => $supportsite{emea} . 'en/details?c=uk&l=en&ServiceTag=', # United Kingdom
'za' => $supportsite{emea} . 'en/details?c=za&l=en&ServiceTag=', # South Africa
# America
'br' => $supportsite{glob} . 'c=br&l=pt&ServiceTag=', # Brazil
'ca' => $supportsite{glob} . 'c=ca&l=en&ServiceTag=', # Canada
'mx' => $supportsite{glob} . 'c=mx&l=es&ServiceTag=', # Mexico
'us' => $supportsite{glob} . 'c=us&l=en&ServiceTag=', # USA
# Asia/Pacific
'au' => $supportsite{ap} . 'c=au&l=en&ServiceTag=', # Australia
'cn' => $supportsite{ap} . 'c=cn&l=zh&ServiceTag=', # China
'in' => $supportsite{ap} . 'c=in&l=en&ServiceTag=', # India
# default fallback
'XX' => $supportsite{glob} . 'ServiceTag=', # default
);
if (exists $url{$opt{htmlinfo}}) {
return $url{$opt{htmlinfo}} . $tag;
}
else {
return $url{XX} . $tag;
}
}
# This helper function returns the corresponding value of a hash key,
# but takes into account that the key may not exist
sub get_hashval {
my $key = shift || return;
my $hash = shift;
return defined $hash->{$key} ? $hash->{$key} : "Undefined value $key";
}
# Find component status from hash
sub get_snmp_status {
my $key = shift || return 'Unknown';
return exists $snmp_status{$key} ? $snmp_status{$key} : 'Unknown';
}
# Find component status from hash
sub get_snmp_probestatus {
my $key = shift || return 'Unknown';
return exists $snmp_probestatus{$key} ? $snmp_probestatus{$key} : 'Unknown';
}
# Check that a hash entry is defined and not an empty string. Return a
# chosen string (parameter) if these conditions are not met
sub get_nonempty_string {
my $key = shift; # key to check
my $hash = shift; # hash where the key belongs
my $alt = shift; # alternate return value
if (defined $hash->{$key} and $hash->{$key} ne q{}) {
return $hash->{$key};
}
return $alt;
}
# Converts from Celsius to something else
sub temp_from_celsius {
my $x = shift;
my $to = shift;
if ($to eq 'F') {
return sprintf '%.1f', ($x * 9/5 + 32);
}
elsif ($to eq 'K') {
return sprintf '%.1f', ($x + 273.15);
}
elsif ($to eq 'R') {
return sprintf '%.1f', ($x * 9/5 + 32 + 459.67);
}
return $x;
}
#---------------------------------------------------------------------
# Check functions
#---------------------------------------------------------------------
#-----------------------------------------
# Check global health status
#-----------------------------------------
sub check_global {
my $health = $E_OK;
if ($snmp) {
#
# Checks global status, i.e. both storage and chassis
#
my $systemStateGlobalSystemStatus = '1.3.6.1.4.1.674.10892.1.200.10.1.2.1';
my $result = $snmp_session->get_request(-varbindlist => [$systemStateGlobalSystemStatus]);
if (!defined $result) {
printf "SNMP ERROR [global]: %s\n", $snmp_error;
exit $E_UNKNOWN;
}
$health = $status2nagios{get_snmp_status($result->{$systemStateGlobalSystemStatus})};
}
else {
#
# NB! This does not check storage, only chassis...
#
foreach (@{ run_command("$omreport $omopt_system -fmt ssv") }) {
next if !m/;/xms;
next if m/\A SEVERITY;COMPONENT/xms;
if (m/\A (.+?);Main\sSystem(\sChassis)? /xms) {
$health = $status2nagios{$1};
last;
}
}
}
# Return the status
return $health;
}
#-----------------------------------------
# STORAGE: Check controllers
#-----------------------------------------
sub check_controllers {
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $minfw = undef;
my $mindr = undef;
my $firmware = undef;
my $driver = undef;
my $minstdr = undef; # Minimum required Storport driver version
my $stdr = undef; # Storport driver version
my @output = ();
if ($snmp) {
my %ctrl_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.1.1.1' => 'controllerNumber',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.2' => 'controllerName',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.5' => 'controllerState',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.8' => 'controllerFWVersion',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.38' => 'controllerComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.39' => 'controllerNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.41' => 'controllerDriverVersion',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.44' => 'controllerMinFWVersion',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.45' => 'controllerMinDriverVersion',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.55' => 'controllerStorportDriverVersion',
'1.3.6.1.4.1.674.10893.1.20.130.1.1.56' => 'controllerMinRequiredStorportVer',
);
# We use get_table() here for the odd case where a server has
# two or more controllers, and where some OIDs are missing on
# one of the controllers.
my $controllerTable = '1.3.6.1.4.1.674.10893.1.20.130.1';
my $result = $snmp_session->get_table(-baseoid => $controllerTable);
if (!defined $result) {
report('storage', 'Storage Error! No controllers found', $E_UNKNOWN);
return;
}
@output = @{ get_snmp_output($result, \%ctrl_oid) };
}
else {
@output = @{ run_omreport('storage controller') };
}
my %ctrl_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
6 => 'Degraded',
);
CTRL:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{controllerName} || 'Unknown controller';
$state = get_hashval($out->{controllerState}, \%ctrl_state) || 'Unknown state';
$status = get_snmp_status($out->{controllerComponentStatus});
$minfw = $out->{controllerMinFWVersion} || undef;
$mindr = $out->{controllerMinDriverVersion} || undef;
$firmware = $out->{controllerFWVersion} || 'N/A';
$driver = $out->{controllerDriverVersion} || 'N/A';
$minstdr = $out->{'controllerMinRequiredStorportVer'} || undef;
$stdr = $out->{controllerStorportDriverVersion} || undef;
$nexus = convert_nexus(($out->{controllerNexusID} || 9999));
}
else {
$nexus = get_nonempty_string('ID', $out, '9999');
$name = get_nonempty_string('Name', $out, 'Unknown controller');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$minfw = $out->{'Minimum Required Firmware Version'} ne 'Not Applicable'
? $out->{'Minimum Required Firmware Version'} : undef;
$mindr = $out->{'Minimum Required Driver Version'} ne 'Not Applicable'
? $out->{'Minimum Required Driver Version'} : undef;
$firmware = $out->{'Firmware Version'} ne 'Not Applicable'
? $out->{'Firmware Version'} : 'N/A';
$driver = $out->{'Driver Version'} ne 'Not Applicable'
? $out->{'Driver Version'} : 'N/A';
$minstdr = (exists $out->{'Minimum Required Storport Driver Version'}
and $out->{'Minimum Required Storport Driver Version'} ne 'Not Applicable')
? $out->{'Minimum Required Storport Driver Version'} : undef;
$stdr = (exists $out->{'Storport Driver Version'}
and $out->{'Storport Driver Version'} ne 'Not Applicable')
? $out->{'Storport Driver Version'} : undef;
}
$name =~ s{\s+\z}{}xms; # remove trailing whitespace
push @controllers, $nexus;
# Collecting some storage info
$sysinfo{'controller'}{$nexus}{'id'} = $nexus;
$sysinfo{'controller'}{$nexus}{'name'} = $name;
$sysinfo{'controller'}{$nexus}{'driver'} = $driver;
$sysinfo{'controller'}{$nexus}{'firmware'} = $firmware;
$sysinfo{'controller'}{$nexus}{'storport'} = $stdr;
# Store controller info for future use (SNMP)
if ($snmp) {
$snmp_controller{$out->{controllerNumber}} = $nexus;
}
next CTRL if blacklisted('ctrl', $nexus);
# Special case: old firmware
if (!blacklisted('ctrl_fw', $nexus) && defined $minfw) {
chomp $firmware;
my $msg = sprintf q{Controller %d [%s]: Firmware '%s' is out of date},
$nexus, $name, $firmware;
report('storage', $msg, $E_WARNING, $nexus);
}
# Special case: old driver
if (!blacklisted('ctrl_driver', $nexus) && defined $mindr) {
chomp $driver;
my $msg = sprintf q{Controller %d [%s]: Driver '%s' is out of date},
$nexus, $name, $driver;
report('storage', $msg, $E_WARNING, $nexus);
}
# Special case: old storport driver
if (!blacklisted('ctrl_stdr', $nexus) && defined $minstdr) {
chomp $stdr;
my $msg = sprintf q{Controller %d [%s]: Storport driver '%s' is out of date},
$nexus, $name, $stdr;
report('storage', $msg, $E_WARNING, $nexus);
}
# Ok
if ($status eq 'Ok' or ($status eq 'Non-Critical'
and (defined $minfw or defined $mindr or defined $minstdr))) {
my $msg = sprintf 'Controller %d [%s] is %s',
$nexus, $name, $state;
report('storage', $msg, $E_OK, $nexus);
}
# Default
else {
my $msg = sprintf 'Controller %d [%s] needs attention: %s',
$nexus, $name, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
}
return;
}
#-----------------------------------------
# STORAGE: Check physical drives
#-----------------------------------------
sub check_physical_disks {
return if $#controllers == -1;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $fpred = undef;
my $progr = undef;
my $ctrl = undef;
my $vendor = undef; # disk vendor
my $product = undef; # product ID
my $capacity = undef; # disk length (size) in bytes
my $media = undef; # media type (e.g. HDD, SSD)
my $bus = undef; # bus protocol (e.g. SAS, SATA)
my $spare = undef; # spare state (e.g. global hotspare)
my $cert = undef; # if drive is certified or not
my @output = ();
if ($snmp) {
my %pdisk_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.4.1.2' => 'arrayDiskName',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.3' => 'arrayDiskVendor',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.4' => 'arrayDiskState',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.6' => 'arrayDiskProductID',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.9' => 'arrayDiskEnclosureID',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.10' => 'arrayDiskChannel',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.11' => 'arrayDiskLengthInMB',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.15' => 'arrayDiskTargetID',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.21' => 'arrayDiskBusType',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.22' => 'arrayDiskSpareState',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.24' => 'arrayDiskComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.26' => 'arrayDiskNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.31' => 'arrayDiskSmartAlertIndication',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.35' => 'arrayDiskMediaType',
'1.3.6.1.4.1.674.10893.1.20.130.4.1.36' => 'arrayDiskDellCertified',
'1.3.6.1.4.1.674.10893.1.20.130.5.1.7' => 'arrayDiskEnclosureConnectionControllerNumber',
'1.3.6.1.4.1.674.10893.1.20.130.6.1.7' => 'arrayDiskChannelConnectionControllerNumber',
);
my $result = undef;
if ($opt{use_get_table}) {
my $arrayDiskTable = '1.3.6.1.4.1.674.10893.1.20.130.4';
my $arrayDiskEnclosureConnectionControllerNumber = '1.3.6.1.4.1.674.10893.1.20.130.5.1.7';
my $arrayDiskChannelConnectionControllerNumber = '1.3.6.1.4.1.674.10893.1.20.130.6.1.7';
$result = $snmp_session->get_table(-baseoid => $arrayDiskTable);
my $ext1 = $snmp_session->get_table(-baseoid => $arrayDiskEnclosureConnectionControllerNumber);
my $ext2 = $snmp_session->get_table(-baseoid => $arrayDiskChannelConnectionControllerNumber);
if (defined $result) {
defined $ext1 && map { $$result{$_} = $$ext1{$_} } keys %{ $ext1 };
defined $ext2 && map { $$result{$_} = $$ext2{$_} } keys %{ $ext2 };
}
}
else {
$result = $snmp_session->get_entries(-columns => [keys %pdisk_oid]);
}
if (!defined $result) {
printf "SNMP ERROR [storage / pdisk]: %s.\n", $snmp_session->error;
$snmp_session->close;
exit $E_UNKNOWN;
}
@output = @{ get_snmp_output($result, \%pdisk_oid) };
}
else {
foreach my $c (@controllers) {
# This blacklists disks with broken firmware, which includes
# illegal XML characters that makes openmanage choke on itself
next if blacklisted('ctrl_pdisk', $c);
push @output, @{ run_omreport("storage pdisk controller=$c") };
map_item('ctrl', $c, \@output);
}
}
my %spare_state
= (
1 => 'VD member', # disk is a member of a virtual disk
2 => 'DG member', # disk is a member of a disk group
3 => 'Global HS', # disk is a global hot spare
4 => 'Dedicated HS', # disk is a dedicated hot spare
5 => 'no', # not a spare
99 => 'n/a', # not applicable
);
my %media_type
= (
1 => 'unknown',
2 => 'HDD',
3 => 'SSD',
);
my %bus_type
= (
1 => 'SCSI',
2 => 'IDE',
3 => 'Fibre Channel',
4 => 'SSA',
6 => 'USB',
7 => 'SATA',
8 => 'SAS',
);
my %pdisk_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
6 => 'Degraded',
7 => 'Recovering',
11 => 'Removed',
15 => 'Resynching',
22 => 'Replacing', # FIXME: this one is not defined in the OMSA MIBs
24 => 'Rebuilding',
25 => 'No Media',
26 => 'Formatting',
28 => 'Diagnostics',
34 => 'Predictive failure',
35 => 'Initializing',
39 => 'Foreign',
40 => 'Clear',
41 => 'Unsupported',
53 => 'Incompatible',
);
# Check physical disks on each of the controllers
PDISK:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{arrayDiskName} || 'Unknown disk';
$state = get_hashval($out->{arrayDiskState}, \%pdisk_state) || 'Unknown state';
$status = get_snmp_status($out->{arrayDiskComponentStatus});
$fpred = defined $out->{arrayDiskSmartAlertIndication}
&& $out->{arrayDiskSmartAlertIndication} == 2 ? 1 : 0;
$progr = q{};
$nexus = convert_nexus(($out->{arrayDiskNexusID} || 9999));
$vendor = $out->{arrayDiskVendor} || 'Unknown vendor';
$product = $out->{arrayDiskProductID} || 'Unknown product ID';
$spare = get_hashval($out->{arrayDiskSpareState}, \%spare_state) || q{};
$bus = get_hashval($out->{arrayDiskBusType}, \%bus_type);
$media = get_hashval($out->{arrayDiskMediaType}, \%media_type);
$cert = defined $out->{arrayDiskDellCertified} ? $out->{arrayDiskDellCertified} : 1;
$capacity = exists $out->{arrayDiskLengthInMB}
? $out->{arrayDiskLengthInMB} * 1024**2 : -1;
# try to find the controller where the disk belongs
if (exists $out->{arrayDiskEnclosureConnectionControllerNumber}) {
# for disks that are attached to an enclosure
$ctrl = $snmp_controller{$out->{arrayDiskEnclosureConnectionControllerNumber}};
}
elsif (exists $out->{arrayDiskChannelConnectionControllerNumber}) {
# for disks that are not attached to an enclosure
$ctrl = $snmp_controller{$out->{arrayDiskChannelConnectionControllerNumber}};
}
else {
# last resort... use the nexus id (old/broken hardware)
$ctrl = $nexus;
$ctrl =~ s{\A (\d+) : .* \z}{$1}xms;
}
}
else {
$name = get_nonempty_string('Name', $out, 'Unknown disk');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$fpred = lc(get_nonempty_string('Failure Predicted', $out, q{})) eq 'yes' ? 1 : 0;
$progr = ' [' . get_nonempty_string('Progress', $out, q{}) . ']';
$nexus = join q{:}, $out->{ctrl}, $out->{'ID'};
$vendor = get_nonempty_string('Vendor ID', $out, 'Unknown Vendor');
$product = get_nonempty_string('Product ID', $out, 'Unknown Product ID');
$media = get_nonempty_string('Media', $out, undef);
$bus = get_nonempty_string('Bus Protocol', $out, undef);
$spare = get_nonempty_string('Hot Spare', $out, q{});
$cert = get_nonempty_string('Certified', $out, 1);
$ctrl = $out->{ctrl};
$capacity = get_nonempty_string('Capacity', $out, q{});
$capacity =~ s{\A .*? \((\d+) \s bytes\) \z}{$1}xms;
if ($capacity eq 'Unavailable') {
$capacity = -1;
}
if ($cert eq 'Yes' or $cert eq 'Not Applicable') {
$cert = 1;
}
else {
$cert = 0;
}
}
$count{pdisk}++;
next PDISK if blacklisted('pdisk', $nexus);
$vendor =~ s{\s+\z}{}xms; # remove trailing whitespace
$product =~ s{\s+\z}{}xms; # remove trailing whitespace
# If the disk is bad, the vendor field may be empty
if ($vendor eq q{}) { $vendor = 'Unknown Vendor'; }
# Hot spare stuff
if ($spare eq 'Global') { $spare = 'Global HS'; }
elsif ($spare eq 'Dedicated') { $spare = 'Dedicated HS'; }
elsif ($spare !~ m{\A Global|Dedicated}xms) { $spare = undef; }
# Calculate human readable capacity
if ($capacity == -1) {
# capacity is unknown
$capacity = 'Unknown Size';
}
else {
$capacity = ceil($capacity / 1000**3) >= 1000
? sprintf '%.1fTB', ($capacity / 1000**4)
: sprintf '%.0fGB', ($capacity / 1000**3);
$capacity = '450GB' if $capacity eq '449GB'; # quick fix for 450GB disks
$capacity = '300GB' if $capacity eq '299GB'; # quick fix for 300GB disks
$capacity = '146GB' if $capacity eq '147GB'; # quick fix for 146GB disks
$capacity = '100GB' if $capacity eq '99GB'; # quick fix for 100GB disks
}
# Capitalize only the first letter of the vendor name
$vendor = (substr $vendor, 0, 1) . lc (substr $vendor, 1, length $vendor);
# Remove unnecessary trademark rubbish from vendor name
$vendor =~ s{\(tm\)\z}{}xms;
# bus and media aren't always defined
my $busmedia = q{};
if (defined $bus && defined $media) { $busmedia = "$bus-$media "; }
elsif (defined $bus && ! defined $media) { $busmedia = "$bus "; }
elsif (! defined $bus && defined $media) { $busmedia = "$media "; }
# Special case: Failure predicted
if ($fpred) {
my $msg = sprintf '%s [%s %s, %s] on ctrl %d needs attention: Failure Predicted',
$name, $vendor, $product, $capacity, $ctrl;
$msg .= " ($state)" if $state ne 'Predictive failure';
report('storage', $msg,
($status2nagios{$status} == $E_CRITICAL ? $E_CRITICAL : $E_WARNING), $nexus);
}
# Special case: Rebuilding / Replacing
elsif ($state =~ m{\A Rebuilding|Replacing \z}xms) {
my $msg = sprintf '%s [%s %s, %s] on ctrl %d is %s%s',
$name, $vendor, $product, $capacity, $ctrl, $state, $progr;
report('storage', $msg, $E_WARNING, $nexus);
}
# Special case: Uncertified disk
elsif ($status eq 'Non-Critical' and !$cert) {
if (blacklisted('pdisk_cert', $nexus)) {
my $msg = sprintf '%s [%s %s, %s] on ctrl %d is %s, Not Certified',
$name, $vendor, $product, $capacity, $ctrl, $state;
report('storage', $msg, $E_OK, $nexus);
}
else {
my $msg = sprintf '%s [%s %s, %s] on ctrl %d is Not Certified',
$name, $vendor, $product, $capacity, $ctrl;
report('storage', $msg, $E_WARNING, $nexus);
}
}
# Special case: Foreign disk
elsif ($status eq 'Non-Critical' and $state eq 'Foreign'
and blacklisted('pdisk_foreign', $nexus)) {
my $msg = sprintf '%s [%s %s, %s] on ctrl %d is %s',
$name, $vendor, $product, $capacity, $ctrl, $state;
report('storage', $msg, $E_OK, $nexus);
}
# Default
elsif ($status ne 'Ok') {
my $msg = sprintf '%s [%s %s, %s] on ctrl %d needs attention: %s',
$name, $vendor, $product, $capacity, $ctrl, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
# Ok
else {
my $msg = sprintf '%s [%s%s] on ctrl %d is %s',
$name, $busmedia, $capacity, $ctrl, $state;
if (defined $spare) { $msg .= " ($spare)"; }
report('storage', $msg, $E_OK, $nexus);
}
}
return;
}
#-----------------------------------------
# STORAGE: Check logical drives
#-----------------------------------------
sub check_virtual_disks {
return if $#controllers == -1;
my $name = undef;
my $nexus = undef;
my $dev = undef;
my $state = undef;
my $status = undef;
my $layout = undef;
my $size = undef;
my $progr = undef;
my $ctrl = undef;
my @output = ();
if ($snmp) {
my %vdisk_oid
= (
'1.3.6.1.4.1.674.10893.1.20.140.1.1.3' => 'virtualDiskDeviceName',
'1.3.6.1.4.1.674.10893.1.20.140.1.1.4' => 'virtualDiskState',
'1.3.6.1.4.1.674.10893.1.20.140.1.1.6' => 'virtualDiskLengthInMB',
'1.3.6.1.4.1.674.10893.1.20.140.1.1.13' => 'virtualDiskLayout',
'1.3.6.1.4.1.674.10893.1.20.140.1.1.20' => 'virtualDiskComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.140.1.1.21' => 'virtualDiskNexusID',
);
my $result = undef;
if ($opt{use_get_table}) {
my $virtualDiskTable = '1.3.6.1.4.1.674.10893.1.20.140.1';
$result = $snmp_session->get_table(-baseoid => $virtualDiskTable);
}
else {
$result = $snmp_session->get_entries(-columns => [keys %vdisk_oid]);
}
# No logical drives is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%vdisk_oid) };
}
else {
foreach my $c (@controllers) {
push @output, @{ run_omreport("storage vdisk controller=$c") };
map_item('ctrl', $c, \@output);
}
}
my %vdisk_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
6 => 'Degraded',
15 => 'Resynching',
16 => 'Regenerating',
24 => 'Rebuilding',
26 => 'Formatting',
32 => 'Reconstructing',
35 => 'Initializing',
36 => 'Background Initialization',
38 => 'Resynching Paused',
52 => 'Permanently Degraded',
54 => 'Degraded Redundancy',
);
my %vdisk_layout
= (
1 => 'Concatenated',
2 => 'RAID-0',
3 => 'RAID-1',
4 => 'UNSUPPORTED:raid-2',
5 => 'UNSUPPORTED:raid-3',
6 => 'UNSUPPORTED:raid-4',
7 => 'RAID-5',
8 => 'RAID-6',
9 => 'UNSUPPORTED:raid-7',
10 => 'RAID-10',
11 => 'UNSUPPORTED:raid-30',
12 => 'RAID-50',
13 => 'UNSUPPORTED:addSpares',
14 => 'UNSUPPORTED:deleteLogical',
15 => 'UNSUPPORTED:transformLogical',
18 => 'UNSUPPORTED:raid-0-plus-1',
19 => 'Concatenated RAID-1',
20 => 'UNSUPPORTED:concatRaid-5',
21 => 'UNSUPPORTED:noRaid',
22 => 'UNSUPPORTED:volume',
23 => 'UNSUPPORTED:raidMorph',
24 => 'RAID-60',
25 => 'CacheCade',
);
# Check virtual disks on each of the controllers
VDISK:
foreach my $out (@output) {
if ($snmp) {
$dev = $out->{virtualDiskDeviceName} || 'Unknown device';
$state = get_hashval($out->{virtualDiskState}, \%vdisk_state) || 'Unknown state';
$layout = get_hashval($out->{virtualDiskLayout}, \%vdisk_layout) || 'Unknown layout';
$status = get_snmp_status($out->{virtualDiskComponentStatus});
$size = sprintf '%.2f GB', ($out->{virtualDiskLengthInMB} || 0) / 1024;
$progr = q{}; # not available via SNMP
$nexus = convert_nexus(($out->{virtualDiskNexusID} || 9999));
}
else {
$dev = get_nonempty_string('Device Name', $out, 'Unknown device');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$layout = get_nonempty_string('Layout', $out, 'Unknown layout');
$size = get_nonempty_string('Size', $out, 'Unavailable');
$size =~ s{\A (.*GB).* \z}{$1}xms;
$progr = ' [' . get_nonempty_string('Progress', $out, q{}) . ']';
$ctrl = $out->{ctrl};
$nexus = join q{:}, $ctrl, get_nonempty_string('ID', $out, '9999');
}
$count{vdisk}++;
next VDISK if blacklisted('vdisk', $nexus);
# The device name is undefined sometimes
$dev = q{} if !defined $dev;
# Special case: Regenerating
if ($state eq 'Regenerating') {
my $msg = sprintf q{Logical Drive '%s' [%s, %s] is %s%s},
$dev, $layout, $size, $state, $progr;
report('storage', $msg, $E_WARNING, $nexus);
}
# Default
elsif ($status ne 'Ok') {
my $msg = sprintf q{Logical Drive '%s' [%s, %s] needs attention: %s},
$dev, $layout, $size, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
# Ok
else {
my $msg = sprintf q{Logical Drive '%s' [%s, %s] is %s},
$dev, $layout, $size, $state;
report('storage', $msg, $E_OK, $nexus);
}
}
return;
}
#-----------------------------------------
# STORAGE: Check cache batteries
#-----------------------------------------
sub check_cache_battery {
return if $#controllers == -1;
my $id = undef;
my $nexus = undef;
my $state = undef;
my $status = undef;
my $ctrl = undef;
my $learn = undef; # learn state
my $pred = undef; # battery's ability to be charged
my @output = ();
if ($snmp) {
my %bat_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.15.1.4' => 'batteryState',
'1.3.6.1.4.1.674.10893.1.20.130.15.1.6' => 'batteryComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.15.1.9' => 'batteryNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.15.1.10' => 'batteryPredictedCapacity',
'1.3.6.1.4.1.674.10893.1.20.130.15.1.12' => 'batteryLearnState',
'1.3.6.1.4.1.674.10893.1.20.130.16.1.5' => 'batteryConnectionControllerNumber',
);
my $result = undef;
if ($opt{use_get_table}) {
my $batteryTable = '1.3.6.1.4.1.674.10893.1.20.130.15';
my $batteryConnectionTable = '1.3.6.1.4.1.674.10893.1.20.130.16';
$result = $snmp_session->get_table(-baseoid => $batteryTable);
my $ext = $snmp_session->get_table(-baseoid => $batteryConnectionTable);
if (defined $result) {
defined $ext && map { $$result{$_} = $$ext{$_} } keys %{ $ext };
}
}
else {
$result = $snmp_session->get_entries(-columns => [keys %bat_oid]);
}
# No cache battery is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%bat_oid) };
}
else {
foreach my $c (@controllers) {
push @output, @{ run_omreport("storage battery controller=$c") };
map_item('ctrl', $c, \@output);
}
}
my %bat_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
6 => 'Degraded',
7 => 'Reconditioning',
9 => 'High',
10 => 'Power Low',
12 => 'Charging',
21 => 'Missing',
36 => 'Learning',
);
# Specifies the learn state activity of the battery
my %bat_learn_state
= (
1 => 'Failed',
2 => 'Active',
4 => 'Timed out',
8 => 'Requested',
16 => 'Idle',
);
# This property displays the battery's ability to be charged
my %bat_pred_cap
= (
1 => 'Failed', # The battery cannot be charged and needs to be replaced
2 => 'Ready', # The battery can be charged to full capacity
4 => 'Unknown', # The battery is completing a Learn cycle. The charge capacity of the
# battery cannot be determined until the Learn cycle is complete
);
# Check battery on each of the controllers
BATTERY:
foreach my $out (@output) {
if ($snmp) {
$status = get_snmp_status($out->{batteryComponentStatus});
$state = get_hashval($out->{batteryState}, \%bat_state) || 'Unknown state';
$learn = get_hashval($out->{batteryLearnState}, \%bat_learn_state) || 'Unknown learn state';
$pred = get_hashval($out->{batteryPredictedCapacity}, \%bat_pred_cap) || 'Unknown predicted capacity status';
$ctrl = $snmp_controller{$out->{batteryConnectionControllerNumber}};
$nexus = convert_nexus(($out->{batteryNexusID} || 9999));
$id = $nexus;
$id =~ s{\A \d+:(\d+) \z}{$1}xms;
}
else {
$id = get_nonempty_string('ID', $out, 9999);
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$learn = get_nonempty_string('Learn State', $out, 'Unknown learn state');
$pred = get_nonempty_string('Predicted Capacity Status', $out, 'Unknown predicted capacity status');
$ctrl = $out->{'ctrl'};
$nexus = join q{:}, $out->{ctrl}, $id;
}
next BATTERY if blacklisted('bat', $nexus);
# Special case: Charging
if ($state eq 'Charging') {
if ($pred eq 'Failed') {
my $msg = sprintf 'Cache Battery %d in controller %d is %s (%s) [replace battery]',
$id, $ctrl, $state, $pred;
report('storage', $msg, $E_CRITICAL, $nexus);
}
else {
next BATTERY if blacklisted('bat_charge', $nexus);
my $msg = sprintf 'Cache Battery %d in controller %d is %s (%s) [probably harmless]',
$id, $ctrl, $state, $pred;
report('storage', $msg, $E_WARNING, $nexus);
}
}
# Special case: Learning (battery learns its capacity)
elsif ($state eq 'Learning') {
if ($learn eq 'Failed') {
my $msg = sprintf 'Cache Battery %d in controller %d is %s (%s)',
$id, $ctrl, $state, $learn;
report('storage', $msg, $E_CRITICAL, $nexus);
}
else {
next BATTERY if blacklisted('bat_charge', $nexus);
my $msg = sprintf 'Cache Battery %d in controller %d is %s (%s) [probably harmless]',
$id, $ctrl, $state, $learn;
report('storage', $msg, $E_WARNING, $nexus);
}
}
# Special case: Power Low (first part of recharge cycle)
elsif ($state eq 'Power Low') {
next BATTERY if blacklisted('bat_charge', $nexus);
my $msg = sprintf 'Cache Battery %d in controller %d is %s [probably harmless]',
$id, $ctrl, $state;
report('storage', $msg, $E_WARNING, $nexus);
}
# Special case: Degraded and Non-Critical (usually part of recharge cycle)
elsif ($state eq 'Degraded' && $status eq 'Non-Critical') {
next BATTERY if blacklisted('bat_charge', $nexus);
my $msg = sprintf 'Cache Battery %d in controller %d is %s (%s) [probably harmless]',
$id, $ctrl, $state, $status;
report('storage', $msg, $E_WARNING, $nexus);
}
# Default
else {
my $msg = sprintf 'Cache Battery %d in controller %d is %s',
$id, $ctrl, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
}
return;
}
#-----------------------------------------
# STORAGE: Check connectors (channels)
#-----------------------------------------
sub check_connectors {
return if $#controllers == -1;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $type = undef;
my $ctrl = undef;
my @output = ();
if ($snmp) {
my %conn_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.2.1.2' => 'channelName',
'1.3.6.1.4.1.674.10893.1.20.130.2.1.3' => 'channelState',
'1.3.6.1.4.1.674.10893.1.20.130.2.1.8' => 'channelComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.2.1.9' => 'channelNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.2.1.11' => 'channelBusType',
);
my $result = undef;
if ($opt{use_get_table}) {
my $channelTable = '1.3.6.1.4.1.674.10893.1.20.130.2';
$result = $snmp_session->get_table(-baseoid => $channelTable);
}
else {
$result = $snmp_session->get_entries(-columns => [keys %conn_oid]);
}
if (!defined $result) {
printf "SNMP ERROR [storage / channel]: %s.\n", $snmp_session->error;
$snmp_session->close;
exit $E_UNKNOWN;
}
@output = @{ get_snmp_output($result, \%conn_oid) };
}
else {
foreach my $c (@controllers) {
push @output, @{ run_omreport("storage connector controller=$c") };
map_item('ctrl', $c, \@output);
}
}
my %conn_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
6 => 'Degraded',
);
my %conn_bustype
= (
1 => 'SCSI',
2 => 'IDE',
3 => 'Fibre Channel',
4 => 'SSA',
6 => 'USB',
7 => 'SATA',
8 => 'SAS',
);
# Check connectors on each of the controllers
CHANNEL:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{channelName} || 'Unknown channel';
$status = get_snmp_status($out->{channelComponentStatus});
$state = get_hashval($out->{channelState}, \%conn_state) || 'Unknown state';
$type = get_hashval($out->{channelBusType}, \%conn_bustype) || 'Unknown type';
$nexus = convert_nexus(($out->{channelNexusID} || 9999));
$ctrl = $nexus;
$ctrl =~ s{(\d+):\d+}{$1}xms;
}
else {
$name = get_nonempty_string('Name', $out, 'Unknown channel');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$type = get_nonempty_string('Connector Type', $out, 'Unknown type');
$ctrl = $out->{ctrl};
$nexus = join q{:}, $out->{ctrl}, $out->{'ID'};
}
next CHANNEL if blacklisted('conn', $nexus);
my $msg = sprintf '%s [%s] on controller %d is %s',
$name, $type, $ctrl, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
return;
}
#-----------------------------------------
# STORAGE: Check enclosures
#-----------------------------------------
sub check_enclosures {
my $id = undef;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $firmware = undef;
my $ctrl = undef;
my $occupied_slots = undef; # number of occupied slots
my $total_slots = undef; # number of total slots
my @output = ();
if ($snmp) {
my %encl_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.3.1.1' => 'enclosureNumber',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.2' => 'enclosureName',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.4' => 'enclosureState',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.19' => 'enclosureChannelNumber',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.24' => 'enclosureComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.25' => 'enclosureNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.26' => 'enclosureFirmwareVersion',
'1.3.6.1.4.1.674.10893.1.20.130.3.1.31' => 'enclosureOccupiedSlotCount', # new in OMSA 6.3.0
'1.3.6.1.4.1.674.10893.1.20.130.3.1.32' => 'enclosureTotalSlots', # new in OMSA 6.3.0
);
my $result = undef;
if ($opt{use_get_table}) {
my $enclosureTable = '1.3.6.1.4.1.674.10893.1.20.130.3';
$result = $snmp_session->get_table(-baseoid => $enclosureTable);
}
else {
$result = $snmp_session->get_entries(-columns => [keys %encl_oid]);
}
# No enclosures is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%encl_oid) };
}
else {
foreach my $c (@controllers) {
push @output, @{ run_omreport("storage enclosure controller=$c") };
map_item('ctrl', $c, \@output);
}
}
my %encl_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
6 => 'Degraded',
);
ENCLOSURE:
foreach my $out (@output) {
if ($snmp) {
$id = ($out->{enclosureNumber} || 10000) - 1;
$name = $out->{enclosureName} || 'Unknown enclosure';
$state = get_hashval($out->{enclosureState}, \%encl_state) || 'Unknown state';
$status = get_snmp_status($out->{enclosureComponentStatus});
$firmware = $out->{enclosureFirmwareVersion} || 'N/A';
$nexus = convert_nexus(($out->{enclosureNexusID} || 9999));
$ctrl = $nexus;
$ctrl =~ s{\A (\d+):.* \z}{$1}xms;
# for the next two, a value of 9999 means feature not available
$occupied_slots = defined $out->{enclosureOccupiedSlotCount}
&& $out->{enclosureOccupiedSlotCount} != 9999
? $out->{enclosureOccupiedSlotCount} : undef;
$total_slots = defined $out->{enclosureTotalSlots}
&& $out->{enclosureTotalSlots} != 9999
? $out->{enclosureTotalSlots} : undef;
}
else {
$id = get_nonempty_string('ID', $out, 9999);
$name = get_nonempty_string('Name', $out, 'Unknown enclosure');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$firmware = get_nonempty_string('Firmware Version', $out, 'N/A');
$firmware =~ s{Not\sApplicable}{N/A}xms;
$nexus = join q{:}, $out->{ctrl}, $id;
$ctrl = $out->{ctrl};
}
$name =~ s{\s+\z}{}xms; # remove trailing whitespace
$firmware =~ s{\s+\z}{}xms; # remove trailing whitespace
# store enclosure data for future use
if ($snmp) {
$snmp_enclosure{$out->{enclosureNumber}}{id} = $id;
$snmp_enclosure{$out->{enclosureNumber}}{name} = $name;
$snmp_enclosure{$out->{enclosureNumber}}{nexus} = $nexus;
}
else {
push @enclosures, { 'id' => $id,
'ctrl' => $out->{ctrl},
'name' => $name };
}
# Collecting some storage info
$sysinfo{'enclosure'}{$nexus}{'id'} = $nexus;
$sysinfo{'enclosure'}{$nexus}{'name'} = $name;
$sysinfo{'enclosure'}{$nexus}{'firmware'} = $firmware;
next ENCLOSURE if blacklisted('encl', $nexus);
my $msg = q{};
if (defined $occupied_slots && defined $total_slots) {
$msg = sprintf 'Enclosure %s [%s, %d/%d slots occupied] on ctrl %d is %s',
$nexus, $name, $occupied_slots, $total_slots, $ctrl, $state;
}
else {
$msg = sprintf 'Enclosure %s [%s] on controller %d is %s',
$nexus, $name, $ctrl, $state;
}
report('storage', $msg, $status2nagios{$status}, $nexus);
}
return;
}
#-----------------------------------------
# STORAGE: Check enclosure fans
#-----------------------------------------
sub check_enclosure_fans {
return if $#controllers == -1;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $speed = undef;
my $encl_id = undef;
my $encl_name = undef;
my @output = ();
if ($snmp) {
my %fan_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.7.1.2' => 'fanName',
'1.3.6.1.4.1.674.10893.1.20.130.7.1.4' => 'fanState',
'1.3.6.1.4.1.674.10893.1.20.130.7.1.11' => 'fanProbeCurrValue',
'1.3.6.1.4.1.674.10893.1.20.130.7.1.15' => 'fanComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.7.1.16' => 'fanNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.8.1.4' => 'fanConnectionEnclosureName',
'1.3.6.1.4.1.674.10893.1.20.130.8.1.5' => 'fanConnectionEnclosureNumber',
);
my $result = undef;
if ($opt{use_get_table}) {
my $fanTable = '1.3.6.1.4.1.674.10893.1.20.130.7';
my $fanConnectionTable = '1.3.6.1.4.1.674.10893.1.20.130.8';
$result = $snmp_session->get_table(-baseoid => $fanTable);
my $ext = $snmp_session->get_table(-baseoid => $fanConnectionTable);
if (defined $result) {
defined $ext && map { $$result{$_} = $$ext{$_} } keys %{ $ext };
}
}
else {
$result = $snmp_session->get_entries(-columns => [keys %fan_oid]);
}
# No enclosure fans is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%fan_oid) };
}
else {
foreach my $enc (@enclosures) {
push @output, @{ run_omreport("storage enclosure controller=$enc->{ctrl} enclosure=$enc->{id} info=fans") };
map_item('ctrl', $enc->{ctrl}, \@output);
map_item('encl_id', $enc->{id}, \@output);
map_item('encl_name', $enc->{name}, \@output);
}
}
my %fan_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
6 => 'Degraded',
21 => 'Missing',
);
# Check fans on each of the enclosures
FAN:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{fanName} || 'Unknown fan';
$state = get_hashval($out->{fanState}, \%fan_state) || 'Unknown state';
$status = get_snmp_status($out->{fanComponentStatus});
$speed = $out->{fanProbeCurrValue} || 'N/A';
$encl_name = $out->{fanConnectionEnclosureName} || 'Unknown enclosure';
$encl_id = $snmp_enclosure{$out->{fanConnectionEnclosureNumber}}{nexus};
$nexus = convert_nexus(($out->{fanNexusID} || 9999));
}
else {
$name = get_nonempty_string('Name', $out, 'Unknown fan');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$speed = get_nonempty_string('Speed', $out, 'N/A');
$encl_id = join q{:}, $out->{ctrl}, $out->{'encl_id'};
$encl_name = $out->{encl_name};
$nexus = join q{:}, $out->{ctrl}, $out->{'encl_id'}, get_nonempty_string('ID', $out, '9999');
}
next FAN if blacklisted('encl_fan', $nexus);
# Default
if ($status ne 'Ok') {
my $msg = sprintf '%s in enclosure %s [%s] needs attention: %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
# Ok
else {
my $msg = sprintf '%s in enclosure %s [%s] is %s (speed=%s)',
$name, $encl_id, $encl_name, $state, $speed;
report('storage', $msg, $E_OK, $nexus);
}
}
return;
}
#-----------------------------------------
# STORAGE: Check enclosure power supplies
#-----------------------------------------
sub check_enclosure_pwr {
return if $#controllers == -1;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $encl_id = undef;
my $encl_name = undef;
my @output = ();
if ($snmp) {
my %ps_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.9.1.2' => 'powerSupplyName',
'1.3.6.1.4.1.674.10893.1.20.130.9.1.4' => 'powerSupplyState',
'1.3.6.1.4.1.674.10893.1.20.130.9.1.9' => 'powerSupplyComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.9.1.10' => 'powerSupplyNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.10.1.4' => 'powerSupplyConnectionEnclosureName',
'1.3.6.1.4.1.674.10893.1.20.130.10.1.5' => 'powerSupplyConnectionEnclosureNumber',
);
my $result = undef;
if ($opt{use_get_table}) {
my $powerSupplyTable = '1.3.6.1.4.1.674.10893.1.20.130.9';
my $powerSupplyConnectionTable = '1.3.6.1.4.1.674.10893.1.20.130.10';
$result = $snmp_session->get_table(-baseoid => $powerSupplyTable);
my $ext = $snmp_session->get_table(-baseoid => $powerSupplyConnectionTable);
if (defined $result) {
defined $ext && map { $$result{$_} = $$ext{$_} } keys %{ $ext };
}
}
else {
$result = $snmp_session->get_entries(-columns => [keys %ps_oid]);
}
# No enclosure power supplies is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%ps_oid) };
}
else {
foreach my $enc (@enclosures) {
push @output, @{ run_omreport("storage enclosure controller=$enc->{ctrl} enclosure=$enc->{id} info=pwrsupplies") };
map_item('ctrl', $enc->{ctrl}, \@output);
map_item('encl_id', $enc->{id}, \@output);
map_item('encl_name', $enc->{name}, \@output);
}
}
my %ps_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
5 => 'Not Installed',
6 => 'Degraded',
11 => 'Removed',
21 => 'Missing',
);
# Check power supplies on each of the enclosures
PS:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{powerSupplyName} || 'Unknown PSU';
$state = get_hashval($out->{powerSupplyState}, \%ps_state) || 'Unknown state';
$status = get_snmp_status($out->{powerSupplyComponentStatus});
$encl_id = $snmp_enclosure{$out->{powerSupplyConnectionEnclosureNumber}}{nexus};
$encl_name = $out->{powerSupplyConnectionEnclosureName} || 'Unknown enclosure';
$nexus = convert_nexus(($out->{powerSupplyNexusID} || 9999));
}
else {
$name = get_nonempty_string('Name', $out, 'Unknown PSU');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$encl_id = join q{:}, $out->{ctrl}, $out->{'encl_id'};
$encl_name = $out->{encl_name};
$nexus = join q{:}, $out->{ctrl}, $out->{'encl_id'}, get_nonempty_string('ID', $out, '9999');
}
next PS if blacklisted('encl_ps', $nexus);
# Default
if ($status ne 'Ok') {
my $msg = sprintf '%s in enclosure %s [%s] needs attention: %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
# Ok
else {
my $msg = sprintf '%s in enclosure %s [%s] is %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $E_OK, $nexus);
}
}
return;
}
#-----------------------------------------
# STORAGE: Check enclosure temperatures
#-----------------------------------------
sub check_enclosure_temp {
return if $#controllers == -1;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $reading = undef;
my $unit = undef;
my $max_warn = undef;
my $max_crit = undef;
my $min_warn = undef;
my $min_crit = undef;
my $encl_id = undef;
my $encl_name = undef;
my @output = ();
if ($snmp) {
my %temp_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.11.1.2' => 'temperatureProbeName',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.4' => 'temperatureProbeState',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.6' => 'temperatureProbeUnit',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.7' => 'temperatureProbeMinWarning',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.8' => 'temperatureProbeMinCritical',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.9' => 'temperatureProbeMaxWarning',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.10' => 'temperatureProbeMaxCritical',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.11' => 'temperatureProbeCurValue',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.13' => 'temperatureProbeComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.11.1.14' => 'temperatureProbeNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.12.1.4' => 'temperatureConnectionEnclosureName',
'1.3.6.1.4.1.674.10893.1.20.130.12.1.5' => 'temperatureConnectionEnclosureNumber',
);
my $result = undef;
if ($opt{use_get_table}) {
my $temperatureProbeTable = '1.3.6.1.4.1.674.10893.1.20.130.11';
my $temperatureConnectionTable = '1.3.6.1.4.1.674.10893.1.20.130.12';
$result = $snmp_session->get_table(-baseoid => $temperatureProbeTable);
my $ext = $snmp_session->get_table(-baseoid => $temperatureConnectionTable);
if (defined $result) {
defined $ext && map { $$result{$_} = $$ext{$_} } keys %{ $ext };
}
}
else {
$result = $snmp_session->get_entries(-columns => [keys %temp_oid]);
}
# No enclosure temperature probes is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%temp_oid) };
}
else {
foreach my $enc (@enclosures) {
push @output, @{ run_omreport("storage enclosure controller=$enc->{ctrl} enclosure=$enc->{id} info=temps") };
map_item('ctrl', $enc->{ctrl}, \@output);
map_item('encl_id', $enc->{id}, \@output);
map_item('encl_name', $enc->{name}, \@output);
}
}
my %temp_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
4 => 'Offline',
6 => 'Degraded',
9 => 'Inactive',
21 => 'Missing',
);
# Check temperature probes on each of the enclosures
TEMP:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{temperatureProbeName} || 'Unknown temp probe';
$state = get_hashval($out->{temperatureProbeState}, \%temp_state) || 'Unknown state';
$status = get_snmp_probestatus($out->{temperatureProbeComponentStatus});
$unit = $out->{temperatureProbeUnit} || 'Unknown unit';
$reading = $out->{temperatureProbeCurValue} || '[N/A]';
$max_warn = $out->{temperatureProbeMaxWarning} || '[N/A]';
$max_crit = $out->{temperatureProbeMaxCritical} || '[N/A]';
$min_warn = $out->{temperatureProbeMinWarning} || '[N/A]';
$min_crit = $out->{temperatureProbeMinCritical} || '[N/A]';
$encl_id = $snmp_enclosure{$out->{temperatureConnectionEnclosureNumber}}{nexus};
$encl_name = $out->{temperatureConnectionEnclosureName} || 'Unknown enclosure';
$nexus = convert_nexus(($out->{temperatureProbeNexusID} || 9999));
}
else {
$name = get_nonempty_string('Name', $out, 'Unknown temp probe');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$unit = 'FIXME';
$reading = get_nonempty_string('Reading', $out, '[N/A]');
$max_warn = get_nonempty_string('Maximum Warning Threshold', $out, '[N/A]');
$max_crit = get_nonempty_string('Maximum Failure Threshold', $out, '[N/A]');
$min_warn = get_nonempty_string('Minimum Warning Threshold', $out, '[N/A]');
$min_crit = get_nonempty_string('Minimum Failure Threshold', $out, '[N/A]');
$encl_id = join q{:}, $out->{ctrl}, $out->{'encl_id'};
$encl_name = $out->{encl_name};
$nexus = join q{:}, $out->{ctrl}, $out->{'encl_id'}, get_nonempty_string('ID', $out, '9999');
}
next TEMP if blacklisted('encl_temp', $nexus);
# Make sure these values are integers
$reading =~ s{\A \s* (-?\d+) \s* C? \s* \z}{$1}xms or $reading = '[N/A]';
$max_warn =~ s{\A \s* (-?\d+) \s* C? \s* \z}{$1}xms or $max_warn = '[N/A]';
$max_crit =~ s{\A \s* (-?\d+) \s* C? \s* \z}{$1}xms or $max_crit = '[N/A]';
$min_warn =~ s{\A \s* (-?\d+) \s* C? \s* \z}{$1}xms or $min_warn = '[N/A]';
$min_crit =~ s{\A \s* (-?\d+) \s* C? \s* \z}{$1}xms or $min_crit = '[N/A]';
# Convert temp units
if ($opt{tempunit} ne 'C') {
$reading = temp_from_celsius($reading, $opt{tempunit});
$max_warn = temp_from_celsius($max_warn, $opt{tempunit});
$max_crit = temp_from_celsius($max_crit, $opt{tempunit});
$min_warn = temp_from_celsius($min_warn, $opt{tempunit});
$min_crit = temp_from_celsius($min_crit, $opt{tempunit});
}
# Inactive temp probes
if ($status eq 'Unknown' and $state eq 'Inactive') {
my $msg = sprintf '%s in enclosure %s [%s] is %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $E_OK, $nexus);
}
elsif ($status ne 'Ok' and $max_crit ne '[N/A]' and $reading > $max_crit) {
my $msg = sprintf '%s in enclosure %s [%s] is critically high at %s %s',
$name, $encl_id, $encl_name, $reading, $opt{tempunit};
my $err = $snmp ? $probestatus2nagios{$status} : $status2nagios{$status};
report('chassis', $msg, $err, $nexus);
}
elsif ($status ne 'Ok' and $max_warn ne '[N/A]' and $reading > $max_warn) {
my $msg = sprintf '%s in enclosure %s [%s] is too high at %s %s',
$name, $encl_id, $encl_name, $reading, $opt{tempunit};
my $err = $snmp ? $probestatus2nagios{$status} : $status2nagios{$status};
report('chassis', $msg, $err, $nexus);
}
elsif ($status ne 'Ok' and $min_crit ne '[N/A]' and $reading < $min_crit) {
my $msg = sprintf '%s in enclosure %s [%s] is critically low at %s %s',
$name, $encl_id, $encl_name, $reading, $opt{tempunit};
my $err = $snmp ? $probestatus2nagios{$status} : $status2nagios{$status};
report('chassis', $msg, $err, $nexus);
}
elsif ($status ne 'Ok' and $min_warn ne '[N/A]' and $reading < $min_warn) {
my $msg = sprintf '%s in enclosure %s [%s] is too low at %s %s',
$name, $encl_id, $encl_name, $reading, $opt{tempunit};
my $err = $snmp ? $probestatus2nagios{$status} : $status2nagios{$status};
report('chassis', $msg, $err, $nexus);
}
# Default
elsif ($status ne 'Ok') {
my $msg = sprintf '%s in enclosure %s [%s] is %s',
$name, $encl_id, $encl_name, $state;
if (defined $reading && $reading =~ m{\A -?\d+ \z}xms) {
# take into account that with certain states the
# reading doesn't exist or is not an integer
$msg .= sprintf ' at %s %s', $reading, $opt{tempunit};
if ($min_warn eq '[N/A]' or $min_crit eq '[N/A]') {
$msg .= sprintf ' (max=%s/%s)', $max_warn, $max_crit;
}
else {
$msg .= sprintf ' (min=%s/%s, max=%s/%s)',
$min_warn, $min_crit, $max_warn, $max_crit;
}
}
my $err = $snmp ? $probestatus2nagios{$status} : $status2nagios{$status};
report('storage', $msg, $err, $nexus);
}
# Ok
else {
my $msg = sprintf '%s in enclosure %s [%s]',
$name, $encl_id, $encl_name;
if (defined $reading && $reading ne '[N/A]') {
# take into account that with certain states the
# reading doesn't exist or is not an integer
$msg .= sprintf ' reads %s %s', $reading, $opt{tempunit};
if ($min_warn eq '[N/A]' or $min_crit eq '[N/A]') {
$msg .= sprintf ' (max=%s/%s)', $max_warn, $max_crit;
}
else {
$msg .= sprintf ' (min=%s/%s, max=%s/%s)',
$min_warn, $min_crit, $max_warn, $max_crit;
}
}
else {
$msg .= sprintf ' is %s', $state;
}
report('storage', $msg, $E_OK, $nexus);
}
# Collect performance data
if (defined $opt{perfdata} && $reading ne '[N/A]') {
my $index = $name;
$index =~ s{\A Temperature\sProbe\s(\d+) \z}{$1}gxms;
my $legacy_name = $name;
$legacy_name =~ s{\A Temperature\sProbe\s(\d+) \z}{temp_$1}gxms;
my $legacy_label = lc "enclosure_${encl_id}_${legacy_name}";
my $legacy_mini = $legacy_label;
$legacy_mini =~ s{enclosure_(.+?)_temp_(.+?)}{e$1t$2}xms;
push @perfdata, {
type => 'E',
id => $opt{perfdata} eq 'minimal' ? "${encl_id}_t${index}" : "${encl_id}_temp_${index}",
unit => $opt{tempunit},
label => q{},
legacy => $legacy_label,
mini => $legacy_mini,
value => $reading,
warn => $max_warn,
crit => $max_crit,
};
}
}
return;
}
#-----------------------------------------
# STORAGE: Check enclosure management modules (EMM)
#-----------------------------------------
sub check_enclosure_emms {
return if $#controllers == -1;
my $nexus = undef;
my $name = undef;
my $state = undef;
my $status = undef;
my $encl_id = undef;
my $encl_name = undef;
my @output = ();
if ($snmp) {
my %emms_oid
= (
'1.3.6.1.4.1.674.10893.1.20.130.13.1.2' => 'enclosureManagementModuleName',
'1.3.6.1.4.1.674.10893.1.20.130.13.1.4' => 'enclosureManagementModuleState',
'1.3.6.1.4.1.674.10893.1.20.130.13.1.11' => 'enclosureManagementModuleComponentStatus',
'1.3.6.1.4.1.674.10893.1.20.130.13.1.12' => 'enclosureManagementModuleNexusID',
'1.3.6.1.4.1.674.10893.1.20.130.14.1.4' => 'enclosureManagementModuleConnectionEnclosureName',
'1.3.6.1.4.1.674.10893.1.20.130.14.1.5' => 'enclosureManagementModuleConnectionEnclosureNumber',
);
my $result = undef;
if ($opt{use_get_table}) {
my $enclosureManagementModuleTable = '1.3.6.1.4.1.674.10893.1.20.130.13';
my $enclosureManagementModuleConnectionTable = '1.3.6.1.4.1.674.10893.1.20.130.14';
$result = $snmp_session->get_table(-baseoid => $enclosureManagementModuleTable);
my $ext = $snmp_session->get_table(-baseoid => $enclosureManagementModuleConnectionTable);
if (defined $result) {
defined $ext && map { $$result{$_} = $$ext{$_} } keys %{ $ext };
}
}
else {
$result = $snmp_session->get_entries(-columns => [keys %emms_oid]);
}
# No enclosure EMMs is OK
return if !defined $result;
@output = @{ get_snmp_output($result, \%emms_oid) };
}
else {
foreach my $enc (@enclosures) {
push @output, @{ run_omreport("storage enclosure controller=$enc->{ctrl} enclosure=$enc->{id} info=emms") };
map_item('ctrl', $enc->{ctrl}, \@output);
map_item('encl_id', $enc->{id}, \@output);
map_item('encl_name', $enc->{name}, \@output);
}
}
my %emms_state
= (
0 => 'Unknown',
1 => 'Ready',
2 => 'Failed',
3 => 'Online',
4 => 'Offline',
5 => 'Not Installed',
6 => 'Degraded',
21 => 'Missing',
);
# Check EMMs on each of the enclosures
EMM:
foreach my $out (@output) {
if ($snmp) {
$name = $out->{enclosureManagementModuleName} || 'Unknown EMM';
$state = get_hashval($out->{enclosureManagementModuleState}, \%emms_state) || 'Unknown state';
$status = get_snmp_status($out->{enclosureManagementModuleComponentStatus});
$encl_id = $snmp_enclosure{$out->{enclosureManagementModuleConnectionEnclosureNumber}}{nexus};
$encl_name = $out->{enclosureManagementModuleConnectionEnclosureName} || 'Unknown enclosure';
$nexus = convert_nexus(($out->{enclosureManagementModuleNexusID} || 9999));
}
else {
$name = get_nonempty_string('Name', $out, 'Unknown EMM');
$state = get_nonempty_string('State', $out, 'Unknown state');
$status = get_nonempty_string('Status', $out, 'Unknown');
$encl_id = join q{:}, $out->{ctrl}, $out->{'encl_id'};
$encl_name = $out->{encl_name};
$nexus = join q{:}, $out->{ctrl}, $out->{'encl_id'}, get_nonempty_string('ID', $out, '9999');
}
next EMM if blacklisted('encl_emm', $nexus);
# Not installed
if ($status =~ m{\A Other|Unknown \z}xms and $state eq 'Not Installed') {
my $msg = sprintf '%s in enclosure %s [%s] is %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $E_OK, $nexus);
}
# Default
elsif ($status ne 'Ok') {
my $msg = sprintf '%s in enclosure %s [%s] needs attention: %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $status2nagios{$status}, $nexus);
}
# Ok
else {
my $msg = sprintf '%s in enclosure %s [%s] is %s',
$name, $encl_id, $encl_name, $state;
report('storage', $msg, $E_OK, $nexus);
}
}
return;
}
#-----------------------------------------
# CHASSIS: Check memory modules
#-----------------------------------------
sub check_memory {
my $index = undef;
my $status = undef;
my $location = undef;
my $size = undef;
my $modes = undef;
my @failures = ();
my @output = ();
if ($snmp) {
my %dimm_oid
= (
'1.3.6.1.4.1.674.10892.1.1100.50.1.2.1' => 'memoryDeviceIndex',
'1.3.6.1.4.1.674.10892.1.1100.50.1.5.1' => 'memoryDeviceStatus',
'1.3.6.1.4.1.674.10892.1.1100.50.1.8.1' => 'memoryDeviceLocationName',
'1.3.6.1.4.1.674.10892.1.1100.50.1.14.1' => 'memoryDeviceSize',
'1.3.6.1.4.1.674.10892.1.1100.50.1.20.1' => 'memoryDeviceFailureModes',
);
my $result = undef;
if ($opt{use_get_table}) {
my $memoryDeviceTable = '1.3.6.1.4.1.674.10892.1.1100.50.1';
$result = $snmp_session->get_table(-baseoid => $memoryDeviceTable);
}
else {
$result = $snmp_session->get_entries(-columns => [keys %dimm_oid]);
}
if (!defined $result) {
printf "SNMP ERROR [memory]: %s.\n", $snmp_session->error;
$snmp_session->close;
exit $E_UNKNOWN;
}
@output = @{ get_snmp_output($result, \%dimm_oid) };
}
else {
@output = @{ run_omreport("$omopt_chassis memory") };
}
# Note: These values are bit masks, so combination values are
# possible. If value is 0 (zero), memory device has no faults.
my %failure_mode
= (
1 => 'ECC single bit correction warning rate exceeded',
2 => 'ECC single bit correction failure rate exceeded',
4 => 'ECC multibit fault encountered',
8 => 'ECC single bit correction logging disabled',
16 => 'device disabled because of spare activation',
);
DIMM:
foreach my $out (@output) {
@failures = (); # Initialize
if ($snmp) {
$index = ($out->{memoryDeviceIndex} || 10000) - 1;
$status = get_snmp_status($out->{memoryDeviceStatus});
$location = $out->{memoryDeviceLocationName} || 'Unknown location';
$size = sprintf '%d MB', ($out->{memoryDeviceSize} || 0)/1024;
$modes = $out->{memoryDeviceFailureModes} || -9999;
if ($modes > 0) {
foreach my $mask (sort keys %failure_mode) {
if (($modes & $mask) != 0) { push @failures, $failure_mode{$mask}; }
}
}
elsif ($modes == -9999) {
push @failures, q{ERROR: Failure modes not available via SNMP};
}
}
else {
my $type = get_nonempty_string('Type', $out, q{});
$index = $type eq '[Not Occupied]' ? undef : get_nonempty_string('Index', $out, 9999);
$status = get_nonempty_string('Status', $out, 'Unknown');
$location = get_nonempty_string('Connector Name', $out, 'Unknown location');
$size = get_nonempty_string('Size', $out, 0);
if (defined $size) {
$size =~ s{\s\s}{ }gxms;
}
# Run 'omreport chassis memory index=X' to get the failures
if ($status ne 'Ok' && defined $index) {
foreach (@{ run_command("$omreport $omopt_chassis memory index=$index -fmt ssv") }) {
if (m/\A Failures; (.+?) \z/xms) {
chop(my $fail = $1);
push @failures, split m{\.}xms, $fail;
}
}
}
}
$location =~ s{\A \s*(.*?)\s* \z}{$1}xms;
# calculate total memory
my $msize = defined $size ? $size : 0;
$msize =~ s{\A (\d+) \s MB}{$1}xms;
$count{mem} += $msize;
# Ignore empty memory slots
next DIMM if !defined $index;
$count{dimm}++;
next DIMM if blacklisted('dimm', $index);
if ($status ne 'Ok') {
my $msg = undef;
if (scalar @failures == 0) {
$msg = sprintf 'Memory module %d [%s, %s] needs attention (%s)',
$index, $location, $size, $status;
}
else {
$msg = sprintf 'Memory module %d [%s, %s] needs attention: %s',
$index, $location, $size, (join q{, }, @failures);
}
report('chassis', $msg, $status2nagios{$status}, $index);
}
# Ok
else {
my $msg = sprintf 'Memory module %d [%s, %s] is %s',
$index, $location, $size, $status;
report('chassis', $msg, $E_OK, $index);
}
}
return;
}
#-----------------------------------------
# CHASSIS: Check fans
#-----------------------------------------
sub check_fans {
my $index = undef;
my $status = undef;
my $reading = undef;
my $location = undef;
my $max_crit = undef;
my $max_warn = undef;
my @output = ();
if ($snmp) {
my %cool_oid
= (
'1.3.6.1.4.1.674.10892.1.700.12.1.2.1' => 'coolingDeviceIndex',
'1.3.6.1.4.1.674.10892.1.700.12.1.5.1' => 'coolingDeviceStatus',
'1.3.6.1.4.1.674.10892.1.700.12.1.6.1' => 'coolingDeviceReading',
'1.3.6.1.4.1.674.10892.1.700.12.1.8.1' => 'coolingDeviceLocationName',
'1.3.6.1.4.1.674.10892.1.700.12.1.10.1' => 'coolingDeviceUpperCriticalThreshold',
'1.3.6.1.4.1.674.10892.1.700.12.1.11.1' => 'coolingDeviceUpperNonCriticalThreshold',
);
my $result = undef;
if ($opt{use_get_table}) {
my $coolingDeviceTable = '1.3.6.1.4.1.674.10892.1.700.12.1';
$result = $snmp_session->get_table(-baseoid => $coolingDeviceTable);
}
else {
$result = $snmp_session->get_entries(-columns => [keys %cool_oid]);
}
if ($blade && !defined $result) {
return 0;
}
elsif (!$blade && !defined $result) {
printf "SNMP ERROR [cooling]: %s.\n", $snmp_session->error;
$snmp_session->close;
exit $E_UNKNOWN;
}
@output = @{ get_snmp_output($result, \%cool_oid) };
}
else {
@output = @{ run_omreport("$omopt_chassis fans") };
}
FAN:
foreach my $out (@output) {
if ($snmp) {
$index = ($out->{coolingDeviceIndex} || 10000) - 1;
$status