|
|
@@ -0,0 +1,899 @@
|
|
|
+#!/usr/bin/perl
|
|
|
+#
|
|
|
+# ============================== SUMMARY =====================================
|
|
|
+#
|
|
|
+# Program : check_snmp_temperature.pl
|
|
|
+# Version : 0.41
|
|
|
+# Date : Mar 23, 2012
|
|
|
+# Author : William Leibzon - william@leibzon.org
|
|
|
+# Summary : This is a nagios plugin that checks temperature sensors
|
|
|
+# using SNMP. Dell, HP, Cisco and other types are supported
|
|
|
+# and for other systems OIDs can be easily specified too
|
|
|
+# Licence : GPL - summary below, text at http://www.fsf.org/licenses/gpl.txt
|
|
|
+#
|
|
|
+# =========================== PROGRAM LICENSE =================================
|
|
|
+#
|
|
|
+# This program is free software; you can redistribute it and/or modify
|
|
|
+# it under the terms of the GNU General Public License as published by
|
|
|
+# the Free Software Foundation; either version 2 of the License, or
|
|
|
+# (at your option) any later version.
|
|
|
+#
|
|
|
+# This program is distributed in the hope that it will be useful,
|
|
|
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
+# GNU General Public License for more details.
|
|
|
+#
|
|
|
+# You should have received a copy of the GNU General Public License
|
|
|
+# along with this program; if not, write to the Free Software
|
|
|
+# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
+#
|
|
|
+# ===================== INFORMATION ABOUT THIS PLUGIN =========================
|
|
|
+#
|
|
|
+# This Temperature check plugin that retreives temperature sensor values from
|
|
|
+# SNMP and can issue alerts if selected parameters are above given number
|
|
|
+# It also returns performance data for further nagios 2.0 post-processing
|
|
|
+#
|
|
|
+# This program is written and maintained by:
|
|
|
+# William Leibzon - william(at)leibzon.org
|
|
|
+# It is partially based on check_snmp_* plugins by:
|
|
|
+# Patrick Proy (patrick at proy.org)
|
|
|
+#
|
|
|
+# ============================= SETUP NOTES ====================================
|
|
|
+#
|
|
|
+# Make sure to check and if necessary adjust the the path to utils.pm
|
|
|
+# Make sure you have Net::SNMP perl module installed
|
|
|
+#
|
|
|
+# If you want to check Dell servers, HP server, Juniper routers or
|
|
|
+# Cisco Switches/Routers (cisco 7500, 5500, 2948) then you may skip
|
|
|
+# much of the configuration hassles and use pre-programmed settings
|
|
|
+# by using "--type" (or -T) parameter, you do still need to specify
|
|
|
+# though if you want output as C or F with '-o' option (see examples).
|
|
|
+# The plugin currently does not support finding critical & warning
|
|
|
+# thresholds which most systems also report in SNMP, so actual thresholds
|
|
|
+# you will need to specify as well.
|
|
|
+#
|
|
|
+# NOTE: If you've previously used 0.2x version of this plugin to
|
|
|
+# check HP equipment, beware that 0.3 version has "incompatible"
|
|
|
+# change in that it returns human-readable sensor names rather
|
|
|
+# then using HP locale ids to enumerate sensors. If you need
|
|
|
+# old behavior then instead of using '-T hp' as parameter
|
|
|
+# use '-N 1.3.6.1.4.1.232.6.2.6.8.1.3 -D 1.3.6.1.4.1.232.6.2.6.8.1.4'
|
|
|
+#
|
|
|
+# If you're using some other device then you need to check documentation to
|
|
|
+# figure out correct parameters for this plugin, then specify base temperature
|
|
|
+# sensor names table OID with '-N' and values table OID with '-D. You also need
|
|
|
+# to specify what base sensor temperature data type is with "-i" (see below).
|
|
|
+#
|
|
|
+# The way plugin works is to walk the snmp tree from base names OID and find
|
|
|
+# all the sensor names. Then it compares names given with '-a' (names are
|
|
|
+# seperated by ',') to those found in the snmp tree (in '-a' you're expected
|
|
|
+# to specify one word which would be found in the full sensor name and
|
|
|
+# is unique for thaqt `sensor) and uses OID ending (i.e. part of OID after
|
|
|
+# the base) and adds it to base value table OID to create OID to be retrieved
|
|
|
+# (similar to how you find ethernet statistics OIDs based on name of the
|
|
|
+# interface and in fact many of SNMP parameters are like that).
|
|
|
+#
|
|
|
+# Note: If you don't know temperature sensor names on your system do:
|
|
|
+# check_snmp_temperature -v -A '*' ...
|
|
|
+# (using '-v' option forces debugging output that should further help)
|
|
|
+#
|
|
|
+# If your system does not have table with sensor names you can still use
|
|
|
+# this plugin if you know exact temperature data OIDs. Then you specify list
|
|
|
+# of names sensors should be known by with '-n' option and list of data OIDs
|
|
|
+# with '-d' option (this can also be useful if you want to avoid having plugin
|
|
|
+# do snmp table walk each time as retrieving specific list of OIDs is faster).
|
|
|
+# You will still need to specify what is likely the same sensor names you
|
|
|
+# you put in '-n' with '-a' or '-A' option.
|
|
|
+#
|
|
|
+# Request: If you have an new type of device and as per above you figured
|
|
|
+# out SNMP parameters that work, please send me email with this
|
|
|
+# information so that I can add it as a new system type.
|
|
|
+#
|
|
|
+# The values retrieved are compared to specified warning and critical values,
|
|
|
+# but first the temperature has to be converted from base measurement units to
|
|
|
+# measurement units you want. These units are Celsius (C) or Fahrenheit (F)
|
|
|
+# or Kelvin (K) with input measurement unit specified with '-i' and output
|
|
|
+# specified with '-o'. For input you sometimes have situation where sensor
|
|
|
+# reports 10xRealValue, i.e. 33.5C is reported as 335 - this is supported
|
|
|
+# too and then input type is specified as '-i 10C'.
|
|
|
+#
|
|
|
+# Warning and critical values are specified with '-w' and '-c' and each
|
|
|
+# one must have exact same number of values (separated by ',') as number
|
|
|
+# of sensor names specified with '-a'. Any values you dont want to compare
|
|
|
+# you specify as 0 or just not specify (i.e. -w ',50,'). In some cases you
|
|
|
+# might not get data for specific sensor and want to substitute default
|
|
|
+# value - this is supported with '-u' option (note that default values
|
|
|
+# is in fact compared against -w and -c).
|
|
|
+#
|
|
|
+# Additionally if you want performance output then use '-f' option to get all
|
|
|
+# the sensors specified in '-a' or specify particular list of sensors for
|
|
|
+# performance data with '-A' (this list can include names not found in '-a').
|
|
|
+# A special option of -A '*' will allow to get data from all sensors found
|
|
|
+# and is this very useful to find what sensors you have with manual run.
|
|
|
+#
|
|
|
+# ========================= SETUP EXAMPLES ==================================
|
|
|
+#
|
|
|
+# define command {
|
|
|
+# command_name check_cisco_temperature
|
|
|
+# command_line $USER1$/check_snmp_temperature.pl -f -H $HOSTADDRESS$ --type=cisco1 -o F -C $ARG1$ -a $ARG2$ -w $ARG3$ -c $ARG4$
|
|
|
+# }
|
|
|
+#
|
|
|
+# define service{
|
|
|
+# use std-service
|
|
|
+# hostgroup_name cs2948
|
|
|
+# service_description Temperature
|
|
|
+# check_command check_cisco_temperature!foo!Chassis!160!190
|
|
|
+# }
|
|
|
+#
|
|
|
+# define command{
|
|
|
+# command_name check_dell_temperature
|
|
|
+# command_line $USER1$/check_snmp_temperature.pl -H $HOSTADDRESS$ -C public \
|
|
|
+# -N .1.3.6.1.4.1.674.10892.1.700.20.1.8 \
|
|
|
+# -D .1.3.6.1.4.1.674.10892.1.700.20.1.6 -i 10C -o F -u 0 \
|
|
|
+# -a ARG1$ -w $ARG2$ -c $ARG3$ -f
|
|
|
+# }
|
|
|
+#
|
|
|
+# define service {
|
|
|
+# use std-service
|
|
|
+# hostgroup_name dell_1750
|
|
|
+# service_description Temperature
|
|
|
+# check_command check_dell_temperature!CPU,Ambient,Bottom!110,90,0!135,110,0
|
|
|
+# }
|
|
|
+#
|
|
|
+# For some dell systems with all sensors enabled you can replace the above with:
|
|
|
+# check_command check_temperature!'CPU,PROC_1,PROC_2,Ambient,Bottom,BMC Planar,BMC Riser'!110,120,120,90,90,105,105!135,140,140,110,110,125,125
|
|
|
+#
|
|
|
+# ==================== CHANGES/RELEASE, TODO ==================================
|
|
|
+#
|
|
|
+# 0.1 - ??? 2006 : Simple plugin where temperature table OIDs were to be
|
|
|
+# specified directly as parameter. Was used for checking Dell
|
|
|
+# 0.2 - Aug 2006 : Support multiple types of equipment by using config
|
|
|
+# hash/array and --type parameter
|
|
|
+# 0.21 - Dec 2006 : Added support for Juniper and HP
|
|
|
+# 0.22 - Dec 2006 : Added quick hack to interpret 0 value as "dont' check" threshold
|
|
|
+# 0.23 - Dec 2007 : Bug Fixes (especially one involving F as input format)
|
|
|
+# 0.3 - Jan 2008 : Added '-n' and '-d' options to specify exact list of
|
|
|
+# sensor names and oids.
|
|
|
+# Also when you specify 'hp' type, the plugin will now
|
|
|
+# provide human-readable sensor names rather then purely
|
|
|
+# an id of their sensor locale (this is basicly special
|
|
|
+# hack just for HP since I don't know anyone else who
|
|
|
+# hard-coded sensor names by ids into SNMP MIB).
|
|
|
+# 0.31 - Feb 2008 : Bug fix due to report by Michael Timmers. The issue
|
|
|
+# was with sensor list that contains a name which matches
|
|
|
+# by regex with some other later sensor name. In this
|
|
|
+# case it was Juniper with "Routing Engine" which was
|
|
|
+# followed by "Routing Engine PCMCIA Card 0" sensor.
|
|
|
+# 0.32 - May 2008 : Minor bug fixes. Added baytech pdu SNMP OIDs
|
|
|
+# 0.33 - Aug 2008 : Full SNMPv3 support (contrib patch by Nicolas Deffayet)
|
|
|
+# 0.34 - Dec 2011 : Bug and small documentation fixes
|
|
|
+# 0.35 - Jan 2012 : Added reporting warning and critical threshold to
|
|
|
+# performance output (as 'name=temperature;warn;crit'
|
|
|
+# based on what become nagios standard for this info)
|
|
|
+# Documentation history and todo updates (added 0.1 & 0.2
|
|
|
+# versions from below info to above), updated on todo
|
|
|
+# 0.36 - Jan 2012 : If data is missing return "UNKNOWN"
|
|
|
+# Added linux 'lmsensors' as type of device
|
|
|
+# In order to suppot this you need lmsensors package
|
|
|
+# and snmpd compiled as:
|
|
|
+# --with-mib-modules="ucd-snmp/lmSensors ucd-snmp/diskio"
|
|
|
+# 0.40 (beta) - Mar 2012 :
|
|
|
+# Imported newest code from check_mysqld 0.93 to support full nagios
|
|
|
+# threshold specification (including ranges) as well as reporting
|
|
|
+# of warn/crit threshold in performance data. This changes internal
|
|
|
+# processing significantly and it needs to be tested more.
|
|
|
+# 0.41 - Mar 23, 2013: Fixed bug in parse_threshold function, reported by Charlie Langrall
|
|
|
+# official release of 0.4 code branch
|
|
|
+#
|
|
|
+# TODO and older revision history:
|
|
|
+# -- TODO ON TODO --> since most of below is done, it should be cleaned up sometime later
|
|
|
+#
|
|
|
+# 1. [DONE - Aug 2006] To support multiple types of equipment add config
|
|
|
+# array/hash and --type parameter
|
|
|
+# 2. More plugin types for various other equipment need to be added ...
|
|
|
+# [DONE - Dec 2006] - added Juniper & HP
|
|
|
+# 3. [DONE - Mar 2012] Need to update warn & crit parameters parsing code so
|
|
|
+# it would support both low and high values with '<' and '>' prefixed and
|
|
|
+# using '~' for don't check rather then 0
|
|
|
+# [DONE - Dec 2006] - added quick hack to interpret empty values
|
|
|
+# (i.e. -w ",90,") as dont check instead of specifying '0' directly
|
|
|
+# Note: Low temperature value checks are rarely needed for network
|
|
|
+# equipment so this is not high priority right now and will
|
|
|
+# be done together with #4 most likely as part of some general
|
|
|
+# library that would be shared with check_snmp_table and quite
|
|
|
+# likely other plugins where multiple "attributes" are specified
|
|
|
+# 4. [DONE - Mar 2012] Add threshold specification in nagios plugin spec compatible way
|
|
|
+# as was done with check_mysqld 0.9 which uses code similar to this check
|
|
|
+# Add specifying of WARN & CRIT after actual value ';' in the perf output
|
|
|
+# [DONE - Dec 2011] - added WARN & CRIT to perf, threshold spec still on todo
|
|
|
+# 5. Support specifying table OIDs for temperature threshold values.
|
|
|
+# I'll do it only after adding optional file caching so these values
|
|
|
+# can be retrieved about once every day rather then for each check.
|
|
|
+# 6. Support directly querying lmsensors on linux system without SNMP
|
|
|
+# plugin would then be renamed to check_temperature similar to check_netint
|
|
|
+#
|
|
|
+# ========================== START OF PROGRAM CODE ============================
|
|
|
+
|
|
|
+use strict;
|
|
|
+use Getopt::Long;
|
|
|
+use Data::Dumper;
|
|
|
+
|
|
|
+# Nagios specific
|
|
|
+our $TIMEOUT = 30;
|
|
|
+our %ERRORS;
|
|
|
+eval 'use utils qw(%ERRORS $TIMEOUT)';
|
|
|
+if ($@) {
|
|
|
+ $TIMEOUT = 30;
|
|
|
+ %ERRORS = ('OK'=>0,'WARNING'=>1,'CRITICAL'=>2,'UNKNOWN'=>3,'DEPENDENT'=>4);
|
|
|
+}
|
|
|
+
|
|
|
+our $no_snmp=0;
|
|
|
+eval 'use Net::SNMP';
|
|
|
+if ($@) {
|
|
|
+ $no_snmp=1;
|
|
|
+}
|
|
|
+
|
|
|
+# Below is hash array for several types of equipment, format here is that
|
|
|
+# key is name you can specify in "--type" and data for that key is 3-value
|
|
|
+# array with 1st value sensor names table OID (-N option), 2nd is sensor
|
|
|
+# data table OID (-D option) and 3rd is type of temperature reading (-i)
|
|
|
+# Additionally instead of specifying sensor names table OID and sensor data
|
|
|
+# root table OID, the first two arguments to array can be "" and then 4th and
|
|
|
+# 5th argument should be arrays first with list of sensor names and 2nd with
|
|
|
+# list of OIDs for data to be retrieved (see below for how its done for Alteon)
|
|
|
+my %system_types = ( "dell" => [ "1.3.6.1.4.1.674.10892.1.700.20.1.8", "1.3.6.1.4.1.674.10892.1.700.20.1.6", "10C" ],
|
|
|
+ "cisco1" => [ "1.3.6.1.4.1.9.9.13.1.3.1.2", "1.3.6.1.4.1.9.9.13.1.3.1.3", "C" ],
|
|
|
+ "cisco" => [ "1.3.6.1.4.1.9.9.13.1.3.1.2", "1.3.6.1.4.1.9.9.13.1.3.1.3", "C" ], # same as cisco 1 for now, this may change
|
|
|
+ "juniper" => [ "1.3.6.1.4.1.2636.3.1.13.1.5", "1.3.6.1.4.1.2636.3.1.13.1.7", "C" ], # somebody verify it, dont have juniper right now
|
|
|
+ "hp" => [ "1.3.6.1.4.1.232.6.2.6.8.1.3", "1.3.6.1.4.1.232.6.2.6.8.1.4", "C" ],
|
|
|
+ "alteon" => [ "", "", "C", ['RearLeftSensor', 'RearMiddleSensor', 'FrontMiddleSensor', 'FrontRightSensor'], ['1.3.6.1.4.1.1872.2.1.1.6.0','1.3.6.1.4.1.1872.2.1.1.7.0','1.3.6.1.4.1.1872.2.1.1.8.0','1.3.6.1.4.1.1872.2.1.1.9.0'] ], # why do they need to make these alteons so proprietory and hard to deal with?
|
|
|
+ "baytech" => [ "1.3.6.1.4.1.4779.1.3.5.2.1.2", "1.3.6.1.4.1.4779.1.3.5.2.1.8", "10C" ], # baytech pdu
|
|
|
+ "lmsensors" => [ "1.3.6.1.4.1.2021.13.16.2.1.2", "1.3.6.1.4.1.2021.13.16.2.1.3", "1000C" ], #linux with lmsensors
|
|
|
+ "linux" => [ "1.3.6.1.4.1.2021.13.16.2.1.2", "1.3.6.1.4.1.2021.13.16.2.1.3", "1000C" ],
|
|
|
+ );
|
|
|
+# APC OID for the temperature is .1.3.6.1.4.1.318.1.1.2.1.1.0
|
|
|
+# APC OID for the humidity is .1.3.6.1.4.1.318.1.1.2.1.2.0
|
|
|
+# Cisco fans: .1.3.6.1.4.1.9.9.13.1.4.1.3
|
|
|
+# HP switch temperature : .1.3.6.1.4.1.11.2.14.11.1.2.6.1.4.4
|
|
|
+# HP switch fan: .1.3.6.1.4.1.11.2.14.11.1.2.6.1.4.1
|
|
|
+
|
|
|
+my $Version='0.40';
|
|
|
+
|
|
|
+my $o_host= undef; # hostname
|
|
|
+my $o_community= undef; # community
|
|
|
+my $o_port= 161; # SNMP port
|
|
|
+my $o_help= undef; # help option
|
|
|
+my $o_verb= undef; # verbose mode
|
|
|
+my $o_version= undef; # version info option
|
|
|
+my $o_octets= 5000;
|
|
|
+my $o_warn= undef; # warning level option
|
|
|
+my @o_warnL= (); # array for above list
|
|
|
+my $o_crit= undef; # Critical level option
|
|
|
+my @o_critL= (); # array for above list
|
|
|
+my $o_perf= undef; # Performance data option
|
|
|
+my $o_timeout= 15; # Default 15s Timeout
|
|
|
+my $o_version2= undef; # use snmp v2c
|
|
|
+# SNMPv3 specific
|
|
|
+my $o_login= undef; # Login for snmpv3
|
|
|
+my $o_passwd= undef; # Pass for snmpv3
|
|
|
+my $v3protocols=undef; # V3 protocol list.
|
|
|
+my $o_authproto='md5'; # Auth protocol
|
|
|
+my $o_privproto='des'; # Priv protocol
|
|
|
+my $o_privpass= undef; # priv password
|
|
|
+
|
|
|
+my $o_attr= undef; # What attribute(s) to check (specify more then one separated by '.')
|
|
|
+my @o_attrL= (); # array for above list
|
|
|
+my $o_perfattr= undef; # List of attributes to only provide values in performance data but no checking
|
|
|
+my @o_perfattrL=(); # array for above list
|
|
|
+my $o_ounit= 'C'; # Output Temperature Measurement Units - can be 'C', 'F' or 'K'
|
|
|
+my $o_iunit= 'C'; # Incoming Temperature Measurement Units - can prefix with number if its n*temp
|
|
|
+my $oid_names= undef; # OID for base of sensor attribute names
|
|
|
+my $oid_data= undef; # OID for base of actual data for those attributes found when walking name base
|
|
|
+my $o_names= undef; # List of sensor names (as opposed to specifying names table)
|
|
|
+my $o_unkdef= undef; # Default value to report for unknown attributes
|
|
|
+my $o_type= undef; # Type of system to check (predefined values for $oid_names, $oid_data, $oid_iunit)
|
|
|
+my $o_sensornames=undef; # Option specifying list of sensor names that then go into @ar_sensornames array
|
|
|
+my $o_sensoroids=undef; # Option specifying list of sensor oids that then go into @ar_sensoroids array
|
|
|
+my @ar_sensornames=(); # List of sensor names if specified in the sensor_types array
|
|
|
+my @ar_sensoroids=(); # List of sensor data oids if specified in sensor_types array
|
|
|
+
|
|
|
+# This is hack for HP based on cpqHeTemperatureLocale OID from cpqhlth.mib to map reported locale id to real name
|
|
|
+my %hp_locale = ( 1=> ['OTHER',1], 2=> ['UNKNOWN',1], 3=> ['System', 1], 4=> ['SystemBoard',1], 5=> ['ioBoard',1],
|
|
|
+ 6=> ['CPU',1], 7=> ['Memory',1], 8=> ['Storage',1], 9=> ['RemovableMedia',1],
|
|
|
+ 10=> ['PowerSupply',1], 11=> ['Ambient',1], 12=> ['Chassis',1], 13=> ['BridgeCard',1] );
|
|
|
+
|
|
|
+sub print_version { print "$0: $Version\n" };
|
|
|
+
|
|
|
+sub print_usage {
|
|
|
+ print "Usage: $0 [-v] -H <host> -C <snmp_community> [-2] | (-l login -x passwd [-X pass -L <authp>,<privp>]) [-p <port>] [-t <timeout>] -T dell|hp|cisco1|juniper|alteon|lmsensors | [-N <oid_attribnames> -D <oid_attribdata>] | [-n <list of sensor names> -d <list of sensor oids>] [-a <attributes to check> -w <warn levels> -c <crit levels> [-f]] [-A <attributes for perfdata>] [-o <out_temp_unit: C|F|K>] [-i <in_temp_unit>] [-u <unknown_default>] [-V]\n";
|
|
|
+}
|
|
|
+
|
|
|
+# Return true if arg is a number
|
|
|
+sub isnum {
|
|
|
+ my $num = shift;
|
|
|
+ if ( $num =~ /^(\d+\.?\d*)|(^\.\d+)$/ ) { return 1 ;}
|
|
|
+ return 0;
|
|
|
+}
|
|
|
+
|
|
|
+# function used when checking data against critical and warn values
|
|
|
+sub check_threshold {
|
|
|
+ my ($attrib, $data, $th_array, $o_ounit) = @_;
|
|
|
+ my $mod = $th_array->[0];
|
|
|
+ my $lv1 = $th_array->[1];
|
|
|
+ my $lv2 = $th_array->[2];
|
|
|
+
|
|
|
+ # verb("debug check_threshold: $mod : ".(defined($lv1)?$lv1:'')." : ".(defined($lv2)?$lv2:''));
|
|
|
+ return "" if !defined($lv1) || ($mod eq '' && $lv1 eq '');
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " = " . $lv1.$o_ounit if $mod eq '=' && $data eq $lv1;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " != " . $lv1.$o_ounit if $mod eq '!' && $data ne $lv1;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " > " . $lv1.$o_ounit if $mod eq '>' && $data>$lv1;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " > " . $lv2.$o_ounit if $mod eq ':' && $data>$lv2;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " >= ". $lv1.$o_ounit if $mod eq '>=' && $data>=$lv1;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " < " . $lv1.$o_ounit if ($mod eq '<' || $mod eq ':') && $data<$lv1;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit . " <= " . $lv1.$o_ounit if $mod eq '<=' && $data<=$lv1;
|
|
|
+ return " " . $attrib . " Temperature is " . $data . $o_ounit ." in range ". $lv1.$o_ounit."..".$lv2.$o_ounit if $mod eq '@' && $data>=$lv1 && $data<=$lv2;
|
|
|
+ return "";
|
|
|
+}
|
|
|
+
|
|
|
+# function called when parsing threshold options data
|
|
|
+sub parse_threshold {
|
|
|
+ my $thin = shift;
|
|
|
+
|
|
|
+ # link to an array that holds processed threshold data
|
|
|
+ # array: 1st is type of check, 2nd is value2, 3rd is value2, 4th is option, 5th is nagios spec string representation for perf out
|
|
|
+ my $th_array = [ '', undef, undef, '', '' ];
|
|
|
+ my $th = $thin;
|
|
|
+ my $at = '';
|
|
|
+
|
|
|
+ # take 3 ways to specify that there is no threshold
|
|
|
+ return $th_array if ($th eq '0' || $th eq '~' || $th eq '');
|
|
|
+
|
|
|
+ $at = $1 if $th =~ s/^(\^?[@|>|<|=|!]?~?)//; # check mostly for my own threshold format
|
|
|
+ $th_array->[3]='^' if $at =~ s/\^//; # deal with ^ option
|
|
|
+ $at =~ s/~//; # ignore ~ if it was entered
|
|
|
+ if ($th =~ /^\:([-|+]?\d+\.?\d*)/) { # :number format per nagios spec
|
|
|
+ $th_array->[1]=$1;
|
|
|
+ $th_array->[0]=($at !~ /@/)?'>':'<=';
|
|
|
+ $th_array->[5]=($at !~ /@/)?('~:'.$th_array->[1]):($th_array->[1].':');
|
|
|
+ }
|
|
|
+ elsif ($th =~ /([-|+]?\d+\.?\d*)\:$/) { # number: format per nagios spec
|
|
|
+ $th_array->[1]=$1;
|
|
|
+ $th_array->[0]=($at !~ /@/)?'<':'>=';
|
|
|
+ $th_array->[5]=($at !~ /@/)?'':'@';
|
|
|
+ $th_array->[5].=$th_array->[1].':';
|
|
|
+ }
|
|
|
+ elsif ($th =~ /([-|+]?\d+\.?\d*)\:([-|+]?\d+\.?\d*)/) { # nagios range format
|
|
|
+ $th_array->[1]=$1;
|
|
|
+ $th_array->[2]=$2;
|
|
|
+ if ($th_array->[1] > $th_array->[2]) {
|
|
|
+ print "Incorrect format in '$thin' - in range specification first number must be smaller then 2nd\n";
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ $th_array->[0]=($at !~ /@/)?':':'@';
|
|
|
+ $th_array->[5]=($at !~ /@/)?'':'@';
|
|
|
+ $th_array->[5].=$th_array->[1].':'.$th_array->[2];
|
|
|
+ }
|
|
|
+ if (!defined($th_array->[1])) {
|
|
|
+ $th_array->[0] = ($at eq '@')?'<=':$at;
|
|
|
+ $th_array->[1] = $th;
|
|
|
+ $th_array->[5] = '~:'.$th_array->[1] if ($th_array->[0] eq '>' || $th_array->[0] eq '>=');
|
|
|
+ $th_array->[5] = $th_array->[1].':' if ($th_array->[0] eq '<' || $th_array->[0] eq '<=');
|
|
|
+ $th_array->[5] = '@'.$th_array->[1].':'.$th_array->[1] if $th_array->[0] eq '=';
|
|
|
+ $th_array->[5] = $th_array->[1].':'.$th_array->[1] if $th_array->[0] eq '!';
|
|
|
+ }
|
|
|
+ if ($th_array->[0] =~ /[>|<]/ && !isnum($th_array->[1])) {
|
|
|
+ print "Numeric value required when '>' or '<' are used !\n";
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ # verb("debug parse_threshold: $th_array->[0] and $th_array->[1]");
|
|
|
+ $th_array->[0] = '=' if !$th_array->[0] && !isnum($th_array->[1]) && $th_array->[1] ne '';
|
|
|
+ if (!$th_array->[0] && isnum($th_array->[1])) { # this is just the number by itself, becomes 0:number check per nagios guidelines
|
|
|
+ $th_array->[2]=$th_array->[1];
|
|
|
+ $th_array->[1]=0;
|
|
|
+ $th_array->[0]=':';
|
|
|
+ $th_array->[5]=$th_array->[2];
|
|
|
+ }
|
|
|
+ return $th_array;
|
|
|
+}
|
|
|
+
|
|
|
+# this function checks that for numeric data warn threshold is within range of critical threshold
|
|
|
+# where within range depends on actual threshold spec and normally just means less
|
|
|
+sub threshold_specok {
|
|
|
+ my ($warn_thar,$crit_thar) = @_;
|
|
|
+ return 0 if (defined($warn_thar->[1]) && !isnum($warn_thar->[1])) || (defined($crit_thar->[1]) && !isnum($crit_thar->[1]));
|
|
|
+ return 1 if defined($warn_thar) && defined($warn_thar->[1]) &&
|
|
|
+ defined($crit_thar) && defined($crit_thar->[1]) &&
|
|
|
+ isnum($warn_thar->[1]) && isnum($crit_thar->[1]) &&
|
|
|
+ $warn_thar->[0] eq $crit_thar->[0] &&
|
|
|
+ (!defined($warn_thar->[3]) || $warn_thar->[3] !~ /\^/) &&
|
|
|
+ (!defined($crit_thar->[3]) || $crit_thar->[3] !~ /\^/) &&
|
|
|
+ (($warn_thar->[1]>$crit_thar->[1] && ($warn_thar->[0] =~ />/ || $warn_thar->[0] eq '@')) ||
|
|
|
+ ($warn_thar->[1]<$crit_thar->[1] && ($warn_thar->[0] =~ /</ || $warn_thar->[0] eq ':')) ||
|
|
|
+ ($warn_thar->[0] eq ':' && $warn_thar->[2]>=$crit_thar->[2]) ||
|
|
|
+ ($warn_thar->[0] eq '@' && $warn_thar->[2]<=$crit_thar->[2]));
|
|
|
+ return 0; # return with 0 means specs check out and are ok
|
|
|
+}
|
|
|
+
|
|
|
+sub help {
|
|
|
+ print "\nSNMP Temperature Monitor for Nagios version ",$Version,"\n";
|
|
|
+ print " by William Leibzon - william(at)leibzon.org\n\n";
|
|
|
+ print_usage();
|
|
|
+ print <<EOD;
|
|
|
+-v, --verbose
|
|
|
+ print extra debugging information
|
|
|
+-h, --help
|
|
|
+ print this help message
|
|
|
+-H, --hostname=HOST
|
|
|
+ name or IP address of host to check
|
|
|
+-C, --community=COMMUNITY NAME
|
|
|
+ community name for the host's SNMP agent (implies v 1 protocol)
|
|
|
+-2, --v2c
|
|
|
+ Use snmp v2c
|
|
|
+-l, --login=LOGIN ; -x, --passwd=PASSWD
|
|
|
+ Login and auth password for snmpv3 authentication
|
|
|
+ If no priv password exists, implies AuthNoPriv
|
|
|
+-X, --privpass=PASSWD
|
|
|
+ Priv password for snmpv3 (AuthPriv protocol)
|
|
|
+-L, --protocols=<authproto>,<privproto>
|
|
|
+ <authproto> : Authentication protocol (md5|sha : default md5)
|
|
|
+ <privproto> : Priv protocole (des|aes : default des)
|
|
|
+-P, --port=PORT
|
|
|
+ SNMP port (Default 161)
|
|
|
+-w, --warn=INT[,INT[,INT[..]]]
|
|
|
+ Warning temperature level(s). The number of values listed here must exactly match number
|
|
|
+ of sensors listed with '-a'. The values specifify threshold for when Nagios should send
|
|
|
+ WARNING alert. All values are numbers and can have the following prefix modifiers:
|
|
|
+ > - warn if data is above this value (default for numeric values)
|
|
|
+ < - warn if data is below this value (must be followed by number)
|
|
|
+ = - warn if data is equal to this value (default for non-numeric values)
|
|
|
+ ! - warn if data is not equal to this value
|
|
|
+ ~ - do not check this data (must not be followed by number or ':')
|
|
|
+ ^ - this disables check that warning < critical
|
|
|
+ Threshold values can also be specified as range in two forms:
|
|
|
+ num1:num2 - warn if data is outside range i.e. if data<num1 or data>num2
|
|
|
+ \@num1:num2 - warn if data is in range i.e. data>=num1 && data<=num2
|
|
|
+-c, --crit=INT[,INT[,INT[..]]]
|
|
|
+ Critical temperature level(s) (if more then one attribute is checked, must have multiple values)
|
|
|
+ The format is the same as with warning threshold levels.
|
|
|
+-f, --perfdata
|
|
|
+ Perfparse compatible output
|
|
|
+-t, --timeout=INTEGER
|
|
|
+ timeout for SNMP in seconds (Default: 5)
|
|
|
+-V, --version
|
|
|
+ prints version number
|
|
|
+-N, --oidtable_attribnames=OID_STRING
|
|
|
+ Base table OID to walk through to find names of those attributes supported and from that corresponding data OIDs
|
|
|
+-D, --oidtable_attribdata=OID_STRING
|
|
|
+ Base table OID for sensor attribute data, one number is added to that to make up full attribute OID
|
|
|
+-n, --sensor_names=STRING[,STRING[..]]
|
|
|
+ List of sensor names when -N is not used and sensors are specified with exeact oids
|
|
|
+-d, --sensor_oids=OID_STRING[,OID_STRING[..]]
|
|
|
+ List of exact data OIDs for sensors specified with -n (specify this when -N and -D are not used)
|
|
|
+-a, --attributes=STRING[,STRING[..]]
|
|
|
+ Which attribute(s) to check. This is used as regex to check if attribute is found in sensor names.
|
|
|
+ As an example for Dell the attribute names to use are: PROC_1, PROC_2, Ambient, Planar, Riser
|
|
|
+-A, --perf_attributes=STRING[,STRING[..]]
|
|
|
+ Which attribute(s) to add to as part of performance data output. These names can be different then the
|
|
|
+ ones listed in '-a' to only output attributes in perf data but not check. Special value of '*' gets them all.
|
|
|
+-f, --perfparse
|
|
|
+ Used only with '-a'. Causes to output data not only in main status line but also as perfparse output
|
|
|
+-o --out_temp_unit=C|F|K
|
|
|
+ What temperature measurement units are used for output and warning/critical - 'C', 'F' or 'K' - default is 'C'
|
|
|
+-i --in_temp_unit=[num]C|F|K
|
|
|
+ What temperature measurement reported by data OID - format is <num>C|F|K (default is 'C')
|
|
|
+ where num is used if data is num*realdata, i.e. if reported data of 330 means 33C, then it is: -i 10C
|
|
|
+-u, --unknown_default=INT
|
|
|
+ If attribute is not found then report the output as this number (i.e. -u 0)
|
|
|
+-T, --type=dell|hp|cisco1|juniper|alteon|lmsensors
|
|
|
+ This allows to use pre-defined system type to set Base, Data OIDs and incoming temperature measurement type
|
|
|
+ Currently support systems types are: dell, hp, cisco1 (7500, 5500, 2948, etc), juniper, alteon, lmsensors (linux using lmsensors package if snmp is compiled to support it)
|
|
|
+EOD
|
|
|
+}
|
|
|
+
|
|
|
+# For verbose output - don't use it right now
|
|
|
+sub verb { my $t=shift; print $t,"\n" if defined($o_verb) ; }
|
|
|
+
|
|
|
+# Get the alarm signal (just in case snmp timout screws up)
|
|
|
+$SIG{'ALRM'} = sub {
|
|
|
+ print ("ERROR: Alarm signal (Nagios time-out)\n");
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+};
|
|
|
+
|
|
|
+# converts temperature from input format unit into output format units
|
|
|
+sub convert_temp {
|
|
|
+ my ($temp, $in_unit, $out_unit) = @_;
|
|
|
+
|
|
|
+ my $in_mult = 1;
|
|
|
+ my $ctemp = undef;
|
|
|
+ $in_mult = $1 if $in_unit =~ /(\d+)\w/;
|
|
|
+ $in_unit =~ s/\d+//;
|
|
|
+
|
|
|
+ # exit quickly avoiding conversion to and from C if both units are the same
|
|
|
+ return $temp / $in_mult if ($in_unit eq $out_unit);
|
|
|
+ # if units are not the same, we convert to/from C
|
|
|
+ $ctemp = $temp / $in_mult if $in_unit eq 'C';
|
|
|
+ $ctemp = ($temp / $in_mult - 32) / 1.8 if $in_unit eq 'F';
|
|
|
+ $ctemp = $temp / $in_mult - 273.15 if $in_unit eq 'K';
|
|
|
+ $ctemp = $temp / $in_mult if !defined($ctemp);
|
|
|
+ return $ctemp if $out_unit eq "C";
|
|
|
+ return $ctemp * 1.8 + 32 if $out_unit eq "F";
|
|
|
+ return $ctemp + 273.15 if $out_unit eq "K";
|
|
|
+ return $ctemp; # should not get here
|
|
|
+}
|
|
|
+
|
|
|
+sub check_options {
|
|
|
+ Getopt::Long::Configure ("bundling");
|
|
|
+ GetOptions(
|
|
|
+ 'v' => \$o_verb, 'verbose' => \$o_verb,
|
|
|
+ 'h' => \$o_help, 'help' => \$o_help,
|
|
|
+ 'H:s' => \$o_host, 'hostname:s' => \$o_host,
|
|
|
+ 'P:i' => \$o_port, 'port:i' => \$o_port,
|
|
|
+ 'C:s' => \$o_community, 'community:s' => \$o_community,
|
|
|
+ 'l:s' => \$o_login, 'login:s' => \$o_login,
|
|
|
+ 'x:s' => \$o_passwd, 'passwd:s' => \$o_passwd,
|
|
|
+ 'X:s' => \$o_privpass, 'privpass:s' => \$o_privpass,
|
|
|
+ 'L:s' => \$v3protocols, 'protocols:s' => \$v3protocols,
|
|
|
+ 't:i' => \$o_timeout, 'timeout:i' => \$o_timeout,
|
|
|
+ 'V' => \$o_version, 'version' => \$o_version,
|
|
|
+ '2' => \$o_version2, 'v2c' => \$o_version2,
|
|
|
+ 'c:s' => \$o_crit, 'critical:s' => \$o_crit,
|
|
|
+ 'w:s' => \$o_warn, 'warn:s' => \$o_warn,
|
|
|
+ 'f' => \$o_perf, 'perfparse' => \$o_perf,
|
|
|
+ 'a:s' => \$o_attr, 'attributes:s' => \$o_attr,
|
|
|
+ 'A:s' => \$o_perfattr, 'perf_attributes:s' => \$o_perfattr,
|
|
|
+ 'o:s' => \$o_ounit, 'out_temp_unit:s' => \$o_ounit,
|
|
|
+ 'i:s' => \$o_iunit, 'in_temp_unit:s' => \$o_iunit,
|
|
|
+ 'u:i' => \$o_unkdef, 'unknown_default:i' => \$o_unkdef,
|
|
|
+ 'N:s' => \$oid_names, 'oid_attribnames:s' => \$oid_names, 'oidtable_attribnames:s' => \$oid_names,
|
|
|
+ 'D:s' => \$oid_data, 'oid_attribdata:s' => \$oid_data, 'oidtable_attribdata:s' => \$oid_data,
|
|
|
+ 'n:s' => \$o_sensornames, 'sensor_names:s' => \$o_sensornames,
|
|
|
+ 'd:s' => \$o_sensoroids, 'sensor_oids:s' => \$o_sensoroids,
|
|
|
+ 'T:s' => \$o_type, 'type:s' => \$o_type
|
|
|
+ );
|
|
|
+ if (defined($o_help) ) { help(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+ if (defined($o_version)) { print_version(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+ if ($no_snmp) {
|
|
|
+ print "Can't locate Net/SNMP.pm\n"; print_usage(); exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ if (! defined($o_host)) { # check host and filter
|
|
|
+ print "No host defined!\n";print_usage(); exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ # check snmp information
|
|
|
+ if ( !defined($o_community) && (!defined($o_login) || !defined($o_passwd)) )
|
|
|
+ { print "Put snmp login info!\n"; print_usage(); exit $ERRORS{"UNKNOWN"}}
|
|
|
+ if ((defined($o_login) || defined($o_passwd)) && (defined($o_community) || defined($o_version2)) )
|
|
|
+ { print "Can't mix snmp v1,2c,3 protocols!\n"; print_usage(); exit $ERRORS{"UNKNOWN"}}
|
|
|
+ if (defined ($v3protocols)) {
|
|
|
+ if (!defined($o_login)) { print "Put snmp V3 login info with protocols!\n"; print_usage(); exit $ERRORS{"UNKNOWN"}}
|
|
|
+ my @v3proto=split(/,/,$v3protocols);
|
|
|
+ if ((defined ($v3proto[0])) && ($v3proto[0] ne "")) {$o_authproto=$v3proto[0]; } # Auth protocol
|
|
|
+ if (defined ($v3proto[1])) {$o_privproto=$v3proto[1]; } # Priv protocol
|
|
|
+ if ((defined ($v3proto[1])) && (!defined($o_privpass))) {
|
|
|
+ print "Put snmp V3 priv login info with priv protocols!\n"; print_usage(); exit $ERRORS{"UNKNOWN"}}
|
|
|
+ }
|
|
|
+ $o_ounit =~ tr/[a-z]/[A-Z]/;
|
|
|
+ if ($o_ounit ne 'C' && $o_ounit ne 'F' && $o_ounit ne 'K')
|
|
|
+ { print "Invalid output measurement unit specified!\n"; print_usage(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+ $o_iunit =~ tr/[a-z]/[A-Z]/;
|
|
|
+ if ($o_iunit !~ /\d*[C|K|F]/)
|
|
|
+ { print "Invalid input measurement unit specified!\n"; print_usage(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+ if (defined ($o_type)) {
|
|
|
+ if (defined($oid_names) || defined($oid_data) || defined($o_sensornames) || defined($o_sensoroids))
|
|
|
+ { print "Please either specify specify system type (-T) OR base SNMP OIDs for name (-N) and data (-D) tables OR exact list of sensor names (-n) and data OIDs (-d) !\n"; print_usage(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+ if (defined($system_types{$o_type})) {
|
|
|
+ $oid_names = $system_types{$o_type}[0];
|
|
|
+ $oid_data = $system_types{$o_type}[1];
|
|
|
+ $o_iunit = $system_types{$o_type}[2];
|
|
|
+ @ar_sensornames= @{$system_types{$o_type}[3]} if defined($system_types{$o_type}[3]) && !$oid_names;
|
|
|
+ @ar_sensoroids= @{$system_types{$o_type}[4]} if defined($system_types{$o_type}[4]) && !$oid_data;
|
|
|
+ }
|
|
|
+ else { print "Unknown system type $o_type !\n"; print_usage(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+ }
|
|
|
+ if (defined($o_sensornames) && defined($o_sensoroids)) {
|
|
|
+ if (defined($oid_names) || defined($oid_data)) {
|
|
|
+ print "You can not combine -n / -d options with -N / -D\n"; print_usage(); exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ else {
|
|
|
+ @ar_sensornames = split(/,/, $o_sensornames);
|
|
|
+ @ar_sensoroids = split(/,/, $o_sensoroids);
|
|
|
+ if (scalar(@ar_sensornames) != scalar(@ar_sensoroids)) {
|
|
|
+ printf "Number of sensor names specified at -n (%d) must be equal to number of data OIDs specified with -d (%d)\n",
|
|
|
+ scalar(@ar_sensornames), scalar(@ar_sensoroids);
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+ if (scalar(@ar_sensornames)==0 && scalar(@ar_sensoroids)==0 && !(defined($oid_names) && defined($oid_data)))
|
|
|
+ { print "Specify system type (-T) OR base SNMP OIDs for names (-N) and data (-D) tables OR exact list of sensor names (-n) and data OIDs (-d) !\n"; print_usage(); exit $ERRORS{"UNKNOWN"}; }
|
|
|
+
|
|
|
+ # below code is common for number of my plugins, including check_snmp_?, netstat, etc
|
|
|
+ # it is mostly compliant with nagios threshold specification (except use of '~')
|
|
|
+ # and adds number of additional format options using '>','<','!','=' prefixes
|
|
|
+ my (@ar_warnLv,@ar_critLv);
|
|
|
+ if (defined($o_perfattr)) {
|
|
|
+ @o_perfattrL=split(/,/ ,$o_perfattr);
|
|
|
+ }
|
|
|
+ if (defined($o_warn) || defined($o_crit) || defined($o_attr)) {
|
|
|
+ if (defined($o_attr)) {
|
|
|
+ @o_attrL=split(/,/, $o_attr);
|
|
|
+ if (defined($o_warn)) {
|
|
|
+ $o_warn.="~" if $o_warn =~ /,$/;
|
|
|
+ @ar_warnLv=split( /,/ , lc $o_warn );
|
|
|
+ }
|
|
|
+ if (defined($o_crit)) {
|
|
|
+ $o_crit.="~" if $o_crit =~ /,$/;
|
|
|
+ @ar_critLv=split( /,/ , lc $o_crit );
|
|
|
+ }
|
|
|
+ }
|
|
|
+ else {
|
|
|
+ print "Specifying warning and critical levels requires '-a' parameter with list of STATUS variables\n";
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ if (scalar(@ar_warnLv)!=scalar(@o_attrL) || scalar(@ar_critLv)!=scalar(@o_attrL)) {
|
|
|
+ printf "Number of specified warning levels (%d) and critical levels (%d) must be equal to the number of attributes specified at '-a' (%d). If you need to ignore some attribute do it as ',,'\n", scalar(@ar_warnLv), scalar(@ar_critLv), scalar(@o_attrL);
|
|
|
+ verb("Warning Levels: ".join(",",@ar_warnLv));
|
|
|
+ verb("Critical Levels: ".join(",",@ar_critLv));
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ for (my $i=0; $i<scalar(@o_attrL); $i++) {
|
|
|
+ $o_warnL[$i] = parse_threshold($ar_warnLv[$i]);
|
|
|
+ $o_critL[$i] = parse_threshold($ar_critLv[$i]);
|
|
|
+ if (threshold_specok($o_warnL[$i],$o_critL[$i])) {
|
|
|
+ print "Numeric value required for warning and critical thresholds!\n";
|
|
|
+ print "And warning must be less then critical (or greater then when '<' is used)\n";
|
|
|
+ print "(to override warning<critical check prefix warning value with ^)\n";
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+ if (scalar(@o_attrL)==0 && scalar(@o_perfattrL)==0) {
|
|
|
+ print "You must specify list of attributes with either '-a' or '-A'\n";
|
|
|
+ print_usage();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+########## MAIN #######
|
|
|
+
|
|
|
+check_options();
|
|
|
+
|
|
|
+# Check global timeout if something goes wrong
|
|
|
+if (defined($TIMEOUT)) {
|
|
|
+ verb("Alarm at $TIMEOUT");
|
|
|
+ alarm($TIMEOUT);
|
|
|
+} else {
|
|
|
+ verb("no global timeout defined : $o_timeout + 10");
|
|
|
+ alarm ($o_timeout+10);
|
|
|
+}
|
|
|
+
|
|
|
+# Connect to host
|
|
|
+my ($session,$error);
|
|
|
+if ( defined($o_login) && defined($o_passwd)) {
|
|
|
+ # SNMPv3 login
|
|
|
+ verb("SNMPv3 login");
|
|
|
+ if (!defined ($o_privpass)) {
|
|
|
+ verb("SNMPv3 AuthNoPriv login : $o_login, $o_authproto");
|
|
|
+ ($session, $error) = Net::SNMP->session(
|
|
|
+ -hostname => $o_host,
|
|
|
+ -version => '3',
|
|
|
+ -username => $o_login,
|
|
|
+ -authpassword => $o_passwd,
|
|
|
+ -authprotocol => $o_authproto,
|
|
|
+ -timeout => $o_timeout
|
|
|
+ );
|
|
|
+ } else {
|
|
|
+ verb("SNMPv3 AuthPriv login : $o_login, $o_authproto, $o_privproto");
|
|
|
+ ($session, $error) = Net::SNMP->session(
|
|
|
+ -hostname => $o_host,
|
|
|
+ -version => '3',
|
|
|
+ -username => $o_login,
|
|
|
+ -authpassword => $o_passwd,
|
|
|
+ -authprotocol => $o_authproto,
|
|
|
+ -privpassword => $o_privpass,
|
|
|
+ -privprotocol => $o_privproto,
|
|
|
+ -timeout => $o_timeout
|
|
|
+ );
|
|
|
+ }
|
|
|
+} else {
|
|
|
+ if (defined ($o_version2)) {
|
|
|
+ # SNMPv2 Login
|
|
|
+ verb("SNMP v2c login");
|
|
|
+ ($session, $error) = Net::SNMP->session(
|
|
|
+ -hostname => $o_host,
|
|
|
+ -version => '2',
|
|
|
+ -community => $o_community,
|
|
|
+ -maxmsgsize => $o_octets || 10000,
|
|
|
+ -port => $o_port || 161,
|
|
|
+ -timeout => $o_timeout
|
|
|
+ );
|
|
|
+ } else {
|
|
|
+ # SNMPV1 login
|
|
|
+ verb("SNMP v1 login");
|
|
|
+ ($session, $error) = Net::SNMP->session(
|
|
|
+ -version => '1',
|
|
|
+ -hostname => $o_host,
|
|
|
+ -community => $o_community,
|
|
|
+ -port => $o_port || 161,
|
|
|
+ -timeout => $o_timeout
|
|
|
+ );
|
|
|
+ }
|
|
|
+}
|
|
|
+if (!defined($session)) {
|
|
|
+ printf("ERROR opening session: %s.\n", $error);
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+}
|
|
|
+
|
|
|
+# next part of the code builds list of attributes to be retrieved
|
|
|
+my $i;
|
|
|
+my $oid;
|
|
|
+my $line;
|
|
|
+my $attr;
|
|
|
+my @varlist = ();
|
|
|
+my %dataresults;
|
|
|
+my $result;
|
|
|
+
|
|
|
+for ($i=0;$i<scalar(@o_attrL);$i++) {
|
|
|
+ $dataresults{$o_attrL[$i]} = ["check", undef, undef, 0, 0];
|
|
|
+}
|
|
|
+if (defined($o_perfattr) && $o_perfattr ne '*') {
|
|
|
+ for ($i=0;$i<scalar(@o_perfattrL);$i++) {
|
|
|
+ $dataresults{$o_perfattrL[$i]} = ["perf", undef, undef, 0, 0];
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+if (scalar(@ar_sensornames)==0) {
|
|
|
+ verb("Retrieving SNMP table $oid_names to find sensor attribute names");
|
|
|
+ $result = $session->get_table( -baseoid => $oid_names );
|
|
|
+# $result = $session->get_request( -varbindlist => [$oid_names] );
|
|
|
+
|
|
|
+ if (!defined($result)) {
|
|
|
+ printf("ERROR: Problem retrieving OID %s table: %s.\n", $oid_names, $session->error);
|
|
|
+ $session->close();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+ }
|
|
|
+ L1: foreach $oid (Net::SNMP::oid_lex_sort(keys %{$result})) {
|
|
|
+ $line=$result->{$oid};
|
|
|
+ verb("got $oid : $line");
|
|
|
+ # special hack for HP
|
|
|
+ if (defined($o_type) && $o_type eq 'hp' && exists($hp_locale{$line})) {
|
|
|
+ $line = $hp_locale{$result->{$oid}}[0] ."_". $hp_locale{$result->{$oid}}[1];
|
|
|
+ $hp_locale{$result->{$oid}}[1]++;
|
|
|
+ verb("HP hack: interpreting ".$result->{$oid}." as $line");
|
|
|
+ }
|
|
|
+ if (defined($o_perfattr) && $o_perfattr eq '*') {
|
|
|
+ $oid =~ s/$oid_names/$oid_data/;
|
|
|
+ $dataresults{$line} = ["perf", $oid, undef, 0, 0];
|
|
|
+ unshift(@varlist,$oid);
|
|
|
+ verb("match found based on -A '*', now set to retrieve $oid");
|
|
|
+ }
|
|
|
+ foreach $attr (keys %dataresults) {
|
|
|
+ if ($line =~ /$attr/ && !defined($dataresults{$attr}[1])) {
|
|
|
+ $oid =~ s/$oid_names/$oid_data/;
|
|
|
+ $dataresults{$attr}[1] = $oid;
|
|
|
+ unshift(@varlist,$oid) if !defined($varlist[0]) || $varlist[0] ne $oid;
|
|
|
+ verb("match found for $attr, now set to retrieve $oid");
|
|
|
+ next L1;
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+else {
|
|
|
+ my $i;
|
|
|
+ for ($i=0;$i<scalar(@ar_sensornames);$i++) {
|
|
|
+ $line=$ar_sensornames[$i];
|
|
|
+ $oid=$ar_sensoroids[$i];
|
|
|
+ if (defined($o_perfattr) && $o_perfattr eq '*') {
|
|
|
+ $dataresults{$line} = ["perf", $oid, undef, 0, 0];
|
|
|
+ unshift(@varlist,$oid);
|
|
|
+ verb("match found based on -A '*', now set to retrieve $oid");
|
|
|
+ }
|
|
|
+ L2: foreach $attr (keys %dataresults) {
|
|
|
+ if ($line =~ /$attr/ && !defined($dataresults{$attr}[1])) {
|
|
|
+ $dataresults{$attr}[1] = $oid;
|
|
|
+ unshift(@varlist,$oid) if !defined($varlist[0]) || $varlist[0] ne $oid;
|
|
|
+ verb("match found for $attr, now set to retrieve $oid");
|
|
|
+ next L2;
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+# now we actually retrieve the attributes
|
|
|
+my $statuscode = "OK";
|
|
|
+my $statusinfo = "";
|
|
|
+my $statusdata = "";
|
|
|
+my $perfdata = "";
|
|
|
+my $chk = "";
|
|
|
+
|
|
|
+verb("Getting SNMP data for oids" . join(" ",@varlist));
|
|
|
+$result = $session->get_request(
|
|
|
+ -Varbindlist => \@varlist
|
|
|
+);
|
|
|
+if (!defined($result)) {
|
|
|
+ printf("ERROR: Can not retrieve OID(s) %s: %s.\n", join(" ",@varlist), $session->error);
|
|
|
+ $session->close();
|
|
|
+ exit $ERRORS{"UNKNOWN"};
|
|
|
+}
|
|
|
+else {
|
|
|
+ foreach $attr (keys %dataresults) {
|
|
|
+ if (defined($dataresults{$attr}[1]) && defined($$result{$dataresults{$attr}[1]})) {
|
|
|
+ $dataresults{$attr}[2]=convert_temp($$result{$dataresults{$attr}[1]},$o_iunit,$o_ounit);
|
|
|
+ verb("got $dataresults{$attr}[1] : $attr = $dataresults{$attr}[2]");
|
|
|
+ }
|
|
|
+ else {
|
|
|
+ if (defined($o_unkdef)) {
|
|
|
+ $dataresults{$attr}[2]=$o_unkdef;
|
|
|
+ verb("could not find snmp data for $attr, setting to to default value $o_unkdef");
|
|
|
+ }
|
|
|
+ else {
|
|
|
+ verb("could not find snmp data for $attr");
|
|
|
+ }
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+# loop to check if warning & critical attributes are ok
|
|
|
+for ($i=0;$i<scalar(@o_attrL);$i++) {
|
|
|
+ if (defined($dataresults{$o_attrL[$i]}[2])) {
|
|
|
+ if ($chk = check_threshold($o_attrL[$i],$dataresults{$o_attrL[$i]}[2],$o_critL[$i],$o_ounit)) {
|
|
|
+ $dataresults{$o_attrL[$i]}[3]++;
|
|
|
+ $statuscode = "CRITICAL";
|
|
|
+ $statusinfo .= $chk;
|
|
|
+ }
|
|
|
+ elsif ($chk = check_threshold($o_attrL[$i],$dataresults{$o_attrL[$i]}[2],$o_warnL[$i],$o_ounit)) {
|
|
|
+ $dataresults{$o_attrL[$i]}[3]++;
|
|
|
+ $statuscode="WARNING" if $statuscode eq "OK";
|
|
|
+ $statusinfo .= $chk;
|
|
|
+ }
|
|
|
+ if ($dataresults{$o_attrL[$i]}[3]==0) {
|
|
|
+ $dataresults{$o_attrL[$i]}[3]++;
|
|
|
+ $statusdata .= "," if ($statusdata);
|
|
|
+ $statusdata .= " " . $o_attrL[$i] . " Temperature is " . $dataresults{$o_attrL[$i]}[2] . $o_ounit;
|
|
|
+ }
|
|
|
+ if (defined($o_perf) && $dataresults{$o_attrL[$i]}[4]==0 &&
|
|
|
+ defined($o_warnL[$i][5]) && defined($o_critL[$i][5])) {
|
|
|
+ $dataresults{$o_attrL[$i]}[4]++;
|
|
|
+ $perfdata .= " " . $o_attrL[$i] . "=" . $dataresults{$o_attrL[$i]}[2];
|
|
|
+ $perfdata .= ';' if $o_warnL[$i][5] ne '' || $o_critL[$i][5] ne '';
|
|
|
+ $perfdata .= $o_warnL[$i][5] if $o_warnL[$i][5] ne '';
|
|
|
+ $perfdata .= ';'.$o_critL[$i][5] if $o_critL[$i][5] ne '';
|
|
|
+ }
|
|
|
+ }
|
|
|
+ else {
|
|
|
+ $statusdata .= "," if ($statusdata);
|
|
|
+ $statusdata .= " $o_attrL[$i] data is missing";
|
|
|
+ $statuscode = "UNKNOWN" if $statuscode eq "OK";
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+# add data for performance-only attributes
|
|
|
+if (defined($o_perfattr) && $o_perfattr eq '*') {
|
|
|
+ foreach $attr (keys %dataresults) {
|
|
|
+ if ($dataresults{$attr}[0] eq "perf" && defined($dataresults{$attr}[2]) && $dataresults{$attr}[4]==0) {
|
|
|
+ $dataresults{$attr}[4]++;
|
|
|
+ $perfdata .= " " . $attr . "=" . $dataresults{$attr}[2];
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+else {
|
|
|
+ for ($i=0;$i<scalar(@o_perfattrL);$i++) {
|
|
|
+ if (defined($dataresults{$o_perfattrL[$i]}[2]) && $dataresults{$o_perfattrL[$i]}[4]==0) {
|
|
|
+ $dataresults{$o_perfattrL[$i]}[4]++;
|
|
|
+ $perfdata .= " " . $o_perfattrL[$i] . "=" . $dataresults{$o_perfattrL[$i]}[2];
|
|
|
+ }
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+$session->close;
|
|
|
+print $statuscode . $statusinfo;
|
|
|
+print " -".$statusdata if $statusdata;
|
|
|
+print " |".$perfdata if $perfdata;
|
|
|
+print "\n";
|
|
|
+
|
|
|
+exit $ERRORS{$statuscode};
|