-
Notifications
You must be signed in to change notification settings - Fork 57
/
check_memcached.pl
executable file
·993 lines (946 loc) · 44.7 KB
/
check_memcached.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
#!/usr/bin/perl -w
#
# ============================== SUMMARY =====================================
#
# Program : check_memcached.pl
# Version : 0.6
# Date : Apr 6, 2012
# Author : William Leibzon - william@leibzon.org
# Licence : GPL - summary below, full text at http://www.fsf.org/licenses/gpl.txt
#
# =========================== PROGRAM LICENSE =================================
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
#
# ===================== INFORMATION ABOUT THIS PLUGIN =========================
#
# This is Memcached Check plugin. It gets stats variables and allows to set thresholds
# on their value or their rate of change. It can measure response time, calculate
# hitrate, memory utilization and other data. The plugin is based on check_mysqld.pl.
#
# It also returns status variables as perfomance data for further nagios 2.0
# post-processing, you can find graph templates NagiosGrapher & PNP4Nagios at:
# http://william.leibzon.org/nagios/
#
# This program is written and maintained by:
# William Leibzon - william(at)leibzon.org
#
# ============================= SETUP NOTES ====================================
#
# Make sure to install perl Cache::Memcached library from CPAN first.
#
# This plugin checks Memcached and measures response which can be used for
# threshold checks. It also retrieves various statistics data available with
# memcache 'stats' command (what you get when you telnet to the port and
# do 'stats') and allows to set thresholds either on their direct values
# or on rate of change of those variables. Plugin also calculates other useful
# statistics like Hitrate (calculated on rate of change unlike all other plugins
# that do it based on totals for all the time) and Memory Utilization and allows
# to set thresholds on their values. All variables can be returned back as
# performance data for graphing and pnp4nagios template should be available
# with this plugin on the same site you downloaded it from.
#
# For help on what parameters this plugin accepts you can just do
# ./check_memcached.pl --help
#
# 1. Connection Parameters
#
# Plugin currently does not support authentication so the only connection
# parameters are "-H hostname" and "-p port". The default port is 11211
# but you must specify hotname (if localhost specify it as -H 127.0.0.1)
#
# 2. Response Time, HitRate, Memory Utilization
#
# To get response time you use "-T" or "--response_time" option. By itself
# it will cause output of respose time at the status line. You can also us
# it as "-T warn,crit" to specify warning and critical thresholds.
#
# To get hitrate the option needed is "-R" or "--hitrate". If previous
# performance data is not feed to plugin (-P option, see below) the plugin
# calculates it as total hitrate over life of memcached process. If -P
# is specified and previous performance data is feed back, the data is
# based on real hitrate with lifei-long info also given in paramphesis.
# As with -T you can specify -R by itself or with thresholds as -R warn,crit
#
# Memory utilization corresponds to what some others call "size". This is
# percent of max memory currently in use. The option is -U or --utilization
# and as you probably guessed can be used by itself or as -U warn,crit
#
# 3. Memcache Statistics Variables and calculating their Rate of Change
#
# All statistics variables from memcached 'stats' can be checked with the plugin.
# And as some people know there are actually several stats arrays in memcached.
# By default the plugin will get statistics for 'misc' and 'malloc'. You can
# specify a list of statistics array names (corresponding to 'stats name'
# command in memcached) with -s or --stats command. Known arrays are:
# misc, malloc, sizes, maps, cachedump, slabs, items
# And example of trying to retrieve all of them is:
# -s misc,malloc,sizes,maps,cachedump,slabs,items
# However not all of them will have data in your system and arrays like
# sizes provide too much datai (how many items stored on each size)
# for standard use.
#
# To see stat variables in plugin status output line and or specify thresholds
# based on their values you would use -a or --variables argument. For example:
# -a curr_connections,evictions
# You must specify same number of warning and critical thresholds with
# -w or --warn and -c or --crit argument as a number of variables specified
# in -a. If you simply want variable values on status without checking their value
# then either use ~ in place of threshold value or nothing at all. For example:
# -a curr_connections,evictions -w ~,~ -c ~,~
# OR -a curr_connections,evictions -w , -c ,
#
# If you want to check rate of change rather than actual value you can do this
# by specifying it as '&variable' such as "&total_connections" which is similar
# to 'curr_connections'. By default it would be reported in the output as
# '&Delta_variable' and as nagios removed '&' symbol you probably will
# see it as just "Delta_variable" unless you changed nagios.cfg and removed '&'
# from 'illegal_macro_output_chars'. As an alternative you can specify how to
# label these with -L or --rate_label option which specify prefix and/or suffix
# For example '-L dt_' would have the output being "dt_total_connections'
# and '-L ,_rate' would result in 'total_connections_rate' for the name.
# You can use these creates names in -a as well, for example:
# -L ,_rate -a total_connections_rate -w 1000 -c ~
#
# Now in order to be able to calculate rate of change, the plugin needs to
# know values of the variables from when it was run the last time. This
# is done by feeding it previous performance data with a -P option.
# In commands.cfg this would be specified as:
# -P "$SERVICEPERFDATA$"
# And don't forget the quotes, in this case they are not just for documentation.
#
# 4. Threshold Specification
#
# The plugin fully supports Nagios plug-in specification for specifying thresholds:
# http://nagiosplug.sourceforge.net/developer-guidelines.html#THRESHOLDFORMAT
#
# And it supports an easier format with the following one-letter prefix modifiers:
# >value : issue alert if data is above this value (default for numeric value)
# <value : issue alert if data is below this value (must be followed by number)
# =value : issue alert if data is equal to this value (default for non-numeric)
# !value : issue alert if data is NOT equal to this value
#
# There are also two two specifications of range formats:
# number1:number2 issue alert if data is OUTSIDE of range [number1..number2]
# i.e. alert if data<$number1 or data>$number2
# @number1:number2 issue alert if data is WITHIN range [number1..number2]
# i.e. alert if data>=$number and $data<=$number2
#
# The plugin will attempt to check that WARNING values is less than CRITICAL
# (or greater for <). A special prefix modifier '^' can also be used to disable
# checking that warn values are less then (or greater then) critical values.
# A quick example of such special use is '--warn=^<100 --crit=>200' which means
# warning alert if value is < 100 and critical alert if its greater than 200.
#
# 5. Performance Data
#
# Using '-f' option causes values of all variables you specified in -a as
# well as response time from -T, hitrate from -R and memory use from -U
# to go out as performance data for Nagios graphing programs that can use it.
#
# You may also directly specify which variables are to be return as performance data
# and with '-A' option. If you use '-A' by itself and not specify any variables or
# use special special value of '*' (as in '-A *') the plugin will output all variables.
#
# The plugin will output threshold values as part of performance data as specified at
# http://nagiosplug.sourceforge.net/developer-guidelines.html#AEN201
# And don't worry about using non-standard >,<,=,~ prefixes, all of that would get
# converted into nagios threshold for performance output
#
# The plugin is smart enough to add 'c' suffix for known COUNTER variables to
# values in performance data. Known variables are specifed in an array you can
# find at the top of the code (further below) and plugin author does not claim
# to have identified all variables correctly. Please email if you find an error
# or want to add more variables.
#
# As noted above performance data is also used to calcualte rate of change
# by feeding it back with -P option. In that regard even if you did not specify
# -f or -A but you have specified &variable, its actual data would be sent out
# in performance output. Additionally last time plugin was run is also in
# performance data as special _ptime variable.
#
# 6. Example of Nagios Config Definitions
#
# Sample command and service definitions are below:
#
# define command {
# command_name check_memcached
# command_line $USER1$/check_memcached.pl -H $HOSTADDRESS$ -p $ARG1$ -T $ARG2$ -R $ARG3$ -U $ARG4$ -a curr_connections,evictions -w ~,~ -c ~,~ -f -A 'utilization,hitrate,response_time,curr_connections,evictions,cmd_set,bytes_written,curr_items,uptime,rusage_system,get_hits,total_connections,get_misses,bytes,time,connection_structures,total_items,limit_maxbytes,rusage_user,cmd_get,bytes_read,threads,rusage_user_ms,rusage_system_ms,cas_hits,conn_yields,incr_misses,decr_misses,delete_misses,incr_hits,decr_hits,delete_hits,cas_badval,cas_misses,cmd_flush,listen_disabled_num,accepting_conns,pointer_size,pid' -P "$SERVICEPERFDATA$"
# }
#
# Arguments and thresholds are:
# ARG1 : Port
# ARG2 : Hitrate Threshold. Below it is <60% for warning, <30% for critical
# ARG3 : Response Time Threshold. Below it is >0.1s for WARNING, >0.2s for critical
# ARG4 : Utilization/Size Threshold. Below it is >95% for warning, >98% for critical
#
# define service {
# use prod-service
# service_description Memcached: Port 11212
# check_command check_memcached!11212!'>0.1,>0.2'!'<60,<30'!'>95,>98'
# hostgroups memcached
# }
#
# Example of command-line use:
# /usr/lib/nagios/plugins/check_memcached.pl -H localhost -a 'curr_connections,evications' -w ~,~ -c ~,~ -s misc,malloc,sizes -U -A -R -T -f -v
#
# In above the -v option means "verbose" and with it plugin will output some debugging
# information about what it is doing. The option is not intended to be used when plugin
# is called from nagios itself.
#
# ======================= VERSION HISTORY and TODO ================================
#
# The plugins is written by reusing code my check_mysqld.pl which similarly to
# this plugin allows to get STATUS variables and use these for nagios tests.
# check_mysqld.pl has history going back to 2004.
#
# [0.5 - Mar 2012] First version of the code based on check_mysqld.pl 0.93
# This is being released as 0.5 because its coming from
# a very mature code of check_mysqld and has a lot of options
# If there are no major issues found with this plugin, next
# version will be 1.0
# [0.6 - Apr 2012] Added support for re using old performance data to calculate
# rate of change for certain variables. This also changes how
# hitrate is calcualted as now if previous performance data
# is available, hitrate would be #misses/#total from last check
# rather than #misses/#total from start of statistics.
#
# TODO or consider for future:
#
# 1. In plans are to allow long options to specify thresholds for known variables.
# These would mean you specify '--cur_connections' in similar way to '--hitrate'
# Internally these would be convered into -A, -w, -c as appropriate an used
# together with these options. So in practice it will now allow to get any data
# just a different way to specify options for this plugin.
#
# 2. This is currently the most advanced form of code shared by number of my plugins
# such as chec_mysqld.pl, check_netstat.pl, check_snmp_temperature.pl and others.
# Since its getting tiresome to have to port codde from one plugin to another
# when new features are added to common code, the plans are to actually create
# a library (basically alternative to Nagios::Plugin, this plugin by itself
# already has 100% what is in that library and more).
#
# 3. Currently I have no TODO for memcached itself. But perhaps other users
# can recommand a new feature to be added here. If so please email me at
# william@leibzon.org.
# And don't worry, I'm not a company with sme hidden agenda to use your idea
# but an actual person who you can easily get hold of by email, find on forums
# and on Nagios conferences. More info on my nagios work is at:
# http://william.leibzon.org/nagios/
# Above also should have PNP4Nagios template for check_memcached.pl if you
# did not get it from the place you downloaded this plugin from.
#
# ============================ START OF PROGRAM CODE =============================
use strict;
use IO::Socket;
use Cache::Memcached;
use Getopt::Long qw(:config no_ignore_case);
# default mysql hostname, port, database, user and password, see NOTES above
my $HOSTNAME= 'localhost';
my $PORT= 11211;
# Add path to additional libraries if necessary
use lib '/usr/lib/nagios/plugins';
our $TIMEOUT;
our %ERRORS;
eval 'use utils qw(%ERRORS $TIMEOUT)';
if ($@) {
$TIMEOUT = 20;
%ERRORS = ('OK'=>0,'WARNING'=>1,'CRITICAL'=>2,'UNKNOWN'=>3,'DEPENDENT'=>4);
}
my $Version='0.6';
# This is a list of known statistics variables (plus few variables added by plugin),
# used in order to desinate COUNTER variables with 'c' in perfout for graphing programs
my %KNOWN_STATUS_VARS = (
'utilization' => [ 'GAUGE', '%' ], # calculated by plugin
'hitrate' => [ 'GAUGE', '%' ], # calculated by plugin
'response_time' => [ 'GAUGE', 's' ], # measured by plugin
'curr_connections' => [ 'GAUGE', '' ],
'evictions' => [ 'COUNTER', 'c' ],
'bytes' => [ 'GAUGE', 'B' ],
'connection_structures' => [ 'GAUGE', '' ],
'time' => [ 'COUNTER', 's' ],
'total_items' => [ 'COUNTER', 'c' ],
'cmd_set' => [ 'COUNTER', 'c' ],
'bytes_written' => [ 'COUNTER', 'c' ],
'curr_items' => [ 'GAUGE', '' ],
'limit_maxbytes' => [ 'GAUGE', 'B' ],
'uptime' => [ 'COUNTER', 's' ],
'rusage_user' => [ 'COUNTER', 's' ],
'cmd_get' => [ 'COUNTER', 'c' ],
'rusage_system' => [ 'COUNTER', 's' ],
'get_hits' => [ 'COUNTER', 'c' ],
'bytes_read' => [ 'COUNTER', 'c' ],
'threads' => [ 'GAUGE', '' ],
'rusage_user_ms' => [ 'COUNTER', 'c' ], # this is round(rusage_user*1000)
'rusage_system_ms' => [ 'COUNTER', 'c' ], # this is round(rusage_system*1000)
'total_connections' => [ 'COUNTER', 'c' ],
'get_misses' => [ 'COUNTER', 'c' ],
'total_free' => [ 'GAUGE', 'B' ],
'releasable_space' => [ 'GAUGE', 'B' ],
'free_chunks' => [ 'GAUGE', '' ],
'fastbin_blocks' => [ 'GAUGE', '' ],
'arena_size' => [ 'GAUGE', '' ],
'total_alloc' => [ 'GAUGE', 'B' ],
'max_total_alloc' => [ 'GAUGE', '' ],
'mmapped_regions' => [ 'GAUGE', '' ],
'mmapped_space' => [ 'GAUGE', '' ],
'fastbin_space' => [ 'GAUGE', '' ],
'auth_cmds' => [ 'COUNTER', 'c' ],
'auth_errors' => [ 'COUNTER', 'c' ],
);
# ============= MAIN PROGRAM CODE - DO NOT MODIFY BELOW THIS LINE ==============
my $o_host= undef; # hostname
my $o_port= undef; # port
my $o_help= undef; # help option
my $o_verb= undef; # verbose mode
my $o_version= undef; # version info option
my $o_variables=undef; # list of variables for warn and critical
my @o_varsL= (); # array from above list
my $o_perfvars= undef; # list of variables to include in perfomance data
my @o_perfvarsL=(); # array from above list
my $o_warn= undef; # warning level option
my @o_warnL= (); # array of warn data processing threshold
my $o_crit= undef; # Critical level option
my @o_critL= (); # array of critical data processing thresholds
my $o_perf= undef; # Performance data option
my $o_timeout= undef; # Timeout to use - note that normally timeout is take from nagios anyway
my $o_mdsopt= undef; # Stat List to get data for
my @o_mdslist= ('misc','malloc'); # Default List, if -S option is entered, this is replaced
my $o_timecheck=undef; # threshold spec for connection time
my $o_hitrate= undef; # threshold spec for hitrate%
my $o_utilsize= undef; # threshold spec for utilization%
my $o_prevperf= undef; # performance data given with $SERVICEPERFDATA$ macro
my $o_prevtime= undef; # previous time plugin was run $LASTSERVICECHECK$ macro
my $o_ratelabel=undef; # prefix and suffix for creating rate variables
my $o_rsuffix='';
my $o_rprefix="&Delta_"; # default prefix
## Additional global variables
my $memd= undef; # DB connection object
my %prev_perf= (); # array that is populated with previous performance data
my @prev_time= (); # timestamps if more then one set of previois performance data
my $perfcheck_time=undef; # time when data was last checked
sub p_version { print "check_memcached.pl version : $Version\n"; }
sub print_usage {
print "Usage: $0 [-v] -H <host> [-p <port>] [-s <memcache stat arrays>] [-a <memcache statistics variables> -w <variables warning thresholds> -c <variables critical thresholds>] [-A <performance output variables>] [-L <ratevar-prefix>[,<ratevar-suffix>]] [-T [conntime_warn,conntime_crit]] [-R [hitrate_warn,hitrate_crit]] [-U [utilization_size_warn,utilization_size_crit]] [-f] [-T <timeout>] [-V] [-P <previous performance data in quoted string>]\n";
print "For more details on options do: $0 --help\n";
}
sub help {
print "\nMemcache Database Check for Nagios version ",$Version,"\n";
print " by William Leibzon - william(at)leibzon.org\n\n";
print "This monitoring plugin lets you do threshold checks on some status variables\n";
print "which are also returned as performance output for graphing.\n\n";
print_usage();
print <<EOT;
-v, --verbose
print extra debugging information
-h, --help
Print this detailed help screen
-H, --hostname=ADDRESS
Hostname or IP Address to check
-p, --port=INTEGER
port number (default: 3306)
-t, --timeout=NUMBER
Allows to set timeout for execution of this plugin. This overrides nagios default.
-s, --stat=<list of stat arrays>
This allows to list stat arrays that would be queried (separated by ',').
Supported memcache statistics array are:
misc, malloc, sizes, maps, cachedump, slabs, items
If this option is not specified, the plugin will check only 'misc' and 'malloc'
-a, --variables=STRING[,STRING[,STRING...]]
List of variables from memcache statistics data to do threshold checks on.
The default (if option is not used) is not to monitor any variable.
The variable name should be prefixed with '&' to chec its rate of
change over time rather than actual value.
-w, --warn=STR[,STR[,STR[..]]]
This option can only be used if '--variables' (or '-a') option above
is used and number of values listed here must exactly match number
of variables specified with '-a'. The values specify warning threshold
for when Nagios should send WARNING alert. These values are usually
numbers and can have the following prefix modifiers:
> - warn if data is above this value (default for numeric values)
< - warn if data is below this value (must be followed by number)
= - warn if data is equal to this value (default for non-numeric values)
! - warn if data is not equal to this value
~ - do not check this data (must not be followed by number or ':')
^ - for numeric values this disables check that warning < critical
Threshold values can also be specified as range in two forms:
num1:num2 - warn if data is outside range i.e. if data<num1 or data>num2
\@num1:num2 - warn if data is in range i.e. data>=num1 && data<=num2
-c, --crit=STR[,STR[,STR[..]]]
This option can only be used if '--variables' (or '-a') option above
is used and number of values listed here must exactly match number of
variables specified with '-a'. The values specify critical threshold
for when Nagios should send CRITICAL alert. The format is exactly same
as with -w option except no '^' prefix.
-R, --hitrate=[WARN,CRIT]
Calculates Hitrate %: cache_miss/(cache_hits+cache_miss). If this is used
as just -R then this info just goes to output line. With '-R -f' these
go as performance data. You can also specify values for this parameter,
these are interprted as WARNING and CRITICAL thresholds (separated by ',').
The format for WARN and CRIT is same as what you would use in -w and -c.
-U, --utilization=[WARN,CRIT]
This calculates percent of space in use, which is bytes/limit_maxbytes
In some other places this is called size, but since this plugin can
actually get objects of different size, utilization is more appropriate.
If you specify -U by itself, the plugin will just output this info,
with '-f' it will also include it in performance data. You can also specify
parameter value which are interpreted as WARNING and CRITICAL thresholds.
-T, --response_time=[WARN,CRIT]
If this is used as just -T the plugin will measure and output connection
response time in seconds. With -f this would also be provided on perf variables.
You can also specify values for this parameter, these are interprted as
WARNING and CRITICAL thresholds (separated by ',').
-f, --perfparse
This should only be used with '-a' and causes variable data not only as part of
main status line but also as perfparse compatible output (for graphing, etc).
-A, --perfvars=[STRING[,STRING[,STRING...]]]
This allows to list variables which values will go only into perfparse
output (and not for threshold checking). The option by itself (emply value)
is same as a special value '*' and specify to output all variables.
-P, --prev_perfdata
Previous performance data (normally put '-P \$SERVICEPERFDATA\$' in nagios
command definition). This is used to calculate rate of change for counter
statistics variables and for proper calculation of hitrate.
-L, --rate_label=[PREFIX_STRING[,SUFFIX_STRING]]
Lael
-V, --version
Prints version number
EOT
}
# For verbose output
sub verb { my $t=shift; print $t,"\n" if defined($o_verb) ; }
# Return true if arg is a number
sub isnum {
my $num = shift;
if (defined($num) && $num =~ /^[-|+]?((\d+\.?\d*)|(^\.\d+))$/ ) { return 1 ;}
return 0;
}
# load previous performance data
sub process_perf {
my %pdh;
my ($nm,$dt);
foreach (split(' ',$_[0])) {
if (/(.*)=(.*)/) {
($nm,$dt)=($1,$2);
verb("prev_perf: $nm = $dt");
# in some of my plugins time_ is to profile execution time for part of plugin
# $pdh{$nm}=$dt if $nm !~ /^time_/;
$pdh{$nm}=$dt;
$pdh{$nm}=$1 if $dt =~ /(\d+)[cs]/; # 'c' or 's' maybe added
# support for more than one set of previously cached performance data
# push @prev_time,$1 if $nm =~ /.*\.(\d+)/ && (!defined($prev_time[0]) || $prev_time[0] ne $1);
}
}
return %pdh;
}
# this function is used when checking data against critical and warn values
sub check_threshold {
my ($attrib, $data, $th_array) = @_;
my $mod = $th_array->[0];
my $lv1 = $th_array->[1];
my $lv2 = $th_array->[2];
# verb("debug check_threshold: $mod : ".(defined($lv1)?$lv1:'')." : ".(defined($lv2)?$lv2:''));
return "" if !defined($lv1) || ($mod eq '' && $lv1 eq '');
return " " . $attrib . " is " . $data . " = " . $lv1 if $mod eq '=' && $data eq $lv1;
return " " . $attrib . " is " . $data . " != " . $lv1 if $mod eq '!' && $data ne $lv1;
return " " . $attrib . " is " . $data . " > " . $lv1 if $mod eq '>' && $data>$lv1;
return " " . $attrib . " is " . $data . " > " . $lv2 if $mod eq ':' && $data>$lv2;
return " " . $attrib . " is " . $data . " >= " . $lv1 if $mod eq '>=' && $data>=$lv1;
return " " . $attrib . " is " . $data . " < " . $lv1 if ($mod eq '<' || $mod eq ':') && $data<$lv1;
return " " . $attrib . " is " . $data . " <= " . $lv1 if $mod eq '<=' && $data<=$lv1;
return " " . $attrib . " is " . $data . " in range $lv1..$lv2" if $mod eq '@' && $data>=$lv1 && $data<=$lv2;
return "";
}
# this function is called when parsing threshold options data
sub parse_threshold {
my $thin = shift;
# link to an array that holds processed threshold data
# array: 1st is type of check, 2nd is threshold value or value1 in range, 3rd is value2 in range, 4th is option, 5th is nagios spec string representation for perf out
my $th_array = [ '', undef, undef, '', '' ];
my $th = $thin;
my $at = '';
$at = $1 if $th =~ s/^(\^?[@|>|<|=|!]?~?)//; # check mostly for my own threshold format
$th_array->[3]='^' if $at =~ s/\^//; # deal with ^ option
$at =~ s/~//; # ignore ~ if it was entered
if ($th =~ /^\:([-|+]?\d+\.?\d*)/) { # :number format per nagios spec
$th_array->[1]=$1;
$th_array->[0]=($at !~ /@/)?'>':'<=';
$th_array->[5]=($at != /@/)?('~:'.$th_array->[1]):($th_array->[1].':');
}
elsif ($th =~ /([-|+]?\d+\.?\d*)\:$/) { # number: format per nagios spec
$th_array->[1]=$1;
$th_array->[0]=($at !~ /@/)?'<':'>=';
$th_array->[5]=($at != /@/)?'':'@';
$th_array->[5].=$th_array->[1].':';
}
elsif ($th =~ /([-|+]?\d+\.?\d*)\:([-|+]?\d+\.?\d*)/) { # nagios range format
$th_array->[1]=$1;
$th_array->[2]=$2;
if ($th_array->[1] > $th_array->[2]) {
print "Incorrect format in '$thin' - in range specification first number must be smaller then 2nd\n";
print_usage();
exit $ERRORS{"UNKNOWN"};
}
$th_array->[0]=($at !~ /@/)?':':'@';
$th_array->[5]=($at != /@/)?'':'@';
$th_array->[5].=$th_array->[1].':'.$th_array->[2];
}
if (!defined($th_array->[1])) { # my own format (<,>,=,!)
$th_array->[0] = ($at eq '@')?'<=':$at;
$th_array->[1] = $th;
$th_array->[5] = '~:'.$th_array->[1] if ($th_array->[0] eq '>' || $th_array->[0] eq '>=');
$th_array->[5] = $th_array->[1].':' if ($th_array->[0] eq '<' || $th_array->[0] eq '<=');
$th_array->[5] = '@'.$th_array->[1].':'.$th_array->[1] if $th_array->[0] eq '=';
$th_array->[5] = $th_array->[1].':'.$th_array->[1] if $th_array->[0] eq '!';
}
if ($th_array->[0] =~ /[>|<]/ && !isnum($th_array->[1])) {
print "Numeric value required when '>' or '<' are used !\n";
print_usage();
exit $ERRORS{"UNKNOWN"};
}
# verb("debug parse_threshold: $th_array->[0] and $th_array->[1]");
$th_array->[0] = '=' if !$th_array->[0] && !isnum($th_array->[1]) && $th_array->[1] ne '';
if (!$th_array->[0] && isnum($th_array->[1])) { # this is just the number by itself, becomes 0:number check per nagios guidelines
$th_array->[2]=$th_array->[1];
$th_array->[1]=0;
$th_array->[0]=':';
$th_array->[5]=$th_array->[2];
}
return $th_array;
}
# this function checks that for numeric data warn threshold is within range of critical
# where within range depends on actual threshold spec and normally just means less
sub threshold_specok {
my ($warn_thar,$crit_thar) = @_;
return 1 if defined($warn_thar) && defined($warn_thar->[1]) &&
defined($crit_thar) && defined($crit_thar->[1]) &&
isnum($warn_thar->[1]) && isnum($crit_thar->[1]) &&
$warn_thar->[0] eq $crit_thar->[0] &&
(!defined($warn_thar->[3]) || $warn_thar->[3] !~ /\^/) &&
(!defined($crit_thar->[3]) || $crit_thar->[3] !~ /\^/) &&
(($warn_thar->[1]>$crit_thar->[1] && ($warn_thar->[0] =~ />/ || $warn_thar->[0] eq '@')) ||
($warn_thar->[1]<$crit_thar->[1] && ($warn_thar->[0] =~ /</ || $warn_thar->[0] eq ':')) ||
($warn_thar->[0] eq ':' && $warn_thar->[2]>=$crit_thar->[2]) ||
($warn_thar->[0] eq '@' && $warn_thar->[2]<=$crit_thar->[2]));
return 0; # return with 0 means specs check out and are ok
}
# parse command line options
sub check_options {
Getopt::Long::Configure ("bundling");
GetOptions(
'v' => \$o_verb, 'verbose' => \$o_verb,
'h' => \$o_help, 'help' => \$o_help,
'H:s' => \$o_host, 'hostname:s' => \$o_host,
'p:i' => \$o_port, 'port:i' => \$o_port,
't:i' => \$o_timeout, 'timeout:i' => \$o_timeout,
'V' => \$o_version, 'version' => \$o_version,
's:s' => \$o_mdsopt, 'stat:s' => \$o_mdsopt,
'a:s' => \$o_variables, 'variables:s' => \$o_variables,
'c:s' => \$o_crit, 'critical:s' => \$o_crit,
'w:s' => \$o_warn, 'warn:s' => \$o_warn,
'f:s' => \$o_perf, 'perfparse:s' => \$o_perf,
'A:s' => \$o_perfvars, 'perfvars:s' => \$o_perfvars,
'T:s' => \$o_timecheck, 'response_time:s' => \$o_timecheck,
'R:s' => \$o_hitrate, 'hitrate:s' => \$o_hitrate,
'U:s' => \$o_utilsize, 'utilization:s' => \$o_utilsize,
'P:s' => \$o_prevperf, 'prev_perfdata:s' => \$o_prevperf,
'E:s' => \$o_prevtime, 'prev_checktime:s'=> \$o_prevtime,
'L:s' => \$o_ratelabel, 'rate_label:s' => \$o_ratelabel,
);
if (defined($o_help)) { help(); exit $ERRORS{"UNKNOWN"} };
if (defined($o_version)) { p_version(); exit $ERRORS{"UNKNOWN"} };
if (!defined($o_host)) { print "Please specify hostname (-H)\n"; print_usage(); exit $ERRORS{"UNKNOWN"}; }
@o_mdslist=split(/,/, lc $o_mdsopt) if defined($o_mdsopt) && $o_mdsopt ne '';
($o_rprefix,$o_rsuffix)=split(/,/, lc $o_ratelabel) if defined($o_ratelabel) && $o_ratelabel ne '';
# below code is common for number of my plugins, including check_snmp_?, netstat, etc
# it is mostly compliant with nagios threshold specification (except use of '~')
# and adds number of additional format options using '>','<','!','=' prefixes
my (@ar_warnLv,@ar_critLv);
@o_perfvarsL=split( /,/ , lc $o_perfvars ) if defined($o_perfvars) && $o_perfvars ne '*';
$o_perfvars='*' if defined($o_perfvars) && scalar(@o_perfvarsL)==0;
for (my $i=0; $i<scalar(@o_perfvarsL); $i++) {
$o_perfvarsL[$i] = '&'.$1 if $o_perfvarsL[$i] =~ /^$o_rprefix(.*)$o_rsuffix$/;
}
if (defined($o_warn) || defined($o_crit) || defined($o_variables) || (defined($o_timecheck) && $o_timecheck ne '') || (defined($o_hitrate) && $o_hitrate ne '')) {
if (defined($o_variables)) {
@o_varsL=split( /,/ , lc $o_variables );
if (defined($o_warn)) {
$o_warn.="~" if $o_warn =~ /,$/;
@ar_warnLv=split( /,/ , lc $o_warn );
}
if (defined($o_crit)) {
$o_crit.="~" if $o_crit =~ /,$/;
@ar_critLv=split( /,/ , lc $o_crit );
}
}
elsif (!defined($o_timecheck) && !defined($o_hitrate)) {
print "Specifying warning and critical levels requires '-a' parameter with list of STATUS variables\n";
print_usage();
exit $ERRORS{"UNKNOWN"};
}
if (defined($o_timecheck) && $o_timecheck ne '') {
my @o_timeth=split(/,/, lc $o_timecheck);
verb("Processing timecheck thresholds: $o_timecheck");
if (scalar(@o_timeth)!=2) {
printf "Incorrect value '%s' for Connection Time Thresholds. Connection time threshold must include both warning and critical thresholds separated by ','\n", $o_timecheck;
print_usage();
exit $ERRORS{"UNKNOWN"};
}
unshift(@o_varsL,"response_time");
unshift(@ar_warnLv,$o_timeth[0]);
unshift(@ar_critLv,$o_timeth[1]);
}
if (defined($o_hitrate) && $o_hitrate ne '') {
my @o_hrate=split(/,/, lc $o_hitrate);
verb("Processing hitrate thresholds: $o_hitrate");
if (scalar(@o_hrate)!=2) {
printf "Incorrect value '%s' for Hitrate Threshold. You must include both warning and critical thresholds separated by ','\n", $o_hitrate;
print_usage();
exit $ERRORS{"UNKNOWN"};
}
unshift(@o_varsL,"hitrate");
unshift(@ar_warnLv,$o_hrate[0]);
unshift(@ar_critLv,$o_hrate[1]);
}
if (defined($o_utilsize) && $o_utilsize ne '') {
my @o_usize=split(/,/, lc $o_utilsize);
verb("Processing utilization thresholds: $o_utilsize");
if (scalar(@o_usize)!=2) {
printf "Incorrect value '%s' for Utilization Threshold. You must include both warning and critical thresholds separated by ','\n", $o_utilsize;
print_usage();
exit $ERRORS{"UNKNOWN"};
}
unshift(@o_varsL,"utilization");
unshift(@ar_warnLv,$o_usize[0]);
unshift(@ar_critLv,$o_usize[1]);
}
if (scalar(@ar_warnLv)!=scalar(@o_varsL) || scalar(@ar_critLv)!=scalar(@o_varsL)) {
printf "Number of specified warning levels (%d) and critical levels (%d) must be equal to the number of attributes specified at '-a' (%d). If you need to ignore some attribute do it as ',,'\n", scalar(@ar_warnLv), scalar(@ar_critLv), scalar(@o_varsL);
verb("Warning Levels: ".join(",",@ar_warnLv));
verb("Critical Levels: ".join(",",@ar_critLv));
print_usage();
exit $ERRORS{"UNKNOWN"};
}
for (my $i=0; $i<scalar(@o_varsL); $i++) {
$o_varsL[$i] = '&'.$1 if $o_varsL[$i] =~ /^$o_rprefix(.*)$o_rsuffix$/; # always lowercase here
if ($o_varsL[$i] =~ /^&(.*)/) {
if (!defined($o_prevperf)) {
print "Calculating rate variable such as ".$o_varsL[$i]." requires previous performance data. Please add '-P \$SERVICEPERFDATA\$' to your nagios command line.\n";
print_usge();
exit $ERRORS{"UNKNOWN"};
}
if (defined($KNOWN_STATUS_VARS{$1}) && $KNOWN_STATUS_VARS{$1}[0] ne 'COUNTER') {
print "$1 is not a COUNTER variable for which rate of changee should be calculated\n";
print_usage();
exit $ERRORS{"UNKNOWN"};
}
}
$o_warnL[$i] = parse_threshold($ar_warnLv[$i]);
$o_critL[$i] = parse_threshold($ar_critLv[$i]);
if (threshold_specok($o_warnL[$i],$o_critL[$i])) {
print "All numeric warning values must be less then critical (or greater then when '<' is used)\n";
print "Note: to override this check prefix warning value with ^\n";
print_usage();
exit $ERRORS{"UNKNOWN"};
}
}
}
if (defined($o_prevperf)) {
if (defined($o_perf)) {
%prev_perf=process_perf($o_prevperf);
# put last time nagios was checked in timestamp array
if (defined($prev_perf{_ptime})) {
# push @prev_time, $prev_perf{ptime};
$perfcheck_time=$prev_perf{_ptime};
}
elsif (defined($o_prevtime)) {
# push @prev_time, $o_prevtime;
# $prev_perf{ptime}=$o_prevtime;
$perfcheck_time=$o_prevtime;
}
else {
# @prev_time=();
$perfcheck_time=undef;
}
# numeric sort for timestamp array (this is from lowest time to highiest, i.e. to latest)
# my %ptimes=();
# $ptimes{$_}=$_ foreach @prev_time;
# @prev_time = sort { $a <=> $b } keys(%ptimes);
}
else {
print "need -f option first \n"; print_usage(); exit $ERRORS{"UNKNOWN"};
}
}
# if (scalar(@o_varsL)==0 && scalar(@o_perfvarsL)==0) {
# print "You must specify list of attributes with either '-a' or '-A'\n";
# print_usage();
# exit $ERRORS{"UNKNOWN"};
# }
$HOSTNAME = $o_host if defined($o_host);
$PORT = $o_port if defined($o_port);
$TIMEOUT = $o_timeout if defined($o_timeout);
}
# Get the alarm signal (just in case nagios screws up)
$SIG{'ALRM'} = sub {
$memd->disconnect_all if defined($memd);
print ("ERROR: Alarm signal (Nagios time-out)\n");
exit $ERRORS{"UNKNOWN"};
};
########## MAIN #######
check_options();
# Check global timeout if plugin screws up
if (defined($TIMEOUT)) {
verb("Alarm at $TIMEOUT");
alarm($TIMEOUT);
}
else {
verb("no timeout defined : $o_timeout + 10");
alarm ($o_timeout+10);
}
my $sock = new IO::Socket::INET(
PeerAddr => $HOSTNAME,
PeerPort => $PORT,
Proto => 'tcp',
);
if (!$sock) {
print "CRITICAL ERROR - Can not connect to '$HOSTNAME' on port $PORT\n";
exit $ERRORS{'CRITICAL'};
}
close($sock);
my $start_time;
my $dsn = $HOSTNAME.":".$PORT;
verb("connecting to $dsn");
$start_time = [ Time::HiRes::gettimeofday() ] if defined($o_timecheck);
$memd = new Cache::Memcached { 'servers' => [ $dsn ] };
if (!$memd) {
print "CRITICAL ERROR - Memcache error connecting to '$HOSTNAME' on port $PORT\n";
exit $ERRORS{'CRITICAL'};
}
# This returns hashref of various statistics data on memcached
# Basically results of 'stats', 'stats malloc', 'stats sizes', etc.
verb("Requesting statistics on: ".join(',',@o_mdslist));
my $stats = $memd->stats(\@o_mdslist);
my %dataresults;
my $memdversion = "";
my $statuscode = "OK";
my $statusinfo = "";
my $statusdata = "";
my $perfdata = "";
my $vstat;
my $vnam;
my $dnam;
my $vval;
my $chk = "";
my $i;
# load all data into internal hash array
$dataresults{$_} = [undef, 0, 0] foreach(@o_varsL);
$dataresults{$_} = [undef, 0, 0] foreach(@o_perfvarsL);
foreach $vstat (keys %{$stats->{'hosts'}{$dsn}}) {
foreach $vnam (keys %{$stats->{'hosts'}{$dsn}{$vstat}}) {
$vval = $stats->{'hosts'}{$dsn}{$vstat}{$vnam};
if (defined($vval)) {
verb("Stats Data: $vstat($vnam) = $vval");
if ($vnam eq 'version') {
$memdversion = $vval;
}
else {
if ($vstat eq 'misc' || $vstat eq 'malloc') {
$dnam = $vnam;
}
else {
$dnam = $vstat.'_'.$vnam;
}
$dataresults{$dnam}[0] = $vval if exists($dataresults{$dnam});
if (defined($o_perfvars) && $o_perfvars eq '*') { # this adds all status variables variables into performance data when -A '*' is used
$dataresults{$dnam} = [$vval, 0, 0];
push @o_perfvarsL, $dnam;
}
}
}
else {
verb("Stats Data: $vstat($vnam) = NULL");
}
}
}
$memd->disconnect_all;
# Response Time
if (defined($o_timecheck)) {
$dataresults{'response_time'}=[0,0,0] if !defined('response_time');
$dataresults{'response_time'}[0]=Time::HiRes::tv_interval($start_time);;
$statusdata .= sprintf(" response in %.3fs", $dataresults{'response_time'}[0]);
$dataresults{'response_time'}[1]++;
if ($o_timecheck eq '' && defined($o_perf)) {
$perfdata .= ' response_time=' . $dataresults{'response_time'}[0].'s';
}
}
# Memory Use Utilization
if (defined($o_utilsize) && defined($dataresults{'bytes'}) && defined($dataresults{'limit_maxbytes'})) {
$dataresults{'utilization'}=[0,1,0];
if (!defined($dataresults{'limit_maxbytes'}[0]) || $dataresults{'limit_maxbytes'}[0]==0) {
$dataresults{'utilization'}[0]=0;
}
else {
$dataresults{'utilization'}[0]=$dataresults{'bytes'}[0]/$dataresults{'limit_maxbytes'}[0]*100;
}
$statusdata.=',' if $statusdata;
$statusdata .= sprintf(" in use %.2f%% of space", $dataresults{'utilization'}[0]);
if ($o_utilsize eq '' && defined($o_perf)) {
$perfdata .= sprintf(" utilization=%.5f%%", $dataresults{'utilization'}[0]);
}
}
# CPU Use - Converts floating seconds to integer ms
if (defined($dataresults{'rusage_user'})) {
$dataresults{'rusage_user_ms'}=[int($dataresults{'rusage_user'}*100+0.5),0,0];
}
if (defined($dataresults{'rusage_system'})) {
$dataresults{'rusage_system_ms'}=[int($dataresults{'rusage_system'}*100+0.5),0,0];
}
# Calculate rate variables
my $timenow=time();
my $ptime=undef;
my $avar;
$ptime=$prev_perf{'_ptime'} if defined($prev_perf{'_ptime'});
if (defined($o_prevperf) && defined($o_perf)) {
for ($i=0;$i<scalar(@o_varsL);$i++) {
if ($o_varsL[$i] =~ /^&(.*)/) {
$avar = $1;
if (defined($dataresults{$avar}) && $dataresults{$avar}[2]==0) {
$dataresults{$avar}[3]= $avar."=".$dataresults{$avar}[0];
if (defined($KNOWN_STATUS_VARS{$avar})) {
$dataresults{$avar}[3].= $KNOWN_STATUS_VARS{$avar}[1];
}
}
if (defined($prev_perf{$avar}) && defined($ptime)) {
$dataresults{$o_varsL[$i]}=[0,0,0] if !defined($dataresults{$o_varsL[$i]});
$dataresults{$o_varsL[$i]}[0]= sprintf("%.2f",
($dataresults{$avar}[0]-$prev_perf{$avar})/($timenow-$ptime));
verb("Calculating Rate of Change for $avar : ".$o_varsL[$i]."=".$dataresults{$o_varsL[$i]}[0]);
}
}
}
}
# Hitrate
my $hits_total=0;
my $hits_hits=undef;
my $hitrate_all=0;
if (defined($o_hitrate) && defined($dataresults{'get_misses'}) && defined($dataresults{'get_hits'})) {
for $avar ('get_misses', 'get_hits') {
if (defined($o_prevperf) && defined($o_perf) && $dataresults{$avar}[2]==0) {
$dataresults{$avar}[3]= $avar."=".$dataresults{$avar}[0].'c';
}
$hits_hits = $dataresults{'get_hits'}[0] if $avar eq 'get_hits';
$hits_total += $dataresults{$avar}[0];
}
verb("Calculating Hitrate : total=".$hits_total." hits=".$hits_hits);
if (defined($hits_hits) && defined($prev_perf{'get_hits'}) && defined($prev_perf{'get_misses'}) && $hits_hits > $prev_perf{'get_hits'}) {
$hitrate_all = $hits_hits/$hits_total*100 if $hits_total!=0;
$hits_hits -= $prev_perf{'get_hits'};
$hits_total -= $prev_perf{'get_misses'};
$hits_total -= $prev_perf{'get_hits'};
verb("Calculating Hitrate. Adjusted based on previous values. total=".$hits_total." hits=".$hits_hits);
}
if (defined($hits_hits)) {
$dataresults{'hitrate'}=[0,0,0] if !defined($dataresults{'hitrate'});
if ($hits_total==0) {
$dataresults{'hitrate'}[0]=0;
}
else {
$dataresults{'hitrate'}[0]=$hits_hits/$hits_total*100;
}
$statusdata.=',' if $statusdata;
$statusdata .= sprintf(" hitrate is %.2f%%", $dataresults{'hitrate'}[0]);
$statusdata .= sprintf(" (%.2f%% from launch)", $hitrate_all) if ($hitrate_all!=0);
$dataresults{'hitrate'}[1]++;
if ($o_hitrate eq '' && defined($o_perf)) {
$perfdata .= sprintf(" hitrate=%.5f%%", $dataresults{'hitrate'}[0]);
}
}
}
# We split into prefix/suffix again but without lowercasing $o_ratelabel first
($o_rprefix,$o_rsuffix)=split(/,/,$o_ratelabel) if defined($o_ratelabel) && $o_ratelabel ne '';
# main loop to check if warning & critical attributes are ok
for ($i=0;$i<scalar(@o_varsL);$i++) {
$avar=$o_varsL[$i];
my $avar_out = $avar;
if ($avar =~ /^&(.*)/) {
$avar_out = $o_rprefix.$1.$o_rsuffix;
}
if (defined($dataresults{$avar}[0])) {
if ($avar ne 'hitrate' || $dataresults{$avar}[0]>0) {
if ($chk = check_threshold($avar,lc $dataresults{$avar}[0],$o_critL[$i])) {
$dataresults{$avar}[1]++;
$statuscode = "CRITICAL";
$statusinfo .= $chk;
}
elsif ($chk = check_threshold($avar,lc $dataresults{$avar}[0],$o_warnL[$i])) {
$dataresults{$avar}[1]++;
$statuscode="WARNING" if $statuscode eq "OK";
$statusinfo .= $chk;
}
}
if ($dataresults{$avar}[1]==0) {
$dataresults{$avar}[1]++;
$statusdata .= ", " if $statusdata;
$statusdata .= $avar_out . " is " . $dataresults{$avar}[0];
}
if (defined($o_perf) && $dataresults{$avar}[2]==0) {
$dataresults{$avar}[3]=$avar_out."=".$dataresults{$avar}[0];
if (defined($KNOWN_STATUS_VARS{$avar})) {
$dataresults{$avar}[3] .= $KNOWN_STATUS_VARS{$avar}[1];
}
if (defined($o_warnL[$i][5]) && defined($o_critL[$i][5])) {
$dataresults{$avar}[3] .= ';' if $o_warnL[$i][5] ne '' || $o_critL[$i][5] ne '';
$dataresults{$avar}[3] .= $o_warnL[$i][5] if $o_warnL[$i][5] ne '';
$dataresults{$avar}[3] .= ';'.$o_critL[$i][5] if $o_critL[$i][5] ne '';
}
}
}
else {
$statuscode="CRITICAL";
$statusinfo .= " $o_varsL[$i] data is missing";
}
}
# add performance data variables
for ($i=0;$i<scalar(@o_perfvarsL);$i++) {
$avar=$o_perfvarsL[$i];
if (defined($dataresults{$avar}[0]) && $dataresults{$avar}[2]==0) {
if (defined($dataresults{$avar}[3])) {
$perfdata .= " " . $dataresults{$avar}[3];
}
else {
$perfdata .= " " . $avar . "=" . $dataresults{$avar}[0];
if (defined($KNOWN_STATUS_VARS{$avar})) {
$perfdata .= $KNOWN_STATUS_VARS{$avar}[1];
}
}
$dataresults{$avar}[2]++;
}
}
if (defined($o_prevperf)) {
$perfdata .= " _ptime=".$timenow;
}
foreach $avar (keys %dataresults) {
if (defined($dataresults{$avar}[3]) && $dataresults{$avar}[2]==0) {
$perfdata .= " " . $dataresults{$avar}[3];
$dataresults{$avar}[2]++;
}
}
# now output the results
print "MEMCACHED " . $memdversion . ' on ' . $HOSTNAME. ':'. $PORT . ' is '. $statuscode . $statusinfo;
print " -" . $statusdata if $statusdata;
print " |" . $perfdata if $perfdata;
print "\n";
# end exit
exit $ERRORS{$statuscode};