forked from HariSekhon/Nagios-Plugins
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcheck_cassandra_tpstats.pl
executable file
·124 lines (103 loc) · 3.59 KB
/
check_cassandra_tpstats.pl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
#!/usr/bin/perl -T
# nagios: -epn
#
# Author: Hari Sekhon
# Date: 2013-10-15 04:56:49 +0100 (Tue, 15 Oct 2013)
#
# http://github.com/harisekhon
#
# License: see accompanying LICENSE file
#
$DESCRIPTION = "Nagios Plugin to fetch Cassandra's thread pool stats per node by parsing 'nodetool tpstats'.
Checks Pending/Blocked operations against warning/critical thresholds.
Check the baseline first and then set appropriate thresholds since a build up of Pending/Blocked operations is indicative of performance problems.
Also returns Active and Dropped operations with perfdata for graphing.
Can specify a remote host and port otherwise it checks the local node's stats (for calling over NRPE on each Cassandra node)
Written and tested against Cassandra 2.0, DataStax Community Edition";
$VERSION = "0.6";
use strict;
use warnings;
BEGIN {
use File::Basename;
use lib dirname(__FILE__) . "/lib";
}
use HariSekhonUtils;
use HariSekhon::Cassandra::Nodetool;
my $default_warning = 0;
my $default_critical = 0;
$warning = $default_warning;
$critical = $default_critical;
%options = (
%nodetool_options,
"w|warning=s" => [ \$warning, "Warning threshold max (inclusive) for Pending/Blocked operations (default: $default_warning)" ],
"c|critical=s" => [ \$critical, "Critical threshold max (inclusive) for Pending/Blocked operations (default: $default_critical)" ],
);
@usage_order = qw/nodetool host port user password warning critical/;
get_options();
($nodetool, $host, $port, $user, $password) = validate_nodetool_options($nodetool, $host, $port, $user, $password);
validate_thresholds(1, 1, { "simple" => "upper", "integer" => 1, "positive" => 1 } );
vlog2;
set_timeout();
$status = "OK";
my $options = nodetool_options($host, $port, $user, $password);
my $cmd = "${nodetool} ${options}tpstats";
vlog2 "fetching threadpool stats";
my @output = cmd($cmd);
check_nodetool_errors(join(" ", @output));
$output[0] =~ /Pool\s+Name\s+Active\s+Pending\s+Completed\s+Blocked\s+All time blocked\s*$/i or die_nodetool_unrecognized_output($output[0]);
my @stats;
my $i = 1;
foreach(; $i < scalar @output; $i++){
$output[$i] =~ /^\s*$/ and $i++ and last;
$output[$i] =~ /^(\w+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s*$/ or die_nodetool_unrecognized_output($output[$i]);
push(@stats,
(
{ "$1_Blocked" => $5, },
{ "$1_Pending" => $3, },
{ "$1_Active" => $2, },
#{ "$1_Completed" => $4, },
#{ "$1_All_time_blocked" => $6, },
)
);
}
foreach(; $i < scalar @output; $i++){
next if $output[$i] =~ /^\s*$/;
last;
}
$output[$i] =~ /^Message type\s+Dropped/ or die_format_changed($output[$i]);
$i++;
my @stats2;
foreach(; $i < scalar @output; $i++){
$output[$i] =~ /^(\w+)\s+(\d+)$/ or die_format_changed($output[$i]);
push(@stats2,
(
{ ucfirst(lc($1)) . "_Dropped" => $2 }
)
);
}
push(@stats2, @stats);
my $msg2;
my $msg3;
my ($thresholds_ok, $thresholds_msg);
foreach(my $i = 0; $i < scalar @stats2; $i++){
foreach my $stat3 ($stats2[$i]){
foreach my $key (keys %$stat3){
$msg2 = "$key=$$stat3{$key} ";
$msg3 .= $msg2;
if($key =~ /Pending|Blocked/i){
($thresholds_ok, $thresholds_msg) = check_thresholds($$stat3{$key}, 1);
unless($thresholds_ok){
$msg2 = uc $msg2;
}
}
$msg .= $msg2;
}
}
}
$msg =~ s/\s$//;
if($verbose or $status ne "OK"){
msg_thresholds();
}
$msg .= "| $msg3";
vlog2;
quit $status, $msg;