centreon-plugins/cloud/prometheus/exporters/nodeexporter/mode/cpudetailed.pm

351 lines
15 KiB
Perl
Raw Normal View History

#
2019-01-09 09:57:11 +01:00
# Copyright 2019 Centreon (http://www.centreon.com/)
#
# Centreon is a full-fledged industry-strength solution that meets
# the needs in IT infrastructure and application monitoring for
# service performance.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
package cloud::prometheus::exporters::nodeexporter::mode::cpudetailed;
use base qw(centreon::plugins::templates::counter);
use strict;
use warnings;
sub set_counters {
my ($self, %options) = @_;
$self->{maps_counters_type} = [
2018-10-29 13:21:48 +01:00
{ name => 'nodes', type => 3, cb_prefix_output => 'prefix_nodes_output',
message_multiple => 'All nodes CPU usage are ok', skipped_code => { -10 => 1 },
counters => [ { name => 'cpu', type => 1, cb_prefix_output => 'prefix_cpu_output',
message_multiple => 'All CPU usage are ok', skipped_code => { -10 => 1 } } ] },
];
$self->{maps_counters}->{nodes} = [
{ label => 'node-wait', set => {
key_values => [ { name => 'iowait' }, { name => 'display' } ],
output_template => 'Wait: %.2f %%',
perfdatas => [
{ label => 'wait', value => 'iowait_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-user', set => {
key_values => [ { name => 'user' }, { name => 'display' } ],
output_template => 'User: %.2f %%',
perfdatas => [
{ label => 'user', value => 'user_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-softirq', set => {
key_values => [ { name => 'softirq' }, { name => 'display' } ],
output_template => 'Soft Irq: %.2f %%',
perfdatas => [
{ label => 'softirq', value => 'softirq_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-interrupt', set => {
key_values => [ { name => 'irq' }, { name => 'display' } ],
output_template => 'Interrupt: %.2f %%',
perfdatas => [
{ label => 'interrupt', value => 'irq_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-idle', set => {
key_values => [ { name => 'idle' }, { name => 'display' } ],
output_template => 'Idle: %.2f %%',
perfdatas => [
{ label => 'idle', value => 'idle_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-steal', set => {
key_values => [ { name => 'steal' }, { name => 'display' } ],
output_template => 'Steal: %.2f %%',
perfdatas => [
{ label => 'steal', value => 'steal_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-system', set => {
key_values => [ { name => 'system' }, { name => 'display' } ],
output_template => 'System: %.2f %%',
perfdatas => [
{ label => 'system', value => 'system_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'node-nice', set => {
key_values => [ { name => 'nice' }, { name => 'display' } ],
output_template => 'Nice: %.2f %%',
perfdatas => [
{ label => 'nice', value => 'nice_absolute', template => '%.2f',
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
];
$self->{maps_counters}->{cpu} = [
{ label => 'cpu-wait', set => {
key_values => [ { name => 'iowait' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'Wait: %.2f %%',
perfdatas => [
{ label => 'wait', value => 'iowait_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-user', set => {
key_values => [ { name => 'user' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'User: %.2f %%',
perfdatas => [
{ label => 'user', value => 'user_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-softirq', set => {
key_values => [ { name => 'softirq' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'Soft Irq: %.2f %%',
perfdatas => [
{ label => 'softirq', value => 'softirq_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-interrupt', set => {
key_values => [ { name => 'irq' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'Interrupt: %.2f %%',
perfdatas => [
{ label => 'interrupt', value => 'irq_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-idle', set => {
key_values => [ { name => 'idle' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'Idle: %.2f %%',
perfdatas => [
{ label => 'idle', value => 'idle_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-steal', set => {
key_values => [ { name => 'steal' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'Steal: %.2f %%',
perfdatas => [
{ label => 'steal', value => 'steal_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-system', set => {
key_values => [ { name => 'system' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'System: %.2f %%',
perfdatas => [
{ label => 'system', value => 'system_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
{ label => 'cpu-nice', set => {
key_values => [ { name => 'nice' }, { name => 'multi' }, { name => 'display' } ],
output_template => 'Nice: %.2f %%',
perfdatas => [
{ label => 'nice', value => 'nice_absolute', template => '%.2f',
min => 0, max => 100, unit => '%',
label_multi_instances => 1, multi_use => 'multi_absolute',
label_extra_instance => 1, instance_use => 'display_absolute' },
],
}
},
];
}
sub prefix_nodes_output {
my ($self, %options) = @_;
return "Node '" . $options{instance_value}->{display} . "' ";
}
sub prefix_cpu_output {
my ($self, %options) = @_;
return "Node '" . $options{instance_value}->{multi} . "' " . "Cpu '" . $options{instance_value}->{display} . "' ";
}
sub new {
my ($class, %options) = @_;
my $self = $class->SUPER::new(package => __PACKAGE__, %options);
bless $self, $class;
$self->{version} = '1.0';
$options{options}->add_options(arguments =>
{
2018-10-29 13:21:48 +01:00
"instance:s" => { name => 'instance', default => 'instance=~".*"' },
"cpu:s" => { name => 'cpu', default => 'cpu=~".*"' },
"type:s" => { name => 'type', default => 'mode=~".*"' },
2018-10-06 14:47:00 +02:00
"extra-filter:s@" => { name => 'extra_filter' },
"metric-overload:s@" => { name => 'metric_overload' },
});
return $self;
}
sub check_options {
my ($self, %options) = @_;
$self->SUPER::check_options(%options);
$self->{metrics} = {
'cpu' => "^node_cpu.*",
};
foreach my $metric (@{$self->{option_results}->{metric_overload}}) {
next if ($metric !~ /(.*),(.*)/);
$self->{metrics}->{$1} = $2 if (defined($self->{metrics}->{$1}));
}
2018-10-29 13:21:48 +01:00
$self->{labels} = {};
foreach my $label (('instance', 'cpu', 'type')) {
if ($self->{option_results}->{$label} !~ /^(\w+)[!~=]+\".*\"$/) {
$self->{output}->add_option_msg(short_msg => "Need to specify --" . $label . " option as a PromQL filter.");
$self->{output}->option_exit();
}
$self->{labels}->{$label} = $1;
}
$self->{extra_filter} = '';
foreach my $filter (@{$self->{option_results}->{extra_filter}}) {
$self->{extra_filter} .= ',' . $filter;
}
$self->{prom_timeframe} = defined($self->{option_results}->{timeframe}) ? $self->{option_results}->{timeframe} : 900;
$self->{prom_step} = defined($self->{option_results}->{step}) ? $self->{option_results}->{step} : "1m";
}
sub manage_selection {
my ($self, %options) = @_;
$self->{nodes} = {};
2018-10-29 13:21:48 +01:00
my $results = $options{custom}->query_range(queries => [ '(irate({__name__=~"' . $self->{metrics}->{cpu} . '",' .
$self->{option_results}->{instance} . ',' .
$self->{option_results}->{cpu} . ',' .
$self->{option_results}->{type} .
$self->{extra_filter} . '}[1m])) * 100' ],
timeframe => $self->{prom_timeframe}, step => $self->{prom_step});
2018-10-29 13:21:48 +01:00
foreach my $result (@{$results}) {
my $average = $options{custom}->compute(aggregation => 'average', values => $result->{values});
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{display} = $result->{metric}->{$self->{labels}->{instance}};
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{$result->{metric}->{$self->{labels}->{type}}} += $average;
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{cpu}->{$result->{metric}->{$self->{labels}->{cpu}}}->{multi} = $result->{metric}->{$self->{labels}->{instance}};
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{cpu}->{$result->{metric}->{$self->{labels}->{cpu}}}->{display} = $result->{metric}->{$self->{labels}->{cpu}};
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{cpu}->{$result->{metric}->{$self->{labels}->{cpu}}}->{$result->{metric}->{$self->{labels}->{type}}} = $average;
}
foreach my $node (keys %{$self->{nodes}}) {
foreach my $metric (keys %{$self->{nodes}->{$node}}) {
next if ($metric =~ /cpu|display/);
$self->{nodes}->{$node}->{$metric} /= scalar(keys %{$self->{nodes}->{$node}->{cpu}});
}
}
if (scalar(keys %{$self->{nodes}}) <= 0) {
$self->{output}->add_option_msg(short_msg => "No nodes found.");
$self->{output}->option_exit();
}
}
1;
__END__
=head1 MODE
Check CPU detailed usage for nodes and each of their cores.
=over 8
2018-10-29 13:21:48 +01:00
=item B<--instance>
Filter on a specific instance (Must be a PromQL filter, Default: 'instance=~".*"')
=item B<--cpu>
Filter on a specific cpu (Must be a PromQL filter, Default: 'cpu=~".*"')
=item B<--type>
2018-10-06 14:47:00 +02:00
2018-10-29 13:21:48 +01:00
Filter on a specific type (Must be a PromQL filter, Default: 'mode=~".*"')
=item B<--warning-*>
Threshold warning.
Can be: 'node-idle', 'node-wait', 'node-irq', 'node-nice',
'node-softirq', 'node-steal', 'node-system', 'node-user',
'cpu-idle', 'cpu-wait', 'cpu-irq', 'cpu-nice', 'cpu-softirq',
'cpu-steal', 'cpu-system', 'cpu-user'.
=item B<--critical-*>
Threshold critical.
Can be: 'node-idle', 'node-wait', 'node-irq', 'node-nice',
'node-softirq', 'node-steal', 'node-system', 'node-user',
'cpu-idle', 'cpu-wait', 'cpu-irq', 'cpu-nice', 'cpu-softirq',
'cpu-steal', 'cpu-system', 'cpu-user'.
=item B<--extra-filter>
Add a PromQL filter (Can be multiple)
Example : --extra-filter='name=~".*pretty.*"'
=item B<--metric-overload>
Overload default metrics name (Can be multiple, metric can be 'cpu')
Example : --metric-overload='metric,^my_metric_name$'
=back
=cut