2018-10-05 18:17:24 +02:00
|
|
|
#
|
2019-01-09 09:57:11 +01:00
|
|
|
# Copyright 2019 Centreon (http://www.centreon.com/)
|
2018-10-05 18:17:24 +02:00
|
|
|
#
|
|
|
|
# Centreon is a full-fledged industry-strength solution that meets
|
|
|
|
# the needs in IT infrastructure and application monitoring for
|
|
|
|
# service performance.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
#
|
|
|
|
|
|
|
|
package cloud::prometheus::exporters::nodeexporter::mode::cpudetailed;
|
|
|
|
|
|
|
|
use base qw(centreon::plugins::templates::counter);
|
|
|
|
|
|
|
|
use strict;
|
|
|
|
use warnings;
|
|
|
|
|
|
|
|
sub set_counters {
|
|
|
|
my ($self, %options) = @_;
|
|
|
|
|
|
|
|
$self->{maps_counters_type} = [
|
2018-10-29 13:21:48 +01:00
|
|
|
{ name => 'nodes', type => 3, cb_prefix_output => 'prefix_nodes_output',
|
|
|
|
message_multiple => 'All nodes CPU usage are ok', skipped_code => { -10 => 1 },
|
|
|
|
counters => [ { name => 'cpu', type => 1, cb_prefix_output => 'prefix_cpu_output',
|
|
|
|
message_multiple => 'All CPU usage are ok', skipped_code => { -10 => 1 } } ] },
|
2018-10-05 18:17:24 +02:00
|
|
|
];
|
|
|
|
|
|
|
|
$self->{maps_counters}->{nodes} = [
|
|
|
|
{ label => 'node-wait', set => {
|
|
|
|
key_values => [ { name => 'iowait' }, { name => 'display' } ],
|
|
|
|
output_template => 'Wait: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'wait', value => 'iowait_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-user', set => {
|
|
|
|
key_values => [ { name => 'user' }, { name => 'display' } ],
|
|
|
|
output_template => 'User: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'user', value => 'user_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-softirq', set => {
|
|
|
|
key_values => [ { name => 'softirq' }, { name => 'display' } ],
|
|
|
|
output_template => 'Soft Irq: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'softirq', value => 'softirq_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-interrupt', set => {
|
|
|
|
key_values => [ { name => 'irq' }, { name => 'display' } ],
|
|
|
|
output_template => 'Interrupt: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'interrupt', value => 'irq_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-idle', set => {
|
|
|
|
key_values => [ { name => 'idle' }, { name => 'display' } ],
|
|
|
|
output_template => 'Idle: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'idle', value => 'idle_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-steal', set => {
|
|
|
|
key_values => [ { name => 'steal' }, { name => 'display' } ],
|
|
|
|
output_template => 'Steal: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'steal', value => 'steal_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-system', set => {
|
|
|
|
key_values => [ { name => 'system' }, { name => 'display' } ],
|
|
|
|
output_template => 'System: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'system', value => 'system_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'node-nice', set => {
|
|
|
|
key_values => [ { name => 'nice' }, { name => 'display' } ],
|
|
|
|
output_template => 'Nice: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'nice', value => 'nice_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%', label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
];
|
|
|
|
$self->{maps_counters}->{cpu} = [
|
|
|
|
{ label => 'cpu-wait', set => {
|
|
|
|
key_values => [ { name => 'iowait' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'Wait: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'wait', value => 'iowait_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-user', set => {
|
|
|
|
key_values => [ { name => 'user' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'User: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'user', value => 'user_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-softirq', set => {
|
|
|
|
key_values => [ { name => 'softirq' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'Soft Irq: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'softirq', value => 'softirq_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-interrupt', set => {
|
|
|
|
key_values => [ { name => 'irq' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'Interrupt: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'interrupt', value => 'irq_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-idle', set => {
|
|
|
|
key_values => [ { name => 'idle' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'Idle: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'idle', value => 'idle_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-steal', set => {
|
|
|
|
key_values => [ { name => 'steal' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'Steal: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'steal', value => 'steal_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-system', set => {
|
|
|
|
key_values => [ { name => 'system' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'System: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'system', value => 'system_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
{ label => 'cpu-nice', set => {
|
|
|
|
key_values => [ { name => 'nice' }, { name => 'multi' }, { name => 'display' } ],
|
|
|
|
output_template => 'Nice: %.2f %%',
|
|
|
|
perfdatas => [
|
|
|
|
{ label => 'nice', value => 'nice_absolute', template => '%.2f',
|
|
|
|
min => 0, max => 100, unit => '%',
|
|
|
|
label_multi_instances => 1, multi_use => 'multi_absolute',
|
|
|
|
label_extra_instance => 1, instance_use => 'display_absolute' },
|
|
|
|
],
|
|
|
|
}
|
|
|
|
},
|
|
|
|
];
|
|
|
|
}
|
|
|
|
|
|
|
|
sub prefix_nodes_output {
|
|
|
|
my ($self, %options) = @_;
|
|
|
|
|
|
|
|
return "Node '" . $options{instance_value}->{display} . "' ";
|
|
|
|
}
|
|
|
|
|
|
|
|
sub prefix_cpu_output {
|
|
|
|
my ($self, %options) = @_;
|
|
|
|
|
|
|
|
return "Node '" . $options{instance_value}->{multi} . "' " . "Cpu '" . $options{instance_value}->{display} . "' ";
|
|
|
|
}
|
|
|
|
|
|
|
|
sub new {
|
|
|
|
my ($class, %options) = @_;
|
|
|
|
my $self = $class->SUPER::new(package => __PACKAGE__, %options);
|
|
|
|
bless $self, $class;
|
|
|
|
|
|
|
|
$self->{version} = '1.0';
|
|
|
|
$options{options}->add_options(arguments =>
|
|
|
|
{
|
2018-10-29 13:21:48 +01:00
|
|
|
"instance:s" => { name => 'instance', default => 'instance=~".*"' },
|
|
|
|
"cpu:s" => { name => 'cpu', default => 'cpu=~".*"' },
|
|
|
|
"type:s" => { name => 'type', default => 'mode=~".*"' },
|
2018-10-06 14:47:00 +02:00
|
|
|
"extra-filter:s@" => { name => 'extra_filter' },
|
2018-10-19 09:50:35 +02:00
|
|
|
"metric-overload:s@" => { name => 'metric_overload' },
|
2018-10-05 18:17:24 +02:00
|
|
|
});
|
|
|
|
|
|
|
|
return $self;
|
|
|
|
}
|
|
|
|
|
2018-10-19 09:50:35 +02:00
|
|
|
sub check_options {
|
|
|
|
my ($self, %options) = @_;
|
|
|
|
$self->SUPER::check_options(%options);
|
|
|
|
|
|
|
|
$self->{metrics} = {
|
|
|
|
'cpu' => "^node_cpu.*",
|
|
|
|
};
|
|
|
|
foreach my $metric (@{$self->{option_results}->{metric_overload}}) {
|
|
|
|
next if ($metric !~ /(.*),(.*)/);
|
|
|
|
$self->{metrics}->{$1} = $2 if (defined($self->{metrics}->{$1}));
|
|
|
|
}
|
2018-10-24 15:55:59 +02:00
|
|
|
|
2018-10-29 13:21:48 +01:00
|
|
|
$self->{labels} = {};
|
|
|
|
foreach my $label (('instance', 'cpu', 'type')) {
|
|
|
|
if ($self->{option_results}->{$label} !~ /^(\w+)[!~=]+\".*\"$/) {
|
|
|
|
$self->{output}->add_option_msg(short_msg => "Need to specify --" . $label . " option as a PromQL filter.");
|
|
|
|
$self->{output}->option_exit();
|
|
|
|
}
|
|
|
|
$self->{labels}->{$label} = $1;
|
|
|
|
}
|
|
|
|
|
|
|
|
$self->{extra_filter} = '';
|
|
|
|
foreach my $filter (@{$self->{option_results}->{extra_filter}}) {
|
|
|
|
$self->{extra_filter} .= ',' . $filter;
|
|
|
|
}
|
|
|
|
|
2018-10-24 15:55:59 +02:00
|
|
|
$self->{prom_timeframe} = defined($self->{option_results}->{timeframe}) ? $self->{option_results}->{timeframe} : 900;
|
|
|
|
$self->{prom_step} = defined($self->{option_results}->{step}) ? $self->{option_results}->{step} : "1m";
|
2018-10-19 09:50:35 +02:00
|
|
|
}
|
|
|
|
|
2018-10-05 18:17:24 +02:00
|
|
|
sub manage_selection {
|
|
|
|
my ($self, %options) = @_;
|
|
|
|
|
|
|
|
$self->{nodes} = {};
|
|
|
|
|
2018-10-29 13:21:48 +01:00
|
|
|
my $results = $options{custom}->query_range(queries => [ '(irate({__name__=~"' . $self->{metrics}->{cpu} . '",' .
|
|
|
|
$self->{option_results}->{instance} . ',' .
|
|
|
|
$self->{option_results}->{cpu} . ',' .
|
|
|
|
$self->{option_results}->{type} .
|
|
|
|
$self->{extra_filter} . '}[1m])) * 100' ],
|
2018-10-24 15:55:59 +02:00
|
|
|
timeframe => $self->{prom_timeframe}, step => $self->{prom_step});
|
2018-10-05 18:17:24 +02:00
|
|
|
|
2018-10-29 13:21:48 +01:00
|
|
|
foreach my $result (@{$results}) {
|
|
|
|
my $average = $options{custom}->compute(aggregation => 'average', values => $result->{values});
|
|
|
|
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{display} = $result->{metric}->{$self->{labels}->{instance}};
|
|
|
|
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{$result->{metric}->{$self->{labels}->{type}}} += $average;
|
|
|
|
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{cpu}->{$result->{metric}->{$self->{labels}->{cpu}}}->{multi} = $result->{metric}->{$self->{labels}->{instance}};
|
|
|
|
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{cpu}->{$result->{metric}->{$self->{labels}->{cpu}}}->{display} = $result->{metric}->{$self->{labels}->{cpu}};
|
|
|
|
$self->{nodes}->{$result->{metric}->{$self->{labels}->{instance}}}->{cpu}->{$result->{metric}->{$self->{labels}->{cpu}}}->{$result->{metric}->{$self->{labels}->{type}}} = $average;
|
2018-10-05 18:17:24 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
foreach my $node (keys %{$self->{nodes}}) {
|
|
|
|
foreach my $metric (keys %{$self->{nodes}->{$node}}) {
|
|
|
|
next if ($metric =~ /cpu|display/);
|
|
|
|
$self->{nodes}->{$node}->{$metric} /= scalar(keys %{$self->{nodes}->{$node}->{cpu}});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (scalar(keys %{$self->{nodes}}) <= 0) {
|
|
|
|
$self->{output}->add_option_msg(short_msg => "No nodes found.");
|
|
|
|
$self->{output}->option_exit();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
1;
|
|
|
|
|
|
|
|
__END__
|
|
|
|
|
|
|
|
=head1 MODE
|
|
|
|
|
|
|
|
Check CPU detailed usage for nodes and each of their cores.
|
|
|
|
|
|
|
|
=over 8
|
|
|
|
|
2018-10-29 13:21:48 +01:00
|
|
|
=item B<--instance>
|
|
|
|
|
|
|
|
Filter on a specific instance (Must be a PromQL filter, Default: 'instance=~".*"')
|
|
|
|
|
|
|
|
=item B<--cpu>
|
|
|
|
|
|
|
|
Filter on a specific cpu (Must be a PromQL filter, Default: 'cpu=~".*"')
|
|
|
|
|
|
|
|
=item B<--type>
|
2018-10-06 14:47:00 +02:00
|
|
|
|
2018-10-29 13:21:48 +01:00
|
|
|
Filter on a specific type (Must be a PromQL filter, Default: 'mode=~".*"')
|
2018-10-05 18:17:24 +02:00
|
|
|
|
|
|
|
=item B<--warning-*>
|
|
|
|
|
|
|
|
Threshold warning.
|
|
|
|
Can be: 'node-idle', 'node-wait', 'node-irq', 'node-nice',
|
|
|
|
'node-softirq', 'node-steal', 'node-system', 'node-user',
|
|
|
|
'cpu-idle', 'cpu-wait', 'cpu-irq', 'cpu-nice', 'cpu-softirq',
|
|
|
|
'cpu-steal', 'cpu-system', 'cpu-user'.
|
|
|
|
|
|
|
|
=item B<--critical-*>
|
|
|
|
|
|
|
|
Threshold critical.
|
|
|
|
Can be: 'node-idle', 'node-wait', 'node-irq', 'node-nice',
|
|
|
|
'node-softirq', 'node-steal', 'node-system', 'node-user',
|
|
|
|
'cpu-idle', 'cpu-wait', 'cpu-irq', 'cpu-nice', 'cpu-softirq',
|
|
|
|
'cpu-steal', 'cpu-system', 'cpu-user'.
|
|
|
|
|
2018-10-19 09:50:35 +02:00
|
|
|
=item B<--extra-filter>
|
|
|
|
|
|
|
|
Add a PromQL filter (Can be multiple)
|
|
|
|
|
|
|
|
Example : --extra-filter='name=~".*pretty.*"'
|
|
|
|
|
|
|
|
=item B<--metric-overload>
|
|
|
|
|
|
|
|
Overload default metrics name (Can be multiple, metric can be 'cpu')
|
|
|
|
|
|
|
|
Example : --metric-overload='metric,^my_metric_name$'
|
|
|
|
|
2018-10-05 18:17:24 +02:00
|
|
|
=back
|
|
|
|
|
|
|
|
=cut
|