enh(aws/ec2): instances status mode - add uptime option (#3029)

This commit is contained in:
qgarnier 2021-08-09 16:05:39 +02:00 committed by GitHub
parent 4002186135
commit 6e2a0a5d1c
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 241 additions and 118 deletions

View File

@ -412,7 +412,7 @@ sub ec2_get_instances_status {
foreach (@{$raw_results->{InstanceStatuses}}) {
$instance_results->{$_->{InstanceId}} = {
state => $_->{InstanceState}->{Name},
status => => $_->{InstanceStatus}->{Status}
status => $_->{InstanceStatus}->{Status}
};
}
@ -517,8 +517,8 @@ sub ec2_list_resources {
AvailabilityZone => $instance->{Placement}->{AvailabilityZone},
InstanceType => $instance->{InstanceType},
State => $instance->{State}->{Name},
Tags => join(",", @instance_tags),
KeyName => $instance->{KeyName},
Tags => join(',', @instance_tags),
KeyName => $instance->{KeyName}
};
}
}
@ -526,6 +526,26 @@ sub ec2_list_resources {
return $resource_results;
}
sub ec2_get_instances {
my ($self, %options) = @_;
my $cmd_options = $self->ec2_list_resources_set_cmd(%options);
my $raw_results = $self->execute(cmd_options => $cmd_options);
my $instance_results = {};
foreach my $reservation (@{$raw_results->{Reservations}}) {
foreach my $instance (@{$reservation->{Instances}}) {
$instance_results->{ $instance->{InstanceId} } = {
State => $instance->{State}->{Name},
InstanceType => $instance->{InstanceType},
LaunchTime => $instance->{LaunchTime}
};
}
}
return $instance_results;
}
sub asg_get_resources_set_cmd {
my ($self, %options) = @_;

View File

@ -371,6 +371,33 @@ sub ec2_get_instances_status {
return $instance_results;
}
sub ec2_get_instances {
my ($self, %options) = @_;
my $instance_results = {};
eval {
my $ec2 = $self->{paws}->service('EC2', region => $self->{option_results}->{region});
my $list_instances = $ec2->DescribeInstances(DryRun => 0);
foreach my $reservation (@{$list_instances->{Reservations}}) {
foreach my $instance (@{$reservation->{Instances}}) {
$instance_results->{ $instance->{InstanceId} } = {
Name => $instance->{InstanceId},
InstanceType => $instance->{InstanceType},
State => $instance->{State}->{Name},
LaunchTime => $instance->{LaunchTime}
};
}
}
};
if ($@) {
$self->{output}->add_option_msg(short_msg => "error: $@");
$self->{output}->option_exit();
}
return $instance_results;
}
sub ec2spot_get_active_instances {
my ($self, %options) = @_;

View File

@ -24,22 +24,58 @@ use base qw(centreon::plugins::templates::counter);
use strict;
use warnings;
use centreon::plugins::templates::catalog_functions qw(catalog_status_threshold);
use POSIX;
use centreon::plugins::misc;
use centreon::plugins::templates::catalog_functions qw(catalog_status_threshold_ng);
use DateTime;
my $unitdiv = { s => 1, w => 604800, d => 86400, h => 3600, m => 60 };
my $unitdiv_long = { s => 'seconds', w => 'weeks', d => 'days', h => 'hours', m => 'minutes' };
sub custom_uptime_perfdata {
my ($self, %options) = @_;
$self->{output}->perfdata_add(
nlabel => $self->{nlabel} . '.' . $unitdiv_long->{ $self->{instance_mode}->{option_results}->{uptime_unit} },
unit => $self->{instance_mode}->{option_results}->{uptime_unit},
instances => $self->{result_values}->{display},
value => floor($self->{result_values}->{uptime_seconds} / $unitdiv->{ $self->{instance_mode}->{option_results}->{uptime_unit} }),
warning => $self->{perfdata}->get_perfdata_for_output(label => 'warning-' . $self->{thlabel}),
critical => $self->{perfdata}->get_perfdata_for_output(label => 'critical-' . $self->{thlabel}),
min => 0
);
}
sub custom_uptime_threshold {
my ($self, %options) = @_;
return $self->{perfdata}->threshold_check(
value => floor($self->{result_values}->{uptime_seconds} / $unitdiv->{ $self->{instance_mode}->{option_results}->{uptime_unit} }),
threshold => [
{ label => 'critical-' . $self->{thlabel}, exit_litteral => 'critical' },
{ label => 'warning-'. $self->{thlabel}, exit_litteral => 'warning' },
{ label => 'unknown-'. $self->{thlabel}, exit_litteral => 'unknown' }
]
);
}
sub custom_status_output {
my ($self, %options) = @_;
my $msg = sprintf('state: %s, status: %s', $self->{result_values}->{state}, $self->{result_values}->{status});
return $msg;
return sprintf('state: %s, status: %s', $self->{result_values}->{state}, $self->{result_values}->{status});
}
sub custom_status_calc {
sub prefix_global_output {
my ($self, %options) = @_;
$self->{result_values}->{state} = $options{new_datas}->{$self->{instance} . '_state'};
$self->{result_values}->{status} = $options{new_datas}->{$self->{instance} . '_status'};
$self->{result_values}->{display} = $options{new_datas}->{$self->{instance} . '_display'};
return 0;
return 'Total instances ';
}
sub prefix_awsinstance_output {
my ($self, %options) = @_;
return "Instance '" . $options{instance_value}->{display} . "' ";
}
sub set_counters {
@ -48,69 +84,76 @@ sub set_counters {
$self->{maps_counters_type} = [
{ name => 'global', type => 0, cb_prefix_output => 'prefix_global_output' },
{ name => 'aws_instances', type => 1, cb_prefix_output => 'prefix_awsinstance_output',
message_multiple => 'All instances are ok' },
message_multiple => 'All instances are ok', skipped_code => { -10 => 1 } }
];
$self->{maps_counters}->{global} = [
{ label => 'pending', nlabel => 'ec2.instances.status.pending.count', set => {
key_values => [ { name => 'pending' } ],
output_template => "Pending : %s",
output_template => "pending: %s",
perfdatas => [
{ value => 'pending', template => '%d', min => 0 },
],
{ template => '%d', min => 0 }
]
}
},
{ label => 'running', nlabel => 'ec2.instances.status.running.count', set => {
key_values => [ { name => 'running' } ],
output_template => "Running : %s",
output_template => "running: %s",
perfdatas => [
{ value => 'running', template => '%d', min => 0 },
],
{ template => '%d', min => 0 }
]
}
},
{ label => 'shuttingdown', nlabel => 'ec2.instances.status.shuttingdown.count', set => {
key_values => [ { name => 'shutting-down' } ],
output_template => "Shutting Down : %s",
output_template => "shutting down: %s",
perfdatas => [
{ value => 'shutting-down', template => '%d', min => 0 },
],
{ template => '%d', min => 0 }
]
}
},
{ label => 'terminated', nlabel => 'ec2.instances.status.terminated.count', set => {
key_values => [ { name => 'terminated' } ],
output_template => "Terminated : %s",
output_template => "terminated: %s",
perfdatas => [
{ value => 'terminated', template => '%d', min => 0 },
],
{ template => '%d', min => 0 }
]
}
},
{ label => 'stopping', nlabel => 'ec2.instances.status.stopping.count', set => {
key_values => [ { name => 'stopping' } ],
output_template => "Stopping : %s",
output_template => "stopping: %s",
perfdatas => [
{ value => 'stopping', template => '%d', min => 0 },
],
{ template => '%d', min => 0 }
]
}
},
{ label => 'stopped', nlabel => 'ec2.instances.status.stopped.count', set => {
key_values => [ { name => 'stopped' } ],
output_template => "Stopped : %s",
output_template => "stopped: %s",
perfdatas => [
{ value => 'stopped', template => '%d', min => 0 },
],
{ template => '%d', min => 0 }
]
}
}
},
];
$self->{maps_counters}->{aws_instances} = [
{ label => 'status', threshold => 0, set => {
{ label => 'status', type => 2, set => {
key_values => [ { name => 'state' }, { name => 'status' }, { name => 'display' } ],
closure_custom_calc => $self->can('custom_status_calc'),
closure_custom_output => $self->can('custom_status_output'),
closure_custom_perfdata => sub { return 0; },
closure_custom_threshold_check => \&catalog_status_threshold,
closure_custom_threshold_check => \&catalog_status_threshold_ng
}
},
{ label => 'uptime', nlabel => 'ec2.uptime', set => {
key_values => [ { name => 'uptime_seconds' }, { name => 'uptime_human' }, { name => 'display' } ],
output_template => 'uptime: %s',
output_use => 'uptime_human',
closure_custom_perfdata => $self->can('custom_uptime_perfdata'),
closure_custom_threshold_check => $self->can('custom_uptime_threshold')
}
}
];
}
@ -120,9 +163,9 @@ sub new {
bless $self, $class;
$options{options}->add_options(arguments => {
"filter-instanceid:s" => { name => 'filter_instanceid' },
"warning-status:s" => { name => 'warning_status', default => '' },
"critical-status:s" => { name => 'critical_status', default => '' }
'filter-instanceid:s' => { name => 'filter_instanceid' },
'add-uptime' => { name => 'add_uptime' },
'uptime-unit:s' => { name => 'uptime_unit', default => 'd' }
});
return $self;
@ -132,19 +175,34 @@ sub check_options {
my ($self, %options) = @_;
$self->SUPER::check_options(%options);
$self->change_macros(macros => ['warning_status', 'critical_status']);
if ($self->{option_results}->{uptime_unit} eq '' || !defined($unitdiv->{$self->{option_results}->{uptime_unit}})) {
$self->{option_results}->{uptime_unit} = 'd';
}
}
sub prefix_global_output {
sub add_uptime {
my ($self, %options) = @_;
return "Total instances ";
}
return if (!defined($options{instances}->{ $options{instance_id} }));
sub prefix_awsinstance_output {
my ($self, %options) = @_;
return if ($options{state} !~ /running|stopping/);
return "Instance '" . $options{instance_value}->{display} . "' ";
# format: "2021-04-16T07:54:33.000Z"
return if ($options{instances}->{ $options{instance_id} }->{LaunchTime} !~ /^(\d+)-(\d+)-(\d+)T(\d+):(\d+):(\d+)/);
my $dt = DateTime->new(
year => $1,
month => $2,
day => $3,
hour => $4,
minute => $5,
second => $6,
time_zone => 'UTC'
);
$self->{aws_instances}->{ $options{instance_id} }->{uptime_seconds} = time() - $dt->epoch();
$self->{aws_instances}->{ $options{instance_id} }->{uptime_human} = centreon::plugins::misc::change_seconds(
value => $self->{aws_instances}->{ $options{instance_id} }->{uptime_seconds}
);
}
sub manage_selection {
@ -153,8 +211,14 @@ sub manage_selection {
$self->{global} = {
pending => 0, running => 0, 'shutting-down' => 0, terminated => 0, stopping => 0, stopped => 0,
};
$self->{aws_instances} = {};
my $result = $options{custom}->ec2_get_instances_status();
my $instances;
if (defined($self->{option_results}->{add_uptime})) {
$instances = $options{custom}->ec2_get_instances();
}
foreach my $instance_id (keys %{$result}) {
if (defined($self->{option_results}->{filter_instanceid}) && $self->{option_results}->{filter_instanceid} ne '' &&
$instance_id !~ /$self->{option_results}->{filter_instanceid}/) {
@ -165,9 +229,11 @@ sub manage_selection {
$self->{aws_instances}->{$instance_id} = {
display => $instance_id,
state => $result->{$instance_id}->{state},
status => $result->{$instance_id}->{status},
status => $result->{$instance_id}->{status}
};
$self->{global}->{$result->{$instance_id}->{state}}++;
$self->add_uptime(instances => $instances, instance_id => $instance_id, state => $result->{$instance_id}->{state})
if (defined($self->{option_results}->{add_uptime}));
$self->{global}->{ $result->{$instance_id}->{state} }++;
}
if (scalar(keys %{$self->{aws_instances}}) <= 0) {
@ -201,21 +267,31 @@ Example: --filter-counters='^running$'
Filter by instance id (can be a regexp).
=item B<--add-uptime>
Monitor instances uptime.
=item B<--uptime-unit>
Select the unit for uptime threshold. May be 's' for seconds, 'm' for minutes,
'h' for hours, 'd' for days, 'w' for weeks. Default is days.
=item B<--warning-status>
Set warning threshold for status (Default: '').
Set warning threshold for status.
Can used special variables like: %{state}, %{display}
=item B<--critical-status>
Set critical threshold for status (Default: '').
Set critical threshold for status.
Can used special variables like: %{state}, %{display}
=item B<--warning-*> B<--critical-*>
Threshold warning.
Thresholds.
Can be: 'pending', 'running', 'shuttingdown',
'terminated', 'stopping', 'stopped'.
'terminated', 'stopping', 'stopped',
'uptime'.
=back