+ move emc celerra

This commit is contained in:
garnier-quentin 2016-10-07 17:23:02 +02:00
parent a14fa809ea
commit b81605e7b1
3 changed files with 68 additions and 174 deletions

View File

@ -29,24 +29,26 @@ my %map_cs_status = (
11 => 'Secondary Control Station',
);
sub load { }
sub check {
my ($self) = @_;
$self->{output}->output_add(long_msg => "Checking control stations");
$self->{components}->{controlstation} = {name => 'control stations', total => 0, skip => 0};
return if ($self->check_exclude(section => 'controlstation'));
return if ($self->check_filter(section => 'controlstation'));
foreach my $line (split /\n/, $self->{stdout}) {
next if ($line !~ /^\s*(\d+)\s+-\s+(\S+)/);
my ($code, $instance) = ($1, $2);
next if (!defined($map_cs_status{$code}));
return if ($self->check_exclude(section => 'controlstation', instance => $instance));
return if ($self->check_filter(section => 'controlstation', instance => $instance));
$self->{components}->{controlstation}->{total}++;
$self->{output}->output_add(long_msg => sprintf("Control station '%s' status is '%s'",
$instance, $map_cs_status{$code}));
my $exit = $self->get_severity(section => 'controlstation', value => $map_cs_status{$code});
my $exit = $self->get_severity(section => 'controlstation', instance => $instance, value => $map_cs_status{$code});
if (!$self->{output}->is_status(value => $exit, compare => 'ok', litteral => 1)) {
$self->{output}->output_add(severity => $exit,
short_msg => sprintf("Control station '%s' status is '%s'",

View File

@ -46,24 +46,26 @@ my %map_dm_status = (
25 => 'DM T2NET Error. Unable to get blade reason code due to management switch problems',
);
sub load { }
sub check {
my ($self) = @_;
$self->{output}->output_add(long_msg => "Checking data movers");
$self->{components}->{datamover} = {name => 'data movers', total => 0, skip => 0};
return if ($self->check_exclude(section => 'datamover'));
return if ($self->check_filter(section => 'datamover'));
foreach my $line (split /\n/, $self->{stdout}) {
next if ($line !~ /^\s*(\d+)\s+-\s+(\S+)/);
my ($code, $instance) = ($1, $2);
next if (!defined($map_dm_status{$code}));
return if ($self->check_exclude(section => 'datamover', instance => $instance));
return if ($self->check_filter(section => 'datamover', instance => $instance));
$self->{components}->{datamover}->{total}++;
$self->{output}->output_add(long_msg => sprintf("Data mover '%s' status is '%s'",
$instance, $map_dm_status{$code}));
my $exit = $self->get_severity(section => 'datamover', value => $map_dm_status{$code});
my $exit = $self->get_severity(section => 'datamover', instance => $instance, value => $map_dm_status{$code});
if (!$self->{output}->is_status(value => $exit, compare => 'ok', litteral => 1)) {
$self->{output}->output_add(severity => $exit,
short_msg => sprintf("Data mover '%s' status is '%s'",

View File

@ -20,45 +20,68 @@
package storage::emc::celerra::local::mode::getreason;
use base qw(centreon::plugins::mode);
use base qw(centreon::plugins::templates::hardware);
use strict;
use warnings;
use centreon::plugins::misc;
my $thresholds = {
controlstation => [
['Primary Control Station', 'OK'], # 10
['Secondary Control Station', 'OK'], # 11
['Control Station is ready, but is not running NAS service', 'CRITICAL'], # 6
],
datamover => [
['Reset (or unknown state)', 'WARNING'],
['DOS boot phase, BIOS check, boot sequence', 'WARNING'],
['SIB POST failures (that is, hardware failures)', 'CRITICAL'],
['DART is loaded on Data Mover, DOS boot and execution of boot.bat, boot.cfg', 'WARNING'],
['DART is ready on Data Mover, running, and MAC threads started', 'WARNING'],
['DART is in contact with Control Station box monitor', 'OK'],
['DART is in panic state', 'CRITICAL'],
['DART reboot is pending or in halted state', 'WARNING'],
['DART panicked and completed memory dump', 'CRITICAL'],
['DM Misc problems', 'CRITICAL'], # code 14
['Data Mover is flashing firmware. DART is flashing BIOS and/or POST firmware. Data Mover cannot be reset', 'CRITICAL'],
['Data Mover Hardware fault detected', 'CRITICAL'],
['DM Memory Test Failure. BIOS detected memory error', 'CRITICAL'],
['DM POST Test Failure. General POST error', 'CRITICAL'],
['DM POST NVRAM test failure. Invalid NVRAM content error', 'CRITICAL'],
['DM POST invalid peer Data Mover type', 'CRITICAL'],
['DM POST invalid Data Mover part number', 'CRITICAL'],
['DM POST Fibre Channel test failure. Error in blade Fibre connection', 'CRITICAL'],
['DM POST network test failure. Error in Ethernet controller', 'CRITICAL'],
['DM T2NET Error. Unable to get blade reason code due to management switch problems', 'CRITICAL'],
],
};
sub set_system {
my ($self, %options) = @_;
$self->{regexp_threshold_overload_check_section_option} =
'^(controlstation|datamover)$';
$self->{cb_hook2} = 'cmd_execute';
$self->{thresholds} = {
controlstation => [
['Primary Control Station', 'OK'], # 10
['Secondary Control Station', 'OK'], # 11
['Control Station is ready, but is not running NAS service', 'CRITICAL'], # 6
],
datamover => [
['Reset (or unknown state)', 'WARNING'],
['DOS boot phase, BIOS check, boot sequence', 'WARNING'],
['SIB POST failures (that is, hardware failures)', 'CRITICAL'],
['DART is loaded on Data Mover, DOS boot and execution of boot.bat, boot.cfg', 'WARNING'],
['DART is ready on Data Mover, running, and MAC threads started', 'WARNING'],
['DART is in contact with Control Station box monitor', 'OK'],
['DART is in panic state', 'CRITICAL'],
['DART reboot is pending or in halted state', 'WARNING'],
['DART panicked and completed memory dump', 'CRITICAL'],
['DM Misc problems', 'CRITICAL'], # code 14
['Data Mover is flashing firmware. DART is flashing BIOS and/or POST firmware. Data Mover cannot be reset', 'CRITICAL'],
['Data Mover Hardware fault detected', 'CRITICAL'],
['DM Memory Test Failure. BIOS detected memory error', 'CRITICAL'],
['DM POST Test Failure. General POST error', 'CRITICAL'],
['DM POST NVRAM test failure. Invalid NVRAM content error', 'CRITICAL'],
['DM POST invalid peer Data Mover type', 'CRITICAL'],
['DM POST invalid Data Mover part number', 'CRITICAL'],
['DM POST Fibre Channel test failure. Error in blade Fibre connection', 'CRITICAL'],
['DM POST network test failure. Error in Ethernet controller', 'CRITICAL'],
['DM T2NET Error. Unable to get blade reason code due to management switch problems', 'CRITICAL'],
],
};
$self->{components_path} = 'storage::emc::celerra::local::mode::components';
$self->{components_module} = ['controlstation', 'datamover'];
}
sub cmd_execute {
my ($self, %options) = @_;
($self->{stdout}) = centreon::plugins::misc::execute(output => $self->{output},
options => $self->{option_results},
sudo => $self->{option_results}->{sudo},
command => $self->{option_results}->{command},
command_path => $self->{option_results}->{command_path},
command_options => $self->{option_results}->{command_options});
}
sub new {
my ($class, %options) = @_;
my $self = $class->SUPER::new(package => __PACKAGE__, %options);
my $self = $class->SUPER::new(package => __PACKAGE__, %options, no_absent => 1, no_performance => 1);
bless $self, $class;
$self->{version} = '1.0';
@ -74,144 +97,11 @@ sub new {
"command:s" => { name => 'command', default => 'getreason' },
"command-path:s" => { name => 'command_path', default => '/nas/sbin' },
"command-options:s" => { name => 'command_options', default => '2>&1' },
"exclude:s" => { name => 'exclude' },
"component:s" => { name => 'component', default => '.*' },
"no-component:s" => { name => 'no_component' },
"threshold-overload:s@" => { name => 'threshold_overload' },
});
$self->{components} = {};
$self->{no_components} = undef;
return $self;
}
sub check_options {
my ($self, %options) = @_;
$self->SUPER::init(%options);
if (defined($self->{option_results}->{no_component})) {
if ($self->{option_results}->{no_component} ne '') {
$self->{no_components} = $self->{option_results}->{no_component};
} else {
$self->{no_components} = 'critical';
}
}
$self->{overload_th} = {};
foreach my $val (@{$self->{option_results}->{threshold_overload}}) {
if ($val !~ /^(.*?),(.*?),(.*)$/) {
$self->{output}->add_option_msg(short_msg => "Wrong threshold-overload option '" . $val . "'.");
$self->{output}->option_exit();
}
my ($section, $status, $filter) = ($1, $2, $3);
if ($self->{output}->is_litteral_status(status => $status) == 0) {
$self->{output}->add_option_msg(short_msg => "Wrong threshold-overload status '" . $val . "'.");
$self->{output}->option_exit();
}
$self->{overload_th}->{$section} = [] if (!defined($self->{overload_th}->{$section}));
push @{$self->{overload_th}->{$section}}, {filter => $filter, status => $status};
}
}
sub run {
my ($self, %options) = @_;
($self->{stdout}) = centreon::plugins::misc::execute(output => $self->{output},
options => $self->{option_results},
sudo => $self->{option_results}->{sudo},
command => $self->{option_results}->{command},
command_path => $self->{option_results}->{command_path},
command_options => $self->{option_results}->{command_options},
no_quit => 1);
my @components = ('controlstation', 'datamover');
my $components = 0;
foreach (@components) {
if (/$self->{option_results}->{component}/) {
my $mod_name = "storage::emc::celerra::local::mode::components::$_";
centreon::plugins::misc::mymodule_load(output => $self->{output}, module => $mod_name,
error_msg => "Cannot load module '$mod_name'.");
$components = 1;
}
}
if ($components == 0) {
$self->{output}->add_option_msg(short_msg => "Wrong option. Cannot find component '" . $self->{option_results}->{component} . "'.");
$self->{output}->option_exit();
}
foreach (@components) {
if (/$self->{option_results}->{component}/) {
my $mod_name = "storage::emc::celerra::local::mode::components::$_";
my $func = $mod_name->can('check');
$func->($self);
}
}
my $total_components = 0;
my $display_by_component = '';
my $display_by_component_append = '';
foreach my $comp (sort(keys %{$self->{components}})) {
# Skipping short msg when no components
next if ($self->{components}->{$comp}->{total} == 0 && $self->{components}->{$comp}->{skip} == 0);
$total_components += $self->{components}->{$comp}->{total} + $self->{components}->{$comp}->{skip};
my $count_by_components = $self->{components}->{$comp}->{total} + $self->{components}->{$comp}->{skip};
$display_by_component .= $display_by_component_append . $self->{components}->{$comp}->{total} . '/' . $count_by_components . ' ' . $self->{components}->{$comp}->{name};
$display_by_component_append = ', ';
}
$self->{output}->output_add(severity => 'OK',
short_msg => sprintf("All %s components are ok [%s].",
$total_components,
$display_by_component)
);
if (defined($self->{option_results}->{no_component}) && $total_components == 0) {
$self->{output}->output_add(severity => $self->{no_components},
short_msg => 'No components are checked.');
}
$self->{output}->display();
$self->{output}->exit();
}
sub check_exclude {
my ($self, %options) = @_;
if (defined($options{instance})) {
if (defined($self->{option_results}->{exclude}) && $self->{option_results}->{exclude} =~ /(^|\s|,)${options{section}}[^,]*#\Q$options{instance}\E#/) {
$self->{components}->{$options{section}}->{skip}++;
$self->{output}->output_add(long_msg => sprintf("Skipping $options{section} section $options{instance} instance."));
return 1;
}
} elsif (defined($self->{option_results}->{exclude}) && $self->{option_results}->{exclude} =~ /(^|\s|,)$options{section}(\s|,|$)/) {
$self->{output}->output_add(long_msg => sprintf("Skipping $options{section} section."));
return 1;
}
return 0;
}
sub get_severity {
my ($self, %options) = @_;
my $status = 'UNKNOWN'; # default
if (defined($self->{overload_th}->{$options{section}})) {
foreach (@{$self->{overload_th}->{$options{section}}}) {
if ($options{value} =~ /$_->{filter}/i) {
$status = $_->{status};
return $status;
}
}
}
foreach (@{$thresholds->{$options{section}}}) {
if ($options{value} =~ /$$_[0]/i) {
$status = $$_[1];
return $status;
}
}
return $status;
}
1;
__END__
@ -227,10 +117,10 @@ Check control stations and data movers status (use 'getreason' command).
Which component to check (Default: '.*').
Can be: 'controlstation', 'datamover'.
=item B<--exclude>
=item B<--filter>
Exclude some parts (comma seperated list) (Example: --exclude=datamover)
Can also exclude specific instance: --exclude='datamover#slot_2#'
Exclude some parts (comma seperated list) (Example: --filter=datamover)
Can also exclude specific instance: --filter=datamover,slot_2
=item B<--no-component>
@ -239,7 +129,7 @@ If total (with skipped) is 0. (Default: 'critical' returns).
=item B<--threshold-overload>
Set to overload default threshold values (syntax: section,status,regexp)
Set to overload default threshold values (syntax: section,[instance,]status,regexp)
It used before default thresholds (order stays).
Example: --threshold-overload='datamover,CRITICAL,^(?!(normal)$)'