mars/userspace/mars-status

774 lines
27 KiB
Plaintext
Raw Normal View History

2012-01-27 14:58:33 +00:00
#!/usr/bin/perl -w
# (c) 2012 Joerg Mann / 1&1 Internet AG
2012-01-27 14:58:33 +00:00
#
# $Id: 5a8a13c09fa23ae74858e48fc010e7f61f90dc02 $
# last update at now ...
2012-01-27 14:58:33 +00:00
# TODO:
# add todo-global delete-logfiles
2012-02-22 14:52:02 +00:00
# anzeige bandbreite / i/o-load wenn dieser genutzt wird
# bugix fuer nachtaegliches join (log-v-4 ...)
2012-01-27 14:58:33 +00:00
###
use warnings;
use strict;
use English;
use Getopt::Long;
2012-01-27 14:58:33 +00:00
use Term::ANSIColor;
use Date::Language;
2012-02-22 14:52:02 +00:00
use POSIX qw(strftime);
use File::Basename;
2012-01-27 14:58:33 +00:00
### defaults
my $version = "0.068e";
2012-01-27 14:58:33 +00:00
my $alife_timeout = "99"; # sec
my $is_tty = 0;
my $mars_dir = '/mars';
my $himself = `uname -n` or die "cannot determine my network node name\n";
my $clearscreen = `clear`;
my $StatusCode = 'OK';
my $StatusLine = '';
my @StatusLines = ();
2012-01-27 14:58:33 +00:00
chomp $himself;
### ARGV
# Optionen in Hash-Ref parsen
my $params = {};
GetOptions( $params, 'help', 'h', 'version', 'v', 'monitor', 'resource=s', 'interval=i', 'long', 'history', 'debug' );
if($params->{help} || $params->{h}) {
2012-06-05 14:34:37 +00:00
print "Usage: mars-status [--help]\n";
print "Usage: mars-status [--version]\n";
print "Usage: mars-status (without specification of parameters, an abstract of all the informations spent)\n";
print "Usage: mars-status [--resource <RESNAME>] [--interval <seconds>] [--long [--history] [--debug]]\n";
print " --resource : limits the display to the specified resource\n";
print " --interval : refreshes the display every second xxx\n";
print " --long : displays more detailed information\n";
print " --history : shows information about the log files, version numbers and their status\n";
print " --debug : additional display error messages and warnings to internal\n";
print " --monitor : indicator to use for monitoring (not available)\n";
print "\nAdvanced information are also available here: http://http://wiki.intranet.1and1.com/bin/view/PO/ProjektTEC1603\n";
exit;
}
# Farbe zuruecksetzen
$SIG{INT} = sub {
2012-06-05 14:34:37 +00:00
print color 'reset';
print $clearscreen;
exit;
};
2012-01-27 14:58:33 +00:00
### figure out TTY
my $tty = readlink '/dev/stdout';
while ( my $temp = readlink $tty ) {
2012-06-05 14:34:37 +00:00
$tty = $temp;
2012-01-27 14:58:33 +00:00
}
if ( $tty =~ /^\/dev\/pts\// ) {
2012-06-05 14:34:37 +00:00
$is_tty = 1;
2012-01-27 14:58:33 +00:00
} elsif ( $tty =~ /^\/dev\/tty/ ) {
2012-06-05 14:34:37 +00:00
$is_tty = 1;
2012-01-27 14:58:33 +00:00
}
#########################################################################################
### subs
sub check_link {
2012-06-05 14:34:37 +00:00
my $dir = shift;
my $result = readlink $dir;
if ( !$result ) {
return 0;
} else {
return $result;
}
2012-01-27 14:58:33 +00:00
}
### print color
2012-06-05 14:34:37 +00:00
sub print_screen {
my $text = shift;
my $color = shift;
if (!$color) {$color = 'FAINT';}
if ( $params->{'monitor'} ) {
chomp $text;
my $Monitor = $text;
$Monitor =~ s/.*---> TODO:.*/ERROR/;
$Monitor =~ s/.*---> HINT:.*/WARNING/;
$Monitor =~ s/.*---> WORK:.*/OK/;
$text =~ s/ = \(.*//g;
$text =~ s/[\n\t]//g;
chomp $Monitor;
if ( $Monitor eq '') {
return;
} elsif (( $Monitor eq 'ERROR' ) && ( $color eq 'red' )) {
$StatusCode = 'ERROR';
$text =~ s/.*TODO: //;
push @StatusLines, $Monitor.$text;
} elsif (( $Monitor eq 'WARNING' ) || ( $Monitor eq 'ERROR' )) {
if ( $StatusCode ne 'ERROR') { $StatusCode = 'WARNING'; }
$text =~ s/.*(HINT|TODO): //;
push @StatusLines, $Monitor.$text;
} elsif ( $Monitor eq 'OK' ) {
if (( $StatusCode ne 'ERROR') && ( $StatusCode ne 'WARNING' )) { $StatusCode = 'OK'; }
$text =~ s/.*WORK: //;
push @StatusLines, $Monitor.$text;
}
} else {
print color "$color" if ( $is_tty );
print "$text";
print color 'reset' if ( $is_tty );
}
2012-01-27 14:58:33 +00:00
}
### read links
sub convert_link {
2012-06-05 14:34:37 +00:00
my $link = shift;
$link = check_link "$link";
if (( !$link ) || ( $link eq 0 )) {
2012-06-05 14:34:37 +00:00
print_screen "off", 'red';
} else {
print_screen "on", 'green';
}
return $link;
2012-01-27 14:58:33 +00:00
}
#########################################################################################
### sub display resource-partner
sub display_partner {
my %p = @_;
2012-06-05 14:34:37 +00:00
my $PRes = $p{ressource};
my $PName = $p{nodename};
my $PSize = $p{ressource_size};
my $ref_ResPartner = $p{res_partner};
my $ref_ResInReplay = $p{res_inreplay};
my $ref_ResInSync = $p{res_insync};
2012-06-05 14:34:37 +00:00
my $ref_AULogfile = $p{res_AULogfile};
my $PStatus = check_link "$mars_dir/$PRes/primary";
my $PDevice = check_link "$mars_dir/$PRes/device-$PName";
my $Ljoined = check_link "$mars_dir/$PRes/device-$himself";
### status
if ( $PStatus eq $PName ) {
print_screen "as Primary, ",'blue';
} else {
2012-01-27 14:58:33 +00:00
if ( $PDevice eq 0 ) {
2012-06-05 14:34:37 +00:00
print_screen "not joined, ",'red';
} else {
print_screen "as Secondary, ",'blue';
2012-01-27 14:58:33 +00:00
}
2012-06-05 14:34:37 +00:00
}
### alive
my @PAlive = lstat("$mars_dir/alive-$PName");
if ( !$PAlive[9] ) { $PAlive[9]=0 };
my $PAlive = time()- $PAlive[9] - $alife_timeout;
if ( $PAlive > 1 ) {
print_screen "Status: unknown (last message before $PAlive sec) !!!\n", 'red';
} else {
print_screen "Status: connected\n",'blue';
}
### device
# joined ?
if ( $PDevice eq 0 ) {
if ( $params->{'long'} ) { print_screen " -> Resource is not joined to this node\n", 'red'; }
return;
}
if ( $params->{'long'} ) {
print_screen "\tDevice : ".check_link "$mars_dir/$PRes/data-$PName";
print_screen ", used as $PDevice";
2012-06-05 14:34:37 +00:00
my $ASize = check_link "$mars_dir/$PRes/actsize-$PName";
if ( $PSize eq $ASize) {
print_screen ", not resized";
} else {
print_screen "\n\t\t---> HINT: resizing used ($PSize != $ASize)",'red';
}
2012-06-05 14:34:37 +00:00
# check mountpint
if ( $himself eq $PName ) {
my $PUDevice = "/dev/mars/$PDevice";
if ( stat( $PUDevice) ) {
open my $fh, '<', '/proc/mounts' or die $!;
$PUDevice = ( grep { /^$PUDevice / } <$fh> )[0];
if ( $PUDevice ) {
$PUDevice = ( split / /, $PUDevice )[1];
print_screen " and mountet as $PUDevice\n",'blue';
} else {
print_screen "\n\t\t---> TODO: enable to mount\n",'green';
}
} else {
print_screen "\n\t\t---> HINT: unable to mount, Device is Secondary or mars is starting\n",'blue';
2012-06-05 14:34:37 +00:00
}
} else {
print_screen "\n";
2012-01-27 14:58:33 +00:00
}
2012-06-05 14:34:37 +00:00
}
$$ref_ResPartner++;
### sync
my $PSyncsize = check_link "$mars_dir/$PRes/syncstatus-$PName";
my $SStatus = sprintf("%.2f", ($PSyncsize / $PSize * 100));
if ( $params->{'long'} ) {
print_screen (sprintf "\tSync : %s bytes (%.3fTB) synced = ", $PSyncsize, ( $PSyncsize/1024/1024/1024/1024));
if ( $SStatus < 100) {
print_screen "$SStatus%\n";
print_screen "\t\t---> WORK: Sync in progress = ($SStatus% < 100.00%)\n", 'red';
} else {
print_screen "$SStatus%\n", 'green';
}
}
$$ref_ResInSync = $SStatus;
### work by resize ...
#print "\n$PSize\n$PSyncsize\n$PName";
2012-06-05 14:34:37 +00:00
### logfile
my @PLogFile = split (',', check_link "$mars_dir/$PRes/replay-$PName" );
my @PLogLink = split ("-", $PLogFile[0]);
# TODO: kein Logfile vorhanden ...
my $PLogName = "$PLogLink[0]-$PLogLink[1]";
my $PLogSize = -s "$mars_dir/$PRes/$PLogFile[0]";
if ( !$PLogFile[1] ) { $PLogFile[1] = 0; $PLogFile[2] = 0; }
if (( !$PLogSize ) || ( $PLogSize eq 0 )) { $PLogSize = 0.0001; }
if ( $params->{'long'} ) {
2012-07-18 07:40:16 +00:00
print_screen (sprintf "\tLogfile : %s bytes (%.3fGB) in %s active\n", $PLogSize, ( $PLogSize/1024/1024/1024 ), $PLogName);
2012-06-05 14:34:37 +00:00
if ( $Ljoined eq "0" || $PLogSize eq "0.0001" ) {
print_screen "\t\t---> WORK: Logfile inactive or empty = (Size: $PLogSize)\n", 'red';
2012-06-05 14:34:37 +00:00
}
if ( ( $ref_AULogfile ) && !($PLogName eq $ref_AULogfile) ) {
print_screen "\t\t---> HINT: Logfile Version not actual = ($PLogName ! $ref_AULogfile)\n", 'red';
2012-06-05 14:34:37 +00:00
}
}
2012-01-27 14:58:33 +00:00
2012-06-05 14:34:37 +00:00
### replay
my $RStatus = sprintf("%.2f", ( $PLogFile[1] / $PLogSize * 100));
if ( $Ljoined eq "0" || $PLogSize eq "1" ) { $RStatus = 0; }
2012-07-18 07:40:16 +00:00
if (( $PLogFile[1] ne $PLogSize ) && ( $RStatus eq "100.00" )) { $RStatus = 99.99; }
2012-06-05 14:34:37 +00:00
if ( $params->{'long'} ) {
2012-07-18 07:40:16 +00:00
print_screen sprintf ("\tReplayed: %s bytes (%.3fGB) now replayed, Todo %d (%.3fGB) = ",
$PLogFile[1], ( $PLogFile[1]/1024/1024/1024 ), $PLogFile[2], ( $PLogFile[2]/1024/1024/1024 ));
2012-06-05 14:34:37 +00:00
if (( $RStatus < 1 ) && ( $PLogSize != 0.0001 )) {
print_screen "$RStatus%\n";
print_screen "\t\t---> HINT: Replay not started, Logfile inactive or empty = (Size: $PLogSize)\n", 'red';
2012-06-05 14:34:37 +00:00
} elsif (( $RStatus < 100 ) && ( $PLogSize != 0.0001 )) {
print_screen "$RStatus%\n";
print_screen "\t\t---> WORK: Replay in progress = ($RStatus% < 100.00%)\n", 'red';
2012-06-05 14:34:37 +00:00
} elsif ( $PLogFile[2] > 0 ) {
$RStatus = sprintf("%.2f", ($PLogFile[1]-$PLogFile[2])/$PLogFile[1] * 100);
print_screen "$RStatus%\n", 'red';
} elsif ( $PLogSize = 0.0001 ) {
$RStatus = "100.00";
print_screen "$RStatus%\n", 'green';
} else {
print_screen "$RStatus%\n", 'green';
}
### start work speed
#if $params->{'interval'} ...
#if nicht lokale ressource ...
### end work speed
2012-06-05 14:34:37 +00:00
}
$$ref_ResInReplay = $RStatus;
2012-01-27 14:58:33 +00:00
2012-06-05 14:34:37 +00:00
2012-01-27 14:58:33 +00:00
2012-06-05 14:34:37 +00:00
if ( $params->{'long'} ) {
### actual
my $ActStatus = check_link "$mars_dir/$PRes/actual-$PName/is-primary";
if ( $ActStatus eq 1 ) {
print_screen "\tActual : Status Primary, used Device=";
convert_link "$mars_dir/$PRes/actual-$PName/device-$PDevice";
print_screen "\n";
2012-06-05 14:34:37 +00:00
} else {
print_screen "\tActual : Status Secondary, Syncstatus=";
convert_link "$mars_dir/$PRes/actual-$PName/copy-syncstatus-$PName";
print_screen ", Logfileupdate=";
convert_link "$mars_dir/$PRes/actual-$PName/logfile-update";
print_screen "\n";
2012-01-27 14:58:33 +00:00
}
2012-06-05 14:34:37 +00:00
### switch
print_screen "\tSwitch : Attach=";
convert_link "$mars_dir/$PRes/todo-$PName/attach";
print_screen ", Connect=";
convert_link "$mars_dir/$PRes/todo-$PName/connect";
print_screen ", Sync=";
convert_link "$mars_dir/$PRes/todo-$PName/sync";
print_screen ", AllowReplay=";
convert_link "$mars_dir/$PRes/todo-$PName/allow-replay";
print_screen "\n";
2012-06-05 14:34:37 +00:00
}
return $PLogName;
2012-01-27 14:58:33 +00:00
}
#########################################################################################
###
sub check_logfile {
2012-06-05 14:34:37 +00:00
my $LResource = shift;
my $LPartner = shift;
my $oldEqual = 0;
my $LogCount = 0;
my $LogCountSum = 0;
my $LogCountNow = 1;
my $LogFailed = 0;
2012-06-05 14:34:37 +00:00
print_screen " -> History Replay/Status\n",'blue';
my @logfile = <$mars_dir/$LResource/log*>;
### mal fix zaehlen ...
foreach (@logfile) {
$LogCountSum++;
}
2012-06-05 14:34:37 +00:00
foreach my $logfile (@logfile) {
my $LVersion = $logfile;
$LVersion =~ s/^.*log-([0-9]+)-.*$/$1/;
my $LogStatus = check_link "$logfile";
my $allEqual = 1;
if ( $LogStatus eq 0 ) {
### found logfile
2012-06-05 14:34:37 +00:00
my $OldCheck;
my $OldSize;
my $LogSize = -s "$logfile";
print_screen "\tLogfile Version: $LVersion - Size: $LogSize\n";
2012-06-05 14:34:37 +00:00
### check other ...
2012-06-05 14:34:37 +00:00
my @LVersion = <$mars_dir/$LResource/version-$LVersion*>;
foreach my $LVersion (@LVersion) {
my @LogDetail = split (',', check_link "$LVersion" );
my $LogServer = $LVersion;
$LogServer =~ s/.*[0-9]-//;
$LogCount++;
print_screen "\t\tSource: $LogServer, Check: $LogDetail[0], ReplayPosition: $LogDetail[2], Todo: $LogDetail[3] blocks\n";
2012-06-05 14:34:37 +00:00
# Initial Values
if ( !defined $OldCheck ) {
# new
$OldCheck = $LogDetail[0];
$OldSize = $LogDetail[2];
$allEqual = 1;
} elsif (!(( $LogDetail[0] eq $OldCheck ) and ( $LogDetail[2] eq $OldSize ))) {
# not same
$allEqual = 0;
if ( !($LogDetail[0] eq $OldCheck) && ($LogDetail[2] eq $OldSize) ) {
print_screen "\t\t---> TODO: Logfiles has not equal Checksums and same size !!!\n",'red';
2012-06-05 14:34:37 +00:00
$LogFailed = 1;
} elsif ( $LogFailed eq 0 ) {
$LogFailed = 1;
}
} else {
# same
$allEqual = 1;
}
2012-02-27 13:56:17 +00:00
2012-06-05 14:34:37 +00:00
# check bad values
if ( $LogDetail[3] < 0 ) {
print_screen "\t\t---> TODO: Found bad values = ($LogDetail[3])it's ok ???\n", 'red';
2012-06-05 14:34:37 +00:00
$LogFailed = 1;
2012-01-27 14:58:33 +00:00
}
2012-06-05 14:34:37 +00:00
} # end foreach
if ( $allEqual eq 1 ) {
$oldEqual = 1;
} else {
$oldEqual = 0;
}
### check Count Logfiles
2012-06-05 14:34:37 +00:00
if ( !($LogCount eq $LPartner) ) {
print_screen "\t\t---> TODO: Count of Logfiles different = (have:$LPartner found:$LogCount)\n", 'red';
2012-06-05 14:34:37 +00:00
$LogFailed = 1;
$oldEqual = 0;
} elsif ( $LogFailed eq 1 ) {
print_screen "\t\t---> WORK: Logfiles has not equal Checksums and different size\n", 'red';
} elsif (( $LogCountSum eq $LogCountNow ) && ( $LogFailed eq 0 )) {
print_screen "\t\t---> WORK: logfiles are actual and unused.\n",'green';
} elsif (( $oldEqual eq 1 ) && ( $LogFailed eq 0 ) && ( $OldSize eq 0 )) {
print_screen "\t\t---> WORK: Logfiles are actual and unused.\n",'green';
} elsif (( $oldEqual eq 1 ) && ( $LogFailed eq 0 )) {
print_screen "\t\t---> WORK: Logfiles has all equal Sizes and Checksums, can be deleted?\n",'green';
2012-06-05 14:34:37 +00:00
} elsif (( $oldEqual eq 1 ) && ( $LogFailed ne 0 )) {
print_screen "\t\t---> TODO: Logfiles has same other errors - Please check History of Logfiles\n",'red';
2012-06-05 14:34:37 +00:00
}
### check delete infos
$logfile =~ m|/log-(.*)$|;
my $DelLogfile = "log-$1";
my @DeleteFiles = <$mars_dir/todo-global/delete-*>;
foreach my $DeleteFiles (@DeleteFiles) {
2012-07-18 07:40:16 +00:00
if ( !(readlink $DeleteFiles) ) {
$DeleteFiles = "n/a";
} else {
$DeleteFiles = basename (readlink $DeleteFiles);
}
if ( $DeleteFiles eq $DelLogfile ) {
print_screen "\t\t---> HINT: LogFile ist marked for delete ($DeleteFiles).\n",'green';
}
}
$LogCount=0;
2012-06-05 14:34:37 +00:00
} # end logstatus
$LogCountNow++;
2012-06-05 14:34:37 +00:00
} # end foreach
2012-01-27 14:58:33 +00:00
}
2012-02-22 14:52:02 +00:00
#########################################################################################
### diskfull
sub check_disk_is_full {
2012-06-05 14:34:37 +00:00
my @diskfull = glob("$mars_dir/rest-space-*");
my $diskfull_mars = "";
print_screen "-> Diskspace on Cluster:", 'bold';
if ( @diskfull ) {
foreach ( @diskfull) {
my $diskfull_space = check_link "$_";
my $diskfull_system = $_;
$diskfull_system =~ s!/mars/rest-space-!!;
if ( $diskfull_space < 1 ) {
$diskfull_space = sprintf ("%.2f", $diskfull_space / 1024 );
if ( $diskfull_system eq $himself ) {
print_screen "\n\t-> TODO ! Local Partition $mars_dir full ($diskfull_space kb Limit) !!! mars is stopping !!!\n\n", "red";
2012-06-05 14:34:37 +00:00
$diskfull_mars = "$diskfull_mars,$diskfull_system";
} else {
print_screen "\n\t-> TODO ! Remotesystem $diskfull_system have mars-disk full ($diskfull_space kb Limit) !!!\n\n", "red";
2012-06-05 14:34:37 +00:00
$diskfull_mars = "$diskfull_mars,$diskfull_system";
}
}
}
}
# TODO /0
if ( !$diskfull_mars ) {
print_screen " ok\n", 'green';
}
2012-02-22 14:52:02 +00:00
}
#########################################################################################
### check /proc/sys/mars/warnings
sub check_mars_warn {
2012-06-05 14:34:37 +00:00
if ( open (MARS_WARN, "< /proc/sys/mars/warnings") ) {
my $mars_warn = "";
while ( <MARS_WARN> ) {
if ( m/^(\d+\.\d+)/ ) {
s/^(\d+\.\d+)/strftime("%a %b %e %H:%M:%S %Y:", localtime($1))/e;
} else {
$_ = localtime(0) . ': ' . $_;
}
s/MARS_WARN\s+//;
$mars_warn = "$mars_warn\t$_";
}
close MARS_WARN;
if ( $mars_warn ne "" ) { print_screen "-> MARS WARNINGS:\n", 'red'; print_screen "$mars_warn" }
2012-06-05 14:34:37 +00:00
}
2012-03-09 15:10:48 +00:00
}
2012-02-22 14:52:02 +00:00
#########################################################################################
### check /proc/sys/mars/errors
sub check_mars_error {
2012-06-05 14:34:37 +00:00
if ( open (MARS_ERROR, "< /proc/sys/mars/errors") ) {
my $mars_error = "";
while ( <MARS_ERROR> ) {
if ( m/^(\d+\.\d+)/ ) {
s/^(\d+\.\d+)/strftime("%a %b %e %H:%M:%S %Y:", localtime($1))/e;
} else {
$_ = localtime(0) . ': ' . $_;
}
s/MARS_ERROR\s+//;
$mars_error = "$mars_error\t$_";
2012-03-09 15:10:48 +00:00
}
2012-06-05 14:34:37 +00:00
close MARS_ERROR;
if ( $mars_error ne "" ) { print_screen "-> MARS ERRORS:\n", 'red'; print_screen "$mars_error" }
2012-06-05 14:34:37 +00:00
}
2012-02-22 14:52:02 +00:00
}
#########################################################################################
2012-06-05 14:34:37 +00:00
### info version
sub info_version {
### module
my %mars_info;
open ( my $lsmod_handle,'-|','lsmod | grep mars' ) || die "blub ... $!";
if (!<$lsmod_handle>) {
print_screen "Module Mars not running\n",'red';
sleep(10);
next;
}
open ( my $modinfo_handle, '-|', 'modinfo mars' ) || die "cannot run modinfo mars: $!";
while ( my $line = <$modinfo_handle> ) {
chomp $line;
my ( $key, $value) = split /: +/, $line;
if ( $value) {
$mars_info{$key} = $value;
}
2012-06-05 14:34:37 +00:00
}
if ( $mars_info{author} eq "") {
print_screen "Module Mars not running\n",'red';
next;
}
### status
print_screen "MARS Status - $himself, $version",'blue';
if ( $params->{'resource'} ) { print_screen ", Ressource: $params->{'resource'}",'blue'; }
print_screen "\n";
2012-06-05 14:34:37 +00:00
### marsadm
my $MAVersion = qx"marsadm version";
print_screen "MARS Admin - $MAVersion",'blue';
### module
print_screen "MARS Module - $mars_info{version}\n",'blue';
### kernel
my $KVersion = '/proc/version';
open my $Kfh, '<', "$KVersion" or die $!;
$KVersion = ( grep { /^Linux/ } <$Kfh> )[0];
$KVersion = ( split / /, $KVersion )[2];
print_screen "MARS Kernel - $KVersion\n",'blue';
print_screen "-------------------------------------------------------------------------------\n";
2012-06-05 14:34:37 +00:00
}
2012-06-05 14:34:37 +00:00
#########################################################################################
### check ressources
sub check_ressource {
opendir my $dirhandle, $mars_dir or die "Cannot open $mars_dir: $!";
my @resources = grep { /^res/ && -d "$mars_dir/$_" } readdir $dirhandle;
if ( !@resources ) {
print_screen "---> HINT: no resources found\n", 'red';
next;
2012-06-05 14:34:37 +00:00
}
2012-06-05 14:34:37 +00:00
foreach my $res (@resources) {
my $ResPartner = 0;
my $ResInReplay = 0;
my $ResInReplaySum = 0;
my $ResInReplayPar = 0;
my $ResInSync = 0;
my $ResInSyncSum = 0;
my $ResInSyncPar = 0;
my $res_name = $res;
$res_name =~ s/^resource-//;
if ( $params->{'resource'} ) {
if (!( $params->{'resource'} eq $res_name)) {
next;
}
}
my $res_size = check_link "$mars_dir/$res/size";
if ( $res_size eq 0 ) { $res_size = 1 };
my $res_tbsize = ( $res_size) / 1024 / 1024 /1024 / 1024;
my $res_master = check_link "$mars_dir/$res/primary";
if ( $res_master eq 0 ) { $res_master = "unknown" };
print_screen sprintf("-> check resource %s, with %d bytes (%.3fTB), Primary Node is %s\n", $res_name, $res_size, $res_tbsize, $res_master), 'bold';
2012-06-05 14:34:37 +00:00
### him self
print_screen " -> local node ($himself) ",'bold';
my $ActualUsedLogfile = display_partner(
ressource => $res,
nodename => $himself,
2012-06-05 14:34:37 +00:00
ressource_size => $res_size,
res_partner => \$ResPartner,
res_inreplay => \$ResInReplay,
res_insync => \$ResInSync,
res_AULogfile => "",
2012-06-05 14:34:37 +00:00
);
if ($ResInReplay ne "100.00") {
$ResInReplaySum = $ResInReplaySum + $ResInReplay;
$ResInReplayPar = $ResInReplayPar + 1;
}
if ($ResInSync ne "100.00") {
$ResInSyncSum = $ResInSyncSum + $ResInSync;
$ResInSyncPar = $ResInSyncPar + 1;
}
# end him self
2012-06-05 14:34:37 +00:00
### joined ...
if ( $ResPartner eq 1) {
### partners
opendir my $server_dh, "$mars_dir/$res" or die "Cannot open $mars_dir/$res: $!";
my @servers = grep { /^data/ && readlink "$mars_dir/$res/$_" } readdir $server_dh;
@servers = sort (@servers);
foreach my $partner (@servers) {
$partner =~ s/^data-//;
if ( $partner eq $himself ) { next; }
print_screen " -> remote node ($partner) ", 'bold';
display_partner(
ressource => $res,
nodename => $partner,
2012-06-05 14:34:37 +00:00
ressource_size => $res_size,
res_partner => \$ResPartner,
res_inreplay => \$ResInReplay,
res_insync => \$ResInSync,
res_AULogfile => $ActualUsedLogfile,
2012-06-05 14:34:37 +00:00
);
if ($ResInReplay ne "100.00") {
$ResInReplaySum = $ResInReplaySum + $ResInReplay;
$ResInReplayPar = $ResInReplayPar + 1;
}
if ($ResInSync ne "100.00") {
$ResInSyncSum = $ResInSyncSum + $ResInSync;
$ResInSyncPar = $ResInSyncPar + 1;
}
2012-06-05 14:34:37 +00:00
}
} # end joined
2012-06-05 14:34:37 +00:00
### modus
if ( $ResPartner eq 0 ) {
2012-06-05 14:34:37 +00:00
if ( $params->{'long'} ) { print_screen " -> modus for $res_name is remote ($ResPartner nodes)\n",'bold'; }
} elsif ( $ResPartner eq 1 ) {
if ( $params->{'long'} ) { print_screen " -> modus for $res_name is standalone ($ResPartner node)\n",'bold'; }
} else {
print_screen " -> modus for $res_name is clustered ($ResPartner nodes), ",'bold';
if ( $ResInReplayPar eq 0 ) {
$ResInReplaySum = "100.00";
} else {
$ResInReplaySum = sprintf("%.2f", $ResInReplaySum / $ResInReplayPar );
}
if ( $ResInSyncPar eq 0 ) {
$ResInSyncSum = "100.00";
} else {
$ResInSyncSum = sprintf("%.2f", $ResInSyncSum / $ResInSyncPar );
}
print_screen "ClusterSummary: ";
2012-06-05 14:34:37 +00:00
if ( $ResInReplaySum eq "100.00" ) {
print_screen "in replay ($ResInReplaySum%),", 'green';
} elsif ( $ResInReplaySum eq "0.00" ) {
print_screen "replay inaktiv ($ResInReplaySum%),", 'red';
2012-06-05 14:34:37 +00:00
} else {
print_screen "not in replay ($ResInReplaySum%),", 'red';
}
if ( $ResInSyncSum eq "100.00" ) {
print_screen " in sync ($ResInSyncSum%)\n", 'green';
} else {
print_screen " not in sync ($ResInSyncSum%)\n", "red";
}
} # end modus
2012-06-05 14:34:37 +00:00
### debug output
if ( $params->{'long'} ) {
### history
if ( $params->{'history'} ) {
check_logfile( $res, $ResPartner );
}
} # end debug
} # end foreach
2012-02-22 14:52:02 +00:00
2012-06-05 14:34:37 +00:00
}
2012-02-22 14:52:02 +00:00
#########################################################################################
### avg_limit
sub check_jammed {
my $jammed = check_link "$mars_dir/jammed-$himself";
print_screen "-> Mars-Transaktion ", 'bold';
if (( !$jammed ) || ( $jammed ne 0 )) {
print_screen "running normaly\n", 'green';
} else {
print_screen "and Replication not runnunig !!!\n", 'red';
}
}
#########################################################################################
### limit's auslesen ...
sub check_limit {
my $LimitL = shift;
my $LimitT = shift;
my $LimitE = shift;
my $mars_limit;
if ( open (MARS_LIMIT, "< /proc/sys/mars/$LimitL") ) {
while (<MARS_LIMIT>) {
$mars_limit = $_;
$mars_limit =~ s/[\n\t]//g;
}
close MARS_LIMIT;
}
print_screen "-> $LimitT: ", 'bold';
if (( !$mars_limit ) || ( $mars_limit < "1" )) {
print_screen "unset, used full speed\n", '';
} else {
print_screen "is $mars_limit $LimitE\n", 'red';
}
}
2012-06-05 14:34:37 +00:00
#########################################################################################
### main loop ...
while(1) {
my $dateFormat = Date::Language->new('English');
### version only
if ( $params->{version} || $params->{v}) {
info_version;
exit 0;
}
#########################################################################################
### main run
print $clearscreen;
### set long by monitor as default
if ( $params->{'monitor'} ) {
$params->{'long'} = 1;
$params->{'history'} = 1;
}
2012-06-05 14:34:37 +00:00
### read mars infos
if ( $params->{'long'} ) {
# read mars info
info_version;
# check system limits
check_limit "loadavg_limit", "AVG-Limit", "";
check_limit "network_traffic_limit_kb", "Network-Traffic-Limit", "kb/s";
check_limit "percent_mem_limit_kb", "Memory-Limit", "kb/s";
check_limit "server_io_limit_mb", "Server-IO-Limit", "mb/s";
check_limit "free_space_mb", "Free-Space-Limit on /mars", "mb";
check_limit "logdel_auto_gb", "Free-Space-Limit for Auto-Log-Delete", 'gb';
check_limit "logrot_auto_gb", "Free-Space-Limit for Auto-Log-Rotate", 'gb';
# check system params
check_jammed;
check_disk_is_full;
2012-06-05 14:34:37 +00:00
}
### check resources
check_ressource;
### debug output
if ( $params->{'long'} ) {
### mars-warn/error
if ( $params->{'debug'} ) {
check_mars_warn;
check_mars_error;
}
}
2012-02-22 14:52:02 +00:00
### end, exit for monitor
if ( $params->{'monitor'} ) {
my %hilf;
foreach (@StatusLines) {
$hilf{$_} = 1;
}
print "$StatusCode : ";
print join(" || ", keys %hilf);
if ( $StatusCode eq 'ERROR') {
exit 1;
} else {
exit 0;
}
}
### end, next loop
2012-06-05 14:34:37 +00:00
print color 'reset';
exit if (not $params->{'interval'});
sleep($params->{'interval'});
2012-01-27 14:58:33 +00:00
}
exit;