mars/userspace/marsadm

432 lines
13 KiB
Plaintext
Raw Normal View History

2011-02-23 20:48:06 +00:00
#!/usr/bin/perl -w
# (c) 2010 Thomas Schoebel-Theuer / 1&1 Internet AG
use strict;
use English;
use warnings;
my $mars = "/mars";
my $host = `uname -n` or die "cannot determine my network node name\n";
chomp $host;
my $ip = `ip a` or die "cannot determine my IP address\n";
2011-03-04 15:14:20 +00:00
$ip =~ s/\A.*inet +(?!127\.0\.)([0-9]+\.[0-9]+\.[0-9]+\.[0-9]+).*?\Z/$1/ms or die "cannot parse my IP address\n";
2011-03-08 16:45:52 +00:00
chomp $ip;
2011-03-04 15:14:20 +00:00
print "my IP is $ip\n";
2011-02-23 20:48:06 +00:00
2011-03-23 17:58:02 +00:00
umask 0077;
2011-02-27 14:17:58 +00:00
die "only root may use this tool\n" unless `whoami` eq "root\n"; # getpid() seems to be missing in perlfunc
2011-02-23 20:48:06 +00:00
##################################################################
# syntactic checks
sub check_id {
my $str = shift;
2011-03-04 15:14:20 +00:00
die "identifier '$str' has disallowed characters" unless $str =~ m/^[A-Za-z_][-A-Za-z0-9_]*$/;
2011-02-23 20:48:06 +00:00
die "identifier '$str' is too long (only 16 chars allowed)" if length($str) > 16;
}
##################################################################
# semantic checks
sub check_res {
my $res = shift;
2011-06-10 13:57:52 +00:00
if(not -d "$mars/resource-$res") {
# DO WHAT I MEAN: try to substitute a device name for a badly given resource name if it is unique
my $count = 0;
my $found;
my @tests = glob("$mars/resource-*/device-$host");
foreach my $test (@tests) {
my $target = readlink($test);
if($target eq $res) {
$found = $test;
$count++;
}
}
if(!$count) {
@tests = glob("$mars/resource-*/_direct-*-$host");
foreach my $test (@tests) {
my $target = readlink($test);
$target =~ s/^.*,//;
if($target eq $res) {
$found = $test;
$count++;
}
}
}
die "resource '$res' does not exist ($count replacements found)\n" unless $count == 1 and $found;
$found =~ s:^.*/resource-(.*)/.*$:$1:;
warn "substituting bad resource name '$res' by uniquely matching resource name '$found'\n";
$res = $found;
}
return $res;
2011-02-23 20:48:06 +00:00
}
2011-02-27 14:17:58 +00:00
sub check_res_member {
my $res = shift;
die "sorry, I have not yet joined to resource '$res'\n" unless -e "$mars/resource-$res/data-$host";
}
sub get_size {
2011-02-23 20:48:06 +00:00
my $arg = shift;
return -1 unless $arg =~ m/^[0-9.]+[kmgtp]?$/i;
my $mod = $arg;
$arg =~ s/[^0-9]+$//;
$mod =~ s/^[0-9]+//;
$_ = $mod;
SWITCH: {
/k/i and $arg *= 1024, last SWITCH;
/m/i and $arg *= 1024 * 1024, last SWITCH;
/g/i and $arg *= 1024 * 1024 * 1024, last SWITCH;
/t/i and $arg *= 1024 * 1024 * 1024 * 1024, last SWITCH;
/p/i and $arg *= 1024 * 1024 * 1024 * 1024 * 1024, last SWITCH;
}
return $arg;
}
##################################################################
2011-02-27 14:17:58 +00:00
# helpers
2011-03-03 09:02:10 +00:00
sub _trigger {
2011-03-03 18:23:34 +00:00
system("modprobe mars_proc; (echo 1 > /proc/sys/mars) >/dev/null 2>&1");
2011-03-03 09:02:10 +00:00
}
2011-02-27 14:17:58 +00:00
sub _switch {
2011-06-10 13:57:52 +00:00
my ($cmd, $res, $path, $on) = @_;
my $src = $on ? "1" : "0";
my $old = readlink($path);
if($old && $old eq $src) {
print "${cmd} on resource $res is already activated\n" if $cmd;
return;
}
2011-03-23 17:58:02 +00:00
my $tmp = $path;
$tmp =~ s/\/([^\/]+)$/.tmp.$1/;
symlink($src, $tmp) or die "cannot create switch symlink\n";
rename($tmp, $path) or die "cannot rename switch symlink\n";
2011-06-10 13:57:52 +00:00
print "successfully started ${cmd} on resource $res\n" if $cmd;
2011-02-27 14:17:58 +00:00
}
sub _writable {
my ($path, $on) = @_;
my $oldmode = (lstat $path)[2] & 0700;
my $newmode = $on ? $oldmode | 0200 : $oldmode & ~0200;
print "chmod '$path' $oldmode $newmode";
chmod($newmode, $path) == 1 or die "cannot chmod '$path'\n";
}
##################################################################
2011-02-23 20:48:06 +00:00
# commands
sub ignore_cmd {
my ($cmd, $res) = @_;
print "ignoring command '$cmd' on resource '$res'\n";
exit(0);
}
sub senseless_cmd {
my ($cmd, $res) = @_;
print "command '$cmd' makes no sense with MARS (ignoring)\n";
exit(0);
}
sub forbidden_cmd {
my ($cmd, $res) = @_;
die "command '$cmd' cannot be used with MARS (it is impossible to carry out uniquely and could therefore lead to a disaster)\n";
}
sub nyi_cmd {
my ($cmd, $res) = @_;
die "command '$cmd' is not yet implemented\n";
}
2011-03-23 08:09:00 +00:00
sub _create_system {
my ($cmd, $peer, $force) = @_;
system("mkdir $mars") unless -d $mars;
system("mkdir $mars/ips") unless -d "$mars/ips";
system("mkdir $mars/defaults") unless -d "$mars/defaults";
system("mkdir $mars/defaults-$host") unless -d "$mars/defaults-$host";
symlink($ip, "$mars/ips/ip-$host");
}
sub create_system {
my ($cmd, $peer, $force) = @_;
die "system is already created\n" if !$force && -d "$mars/ips";
_create_system(@_);
}
2011-02-23 20:48:06 +00:00
sub join_system {
my ($cmd, $peer, $force) = @_;
2011-02-25 11:46:38 +00:00
if(glob("$mars/resource-*")) {
2011-02-23 20:48:06 +00:00
die "Sorry, some resources already exist!\nThis is dangerous!\nIf you are sure that no resource clash is possible, re-invoke this command with '--force' option\n" unless ($force and $force =~ m/--force/);
}
print "joining system via rsync (peer='$peer')\n";
2011-03-23 08:09:00 +00:00
_create_system(@_);
2011-02-23 20:48:06 +00:00
system("rsync --recursive --links -v $peer:$mars/ips/ $mars/ips/") == 0 or die "oops\n";
symlink($ip, "$mars/ips/ip-$host");
2011-02-25 11:46:38 +00:00
system("rsync --recursive --links -v $mars/ips/ $peer:$mars/ips/") == 0 or die "oops\n";
2011-02-23 20:48:06 +00:00
}
sub create_res {
my ($cmd, $res, $dev, $appear) = @_;
my $create = ($cmd eq "create-resource");
die "undefined device or size argument\n" unless $dev;
check_id($appear) if $appear;
if($create) {
2011-02-25 11:46:38 +00:00
die "resource '$res' already exists\n" if -d "$mars/resource-$res";
2011-02-23 20:48:06 +00:00
print "creating new resource '$res'\n";
} else {
print "joining to existing resource '$res'\n";
}
2011-02-27 14:17:58 +00:00
my $size = get_size($dev);
2011-02-23 20:48:06 +00:00
if($size > 0) {
$dev = "";
} else {
die "block device '$dev' does not exist\n" unless -b $dev;
die "block device '$dev' must be an absolute path starting with '/'\n" unless $dev =~ m/^\//;
2011-02-27 14:17:58 +00:00
use Fcntl 'SEEK_END';
open(TEST, "<$dev") or die "cannot open device for reading\n";
$size = sysseek(TEST, 0, SEEK_END);
close(TEST);
print "device size = $size bytes\n";
die "implausible size" unless $size > 0;
2011-02-23 20:48:06 +00:00
}
my $tmp = "$mars/.tmp.$res";
my $primary;
2011-03-23 08:09:00 +00:00
my $replay;
2011-02-23 20:48:06 +00:00
if($create) {
2011-03-23 08:09:00 +00:00
_create_system(@_);
2011-02-23 20:48:06 +00:00
system("rm -rf $tmp");
system("mkdir $tmp") == 0 or die "could not create resource '$res'\n";
2011-02-27 14:17:58 +00:00
symlink($size, "$tmp/size") or die "cannot create size indicator symlink\n";
2011-02-23 20:48:06 +00:00
} else {
$tmp = "$mars/resource-$res";
die "resource '$res' does not exist\n" unless -d $tmp;
2011-02-27 14:17:58 +00:00
$primary = readlink("$tmp/primary") or die "cannot determine primary\n";
2011-02-23 20:48:06 +00:00
die "resource '$res' is already joined\n" if -e "$tmp/data-$host";
die "my ip '$ip' is not registered -- please run 'join-system' first\n" unless -l "$mars/ips/ip-$host";
2011-02-27 14:17:58 +00:00
my $oldsize = readlink("$tmp/size") or die "cannot determine old size\n";
if($size < $oldsize) {
print "adjusting size to $oldsize\n";
$size = $oldsize;
}
die "sizes differ: real size = $oldsize, but requested size = $size\n" unless $oldsize == $size;
2011-03-23 08:09:00 +00:00
$replay = readlink("$tmp/replay-$primary") or die "cannot read replay status of primary '$primary'\n";
2011-03-22 14:36:26 +00:00
$replay =~ s/-$primary,/-$host,/ or die "something is wrong here\n";
2011-02-23 20:48:06 +00:00
}
my $file = "$tmp/data-$host";
2011-02-27 14:17:58 +00:00
if(!$dev) {
2011-02-23 20:48:06 +00:00
print "creating sparse file '$file' with size $size\n";
open(OUT, ">$file") or die "could not open '$file'\n";
use Fcntl 'SEEK_SET';
sysseek(OUT, $size-1, SEEK_SET) == $size-1 or die "could not seek\n";
syswrite(OUT, '\0', 1) == 1 or die "cannot init sparse file\n";
close OUT;
} else {
print "using existing device '$dev'\n";
symlink($dev, $file) or die "cannot create device symlink\n";
}
if($appear) {
# TODO: check for uniqeness of $appear
print "resource '$res' will appear as local device '/dev/mars/$appear'\n";
system("rm -f $tmp/device-$host");
symlink($appear, "$tmp/device-$host") or die "cannot create symlink for local device appearance\n";
}
2011-03-23 08:09:00 +00:00
mkdir("$tmp/defaults") unless -d "$tmp/defaults";
mkdir("$tmp/defaults-$host");
mkdir("$tmp/actual-$host");
mkdir("$tmp/switch-$host");
2011-03-23 17:58:02 +00:00
symlink("1", "$tmp/switch-$host/attach");
2011-03-23 08:09:00 +00:00
symlink("0", "$tmp/switch-$host/connect");
symlink("0", "$tmp/switch-$host/sync");
2011-02-23 20:48:06 +00:00
if($create) {
symlink($host, "$tmp/primary") or die "cannot create primary symlink\n";
2011-05-13 11:19:28 +00:00
symlink("log-000000001-$host,0,0", "$tmp/replay-$host") or die "cannot create replay status\n";
2011-02-23 20:48:06 +00:00
rename($tmp, "$mars/resource-$res") or die "cannot finalize resource '$res'\n";
print "successfully created resource '$res'\n";
} else {
2011-02-25 11:46:38 +00:00
system("rm -f $tmp/replay-$host");
symlink($replay, "$tmp/replay-$host") or die "cannot create replay status\n";
2011-02-23 20:48:06 +00:00
system("rm -f $tmp/syncstatus-$host");
symlink("0", "$tmp/syncstatus-$host") or die "cannot start initial sync\n";
system("rm -f $tmp/connect-$host");
2011-03-04 15:14:20 +00:00
symlink($primary, "$tmp/connect-$host") or die "cannot create peer connect symlink\n";
symlink($host, "$tmp/connect-$primary") unless -l "$tmp/connect-$primary";
2011-02-23 20:48:06 +00:00
print "successfully joined resource '$res'\n";
}
}
sub attach_res {
my ($cmd, $res) = @_;
my $detach = ($cmd eq "detach");
2011-03-23 17:58:02 +00:00
my $path = "$mars/resource-$res/switch-$host/attach";
2011-06-10 13:57:52 +00:00
_switch($cmd, $res, $path, !$detach);
2011-02-23 20:48:06 +00:00
}
sub connect_res {
my ($cmd, $res) = @_;
my $disconnect = ($cmd eq "disconnect");
2011-03-23 08:09:00 +00:00
my $path = "$mars/resource-$res/switch-$host/connect";
2011-06-10 13:57:52 +00:00
_switch($cmd, $res, $path, !$disconnect);
2011-02-27 14:17:58 +00:00
}
sub pause_res {
my ($cmd, $res) = @_;
my $pause = ($cmd eq "pause-sync");
2011-03-23 08:09:00 +00:00
my $path = "$mars/resource-$res/switch-$host/sync";
2011-06-10 13:57:52 +00:00
_switch($cmd, $res, $path, !$pause);
2011-02-23 20:48:06 +00:00
}
sub up_res {
my ($cmd, $res) = @_;
my $down = ($cmd eq "down");
if($down) {
2011-02-27 14:17:58 +00:00
pause_res("pause-sync", $res);
2011-02-23 20:48:06 +00:00
connect_res("disconnect", $res);
attach_res("detach", $res);
} else {
attach_res("attach", $res);
connect_res("connect", $res);
2011-02-27 14:17:58 +00:00
pause_res("resume-sync", $res);
2011-02-23 20:48:06 +00:00
}
}
sub primary_res {
my ($cmd, $res) = @_;
my $sec = ($cmd eq "secondary");
2011-02-27 14:17:58 +00:00
my $pri = "$mars/resource-$res/primary";
2011-02-23 20:48:06 +00:00
my $old = readlink($pri) or die "cannot determine current primary\n";
if($sec) {
die "for safety reasons, switching to secondary is only allowed when I am primary\n" if($old ne $host);
$host = "(none)";
} elsif($old eq $host) {
print "I am already primary.\n";
exit(0);
2011-03-24 16:05:46 +00:00
} else {
my $lnk = "$mars/resource-$res/syncstatus-$host";
if(lstat($lnk)) {
my $syncstatus = readlink($lnk);
my $size = readlink("$mars/resource-$res/size") or die "cannot read size\n";
die "sync has not yet finished, only $syncstatus / $size bytes transferred\n" unless $syncstatus >= $size;
}
2011-02-23 20:48:06 +00:00
}
# TODO: check whether we can switch without interrupting service....
2011-03-01 18:00:14 +00:00
my $tmp = "$mars/resource-$res/.tmp.primary";
2011-02-23 20:48:06 +00:00
system("rm -f $tmp");
symlink($host, $tmp) or die "cannot create new primary symlink\n";
rename($tmp, $pri) or die "cannot install new primary symlink\n";
print "primary changed from '$old' to '$host'\n";
}
2011-02-27 14:17:58 +00:00
sub invalidate_res {
my ($cmd, $res) = @_;
my $pri = "$mars/resource-$res/primary";
my $old = readlink($pri) or die "cannot determine current primary\n";
my $dst = "$mars/resource-$res/syncstatus-$host";
die "primary side cannot be invalidated\n" if $old eq $host;
system("rm -f $dst");
symlink("0", $dst) or die "cannot create invalidation symlink '$dst'\n";
}
2011-02-23 20:48:06 +00:00
sub role_cmd {
my ($cmd, $res) = @_;
2011-02-27 14:17:58 +00:00
my $pri = "$mars/resource-$res/primary";
2011-02-23 20:48:06 +00:00
my $old = readlink($pri) or die "cannot determine current primary\n";
if($old eq $host) {
print "primary\n";
} else {
print "secondary\n";
}
}
##################################################################
my %cmd_table =
(
# new keywords
2011-03-23 08:09:00 +00:00
"create-system" => \&create_system,
2011-02-27 14:17:58 +00:00
"join-system" => \&join_system,
"create-resource" => \&create_res,
"join-resource" => \&create_res,
2011-02-23 20:48:06 +00:00
# compatible keywords
2011-02-27 14:17:58 +00:00
"attach" => \&attach_res,
"detach" => \&attach_res,
"connect" => \&connect_res,
"disconnect" => \&connect_res,
"syncer" => \&ignore_cmd,
"up" => \&up_res,
"down" => \&up_res,
"primary" => \&primary_res,
"secondary" => \&primary_res,
"invalidate" => \&invalidate_res,
2011-02-23 20:48:06 +00:00
"invalidate-remote" => \&forbidden_cmd,
2011-02-27 14:17:58 +00:00
"resize" => \&nyi_cmd,
"create-md" => \&senseless_cmd,
"get-gi" => \&ignore_cmd,
"show-gi" => \&ignore_cmd,
"dump-md" => \&senseless_cmd,
"outdate" => \&ignore_cmd,
"adjust" => \&ignore_cmd,
"wait-connect" => \&nyi_cmd,
"role" => \&role_cmd,
"state" => \&role_cmd,
"cstate" => \&nyi_cmd,
"status" => \&nyi_cmd,
"dump" => \&senseless_cmd,
"verify" => \&nyi_cmd,
2011-03-23 08:09:00 +00:00
"pause-sync" => \&pause_res,
"resume-sync" => \&pause_res,
2011-02-27 14:17:58 +00:00
"new-current-uuid" => \&senseless_cmd,
"dstate" => \&nyi_cmd,
"hidden-commands" => \&ignore_cmd,
2011-02-23 20:48:06 +00:00
);
my $cmd = shift || die "command argument is missing\n";
my $res = shift || die "resource argument is missing\n";
die "unknown command '$cmd'\n" if !exists $cmd_table{$cmd};
check_id($res);
2011-03-02 16:20:36 +00:00
sub do_res {
my $cmd = shift;
my $res = shift;
2011-06-10 13:57:52 +00:00
$res = check_res($res) unless $cmd =~ m/^(join-system|create-resource)$/;
2011-03-02 16:20:36 +00:00
check_res_member($res) unless $cmd =~ m/^(join|create)-(system|resource)$/;
my $func = $cmd_table{$cmd};
&{$func}($cmd, $res, @_);
}
if($res eq "all") {
foreach $res (glob("$mars/resource-*")) {
next unless -e "$res/data-$host";
$res =~ s/^.*\/resource-(.*)$/$1/;
print "--------- resource $res\n";
do_res($cmd, $res, @ARGV);
}
} else {
do_res($cmd, $res, @ARGV);
}
2011-03-03 09:02:10 +00:00
_trigger();