#LyX 2.3 created this file. For more info see http://www.lyx.org/
\lyxformat 544
\begin_document
\begin_header
\save_transient_properties true
\origin unavailable
\textclass scrreprt
\begin_preamble
\usepackage{listings}
\end_preamble
\options abstracton,most,usenames,dvipsnames
\use_default_options true
\begin_modules
customHeadersFooters
enumitem
fixltx2e
tcolorbox
\end_modules
\maintain_unincluded_children false
\language english
\language_package default
\inputencoding auto
\fontencoding global
\font_roman "default" "default"
\font_sans "default" "default"
\font_typewriter "default" "default"
\font_math "auto" "auto"
\font_default_family rmdefault
\use_non_tex_fonts false
\font_sc false
\font_osf false
\font_sf_scale 100 100
\font_tt_scale 100 100
\use_microtype false
\use_dash_ligatures false
\graphics default
\default_output_format default
\output_sync 0
\bibtex_command default
\index_command default
\paperfontsize 10
\spacing single
\use_hyperref true
\pdf_title "MARS User Manual"
\pdf_author "Thomas Schöbel-Theuer"
\pdf_bookmarks true
\pdf_bookmarksnumbered false
\pdf_bookmarksopen true
\pdf_bookmarksopenlevel 2
\pdf_breaklinks true
\pdf_pdfborder true
\pdf_colorlinks true
\pdf_backref section
\pdf_pdfusetitle true
\papersize a4paper
\use_geometry true
\use_package amsmath 1
\use_package amssymb 1
\use_package cancel 1
\use_package esint 1
\use_package mathdots 1
\use_package mathtools 1
\use_package mhchem 1
\use_package stackrel 1
\use_package stmaryrd 1
\use_package undertilde 1
\cite_engine basic
\cite_engine_type default
\biblio_style plain
\use_bibtopic false
\use_indices false
\paperorientation portrait
\suppress_date false
\justification true
\use_refstyle 1
\use_minted 0
\index Index
\shortcut idx
\color #008000
\end_index
\leftmargin 3.7cm
\topmargin 2.7cm
\rightmargin 2.8cm
\bottommargin 2.3cm
\secnumdepth 3
\tocdepth 3
\paragraph_separation indent
\paragraph_indentation default
\is_math_indent 0
\math_numbering_side default
\quotes_style english
\dynamic_quotes 0
\papercolumns 1
\papersides 2
\paperpagestyle headings
\tracking_changes false
\output_changes false
\html_math_output 0
\html_css_as_file 0
\html_be_strict false
\end_header
\begin_body
\begin_layout Standard
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
title{MARS User Manual}
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\begin_inset CommandInset include
LatexCommand input
preview true
filename "common-front-matter.lyx"
\end_inset
\end_layout
\begin_layout Chapter*
Preface
\end_layout
\begin_layout Section*
Introduction
\end_layout
\begin_layout Standard
\begin_inset CommandInset include
LatexCommand input
preview true
filename "common-introduction.lyx"
\end_inset
\end_layout
\begin_layout Section*
Purpose
\end_layout
\begin_layout Standard
This document explains how to install, setup and run a storage replication
system on a Linux based platform using MARS.
\end_layout
\begin_layout Standard
MARS is free software under GPL.
The terms and conditions of the GPL apply.
This documentation is
\emph on
best effort
\emph default
and may contain bugs (no warranty, according to the GPL).
\end_layout
\begin_layout Section*
Scope
\end_layout
\begin_layout Standard
The following topics are covered withing this document:
\end_layout
\begin_layout Itemize
preconditions: what you need.
\end_layout
\begin_layout Itemize
creating a Linux kernel module for MARS.
\end_layout
\begin_layout Itemize
creation of a MARS cluster.
\end_layout
\begin_layout Itemize
creation and operation of MARS resources.
\end_layout
\begin_layout Itemize
dynamic creation / deletion of additional replicas, and how migrate data
this way.
\end_layout
\begin_layout Itemize
hints for monitoring.
\end_layout
\begin_layout Itemize
troubleshooting
\end_layout
\begin_layout Section*
Audience
\end_layout
\begin_layout Standard
This document is written for experienced sysadmins with working knowledge
on the following methods and technologies:
\end_layout
\begin_layout Itemize
Setup and operation of LVM (Logical Volume Manager) under Linux.
\end_layout
\begin_layout Itemize
Operation of storage systems.
\end_layout
\begin_layout Itemize
Ability to patch and to compile and install a customized Linux kernel.
Most patches are already provided ready-to-use, so no full developer knowledge
is needed.
\end_layout
\begin_layout Section*
How to use this document
\end_layout
\begin_layout Standard
Please start with the very short introduction
\begin_inset CommandInset ref
LatexCommand formatted
reference "chap:Briefing:-how-MARS"
plural "false"
caps "false"
noprefix "false"
\end_inset
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:Briefing:-how-MARS"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
If you want to install MARS, read
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:Quick-Start-Guide"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
If you just want to operate a MARS installation which is already set up,
go on to
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:HOWTO-operation-of"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
If you already have some experiences with MARS and just need some details
about marsadm commands, chapter
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:The-Sysadmin-Interface"
plural "false"
caps "false"
noprefix "false"
\end_inset
is a kind of
\begin_inset Quotes eld
\end_inset
reference
\begin_inset Quotes erd
\end_inset
for you.
\end_layout
\begin_layout Standard
Users who want to go deeper into tuning should read
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:Tuning,-tips-and"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
Automation via interfacing to
\family typewriter
systemd
\family default
is described in
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:Advanced-users:-automation"
plural "false"
caps "false"
noprefix "false"
\end_inset
, as well as tips for writing your own automation scripts.
\end_layout
\begin_layout Standard
Appendix
\begin_inset CommandInset ref
LatexCommand vref
reference "chap:FAQ"
plural "false"
caps "false"
noprefix "false"
\end_inset
answers a few
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:FAQ"
plural "false"
caps "false"
noprefix "false"
\end_inset
s by the inventor of MARS.
\end_layout
\begin_layout Standard
Appendix
\begin_inset CommandInset ref
LatexCommand vref
reference "chap:Technical-Data-MARS"
plural "false"
caps "false"
noprefix "false"
\end_inset
contains some estimations for typical datacenter hardware, called
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:Technical-Data-MARS"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
Some non-standard expert tricks (e.g.
for mass operation of thousands of instances) can be found in the following
appendices.
\end_layout
\begin_layout Section*
Related documents
\end_layout
\begin_layout Itemize
\family typewriter
mars-architecture-guide.pdf
\family default
: explains usage scenarios.
\end_layout
\begin_layout Itemize
\family typewriter
football-user-manual.pdf
\family default
: for sysadmins and userspace developers who want to use Football.
\end_layout
\begin_layout Itemize
\family typewriter
mars-for-kernel-developers.pdf
\family default
: some infos for kernel developers.
\end_layout
\begin_layout Standard
\begin_inset CommandInset toc
LatexCommand tableofcontents
\end_inset
\end_layout
\begin_layout Chapter
Briefing: how MARS works
\begin_inset CommandInset label
LatexCommand label
name "chap:Briefing:-how-MARS"
\end_inset
\end_layout
\begin_layout Section
Typical MARS replication setup
\begin_inset CommandInset label
LatexCommand label
name "sec:Typical-MARS-replication"
\end_inset
\end_layout
\begin_layout Standard
Typical recommended usage is replication of multiple Logical Volumes (LVs)
directly at bare metal (never inside of VMs), similar to DRBD:
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/typical-mars-setup.fig
width 100col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
At the primary (active) side A, the applications are running.
At each of the secondary (passive) sides B and C, only the underlying LV
replicas are updated via the replication network traffic.
The filesystem is not mounted at any secondary side, and the applications
are not running there.
However, the roles may be switched at any time, and then the application
will for example run at Datacenter B in primary role, while the corresponding
LV replicas will then be in secondary (passive) role at datacenters A and
C.
\end_layout
\begin_layout Standard
An advantage of multiple LV replication is that primary and secondary roles
can be
\series bold
\emph on
individually
\emph default
switched at runtime
\series default
.
For example, if you have 10 LVs in each of your servers, 6 LVs may currently
run in datacenter A in primary role, while the other 4 LVs are running
in datacenter B, while datacenter C is dimensioned for less CPU power,
and is mainly intended for additional
\begin_inset Quotes eld
\end_inset
emergency backup
\begin_inset Quotes erd
\end_inset
replicas.
For instance, such a 3-datacenter configuration may be used for load balancing
during overload peaks, or for switchover due to kernel security updates,
and much more.
\end_layout
\begin_layout Standard
Further setups are also possible.
For example, you might replicate physical disks.
However, this would be less flexible because your volumes must then uniformly
run in the
\emph on
same
\emph default
datacenter at the same time.
\end_layout
\begin_layout Standard
In addition, MARS' replicated block devices may be exported via iSCSI or
other protocols.
Filesystems residing on top of MARS may be exported via NFS or glusterfs,
etc.
For more details, please consult
\family typewriter
mars-architecture-guide.pdf
\family default
.
\end_layout
\begin_layout Section
The Transaction Logger
\begin_inset CommandInset label
LatexCommand label
name "sec:The-Transaction-Logger"
\end_inset
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/MARS_Data_Flow.pdf
lyxscale 60
width 100text%
\end_inset
\end_layout
\begin_layout Standard
\noindent
The basic idea of MARS is to record all changes made to your LV in a so-called
\series bold
transaction logfile
\series default
.
\emph on
Any
\emph default
write reqeuest is treated like a transaction which changes the contents
of your LV.
\end_layout
\begin_layout Standard
This is similar in concept to some database systems (c.f.
MySQL replication), but there exists no separate
\begin_inset Quotes eld
\end_inset
commit
\begin_inset Quotes erd
\end_inset
operation:
\emph on
any
\emph default
write request is acting like a commit.
\end_layout
\begin_layout Standard
The picture shows the flow of write requests.
Let's start with the primary node.
\end_layout
\begin_layout Standard
Write requests directed at the virtual block device
\family typewriter
/dev/mars/mydata
\family default
are first buffered in a
\emph on
temporary
\emph default
kernel memory buffer.
\end_layout
\begin_layout Standard
The temporary kernel memory buffer serves multiple purposes:
\end_layout
\begin_layout Itemize
It keeps track of the
\series bold
order
\series default
of write operations.
\end_layout
\begin_layout Itemize
Additionally, it keeps track of the positions in the underlying LV
\family typewriter
/dev/lv-x/mydata
\family default
.
In particular, it detects when the same block is overwritten multiple times.
\end_layout
\begin_layout Itemize
Writeback to the underlying LV may occur in a different order than submission
order.
On magnetic disk media, this may lead to a noticeable
\series bold
performance boost
\series default
, as shown in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:IO-Performance-Tuning"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Itemize
During pending write operations, any concurrent reads from the same locations
are served from the temporary memory buffer.
\end_layout
\begin_layout Standard
After the write has been buffered in the temporary memory buffer, the internal
transaction logger kernel thread creates a so-called
\emph on
log entry
\emph default
and starts an
\begin_inset Quotes eld
\end_inset
append
\begin_inset Quotes erd
\end_inset
operation on the transaction logfile.
The log entry contains vital information such as the logical block number
in the underlying LV, the length of the data, a timestamp, some header
magic in order to detect corruption, the log entry sequence number, of
course the data itself, and optional information like an MD5 checksum or
compression information.
\end_layout
\begin_layout Standard
Once the log entries
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice that the order of log records present in the transaction log defines
a total order among the write requests which is
\emph on
compatible
\emph default
to the partial order of write requests issued on
\family typewriter
/dev/mars/mydata
\family default
.
\end_layout
\begin_layout Plain Layout
Also notice that despite its sequential nature, the transaction logfile
is typically
\emph on
not
\emph default
the performance bottleneck of the system.
At least on magnetic media, appending to a logfile is almost purely sequential
IO, it runs much faster than random IO.
\end_layout
\end_inset
have been written through to the
\family typewriter
/mars/
\family default
filesystem via
\family typewriter
fsync()
\family default
, the application waiting for the write operation at
\family typewriter
/dev/mars/mydata
\family default
is signalled that the write was successful
\begin_inset Foot
status open
\begin_layout Plain Layout
In order to reclaim the temporary memory buffer, its content must be written
back to the underlying disk
\family typewriter
/dev/lv-x/mydat
\family default
a somewhen.
After writeback, the temporary space is freed.
The writeback can do the following optimizations:
\end_layout
\begin_layout Enumerate
writeback may be in
\emph on
any
\emph default
order; in particular, it is
\emph on
sorted
\emph default
according to ascending sector ´numbers.
This reduces the average seek distances of magnetic disks in general.
\end_layout
\begin_layout Enumerate
when the same sector is overwritten multiple times, only the
\begin_inset Quotes eld
\end_inset
last
\begin_inset Quotes erd
\end_inset
version need to be written back, skipping some intermediate versions.
\end_layout
\end_inset
.
\end_layout
\begin_layout Standard
This usually happens
\emph on
before
\emph default
the writeback to the underlying LV
\family typewriter
/dev/lv-x/mydata
\family default
has started.
Even when you power off the system right now, the information is not lost:
it is present in the logfile, and will be reconstructed from there after
restart from power loss (Recovery phase).
This is similar to Recovery of database systems after unexpected power
loss.
\end_layout
\begin_layout Standard
In case the primary node crashes during writeback, it suffices to replay
the log entries from some point in the past until the end of the transaction
logfile.
It does no harm if you accidentally replay some log entries twice or even
more often: since the replay is in the original total order.
Thus any temporary inconsistency will be
\emph on
healed
\emph default
\begin_inset Foot
status open
\begin_layout Plain Layout
\noindent
In mathematics, the property that you can apply your logfile twice to your
data (or even as often as you want), is called
\series bold
idempotence
\series default
.
This is a very desirable property: it ensures that nothing goes wrong when
replaying
\begin_inset Quotes eld
\end_inset
too much
\begin_inset Quotes erd
\end_inset
/ starting your replay
\begin_inset Quotes eld
\end_inset
too early
\begin_inset Quotes erd
\end_inset
.
Idempotence is even more beneficial: in case anything should go wrong with
your data on your disk (e.g.
IO errors), replaying your logfile once more often may even
\series bold
heal
\series default
some defects.
\end_layout
\end_inset
by logfile application.
Good news for desperate sysadmins forced to work with old or flaky hardware!
\end_layout
\begin_layout Standard
The basic idea of asynchronous replication by MARS is rather simple: just
transfer the logfiles to your secondary nodes, and replay them onto their
LV replica (aka copy of the disk data, aka mirror).
\end_layout
\begin_layout Standard
Replay is always in the same write order as the total order defined by the
primary.
\end_layout
\begin_layout Standard
Therefore, a mirror of your data on any secondary may be outdated, but it
always corresponds to some version which was valid in the past.
This property is called
\series bold
anytime consistency
\begin_inset Foot
status open
\begin_layout Plain Layout
Your secondary nodes are always
\series bold
strictly consistent
\series default
in themselves.
Notice that this kind of consistency is a
\emph on
local
\emph default
consistency model.
At global level, MARS is
\series bold
eventually consistent
\series default
.
Strict global consistency is generally not possible over long distances.
Reasons are (1) Einstein's law (speed of light), and (2) the CAP theorem
and its sister theorems.
The front-cover pictures showing the planets Earth and Mars tries to lead
your imagination away from global consistency models, in order to prepare
you mentally for local consistency as in
\begin_inset Quotes eld
\end_inset
MARS Think
\begin_inset Formula $^{(tm)}$
\end_inset
\begin_inset Quotes erd
\end_inset
.
\end_layout
\end_inset
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
As you can see in the picture, the logfile transfer process is
\emph on
independent
\emph default
from the replay process.
Both processes can be switched on / off separately (see commands
\family typewriter
marsadm {dis,}connect
\family default
and
\family typewriter
marsadm {pause,resume}-replay
\family default
in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Operation-of-the"
\end_inset
).
This may be
\emph on
exploited
\emph default
: for example, you may replicate your logfiles as soon as possible (to protect
against catastrophic failures), but deliberately wait one hour until it
is replayed (under regular circumstances).
If your data inside your filesystem
\family typewriter
/mydata/
\family default
at the primary site is accidentally destroyed by
\family typewriter
rm -rf /mydata/
\family default
, you have an old copy at the secondary site.
This way, you can substitute
\emph on
some parts
\begin_inset Foot
status open
\begin_layout Plain Layout
Please note that MARS cannot
\emph on
fully
\emph default
substitute a backup system, because it can keep only
\emph on
physical
\emph default
copies, and does not create logical copies.
\end_layout
\end_inset
\emph default
of conventional backup functionality by MARS.
In case you need the actual version, just replay in
\begin_inset Quotes eld
\end_inset
fast-forward
\begin_inset Quotes erd
\end_inset
mode (similar to old-fashioned video tapes).
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Future versions of MARS are planned to also allow
\begin_inset Quotes eld
\end_inset
fast-backward
\begin_inset Quotes erd
\end_inset
rewinding, of course at some cost.
\end_layout
\begin_layout Section
The State of MARS
\begin_inset CommandInset label
LatexCommand label
name "sec:The-State-of"
\end_inset
\end_layout
\begin_layout Standard
In general, MARS tries to
\emph on
hide
\emph default
any network failures from you as best as it can.
After a network problem, any internal low-level socket connections are
\emph on
transparently
\emph default
tried to re-open ASAP, without need for sysadmin intervention.
In difference to DRBD, network failures will
\emph on
not
\emph default
automatically alter the state of MARS, such as switching to
\family typewriter
disconnected
\family default
after a
\family typewriter
ko_timeout
\family default
or similar.
From a high-level sysadmin viewpoint, communication may just take a very
long time to succeed.
\end_layout
\begin_layout Standard
When the behaviour of MARS is different from DRBD, it is usually intended
as a feature.
\end_layout
\begin_layout Standard
MARS is not only an
\series bold
asynchronous
\series default
system at block IO level, but also
\series bold
at control level
\series default
.
\end_layout
\begin_layout Standard
This is
\emph on
necessary
\emph default
because in a widely distributed long-distance system running on slow or
even temporarily failing networks, actions may take a long time, and there
may be many actions
\series bold
started in parallel
\series default
.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Synchronous concepts are generally not sufficient for expressing that.
Because of inherent asynchronicity and of dynamic creation / joining of
resources, it is neither possible to comprehensively depict a complex distribut
ed MARS system, nor a comprehensive standalone snippet of MARS, as a finite
state transition diagram
\begin_inset Foot
status open
\begin_layout Plain Layout
Probably it could be possible to formally model MARS as a Petri net.
However, complete Petri nets are tending to become very conplex, and to
describe lots of low-level details.
Expressing hierarchy, in a top-down fashion, is cumbersome.
We find no clue in trying to do so.
\end_layout
\end_inset
.
\end_layout
\begin_layout Chapter
HOWTO setup MARS
\begin_inset CommandInset label
LatexCommand label
name "chap:Quick-Start-Guide"
\end_inset
\end_layout
\begin_layout Standard
This chapter is for impatient but experienced sysadmins.
For more detailed information, refer to chapter
\begin_inset CommandInset ref
LatexCommand nameref
reference "chap:The-Sysadmin-Interface"
\end_inset
.
\end_layout
\begin_layout Section
Description: what you Need
\begin_inset CommandInset label
LatexCommand label
name "sec:Preparation:-What-you"
\end_inset
\end_layout
\begin_layout Standard
This section describes the hardware you will need to buy and deploy, and
which software components to install.
Step-by-step setup instructions are following in the next section (starting
with section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:MARS-Kernel-Module"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Standard
Typically, you will install MARS at many bare metal servers for replication
of many LVs
\emph on
between
\begin_inset Foot
status open
\begin_layout Plain Layout
Many other solutions, even from commercial storage vendors, will not work
reliably over distances greater than
\begin_inset Formula $\approx50$
\end_inset
km, and/or when your network is not
\emph on
extremely
\emph default
reliable, and/or when you try to push huge masses of data from high-performance
applications through a network bottleneck.
If you ever encountered suchalike problems (or try to avoid them in advance),
MARS is for you.
More information can be found in
\family typewriter
mars-architecture-guide.pdf
\family default
.
\end_layout
\end_inset
\emph default
multiple datacenters.
Do
\emph on
not
\emph default
use MARS inside of VMs (see explanation of Dijkstra's layering rules in
\family typewriter
mars-architecture-guide.pdf
\family default
).
\end_layout
\begin_layout Standard
You can use MARS both at dedicated storage servers (e.g.
for serving Windows clients over iSCSI), or at standalone Linux servers
where CPU and storage are
\emph on
not
\emph default
separated.
\end_layout
\begin_layout Standard
Here is a list of software to be installed at your servers (with distro-specific
tools like
\family typewriter
dpkg
\family default
/
\family typewriter
aptitude
\family default
/
\family typewriter
rpm
\family default
/
\family typewriter
yum
\family default
/
\family typewriter
zypper
\family default
/ etc):
\end_layout
\begin_layout Itemize
\family typewriter
ssh
\end_layout
\begin_layout Itemize
\family typewriter
ssh-agent
\family default
(such that
\family typewriter
ssh root@hostA
\family default
will work without password)
\end_layout
\begin_layout Itemize
\family typewriter
rsync
\end_layout
\begin_layout Itemize
\family typewriter
perl
\end_layout
\begin_layout Itemize
\family typewriter
lvm
\end_layout
\begin_layout Itemize
Further standard Linux tools like
\family typewriter
modprobe
\family default
, typically already present at servers.
When necessary, you typically can install them from typical OpenSource
/ Linux Distro repos.
\end_layout
\begin_layout Itemize
Only if you don't have an already pre-built MARS kernel module, and only
at your workstation, not necessarily at your server: everything you need
for compiling a customized kernel.
Optionally, the tools for building a Debian or rpm package.
Details are distro-specific.
\end_layout
\begin_layout Standard
In order to protect your server data from low-level disk failures, you should
use a
\series bold
hardware RAID controller with BBU
\series default
.
Software RAID is currently
\emph on
not
\emph default
recommended, because it generally provides worse performance due to the
lack of a hardware BBU (for some benchmark comparisons with/out BBU, see
\begin_inset Flex URL
status open
\begin_layout Plain Layout
https://github.com/schoebel/blkreplay/raw/master/doc/blkreplay.pdf
\end_layout
\end_inset
).
\end_layout
\begin_layout Standard
For many application workloads, RAID-6 provides a good compromize between
cost and performance.
Reads are very fast due to RAID-6 striping, while the slow RAID-6 writes
are partially compensated by the MARS kernel memory buffer (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:IO-Performance-Tuning"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Standard
For almost double the cost per TiB, you can speed up write operations by
RAID-10.
However, checkout RAID-6 first.
A good tool to measure your
\emph on
real
\emph default
application performance is
\family typewriter
blktrace
\family default
plus blkreplay, see
\begin_inset Flex URL
status open
\begin_layout Plain Layout
https://github.com/schoebel/blkreplay/raw/master/doc/blkreplay.pdf
\end_layout
\end_inset
.
\end_layout
\begin_layout Standard
For much higher cost per TiB, typically by about a factor of 10, you can
of course also use SSDs in place of HDDs.
While relatively small-sized database workloads are nowadays typically
on SSDs, big mass data is typically remaining on HDDs for cost reasons.
\end_layout
\begin_layout Standard
Typically, you should build more than one RAID set
\begin_inset Foot
status open
\begin_layout Plain Layout
For low-cost storage, RAID-5 is no longer regarded safe for today's typical
storage sizes, because the error rate is regarded too high.
Therefore, use RAID-6.
If you need more than 15 disks in total, create multiple RAID sets (each
having at most 15 disks, better about 12 disks) and stripe them via LVM
(or via your hardware RAID controller if it supports RAID-60).
\end_layout
\end_inset
if you have more than 12 to 15 spindles in total.
Therefore, the step-by-step HOWTO from this best-effort manual will show
you some examples with LVM striping over 2 physical volumes (PVs).
\end_layout
\begin_layout Standard
LVM is highly recommended
\begin_inset Foot
status open
\begin_layout Plain Layout
In principle, you may combine MARS with commercial storage boxes connected
over Fibrechannel or iSCSI.
At 1&1, there is not yet operational experience with such setups.
\end_layout
\end_inset
for maximum flexibility.
When used in static space allocation mode (as opposed to thin provisioning
mode), LVM involves no measurable overhead (within the measurement tolerances
of
\family typewriter
blkreplay
\family default
).
Although LVM thin provisioning could potentially save some cost, it may
lead to massive performance degradation as observed with certain types
of application behaviour.
In order to stay at the safe side of operations, you should dimension your
RAID storage size accordingly.
\end_layout
\begin_layout Standard
MARS' tolerance of networking problems comes with some cost.
You will need some extra space for the transaction logfiles of MARS, residing
at the
\family typewriter
/mars/
\family default
filesystem.
\end_layout
\begin_layout Standard
The exact space requirements for
\family typewriter
/mars/
\family default
depend on the
\emph on
average write rate
\emph default
of your application, not on the size of your data.
An example: in 1&1 Shared Hosting Linux (ShaHoLin), we found that only
few applications are writing more than 1 TB per day during ordinary
\begin_inset Foot
status open
\begin_layout Plain Layout
Exception: restores from backup.
\end_layout
\end_inset
operations.
Most are writing even less than 100 GB per day, because the observed average
filesystem data change rate is only about 1% per day
\begin_inset Foot
status open
\begin_layout Plain Layout
Within some limits, the distribution is an exponential one, according to
Zipf's law.
\end_layout
\end_inset
.
Of course, there exist other applications like backup where the write rate
is much higher.
Please try to determine your actual write rates from system tools like
\family typewriter
sar
\family default
.
Usually, you want to dimension
\family typewriter
/mars/
\family default
such that you can survive a network loss lasting 3 days / about one weekend.
\end_layout
\begin_layout Standard
This can be achieved rather easily, in one of the following ways:
\end_layout
\begin_layout Enumerate
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
sloppy
\end_layout
\end_inset
Create an LV for
\family typewriter
/mars
\family default
on top of your application VG, typically named
\family typewriter
/dev/vg/mars
\family default
or similar (see step-by-step instructions in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Setup-LVM"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
This is the easiest solution if you are anyway using LVM on top of a hardware
BBU.
This is also most flexible: it can be
\series bold
resized during operation
\series default
.
Therefore, you may start with a size of around 500 GiB, and later be extended
with increasing demands.
\begin_inset Newline newline
\end_inset
This variant is also recommended if you have very expensive SSD storage.
Depending on write rates, you could for example start with 100 GiB, and
extend dynamically as far as needed, for example by some alerting scripts,
or even using some cron job.
\end_layout
\begin_layout Enumerate
Alternatively, you may use one
\series bold
dedicated HDD
\series default
with a capacity of 4 TB or more.
Typically, this will provide you with plenty of headroom even for bigger
networking incidents.
Performace of a single HDD over a BBU is typically good enough for
\family typewriter
/mars
\family default
because the transaction logs are involving mostly
\emph on
sequential
\emph default
reads and writes in larger chunks.
However, there exist some workloads where striping could be necessary for
maximizing sequential throughput.
\end_layout
\begin_layout Enumerate
Alternatively, if you are concerned about both performance and reliability,
use two dedicated spindles over hardware RAID-1 with BBU.
For maximum flexibility, put another VG on top of the dediactedRAID-1 set.
For example, if
\family typewriter
/dev/sdc
\family default
is your RAID-1 set, create a PV and a VG called
\family typewriter
mars
\family default
on top of it.
This is most flexible, since you might later migrate your
\family typewriter
/mars
\family default
even during runtime, for example when replacing small disks with bigger
ones, or when replacing HDDs with SSDs during runtime.
\end_layout
\begin_layout Enumerate
For extemely high performance, separate SSD sets for the user data VG and
for
\family typewriter
/mars
\family default
might be beneficial.
However, check whether it really pays off.
Notice that a hardware BBU is nothing but a RAM cache, which is faster
than any SSD, and there
\emph on
exist
\emph default
some workloads where sequntial IO to HDDs is faster than to SSDs.
Sometimes, there are hidden performance bottlenecks, such as SAS busses,
or some old-generation RAID controllers.
\end_layout
\begin_layout Standard
Dedicated HDDs for
\family typewriter
/mars/
\family default
have another advantage: their mechanical head movement is completely independen
t from your data head movements.
For best performance, attach the corresponding disks to your hardware RAID
controller with BBU, building a separate RAID set (even if it consists
only of a single disk – notice that the
\series bold
hardware BBU
\series default
is the crucial point).
\end_layout
\begin_layout Standard
If you are concerned about reliability, use two disks configured as a relatively
small RAID-1 set.
For extremely high performance demands, you may consider (and check) RAID-10
and/or SSD storage.
However, SSDs are reported as less reliable.
While failures of HDDs are typically detectable in advance by upcoming
SMART media error counts, SSDs are typically failing suddenly and unexpectedly
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice: the component failure rate is not the crucial point.
Even if some types of SSDs have a better MTBF than typical HDDs: when you
can detect failure in advance, you can prevent
\end_layout
\end_inset
.
And their failure is not statistically independent in general.
Building a RAID-1 on top of SSDs bears an increased risk that
\emph on
both
\emph default
SSDs are unexpectedly failing both at the same time
\begin_inset Foot
status open
\begin_layout Plain Layout
Preliminary replacement of SSDs after a certain amount of write may help.
But it will increase cost.
\end_layout
\end_inset
.
\end_layout
\begin_layout Standard
If you want to build extremely cheap low-cost storage, for example for low-perfo
rmance backup systems or similar use cases: cheap but high-capacity nearline-SAS
\begin_inset Foot
status open
\begin_layout Plain Layout
Even cheaper SATA disks are not recommended for professional datacenter
usage.
Typically, they are not rated for 24/7/365 usage.
Even for some use cases like backup, experiences are worse.
\end_layout
\end_inset
disks may be sufficient, because the transaction logfiles are highly sequential
in their access pattern.
However, check with
\family typewriter
blkreplay
\family default
that performance is
\emph on
really
\emph default
sufficient, when compared with
\begin_inset Quotes eld
\end_inset
better
\begin_inset Quotes erd
\end_inset
disks.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Do not import the block device for
\family typewriter
/mars/
\family default
over iSCSI.
This would sacrifice both reliability and performance.
MARS is constructed for exploiting a hardware BBU cache with a typical
IO parallelism degree of 1000 parallel IO requests, over fast local DMA.
See also section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:IO-Performance-Tuning"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Consequence: never run MARS inside of a VM (other than for functional component
testing).
See also Dijkstra's layering rules in
\family typewriter
mars-architecture-guide.pdf
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Notice that the filesystem
\family typewriter
/mars/
\family default
has nothing to do with an ordinary filesystem.
It is completely reserved for MARS internal purposes, namely as a
\series bold
storage container
\series default
for MARS' persistent data.
It does not obey any userspace rules like FHS (filesystem hierarchy standard),
and it should not be accessed by any userspace tool execpt the official
\family typewriter
marsadm
\family default
tool.
Its internal data format should be a regarded as a
\series bold
blackbox
\series default
by you.
The internal data format may change in future, or the complete
\family typewriter
/mars/
\family default
filesystem may be even replaced by a totally different container format,
while the official
\family typewriter
marsadm
\family default
interface and its primitive macros are supposed to remain stable.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
That said, you might look into its contents
\emph on
by hand
\emph default
for curiosity or for
\emph on
debugging purposes
\emph default
, and only as root.
But don't program any tools / monitoring scripts / etc bypassing the official
\family typewriter
marsadm
\family default
tool.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Like DRBD, the current version of MARS has
\series bold
no security
\series default
built in.
MARS assumes that it is running in a
\series bold
trusted network
\series default
.
Anyone who can connect to the MARS ports (default 7777 to 7779) can potentially
breach in and become root.
Therefore, you
\series bold
must
\series default
protect your network by appropriate means, such as firewalling and/or encrypted
VPN.
\end_layout
\begin_layout Standard
Currently, MARS provides no shared secret like DRBD, because a simple shared
secret is way too weak to provide any real security (potentially misleading
people about the real level of security).
Future versions of MARS might provide some 2-factor authorization, and
encryption via dynamic session keys.
Until that is implemented
\begin_inset Foot
status open
\begin_layout Plain Layout
There is fundamental argument: network traffic between datacenters belongs
to a higher level than a single component like MARS.
Thus its security requirements must be solved at that higher level, but
not at the lower level of MARS.
\end_layout
\end_inset
, use a secured VPN instead.
And don't forget to
\emph on
audit
\emph default
it for security holes.
\end_layout
\begin_layout Section
MARS Kernel Module
\begin_inset CommandInset label
LatexCommand label
name "sec:MARS-Kernel-Module"
\end_inset
\end_layout
\begin_layout Standard
Always use the newest stable version (master branch) from
\begin_inset Flex URL
status open
\begin_layout Plain Layout
https://github.com/schoebel/mars
\end_layout
\end_inset
.
Please consult the file
\family typewriter
ChangeLog
\family default
there.
\end_layout
\begin_layout Standard
The MARS kernel module should be available or can be built via one of the
following methods:
\end_layout
\begin_layout Itemize
As an external Debian or rpm kernel module, as provided by a package contributor
(or hopefully by standard distros in the future).
\end_layout
\begin_layout Itemize
Via
\family typewriter
dkms
\family default
.
Although there is an example file
\family typewriter
contrib/mars-dkms.dkms
\family default
in the official MARS repo at
\begin_inset Flex URL
status open
\begin_layout Plain Layout
https://github.com/schoebel/mars
\end_layout
\end_inset
which could serve as a base for Linux distro vendors, it would suffer from
\emph on
serious performance degradation
\emph default
if it would be compiled
\emph on
without
\emph default
the MARS pre-patch.
Don't use such a version for any serious application.
With pre-patch,
\family typewriter
dkms
\family default
would be no problem.
You can check whether some already built
\family typewriter
mars.ko
\family default
kernel module has been compiled with pre-patch or not:
\begin_inset Newline newline
\end_inset
\family typewriter
modinfo mars
\family default
\begin_inset Newline newline
\end_inset
which displays the version for the currently active kernel, or any other
version via
\begin_inset Newline newline
\end_inset
\family typewriter
modinfo /path/to/mars.ko
\family default
\begin_inset Newline newline
\end_inset
This should display something like
\begin_inset Newline newline
\end_inset
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
io_driver: aio
\end_layout
\begin_layout Plain Layout
prepatch: has_prepatch
\end_layout
\end_inset
Do not use a kernel module for production if the io_driver either reports
\family typewriter
sio
\family default
in place of
\family typewriter
aio
\family default
, or if no pre-patch is detected.
\end_layout
\begin_layout Itemize
As a
\emph on
separate
\emph default
kernel module, only recommended for
\emph on
experienced
\emph default
\begin_inset Foot
status open
\begin_layout Plain Layout
You should be familiar with the problems arising from orthogonal combination
of different kernel versions with different MARS module versions and with
different
\family typewriter
marsadm
\family default
userspace tool versions at the package management level.
Hint:
\family typewriter
modinfo
\family default
is your friend.
\end_layout
\end_inset
sysadmins: see file
\family typewriter
Makefile.dist
\family default
(tested with some older versions of Debian; may need some extra work with
other distros).
\end_layout
\begin_layout Itemize
Following are recommended build instructions for senior sysadmins or developers,
inplace in the kernel source tree.
Look into the subdirectory
\family typewriter
pre-patches/
\family default
of the MARS repo for the right version of the pre-patches.
\end_layout
\begin_layout Standard
Here are example instructions for LTS kernel 4.4, building everything from
scratch at your Linux workstation, using
\family typewriter
git
\family default
.
Actions marked
\begin_inset Quotes eld
\end_inset
for safety
\begin_inset Quotes erd
\end_inset
are not generally necessary, but may be appropriate for recovery from previous
build failures.
\end_layout
\begin_layout Enumerate
\family typewriter
git clone git://git.kernel.org/pub/scm/linux/kernel/git/stable/linux-stable.git
linux-stable.git
\end_layout
\begin_layout Enumerate
\family typewriter
cd linux-stable.git
\end_layout
\begin_layout Enumerate
\family typewriter
git checkout linux-4.4.y
\end_layout
\begin_layout Enumerate
For safety:
\begin_inset Newline newline
\end_inset
\family typewriter
git pull
\end_layout
\begin_layout Enumerate
Get an appropriate old
\family typewriter
.config
\family default
file.
For example at some OpenSuSE distro:
\begin_inset Newline newline
\end_inset
\family typewriter
cp /boot/config-4.12.14-lp151.28.13-default .config
\family default
\begin_inset Newline newline
\end_inset
Notice: there are several other methods which are outside the scope of this
manual.
When in doubt, consult somebody with kernel build experience.
\end_layout
\begin_layout Enumerate
\family typewriter
make oldconfig || make olddefconfig
\end_layout
\begin_layout Enumerate
\family typewriter
cd block/
\end_layout
\begin_layout Enumerate
\family typewriter
git clone --recurse-submodules https://github.com/schoebel/mars
\end_layout
\begin_layout Enumerate
For safety, ensure you always have the newest MARS version:
\begin_inset Newline newline
\end_inset
\family typewriter
cd mars
\family default
/
\begin_inset Newline newline
\end_inset
\family typewriter
git checkout master
\begin_inset Newline newline
\end_inset
git pull
\begin_inset Newline newline
\end_inset
cd ..
\end_layout
\begin_layout Enumerate
Go back to the root of Linux git:
\begin_inset Newline newline
\end_inset
\family typewriter
cd ..
\end_layout
\begin_layout Enumerate
To avoid mixup of later actions with upstream patches:
\family typewriter
\begin_inset Newline newline
\end_inset
git branch -D mars-patches-for-4.4 || echo IGNORE THIS ERROR
\begin_inset Newline newline
\end_inset
git checkout -b mars-patches-for-4.4
\end_layout
\begin_layout Enumerate
Apply
\emph on
all(!)
\emph default
the patches from
\family typewriter
block/mars/pre-patches/vanilla-$version
\family default
.
For example with kernel 4.4:
\end_layout
\begin_deeper
\begin_layout Enumerate
For safety:
\family typewriter
\begin_inset Newline newline
\end_inset
git reset --hard; git clean -f
\end_layout
\begin_layout Enumerate
\family typewriter
git am block/mars/pre-patches/vanilla-4.4/*.patch
\end_layout
\end_deeper
\begin_layout Enumerate
\family typewriter
make menuconfig
\family default
(or another variant like
\family typewriter
make xconfig
\family default
)
\end_layout
\begin_deeper
\begin_layout Enumerate
Go to
\begin_inset Quotes eld
\end_inset
Enable the block layer
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Enumerate
Select MARS as a module (by moving the cursor and then typing
\family typewriter
m
\family default
)
\end_layout
\begin_layout Enumerate
A lot of sub-options for MARS will pop up.
Leave them at their default.
\end_layout
\begin_layout Enumerate
Save the Kconfig options to
\family typewriter
.config
\family default
and exit.
\end_layout
\end_deeper
\begin_layout Enumerate
Build the kernel, typically something like one of:
\end_layout
\begin_deeper
\begin_layout Enumerate
For Debian / Ubuntu / etc:
\begin_inset Newline newline
\end_inset
\family typewriter
make deb-pkg
\end_layout
\begin_layout Enumerate
For Redhat / CentOS / SuSE / etc:
\begin_inset Newline newline
\end_inset
\family typewriter
make rpm-pkg
\end_layout
\begin_layout Enumerate
Classical with local install:
\begin_inset Newline newline
\end_inset
\family typewriter
make -j 12 && make install modules_install
\end_layout
\begin_layout Enumerate
...
see some more variants and make targets:
\begin_inset Newline newline
\end_inset
\family typewriter
make help
\end_layout
\end_deeper
\begin_layout Enumerate
Copy and install the new Debian or rpm package to the destination servers,
activate them (system-dependent, like
\family typewriter
update-grub
\family default
or similar), and reboot your servers with the modified kernel.
\end_layout
\begin_layout Enumerate
Check that the MARS kernel module is installed (but do not yet load it):
\begin_inset Newline newline
\end_inset
\family typewriter
modinfo mars
\end_layout
\begin_layout Standard
Further / more accurate / latest instructions may be found in
\family typewriter
README
\family default
and in
\family typewriter
INSTALL
\family default
.
You must not only install the kernel and the
\family typewriter
mars.ko
\family default
kernel module to all of your bare metal cluster nodes, but also the
\family typewriter
marsadm
\family default
userspace tool.
\end_layout
\begin_layout Standard
Installing marsadm by hand is rather simple: just copy it to
\family typewriter
/usr/bin/
\family default
or
\family typewriter
/usr/local/bin
\family default
.
For example:
\end_layout
\begin_layout Itemize
\family typewriter
cp -a block/mars/userspace/marsadm /usr/local/bin/
\end_layout
\begin_layout Itemize
Alternatively, create a Debian or rpm package (named
\family typewriter
mars-utils
\family default
or
\family typewriter
mars-tools
\family default
or similar).
Since
\family typewriter
marsadm
\family default
is a basic Perl script which requires no other Perl modules, the only package
dependency is from the Perl interpreter.
Since Perl is typically already installed on virtually every Linux server,
leaving out this dependency won't be a show stopper.
\end_layout
\begin_layout Standard
With newer versions of MARS, a prepatch for vanilla kernels 3.2 through 4.9
(or even later) is no longer needed, at least in theory.
However,
\series bold
IO performance
\series default
is currently
\emph on
much
\emph default
worse when the pre-patch is not applied.
This will be hopefully addressed in a future release.
At the moment, don't use pre-patch-less MARS on any production system.
It has extremely limited IO parallelism because some performance-critical
kernel interfaces are not accessible without the pre-patch.
The command
\family typewriter
modinfo mars
\family default
will report whether the pre-patch is present at your kernel, or not (see
description of
\family typewriter
dkms
\family default
above).
\end_layout
\begin_layout Standard
Pre-patches for various kernel version can be found in the
\family typewriter
pre-patches/
\family default
subdirectory of the MARS source tree.
Following are the types of pre-patches:
\end_layout
\begin_layout Itemize
\family typewriter
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
sloppy
\end_layout
\end_inset
\begin_inset Flex URL
status open
\begin_layout Plain Layout
0001-mars-minimum-pre-patch-for-mars.patch
\end_layout
\end_inset
\family default
or similar.
Please prefer this one (when present for your kernel version) in front
of any old / deprecated
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
0001-mars-generic-pre-patch-for-mars.patch
\end_layout
\end_inset
\family default
or similar.
The latter should not be used anymore, except for testing or as an emergency
fallback.
\end_layout
\begin_layout Itemize
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
0002-mars-SPECIAL-for-in-tree-build.patch
\end_layout
\end_inset
\family default
or similar.
This is
\emph on
only
\emph default
needed when building the MARS kernel module together with all other kernel
modules in a single
\family typewriter
make
\family default
pass.
For separate external module builds (e.g.
with
\family typewriter
dkms
\family default
, or with
\family typewriter
rpmbuild
\family default
etc), this patch
\emph on
must not
\emph default
be applied (but the pre-patch
\emph on
strongly should
\emph default
if somehow possible).
When using this patch, please apply the aforementioned pre-patch also,
because your kernel will be patched anyway.
\end_layout
\begin_layout Itemize
For certain kernels like 4.14, some additional fixes may be necessary.
These are in the respective
\family typewriter
vanilla-*/
\family default
subdirectory, indicated by filename
\family typewriter
*fix*
\family default
.
Sometimes, these are
\emph on
absolutely
\emph default
needed.
For example, an endless loop in unfixed upstream vanilla kernels >= 4.10
may occur upon network timeouts.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Starting from version
\family typewriter
mars0.1stable56
\family default
or
\family typewriter
mars0.1abeta8
\family default
,
\series bold
submodules
\series default
have been added to the github repo of MARS.
If you have an old git checkout, please say
\family typewriter
git pull --recurse-submodules=yes
\family default
or similar.
Otherwise you may be missing an important future part of the MARS release,
without notice (depending on your local
\family typewriter
git
\family default
version and its local configuration).
\end_layout
\begin_layout Section
Setup Primary and Secondary Cluster Nodes
\begin_inset CommandInset label
LatexCommand label
name "sec:Setup-Primary-and"
\end_inset
\end_layout
\begin_layout Standard
If you already have some production data on your bare metal servers via
LVM, you may skip some of the following subsections.
\end_layout
\begin_layout Standard
In case your data is already replicated with DRBD, you may migrate to MARS
(or even back from MARS to DRBD) if you use
\emph on
external
\begin_inset Foot
status open
\begin_layout Plain Layout
\emph on
Internal
\emph default
DRBD metadata should also work as long as the filesystem inside your block
device / disk already exists and is not re-created.
The latter would destroy the DRBD metadata, but even that will not hurt
you really: you can always switch back to DRBD using
\emph on
external
\emph default
metadata, as long as you have some small spare space somewhere.
\end_layout
\end_inset
\emph default
DRBD metadata (which is not touched by MARS).
Internal DRBD metadata is reported to also work, because it resides at
the end of the block device.
However, you will waste some small amount of storage.
\end_layout
\begin_layout Standard
Migrating back to DRBD is also possible, provided you re-initialize the
DRBD meta-data again.
\end_layout
\begin_layout Standard
For the following instructions to work, you must be
\family typewriter
root
\family default
on your servers.
\end_layout
\begin_layout Subsection
Setup Hardware
\begin_inset CommandInset label
LatexCommand label
name "subsec:Setup-Hardware"
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Do not use MARS inside of VMs.
Only use at bare metal!
\end_layout
\begin_layout Standard
When using hardware RAID controllers with hardware BBU (as is highly recommended
), you will need to build your RAID sets with the corresponding tools.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Don't set your hardware BBU cache to
\begin_inset Quotes eld
\end_inset
writethrough
\begin_inset Quotes erd
\end_inset
mode.
This may lead to tremendous performance degradation.
Use the default
\begin_inset Quotes eld
\end_inset
writeback
\begin_inset Quotes erd
\end_inset
strategy instead.
It should be operationally safe, because in case of power loss the BBU
cache content will be preserved thanks to the battery, and/or thanks to
goldcaps for saving the cache content into some flash chips.
\end_layout
\begin_layout Standard
In the following sections, we assume that two RAID sets are already built,
and are accessible as
\family typewriter
/dev/sdb
\family default
and
\family typewriter
/dev/sdc
\family default
.
\end_layout
\begin_layout Subsection
Setup the Network
\begin_inset CommandInset label
LatexCommand label
name "subsec:Setup-the-Network"
\end_inset
\end_layout
\begin_layout Standard
Here are only brief recommendations.
Network setup is outside the scope of this manual.
Recommended are the following basics:
\end_layout
\begin_layout Itemize
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Avoid layer 2 coupling
\emph on
between
\emph default
datacenters.
MARS requires only TCP/IP (typically over IPv4 default ports 7776\SpecialChar ldots
7779)
for replication traffic, so layer 4 coupling (aka routing) is sufficient.
Of course, the lower layers are always present inside the
\emph on
same
\emph default
datacenter, so just avoid
\emph on
unnecessary
\emph default
lower-layer coupling
\emph on
between
\emph default
datacenters.
Any problems caused by the network and its setup are up to your own.
\end_layout
\begin_layout Itemize
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
As explained in
\begin_inset Flex URL
status open
\begin_layout Plain Layout
architecture-guide-geo-redundancy.pdf
\end_layout
\end_inset
, dedicated replication networks are
\emph on
recommended
\emph default
for
\emph on
long-distance
\emph default
replication of hundreds or thousands of servers.
\end_layout
\begin_layout Itemize
Best practice: ensure that
\emph on
each
\emph default
of your cluster hosts can
\family typewriter
ping
\family default
to
\emph on
each
\emph default
other (which means
\begin_inset Formula $O(k^{2})$
\end_inset
potential network connections), via their
\emph on
pure hostname.
\begin_inset Newline newline
\end_inset
\emph default
Example on hostA:
\family typewriter
ping hostB
\end_layout
\begin_layout Itemize
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you have only 1 server IP over 1 physical ethernet interface, classical
datacenter-internal DNS (as typically used for sysadmin
\family typewriter
ssh
\family default
access etc) is sufficient.
If you have a separate replication network, e.g.
a separate physical ethernet interface
\family typewriter
eth1
\family default
in addition to classical
\family typewriter
eth0
\family default
, you
\emph on
might
\emph default
omit another DNS entry
\emph on
theoretically
\emph default
.
Although several
\family typewriter
marsadm
\family default
commands are supporting separate
\family typewriter
$host_ip
\family default
parameters for circumvention of DNS, working directly on IP addresses is
\emph on
not
\emph default
a best practice.
Out of many alternatives, try to
\emph on
avoid
\emph default
separate DNS names for the
\family typewriter
eth1
\family default
-specific master IP, but
\emph on
consider
\emph default
to use
\emph on
local routing
\emph default
for the MARS ports 7776 to 7779 over
\family typewriter
eth1
\family default
, while other ports may remain on
\family typewriter
eth0
\family default
.
Such a port-specific routing setup will make you
\emph on
independent
\emph default
from changes in the network or hardware setup, and it will make the DNS
less complex.
Your scripting will also benefit from simplicity.
On the other hand, beware of (internal or external) routing problems.
However, operations of professional datacenters needs to deal with suchalike
playgrounds anyway.
This MARS-specific guide cannot dive into details.
\end_layout
\begin_layout Itemize
Firewalling is also OT = Off Topic here.
Recommendation: KISS = Keep It Simple and Stupid.
\end_layout
\begin_layout Itemize
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Avoid FQDNs for any testing, and do not encode domain names into any scripting.
See also section
\begin_inset CommandInset ref
LatexCommand vref
reference "sec:Setup-OS"
plural "false"
caps "false"
noprefix "false"
\end_inset
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:Setup-OS"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Section
Setup / Install OS
\begin_inset CommandInset label
LatexCommand label
name "sec:Setup-OS"
\end_inset
\end_layout
\begin_layout Standard
Installing a Linux distribution is outside the scope of this manual.
There are dozens of methods, each of them working differently in detail.
Here are only some rough hints for avoidance of problems with MARS:
\end_layout
\begin_layout Itemize
Hostnames need to be entered into typical installers, e.g.
as used by major Linux distros.
In case you have selected a bad name, you can typically change it, e.g.
via your favourite tool like
\family typewriter
yast
\family default
or
\family typewriter
zypper
\family default
or
\family typewriter
yum
\family default
or the equivalent Debian / Ubuntu tools, and os on, or manally like
\family typewriter
vi /etc/hostname
\family default
followed by reboot, or similar.
However, do this
\series bold
only
\emph on
before
\emph default
MARS is configured
\series default
.
Here are
\series bold
pitfalls you need to know
\series default
:
\end_layout
\begin_deeper
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
As is best practice since decades: only use
\emph on
plain
\emph default
hostnames,
\emph on
separated from
\emph default
domain names.
This means: the shell command
\family typewriter
hostname
\family default
\series bold
\series default
(and siblings like
\family typewriter
uname -n
\family default
)
\series bold
must
\series default
deliver exactly 1 word, without any dot.
Only use
\emph on
this
\emph default
name in later marsadm commands.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Of course, you
\emph on
may
\emph default
also set a
\series bold
domain name
\series default
as is typically reported by the shell command
\family typewriter
domainname
\family default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Do not enter any domain name into the
\family typewriter
hostname
\family default
field of several major Linux distros.
Typically, the entered domainname will then become
\emph on
part of
\emph default
the hostname, which will not only ENDAGER YOUR DATA, but is also a well-known
fault in the Linux and UNIX ecosystems since decades.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Always enter any domainname
\emph on
separately
\emph default
, typically into a different field, or via a different shell command, or
similarly.
If this is not possible during installation, do it later, and
\emph on
do not forget it
\emph default
.
Ensure that the shell command
\family typewriter
hostname
\family default
(or any other host-based command) will never report
\emph on
any part
\emph default
of any / the domainname!
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Why? because there exist OS setups where a host can be member of
\emph on
multiple domains
\emph default
, all in parallel.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Historically, there were
\emph on
several types of domains
\emph default
, e.g.
from YP ~ NIS driven Sun setups.
Some alternate domain setups are used today, e.g.
by Microsoft, or by non-DNS driven network protocols, by CIFS, or by some
printer domains, and so on.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\emph on
Never
\emph default
use domain names in later
\family typewriter
marsadm
\family default
commands! This will pay off, because you typically can change the domainname(s)
later, e.g.
when your machine is expedited to a different location (like moves of whole
datacenters), or you may configure
\emph on
multiple
\emph default
domainnames under certain circumstances.
Only the
\emph on
hostname
\emph default
has to be treated as a
\emph on
unique
\emph default
\series bold
immutable ID of your machine
\series default
.
Other hardware or software configurations like MAC addresses or IP addresses
or DNS zones etc will be typically reconfigurable (when done properly).
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Q: why is the
\family typewriter
hostname
\family default
used as a dot-less machine ID, although there exist a
\emph on
multitude
\emph default
of UUIDs at hardware level?
\begin_inset Newline newline
\end_inset
A: because defective hardware is actually repaired in big datacenters, e.g.
new mainboards, new CPUs, or even (partially)
\series bold
preconfigured spare machines
\series default
where
\emph on
nothing
\emph default
has survived from the old hardware.
MARS supports a
\series bold
variety of repair strategies
\series default
by placing MARS' machine ID into the
\emph on
traditional
\emph default
\family typewriter
hostname
\family default
, independently from any number of domain or DNS names etc, and their contradict
ory shortcomings.
This is a
\emph on
feature
\emph default
, not a bug, and you
\emph on
agreed
\emph default
to this built-in feature of MARS by
\emph on
usage
\emph default
, see the GPL and its license terms and conditions like FITNESS FOR A PARTICULAR
PURPOSE.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Best practice: start your immutable hostname with a lowercase letter from
\family typewriter
a
\family default
to
\family typewriter
z
\family default
, and avoid uppercase letters completely.
Avoid non-English letters from other languages.
Avoid utf-8 etc.
You may include some numbers, and the
\family typewriter
marsadm
\family default
tool will later automatically sort these parts numerically, even when the
number of digits is varying.
Do not use the underscore symbol
\family typewriter
_
\family default
.
When separators are necessary, simply replace it with an
\emph on
infix
\emph default
dash.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: use
\emph on
short
\emph default
but
\emph on
recognizable
\emph default
hostnames according to the Unix Philosophy.
You will likely type these names very often in the following years! In
a huge company, prefer a
\emph on
systematic
\emph default
naming + numbering scheme which is easyly usable by a bigger sysadmin team.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: for long-distance replication, you should encode the
\emph on
datacenter name
\emph default
resp the
\emph on
datacenter region
\emph default
(or similar) with 2 or 3 lowercase letters.
This makes it
\series bold
less risky
\series default
for humans during midnight incidents to get caught by
\series bold
typos
\series default
!
\begin_inset Newline newline
\end_inset
Example: pair the hostname
\family typewriter
cpu-wc1234
\family default
with
\family typewriter
cpu-me1234
\family default
where cpu denotes the machine class,
\family typewriter
wc
\family default
means the
\begin_inset Quotes eld
\end_inset
west coast
\begin_inset Quotes erd
\end_inset
datacenter while
\family typewriter
me
\family default
means the
\begin_inset Quotes eld
\end_inset
middle east
\begin_inset Quotes erd
\end_inset
datacenter, and 1234 is the
\emph on
cluster
\emph default
number, not a sequential machine number.
Thus you don't need to lookup partner machine names or numbers from some
database, even when you just woke up from your sleep at midnight.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Do not use silly
\begin_inset Foot
status open
\begin_layout Plain Layout
As a protection against sillyness, the list of silly basic names in
\family typewriter
marsadm
\family default
may be extended in future.
\end_layout
\end_inset
hostnames like
\family typewriter
none
\family default
/
\family typewriter
all
\family default
/
\family typewriter
any
\family default
/
\family typewriter
undefined
\family default
/
\family typewriter
local
\family default
/
\family typewriter
localhost
\family default
which are reserved specifiers for
\family typewriter
marsadm
\family default
.
When unsure, consult
\family typewriter
marsadm --help
\family default
.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
NEVER EVER modify the hostname
\emph on
after
\emph default
and/or
\emph on
during
\emph default
MARS is already installed, or is already running!
\series bold
Any (human) error is your fault!
\begin_inset Newline newline
\end_inset
See also the GPL: NO WARRANTY
\begin_inset Newline newline
\end_inset
11.
BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY FOR
THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.
EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER
PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER
EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH
YOU.
SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY
SERVICING, REPAIR OR CORRECTION.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
You are FULLY RESPONSIBLE if you do any of the following.
There is NO WARRANTY according to the GPL.
If you
\emph on
really
\emph default
need to change the hostname, first stop all of your applications, then
decommission MARS
\emph on
fully
\emph default
via
\family typewriter
marsadm leave-resource
\family default
and
\family typewriter
marsadm leave-cluster
\family default
commands (see later descriptions), and unload the MARS kernel module via
\family typewriter
rmmod mars
\family default
.
Afterwards, you MUST re-create the
\family typewriter
/mars
\family default
filesystem for safety, typically via
\family typewriter
mkfs.ext4
\family default
.
Be
\series bold
100% sure
\series default
that all of this has
\emph on
fully succeeded
\emph default
.
After decommisioning and deconfiguration of the stack parts
\emph on
above
\emph default
of
\family typewriter
/dev/lv/mydata
\family default
(see the following sections), you can
\emph on
try
\emph default
to change the hostname.
CHECK YOUR WHOLE SETUP, and finally you are
\emph on
fully responsible
\emph default
for re-configuration of the formerly deconfigured parts under the new hostname,
as described in the following sections.
\end_layout
\begin_layout Enumerate
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: by not decommissioning your disks
\family typewriter
/dev/lv/mydata
\family default
, you may keep your valuable data.
However, you are also fully responsible for any error in device naming,
device location, device content, etc.
\end_layout
\end_deeper
\begin_layout Subsection
Setup LVM
\begin_inset CommandInset label
LatexCommand label
name "subsec:Setup-LVM"
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Execute the following instructions only once after bare metal hardware
deployment, or if you want to
\emph on
fully
\emph default
re-install your server.
Otherwise, you may delete existing data.
\end_layout
\begin_layout Enumerate
First step is create the LVM meta-information on the RAID sets
\family typewriter
/dev/sdc
\family default
and
\family typewriter
/dev/sdc
\family default
:
\begin_inset Newline newline
\end_inset
\family typewriter
pvcreate /dev/sdb
\family default
\begin_inset Newline newline
\end_inset
\family typewriter
pvcreate /dev/sdc
\end_layout
\begin_layout Enumerate
Check your physical volumes:
\begin_inset Newline newline
\end_inset
\family typewriter
pvs
\end_layout
\begin_layout Enumerate
Create a volume group:
\begin_inset Newline newline
\end_inset
\family typewriter
vgcreate vg /dev/sdb /dev/sdc
\end_layout
\begin_layout Enumerate
Check your volume group:
\begin_inset Newline newline
\end_inset
\family typewriter
vgs
\end_layout
\begin_layout Enumerate
Create a LV for /mars:
\begin_inset Newline newline
\end_inset
\family typewriter
lvcreate -i 2 -L 100G -n mars lv
\end_layout
\begin_layout Enumerate
Check your list of LVs:
\begin_inset Newline newline
\end_inset
\family typewriter
lvs
\end_layout
\begin_layout Subsection
Setup Cluster Nodes
\begin_inset CommandInset label
LatexCommand label
name "subsec:Setup-your-Cluster"
\end_inset
\end_layout
\begin_layout Standard
For your cluster, you need at least two bare metal nodes.
In the following, they will be called hostA and hostB.
In the beginning, hostA will have the
\family typewriter
primary
\family default
role, while hostB will be your initial
\family typewriter
secondary
\family default
.
The roles may change later.
\end_layout
\begin_layout Enumerate
On each of hostA and hostB, create the
\family typewriter
/mars/
\family default
mountpoint:
\begin_inset Newline newline
\end_inset
\family typewriter
mkdir /mars
\end_layout
\begin_layout Enumerate
On each host, create an
\family typewriter
ext4
\family default
filesystem on your separate disk / RAID set via
\family typewriter
mkfs.ext4
\begin_inset Foot
status open
\begin_layout Plain Layout
Don't use
\family typewriter
xfs
\family default
for
\family typewriter
/mars
\family default
.
Its late allocation strategy may lead to deadlocks and other problems,
at least with some elder kernel versions.
\end_layout
\end_inset
\family default
\begin_inset Newline newline
\end_inset
\family typewriter
mkfs.ext4 /dev/vg/mars
\end_layout
\begin_layout Enumerate
On each host, mount that filesystem to
\family typewriter
/mars/
\family default
.
It is advisable to add an entry to
\family typewriter
/etc/fstab
\family default
., or to create a systemd unit
\family typewriter
mars.mount
\family default
.
Here we just mount it by hand:
\begin_inset Newline newline
\end_inset
\family typewriter
mount /dev/vg/mars /mars
\end_layout
\begin_layout Enumerate
For security reasons, execute
\family typewriter
chmod 0700 /mars
\family default
everyhwere after
\family typewriter
/mars/
\family default
has been mounted.
If you forget this step, any following
\family typewriter
marsadm
\family default
command will drop you a warning, but will fix the problem for you.
\end_layout
\begin_layout Enumerate
On hostA:
\family typewriter
marsadm create-cluster
\family default
\begin_inset Newline newline
\end_inset
This must be done
\emph on
exactly once
\emph default
, on exactly one node of your cluster (the
\emph on
first
\emph default
node).
Never do this twice or on different hosts, because that would create two
different clusters which would have nothing to do with each other.
The
\family typewriter
marsadm
\family default
tool protects you against accidentally joining / merging two different
clusters.
If you accidentally created two different clusters, just umount that
\family typewriter
/mars/
\family default
partition and start over with step 2.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Nodenames (see
\family typewriter
uname -n
\family default
and
\family typewriter
man 1 uname
\family default
and
\family typewriter
man 2 uname
\family default
) are the most critical part of your setup.
They
\series bold
must
\series default
be
\series bold
globally unique
\series default
, and they
\series bold
must never change, perpetually.
Any (human) error is your fault!
\begin_inset Newline newline
\end_inset
See also the GPL: NO WARRANTY
\begin_inset Newline newline
\end_inset
11.
BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY FOR
THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.
EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER
PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER
EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH
YOU.
SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY
SERVICING, REPAIR OR CORRECTION.
\end_layout
\begin_layout Enumerate
Except for historic versions
\begin_inset Foot
status open
\begin_layout Plain Layout
\begin_inset CommandInset label
LatexCommand label
name "foot:port_problems-1"
\end_inset
Old versions of MARS before mars0.1astable101 needed a working
\family typewriter
ssh
\family default
connection from hostB to hostA (as
\family typewriter
root
\family default
), and also in the opposite direction, and between
\emph on
all
\emph default
(current and future) cluster members.
The following is an advice for a historic method.
Test ssh on hostB:
\end_layout
\begin_layout Itemize
\paragraph_spacing other 0
\noindent
\family typewriter
ssh hostA w
\end_layout
\begin_layout Plain Layout
\noindent
This needs to work without entering a password.
Ensure that it also works in the opposite direction.
In addition,
\family typewriter
rsync
\family default
must be installed.
\end_layout
\begin_layout Plain Layout
Hints:
\emph on
very useful
\emph default
is
\family typewriter
ssh-agent
\family default
and
\family typewriter
ssh -A
\family default
preconfigured via
\family typewriter
/etc/ssh/ssh{,d}_config
\family default
.
Hint 2 (experiences from the
\family typewriter
football
\family default
project): if you don't use
\family typewriter
ssh-agent
\family default
(or if you
\emph on
disallow
\emph default
it explicitly by default and allow it only exceptionally), then you will
waste a lot of time and energy with trivial basics.
\family typewriter
marsadm
\family default
has got some provisionary workarounds, like internal fallback to an internal
list of
\family typewriter
ssh
\family default
ports, but suchalike isn't recommended.
Just configure your
\family typewriter
ssh
\family default
infrastructure in such a ways that it works
\emph on
smoothly
\emph default
.
\end_layout
\begin_layout Plain Layout
Similar waste of time and energy will occur if you follow the ill-belief
that (static or dynamic) firewalling on the MARS ports 7776 to 7779 would
be a
\begin_inset Quotes eld
\end_inset
clever
\begin_inset Quotes erd
\end_inset
idea, and/or if you
\begin_inset Quotes eld
\end_inset
sell
\begin_inset Quotes erd
\end_inset
some
\begin_inset Quotes eld
\end_inset
features
\begin_inset Quotes erd
\end_inset
like
\emph on
port knocking
\emph default
on MARS ports to the management.
The quality of such ideas could be disguised if you noticed that your dedicated
replication network
\emph on
is
\emph default
already separated by construction, or it
\emph on
could
\emph default
be done (e.g.
via
\emph on
simple
\emph default
network-level firewalling) with
\emph on
less effort
\emph default
.
Simply, and frankly:
\series bold
do not shoot yourself in your foot
\series default
.
\end_layout
\begin_layout Plain Layout
Another way for damaging yourself is usage of old MARS versions.
Notice that MARS has drastically improved in functional and non-functional
aspects during the last years.
\end_layout
\begin_layout Plain Layout
Some historic hint for those who
\emph on
want to
\emph default
shoot themselves, or are
\emph on
forced
\emph default
to non-productively
\emph on
test
\emph default
something from the ancient world: in old MARS versions, you
\emph on
must not
\emph default
modprobe before join-cluster is executed.
In newer versions, it is vice versa.
\begin_inset CommandInset label
LatexCommand label
name "foot:port_problems-2"
\end_inset
\end_layout
\end_inset
of MARS, execute on
\emph on
both
\emph default
hosts hostA and hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
modprobe mars
\end_layout
\begin_layout Enumerate
On hostB
\family typewriter
:
\begin_inset Newline newline
\end_inset
marsadm join-cluster hostA
\end_layout
\begin_layout Enumerate
When not yet done, do on each of your hosts:
\begin_inset Newline newline
\end_inset
\family typewriter
modprobe mars
\end_layout
\begin_layout Enumerate
Check that mars is running everywhere:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm view all
\end_layout
\begin_layout Enumerate
Ignore any warnings that no resources are yet defined.
But you should check that no warnings about network connections are appearing.
Both cluster nodes should be able to communicate with each other over the
MARS ports (default 7777 to 7779).
\end_layout
\begin_layout Enumerate
Additional checks, to be executed on
\emph on
all
\emph default
of your hosts:
\begin_inset Newline newline
\end_inset
\family typewriter
netstat -lp --tcp | grep 777
\begin_inset Newline newline
\end_inset
netstat --tcp | grep 777
\begin_inset Newline newline
\end_inset
\family default
Both variants should show up some healty connections.
If not, fix your network configuration and/or firewalling etc.
Details are outside of the scope of this manual.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Beware of
\emph on
asymmetric connections
\emph default
, e.g.
caused by inappropriate networking or firewall rules.
\emph on
Any
\emph default
host must be able to communicate with
\emph on
any
\emph default
other host,
\emph on
at least
\emph default
in the
\emph on
same
\emph default
cluster.
See also the big footnote
\begin_inset CommandInset ref
LatexCommand ref
reference "foot:port_problems-1"
plural "false"
caps "false"
noprefix "false"
\end_inset
starting
\begin_inset CommandInset ref
LatexCommand vpageref
reference "foot:port_problems-1"
plural "false"
caps "false"
noprefix "false"
\end_inset
(ending
\begin_inset CommandInset ref
LatexCommand vpageref
reference "foot:port_problems-2"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Do not shoot yourself in your foot by the ill-belief that it would be easy
to control the (replication) network traffic and/or to manage fine-granular
firewalling on hundreds or thousands of machines, whether a single huge
BigCluster or many smaller clusters, e.g.
pairwise and/or according to the current LV replica situation etc.
Big systems (as such) are not only prone to sporadics like defective hardware,
they also tend to
\emph on
some dynamic behaviour
\emph default
like growth and hardware lifecyle.
Thus they need
\emph on
updates
\emph default
and housekeeping in an
\emph on
incremental
\begin_inset Foot
status open
\begin_layout Plain Layout
Big systems are often
\series bold
close to 24/7/365
\series default
und thus need
\emph on
incremental
\emph default
updates / housekeeping at
\series bold
\emph on
every
\emph default
layer
\series default
, including networking and many sub-components.
\end_layout
\end_inset
\emph default
manner.
They aren't static piles of metal and fibres.
Networking and its configuration should also obey: KISS = Keep It Simple
and Stupid.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Well-done
\emph on
coarse
\emph default
granularity at network level is your friend.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you try to reduce the risk, or are already hit by asymmetric MARS connection
s, e.g.
for some historic reasons or due to sporadic ARP-cache overflows etc: regularly
check (e.g.
via monitoring, and/or via long-running background jobs) that
\emph on
all
\emph default
MARS ports are operational, and in
\emph on
all combinations
\emph default
from each server to each other server.
\end_layout
\begin_layout Section
Setup Housekeeping Cron Job
\begin_inset CommandInset label
LatexCommand label
name "subsec:Logfile-Rotation"
\end_inset
\end_layout
\begin_layout Standard
As explained in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:The-Transaction-Logger"
\end_inset
, all changes to your resource data are recorded in transaction logfiles
residing on the
\family typewriter
/mars/
\family default
filesystem.
These files are always growing over time.
In order to avoid filesystem overflow, the following must be executed in
regular time intervals:
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm cron
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Best practice is to run
\family typewriter
marsadm cron
\family default
in a
\family typewriter
cron
\family default
job, such as
\family typewriter
/etc/cron.d/mars
\family default
.
An example cronjob can be found in the
\family typewriter
userspace/cron.d/
\family default
subdirectory of the git repo.
\color gray
Of course, alternatives to
\family typewriter
crontab
\family default
may be also used, but please ensure that
\family typewriter
marsadm cron
\family default
processes aren't invoked in high parallelism to each other on the
\emph on
same
\emph default
cluster host.
On
\emph on
different
\emph default
hosts / distributed systems, parallelism is of course fully OK.
Just avoid any
\emph on
unnecessary
\emph default
local parallelism.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In addition, you should establish some regular monitoring of the free space
present in the
\family typewriter
/mars/
\family default
filesystem.
\end_layout
\begin_layout Standard
More detailed information about about avoidance of
\family typewriter
/mars/
\family default
overflow is in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Defending-Overflow"
\end_inset
.
\end_layout
\begin_layout Standard
Here is some more background information if you want to configure your system
cronjob manually.
In most installations, a 10 minute cron interval should be sufficient.
Here is an example line, to be placed in a file like
\family typewriter
/etc/cron.d/mars
\family default
:
\end_layout
\begin_layout Enumerate
\family typewriter
*/10 * * * * root if [ -L /mars/uuid ] ; then marsadm cron ; fi > /dev/null
2>&1
\end_layout
\begin_layout Standard
Here is some background explanation about some internal intermediate steps,
as executed by
\family typewriter
marsadm cron
\family default
.
The following is DEPRECATED.
Use cron for operations.
Skip the following except for debugging:
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm log-rotate all
\family default
\begin_inset Newline newline
\end_inset
This starts appending to a new logfile on all of your resources.
The logfiles are automatically numbered by an increasing 9-digit logfile
number.
This will suffice for many centuries even if you would logrotate once a
minute.
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm log-delete-all all
\family default
\begin_inset Newline newline
\end_inset
This determines all logfiles from all resources which are no longer needed
(i.e.
which are
\emph on
fully
\emph default
replayed, on
\emph on
all
\emph default
relevant secondaries).
All superfluous logfiles are then deleted, including all copies on all
secondaries.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
The current version of MARS deletes either
\emph on
all
\emph default
replicas of a logfile everywhere, or
\emph on
none
\emph default
of the replicas.
This is a simple rule, but has the drawback that one node may hinder other
nodes from freeing space in
\family typewriter
/mars/
\family default
.
In particular, the command
\family typewriter
marsadm pause-replay $res
\family default
(as well as
\family typewriter
marsadm disconnect $res
\family default
) will freeze the space reclamation in the whole cluster when the pause
is lasting very long.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
During such space accumulation, also the number of so-called deletions
will accumulate in /mars/todo-global/ and sibling directories.
In very big installations consisting of thousands of nodes, it is a good
idea to regularly monitor the number of deletions similarly to the following:
\family typewriter
$(find /mars/ -name
\begin_inset Quotes eld
\end_inset
delete-*
\begin_inset Quotes erd
\end_inset
| wc -l)
\family default
should not exceed a limit of ~150 entries.
\end_layout
\begin_layout Standard
Please prefer the short form
\family typewriter
marsadm cron
\family default
both for human usage, and as an equivalent to scripting two separate commands
\family typewriter
marsadm log-rotate all
\family default
and
\family typewriter
marsadm log-delete-all all
\family default
.
The short form is not only easier to remember, but also future-proof in
case some new MARS features should be added.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Optional, only when running
\emph on
masses
\emph default
of
\family typewriter
marsadm leave-cluster
\family default
or
\family typewriter
leave-resource
\family default
or
\family typewriter
split-cluster
\family default
in
\emph on
huge
\emph default
masses (e.g.
when running
\family typewriter
Football
\family default
for hardware lifecyle or for long-term load balancing over a very long
time): newer versions of
\family typewriter
marsadm
\family default
can also delete some very old remains, which could accumulate over a very
long time (typically years).
Just run
\family typewriter
marsadm cron --autoclean
\family default
everywhere once per month, or once per year.
\end_layout
\begin_layout Section
Creating and Maintaining Resources
\begin_inset CommandInset label
LatexCommand label
name "sec:Creating-and-Maintaining"
\end_inset
\end_layout
\begin_layout Standard
For the sake of simplicity, the underlying LV as well as its later logical
resource name as well as its later virtual device name will all be named
uniformly by the same suffix
\family typewriter
mydata
\family default
.
In general, you might name each of them differently, but suchalike is not
recommended, since it may easily lead to confusion in larger installations.
\end_layout
\begin_layout Standard
You may have some already pre-existing
\family typewriter
/dev/lv/mydata
\family default
at the initially primary hostA.
Before using it for MARS, it must be unused for any other purpose (such
as being mounted, or used by DRBD, etc).
MARS will require
\series bold
exclusive access
\series default
to it.
\end_layout
\begin_layout Standard
If
\family typewriter
/dev/lv/mydata
\family default
already exists and contains some data (e.g.
previously used by DRBD), you should skip the first three steps, otherwise
you may destroy your data.
\end_layout
\begin_layout Enumerate
On both hostA and hostB, create a LV.
In this example, its size is 50G:
\begin_inset Newline newline
\end_inset
\family typewriter
lvcreate -i 2 -L 50G -n mydata lv
\end_layout
\begin_layout Enumerate
On each node, check that the new LV is occurring in each of the following
lists:
\begin_inset Newline newline
\end_inset
\family typewriter
lvs
\end_layout
\begin_layout Enumerate
Only on hostA, you may create a new filesystem:
\begin_inset Newline newline
\end_inset
\family typewriter
mkfs.xfs /dev/vg/mydata
\family default
\begin_inset Newline newline
\end_inset
Alternatively, here is a variant for creation of a zfs filesystem:
\begin_inset Newline newline
\end_inset
\family typewriter
zpool create /dev/vg/mydata
\family default
\begin_inset Newline newline
\end_inset
\family typewriter
zpool export /dev/vg/mydata
\end_layout
\begin_layout Enumerate
Only on hostA, say
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm create-resource mydata /dev/lv/mydata
\family default
\begin_inset Newline newline
\end_inset
As a result, a directory
\family typewriter
/mars/resource-mydata/
\family default
will be created on hostA, containing some symlinks.
hostA will automatically start in the primary role for this resource.
Therefore, a new pseudo-device
\family typewriter
/dev/mars/mydata
\family default
will appear after a few seconds.
\begin_inset Newline newline
\end_inset
Note that the initial content of
\family typewriter
/dev/mars/mydata
\family default
will be
\emph on
exactly
\emph default
the same as in your pre-existing LV
\family typewriter
/dev/lv/mydata
\family default
.
\begin_inset Newline newline
\end_inset
If you like, you may now use
\family typewriter
/dev/mars/mydata
\family default
for mounting your already pre-existing data, or for creating a fresh filesystem
, or for exporting via iSCSI, and so on.
You may do so even before any other cluster node has joined the resource
(so-called
\begin_inset Quotes eld
\end_inset
standalone mode
\begin_inset Quotes erd
\end_inset
).
But you can also do so later after setup of (one ore many) secondaries.
\end_layout
\begin_layout Enumerate
On hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm wait-cluster
\family default
\begin_inset Newline newline
\end_inset
Check that the directory
\family typewriter
/mars/resource-mydata/
\family default
and its symlink content is also appearing on hostB.
If not, check your network and/or firewall setup.
\end_layout
\begin_layout Enumerate
On hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm join-resource mydata /dev/lv/mydata
\family default
\begin_inset Newline newline
\end_inset
As a result, the initial full-sync from node A to node B should start automatica
lly.
\end_layout
\begin_layout Enumerate
On hostB, check that the sync is running after a few seconds:
\begin_inset Newline newline
\end_inset
\family typewriter
watch marsadm view all
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Of course, now any old content
\family typewriter
/dev/lv/mydata
\family default
at hostB (and
\emph on
only
\emph default
there!) is overwritten by the version from hostA.
This is just what you wanted to do by setting up MARS replication.
If you didn't check that your old contents at hostB didn't contain any
valuable data (or if you accidentally provided a wrong LV device argument),
it is too late now.
Therefore, double-check that you are running
\family typewriter
create-resource
\family default
and
\family typewriter
join-resource
\family default
at the right sides of your cluster, and with the right block device names.
Accidental confusion of the right sides, or accidental confusion of LV
names may overwrite valuable data with wrong data, or even with uninitialized
trash
\begin_inset Foot
status open
\begin_layout Plain Layout
Trying to mount unintitialized LV data is bad practice.
It may even crash your kernel.
\end_layout
\end_inset
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In order to reduce suchalike risks,
\family typewriter
marsadm
\family default
does some basic checks.
It checks that the disk device argument is really a block device, and that
exclusive access to it is possible, as well as some further safety checks,
e.g.
whether the size is big enough.
Notice that bigger replica device sizes are allowed at secondaries, although
then you will waste some space.
In such a case,
\family typewriter
marsadm view all
\family default
will display a warning.
This behaviour is necessary as an intermediate step for online resizing
via
\family typewriter
marsadm resize
\family default
.
\end_layout
\begin_layout Standard
MARS cannot know the
\emph on
purpose
\emph default
of your generic block device.
MARS (as well as DRBD) is completely ignorant of the
\emph on
contents
\emph default
of a generic block device; it does not interpret it in any way.
Therefore, you may use MARS (as well as DRBD) for mirroring Windows filesystems
, or raw devices from databases, or virtual machines, or whatever.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Check that state
\family typewriter
Orphan
\family default
is left after a while on hostB.
Notice that
\family typewriter
join-resource
\family default
is only
\emph on
starting
\emph default
a new replica, but does not wait for its completion.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
By default, MARS uses the so-called
\begin_inset Quotes eld
\end_inset
fast fullsync
\begin_inset Quotes erd
\end_inset
algorithm.
It works similar to
\family typewriter
rsync
\family default
, first reading the data on both sides and computing an md5 checksum for
each block.
Heavy-weight data is only transferred over the long-distance network upon
checksum mismatch.
This is extremely fast if your data is already (almost) identical on both
sides.
Conversely, if you know in advance that your initial data is completely
different on both sides, you may choose to switch off the fast fullsync
algorithm via
\family typewriter
echo 0 > /proc/sys/mars/do_fast_fullsync
\family default
in order to save the additional IO overhead and network latencies introduced
by the separate checksum comparison steps.
\end_layout
\begin_layout Enumerate
Optionally, only for experienced sysadmins who
\emph on
really
\emph default
know what they are doing: if you will create a
\emph on
new
\emph default
filesystem on
\family typewriter
/dev/mars/mydata
\family default
\emph on
after(!)
\emph default
having created the MARS resource as well as
\emph on
after
\emph default
having already joined it on every replica, you may abandon the fast fullsync
phase
\emph on
before
\emph default
creating the fresh filesystem, because the old content of
\family typewriter
/dev/mars/mydata
\family default
will then be just garbage not used by the freshly created filesystem
\begin_inset Foot
status open
\begin_layout Plain Layout
It is
\emph on
vital
\emph default
that the transaction logfile contents created by
\family typewriter
mkfs
\family default
is
\emph on
fully
\emph default
propagated to the secondaries and then replayed there.
\end_layout
\begin_layout Plain Layout
Analogously, another exception is also possible, but at your own risk (be
careful, really!): when migrating your data from DRBD to MARS, and you
have ensured that (1) at the end of using DRBD both your replicas were
really equal (you should have checked that), and (2) before and after setting
up any side of MARS (
\family typewriter
create-resource
\family default
as well as
\family typewriter
join-resource
\family default
) nothing has been written at all to it (i.e.
no usage, neither of
\family typewriter
/dev/lv/mydata
\family default
nor of
\family typewriter
/dev/mars/mydata
\family default
has occurred in any way), the first transaction logfile
\family typewriter
/mars/resource-mydata/log-000000001-$primary
\family default
created by MARS will be empty.
Check whether this is really true! Then, and only then, you may also issue
a
\family typewriter
fake-sync
\family default
.
\end_layout
\end_inset
.
Then, and only then, you may say
\family typewriter
marsadm fake-sync mydata
\family default
in order to abort the sync operation.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Never do a
\family typewriter
fake-sync
\family default
unless you are
\series bold
absolutely sure
\series default
that you really don't need to sync the data! Otherwise, you are
\emph on
guaranteed
\emph default
to have produced harmful inconsistencies.
If you accidentally issued
\family typewriter
fake-sync
\family default
, you may startover the fast full sync at your secondary side by saying
\family typewriter
marsadm invalidate mydata
\family default
(analogously to the corresponding DRBD command).
\end_layout
\begin_layout Chapter
HOWTO operation of MARS resources
\begin_inset CommandInset label
LatexCommand label
name "chap:HOWTO-operation-of"
\end_inset
\end_layout
\begin_layout Section
Inspecting the State of MARS
\begin_inset CommandInset label
LatexCommand label
name "sec:Inspecting-the-State"
\end_inset
\end_layout
\begin_layout Standard
The main command for viewing the current state of MARS is
\end_layout
\begin_layout Itemize
\family typewriter
marsadm view mydata
\end_layout
\begin_layout Standard
or its more specialized variant
\end_layout
\begin_layout Itemize
\family typewriter
marsadm view-
\emph on
$macroname
\emph default
mydata
\end_layout
\begin_layout Standard
where
\family typewriter
\emph on
$macroname
\family default
\emph default
is one of the macros described in the following section
\begin_inset CommandInset ref
LatexCommand nameref
reference "subsec:Standard-marsadm-view"
plural "false"
caps "false"
noprefix "false"
\end_inset
, or in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-macro-processor"
plural "false"
caps "false"
noprefix "false"
\end_inset
, or another macro which has been written by yourself.
\end_layout
\begin_layout Standard
You may replace the resource name
\family typewriter
mydata
\family default
with the special keyword
\family typewriter
all
\family default
in order to get the state of all locally joined resources, as well as a
list of all those resources.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When using the variant
\family typewriter
marsadm view all
\family default
, additionally the global communication status will be displayed.
This helps humans in diagnosing problems.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: use the compound command
\family typewriter
watch marsadm view all
\family default
for continuous display of the current state of MARS.
When starting this side-by-side in
\family typewriter
ssh
\family default
terminal windows for all your cluster nodes, you can easily watch what's
going on in the whole cluster.
\end_layout
\begin_layout Subsection
Standard
\family typewriter
marsadm view
\begin_inset CommandInset label
LatexCommand label
name "subsec:Standard-marsadm-view"
\end_inset
\end_layout
\begin_layout Standard
The following predefined complex macros try to address the information needs
of
\series bold
humans
\series default
.
Use them only in scripts when you are prepared about the fact that the
output format may change during development of MARS.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
default
\family default
This is equivalent to
\family typewriter
marsadm view mydata
\family default
without
\family typewriter
\emph on
-maroname
\family default
\emph default
suffix.
It shows a one-line status summary for each resource, optionally followed
by informational lines such as progress bars whenever a sync or a fetch
of logfiles is currently running.
The status line has the following fields:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%{res}
\family default
resource name.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
[
\emph on
this_count
\emph default
/
\emph on
total_count
\emph default
]
\family default
number of replicas of this resource (see join-resource & co), total number
of cluster peers (see join-cluster & co).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%include{diskstate}
\family default
see
\family typewriter
diskstate
\family default
macro below.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%include{replstate}
\family default
see
\family typewriter
replstate
\family default
macro below.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%include{flags}
\family default
see
\family typewriter
flags
\family default
macro below.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%include{role}
\family default
see
\family typewriter
role
\family default
macro below.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%include{primarynode}
\family default
see
\family typewriter
primarynode
\family default
macro below.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
%include{commstate}
\family default
see
\family typewriter
commstate
\family default
macro below.
\end_layout
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\begin_inset space ~
\end_inset
After that, optional lines such as progress bars are appearing only when
something unusual is happening.
These lines are subject to future changes.
For examples, wasted disk space due to missing
\family typewriter
resize
\family default
is reported when
\family typewriter
%{threshold}
\family default
is exceeded.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Customization via your own macros (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Creating-your-own"
\end_inset
) is explicitly encouraged for experienced sysadmins and userspace developers.
It would be nice if a vibrant user community would emerge, helping each
other by exchange of macros.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: in order to produce your own customized inspection / monitoring tools,
you may ask the author for an official reservation of a macro sub-namespace
such as
\family typewriter
*-
\emph on
yourcompanyname
\family default
\emph default
.
You will be fully responsible for your own reserved namespace and can do
with it whatever you want.
The official MARS release will guarantee that
\emph on
no name clashes
\emph default
with your reserved sub-namespace will occur in future.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
default-global
\family default
Currently, this just calls
\family typewriter
comminfo
\family default
(see below).
May be extended in future.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-info
\family default
When present, shows the status of /dev/mars/mydata in human-readyble form.
Shows the empty string when /dev/mars/mydata is not present.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
diskstate
\family default
Shows the status of the underlying disk device, in the following order
of precedence
\begin_inset Foot
status open
\begin_layout Plain Layout
When an earlier list item is displayed, no combinations with following items
are possible.
This kind of
\begin_inset Quotes eld
\end_inset
hiding effect
\begin_inset Quotes erd
\end_inset
can lead to an
\emph on
information loss
\emph default
.
In order to get a non-lossy picture from the state of your system, please
look at the
\family typewriter
flags
\family default
which are able to display cartesian combinations of more detailed internal
states.
\end_layout
\end_inset
:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NotJoined
\family default
(cf
\family typewriter
%get-disk{}
\family default
) No underlying disk device is configured.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NotPresent
\family default
(cf
\family typewriter
%disk-present{}
\family default
) The underlying disk device (as configured, see
\family typewriter
marsadm view-get-disk
\family default
) does not exist or the device node is not accessible.
Therefore MARS cannot work.
Check that LVM or other software is properly configured and running.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Detached
\family default
(cf
\family typewriter
InConsistent
\family default
,
\family typewriter
NeedsReplay
\family default
,
\family typewriter
%todo-attach{}
\family default
,
\family typewriter
%is-attach{}
\family default
) The underlying disk is willingly switched off (see
\family typewriter
marsadm detach
\family default
), and it actually is no longer opened by MARS.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Detaching
\family default
(cf
\family typewriter
%todo-attach{}
\family default
and
\family typewriter
%is-attach{}
\family default
) Access to the underlying disk is switched off, but actually not yet
\family typewriter
close()
\family default
d by MARS.
This can happen for a long time on a primary when other secondaries are
accessing the disk remotely for syncing.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
IncompleteLog[
\emph on
description-text
\emph default
] or
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
InitializedLogRecord[
\emph on
description-text
\emph default
] or
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
DefectiveLog[
\emph on
description-text
\emph default
]
\family default
(cf
\family typewriter
%replay-code{}
\family default
) Typicially this indicates a checksum error in a transaction logfile, or
another (hardware / filesystem) defect.
This occurs extremely rarely in practice, but has been observed more frequently
during a massive failure of air conditioning in a datacenter, when disk
temperatures raised to more than 80° Celsius.
Notice that a secondary
\series bold
refuses
\series default
to apply any knowingly defective logfile data to the disk.
Although this message is
\emph on
not directly
\emph default
referring to the underlying disk, it is mentioned here because of its superior
\series bold
relevance
\series default
for the diskstate.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint for expert sysadmins: when desperate, read the sourcecode of the
\family typewriter
marsadm
\family default
Perl script.
The otherwise undocumented table
\family typewriter
%errno2names
\family default
could hint you at a lot of potential problems, in
\emph on
addition
\emph default
to the standard Unix codes as documented in
\family typewriter
man errno
\family default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
A damaged transaction logfile will always affect the
\emph on
actuality
\emph default
of the disk, but not its
\emph on
integrity
\emph default
(by itself).
What to do in such cases?
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Enumerate
When the damage is only at one of your secondaries, and the primary continues
working: first you should ensure that the primary has a good logfile after
a
\family typewriter
marsadm cron
\family default
, wait for the secondary to get this knowlege over the network, and try
\family typewriter
marsadm invalidate
\family default
at the damaged secondary.
It is crucial that the primary has a fresh correct logfile behind the error
position, and that it is
\emph on
continuously(!)
\emph default
operating correctly, without any interruption.
\end_layout
\begin_layout Enumerate
When
\emph on
all
\emph default
of your secondaries are reporting
\family typewriter
DefectiveLog
\family default
or relatives, the primary could have
\emph on
produced
\emph default
a damaged logfile (e.g.
in RAM, in a DMA channel, etc) while continuing to operate, and all of
your secondaries got that defective logfile.
Please consider more lowlevel messages as reported by
\family typewriter
marsadm view mydata
\family default
.
Check the internet what hardware-dependent cleartext messages might mean,
or some hints like
\begin_inset Quotes eld
\end_inset
Bad magic has repeated pattern
\shape italic
$some_hex_code
\shape default
\begin_inset Quotes erd
\end_inset
.
When a hex code is present, and when it is the
\emph on
same
\emph default
hex number appearing on all of your secondaries, this
\emph on
might
\emph default
tell you something.
For example, certain hex-coded patterns may stem from various HDD or SSD
models, under certain operational conditions like uninitialized media,
or defective BBU caches, etc.
What to do in such cases?
\begin_inset Newline newline
\end_inset
After
\family typewriter
marsadm cron
\family default
, you can check this by comparing the
\family typewriter
md5sum
\family default
of the first primary logfile (having the lowest serial number) with the
versions on your replicas.
The problem is that you don't know whether the primary side has a silent
corruption on any of its disks, or not.
You will need to take an operational decision whether to switchover to
a secondary via
\family typewriter
primary --force
\family default
, or whether to continue operation at the primary and
\family typewriter
invalidate
\family default
your secondaries.
\end_layout
\begin_layout Enumerate
When the original primary is affected in a very bad way, such that it crashed
badly and afterwards even recovery of the
\emph on
primary
\emph default
is impossible
\begin_inset Foot
status open
\begin_layout Plain Layout
In such a rare case, the
\emph on
original primary
\emph default
(but not any other host)
\series bold
refuses
\series default
to come up during recovery with
\emph on
his own
\emph default
logfile originally produced by
\emph on
himself
\emph default
.
This is not a bug, but saves you from incorrectly assuming that your original
primary disk were consistent - it is
\emph on
known
\emph default
to be inconsistent, but recovery is impossible due to the damaged logfile.
Thus
\emph on
this one
\emph default
replica is trapped by defective hardware.
The other replicas shouldn't.
\end_layout
\end_inset
due to this error (which typically occurs extremely rarely, observed two
times during 7 millions of operating hours on defective hardware), you
need to take an operational decision between the following alternatives:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Enumerate
switchover to a former secondary via
\family typewriter
primary --force
\family default
, producing a split brain, and producing some (typically small) data loss.
However, integrity is more important than actuality in such an extreme
case.
\end_layout
\begin_layout Enumerate
deconstruction of the resource at
\emph on
all
\emph default
replicas via
\family typewriter
leave-resource --force
\family default
, running
\family typewriter
fsck
\family default
or similar tools by hand at the underlying disks, selecting the best replica
out of them, and finally re-constructing the resource again.
\end_layout
\begin_layout Enumerate
restore your backup.
\end_layout
\end_deeper
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Orphan
\family default
The secondary cannot replay data anymore, because it has been kicked out
for avoidance of emergency mode.
The data is not recent anymore.
Typically,
\family typewriter
marsadm invalidate
\family default
needs to be done.
\begin_inset Newline newline
\end_inset
There is an execption: shortly after
\family typewriter
join-resource
\family default
or
\family typewriter
invalidate
\family default
, it may take some time until state
\family typewriter
Orphan
\family default
may be left, and until the newest logfile has appeared at your secondary
site (depending on the size of logfiles, and on your network).
In case of network problems, this may take very long.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
This state tells you that your replica is not current, and currently not
being updated at all.
Don't forget to
\series bold
monitor
\series default
for longer occurrences of this state! Otherwise you may get a big surprise
when you need a forceful emergency failover, but your replica is very old
or even does not really exist at all.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NoAttach
\family default
(cf
\family typewriter
%is-attach{}
\family default
) The underlying disk is currently not opened by MARS.
Reasons may be that the kernel module is not loaded, or an exclusive
\family typewriter
open()
\family default
is currently not possible because somebody else has already opened it.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
InConsistent
\family default
(cf
\family typewriter
%is-consistent{}
\family default
) A logfile replay and/or sync is known to be needed / or to complete (e.g.
after
\family typewriter
invalidate
\family default
has started) in order to restore local consistency (for details, look at
\family typewriter
flags
\family default
).
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: in the current implementation of MARS, this will never happen on secondari
es during ordinary replay (but only when either sync has not yet finished,
or when the
\emph on
initial
\emph default
logfile replay after the sync has not yet finished), because the ordinary
logfile replay always maintains anytime consistency once a consistent state
had been reached.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\emph on
Only
\emph default
in case of a primary node crash, and
\emph on
only
\emph default
after attempts have failed to become primary again (e.g.
IO errors, etc), this
\emph on
can
\emph default
(but need not) mean that something went wrong.
Even in such an extremely unlikely event, chances are high that
\family typewriter
fsck
\family default
can fix any remaining problems (and, of course, you can also switchover
to a former secondary).
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When this message appears, simply start MARS again (e.g.
\family typewriter
modprobe mars; marsadm up all
\family default
), in whatever role you are intending.
This will
\emph on
automatically
\emph default
go into phase
\family typewriter
Recovery
\family default
, i.e.
try to replay any necessary transaction logfile(s) in order to fix any
inconsistency.
Only if the automatic fix fails and this message persists for a long time
without progress, you
\emph on
might
\emph default
have a problem.
Typically, as observed at a large installation at 1&1, this happens extremely
rarely, and even then it just indicated that hardware was defective.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
OutDated[FR]
\family default
(cf
\family typewriter
%work-reached{}
\family default
) Only at secondaries.
Tells whether it is
\emph on
currently known
\emph default
that the disk has any lag-behind when compared to the
\emph on
currently known
\emph default
state of the current designated primary (if there exists one).
Only meaningful if a current designated primary exists.
Notice that this kind of status display is subject to
\emph on
natural races
\emph default
, for example when new logfile data has been produced in parallel, or network
propagation is very slow.
Additional information is in brackets:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
[F]
\family default
Fetch is known to be needed.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
[R]
\family default
Replay is known to be needed.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
[FR]
\family default
Both are known to be needed.
\end_layout
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
WriteBack[
\emph on
amount
\emph default
]
\family default
(cf
\family typewriter
%is-primary{}
\family default
and amount via
\family typewriter
%writeback-rest{}
\family default
) Appears only at actual primaries (whether designated or not), when the
writeback from the RAM buffer is active (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-Transaction-Logger"
\end_inset
).
The
\emph on
amount
\emph default
is displayed in human readable form, and may be used for a very rough estimatio
n of recovery time after a primary crash.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Recovery
\family default
(cf
\family typewriter
%todo-primary{}
\family default
) Appears only at the designated primary before it actually has become primary.
Similar to database recovery, this indicates the recovery phase after a
crash
\begin_inset Foot
status open
\begin_layout Plain Layout
In some cases,
\family typewriter
primary --force
\family default
may also trigger this message.
\end_layout
\end_inset
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
EmergencyMode
\family default
(cf
\family typewriter
%is-emergency{}
\family default
) A current designated primary exists, and it is known that this host has
entered emergency mode.
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Emergency-Mode"
\end_inset
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
UpToDate
\family default
Displayed when none of the above has been detected.
\end_layout
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
replstate
\family default
Shows the status of the replication in the following order of precedence:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
ModuleNotLoaded
\family default
(cf
\family typewriter
%is-module-loaded{}
\family default
) No kernel module is loaded, and as a consequence no
\family typewriter
/proc/sys/mars/
\family default
does exist.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
UnResponsive
\family default
(cf
\family typewriter
%is-alive{%{host}}
\family default
) The main thread
\family typewriter
mars_main
\family default
did not do any noticable work for more than
\family typewriter
%{window}
\family default
(default 60) seconds.
Notice that this may happen when deleting
\emph on
extremely
\emph default
large logfiles (up to hundreds of gigabytes or terabytes).
If this happens for a
\emph on
very
\emph default
long time, you should check
\family typewriter
dmesg
\family default
whether you might need a reboot in order to fix the hang.
The time window may be changed by
\family typewriter
--window=$seconds
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NotJoined
\family default
(cf
\family typewriter
%get-disk{}
\family default
) No underlying disk device is configured for this resource.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NotStarted
\family default
(cf
\family typewriter
%todo-attach{}
\family default
) Replication has not been started.
\end_layout
\begin_layout Itemize
When the current host is designated as a primary, the rest of the precedence
list looks as follows:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
EmergencyMode
\family default
(cf.
\family typewriter
%is-emergency{}
\family default
) See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Emergency-Mode"
\end_inset
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Replicating
\family default
(cf.
\family typewriter
%is-primary{}
\family default
) Primary mode has been entered.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NotYetPrimary
\family default
(catchall) This means the current host
\emph on
should
\emph default
act as a primary (see
\family typewriter
marsadm primary
\family default
or
\family typewriter
marsadm primary --force
\family default
), but currently doesn't (yet).
This happens during logfile replay, before primary mode is actually entered.
Notice that replay of very big logfiles may take a long time.
\end_layout
\end_deeper
\begin_layout Itemize
When the current host is
\emph on
not
\emph default
designated as a primary:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
PausedSync
\family default
(cf.
\family typewriter
%sync-rest{}
\family default
and
\family typewriter
%todo-sync{}
\family default
) Some data needs to be synced, but sync is currently switched off.
See
\family typewriter
marsadm {pause,resume}-sync
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Syncing
\family default
(cf.
\family typewriter
%is-sync{}
\family default
) Sync is currently running.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
PausedFetch
\family default
(cf.
\family typewriter
%todo{fetch}
\family default
) Fetch is currently switched off.
See
\family typewriter
marsadm {pause,resume}-fetch
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
PausedReplay
\family default
(cf.
\family typewriter
%todo{replay}
\family default
) Replay is currently switched off.
See
\family typewriter
marsadm {pause,resume}-replay
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
NoPrimaryDesignated
\family default
(cf.
\family typewriter
%get-primary{}
\family default
) A
\family typewriter
secondary
\family default
command has been given somewhere in the cluster.
Thus no designated primary exists.
All resource members are in state
\family typewriter
Secondary
\family default
or try to approach it.
Sync and other operations are not possible.
This state is therefore not recommended.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
PrimaryUnreachable
\family default
(cf.
\family typewriter
%is-alive{}
\family default
) A current designated primary has been set, but this host has not been
remotely updated for more than 60 seconds (see also
\family typewriter
--window=$seconds
\family default
).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Orphan
\family default
The secondary cannot replay data anymore, because it has been kicked out
for avoidance of emergency mode.
The data is not recent anymore.
Typically,
\family typewriter
marsadm invalidate
\family default
needs to be done.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
Replaying
\family default
(catchall) None of the previous conditions have triggered.
\end_layout
\end_deeper
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
flags
\family default
For each of disk, consistency, attach, sync, fetch, and replay, show exactly
one character.
Each character is either a capital one, or the corresponding lowercase
one, or a dash.
The meaning is as follows:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
disk/device:
\family typewriter
D
\family default
= the device
\family typewriter
/dev/mars/mydata
\family default
is present,
\family typewriter
d
\family default
= only the underlying disk
\family typewriter
/dev/lv-x/mydata
\family default
is present,
\family typewriter
-
\family default
= none present / configured.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
consistency: this relates to the
\emph on
underlying disk
\emph default
, not to
\family typewriter
/dev/mars/mydata
\family default
!
\family typewriter
C
\family default
= locally consistent,
\family typewriter
c
\family default
= maybe inconsistent (no guarantee), - = cannot determine.
Notice: this does not tell anything about
\emph on
actuality
\emph default
.
Notice: like the other flags, this flag is subject to races and therefore
should be relied on only in
\emph on
detached
\emph default
state! See also description of macro
\family typewriter
is-consistent
\family default
below.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
attach:
\family typewriter
A
\family default
= attached,
\family typewriter
a
\family default
= currently trying to attach/detach but not yet ready (intermediate state),
\family typewriter
-
\family default
= attach is switched off.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
sync:
\family typewriter
S
\family default
= sync finished,
\family typewriter
s
\family default
= currently syncing,
\family typewriter
-
\family default
= sync is switched off.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
fetch:
\family typewriter
F
\family default
= according to knowlege, fetched logfiles are up-to-date,
\family typewriter
f
\family default
= currently fetching (some parts of) a logfile,
\family typewriter
-
\family default
= fetch is switched off.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
replay:
\family typewriter
R
\family default
= all fetched logfiles are replayed,
\family typewriter
r
\family default
= currently replaying,
\family typewriter
-
\family default
= replay is switched off.
\end_layout
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
todo-role
\family default
Shows the
\emph on
designated
\emph default
state:
\family typewriter
None
\family default
,
\family typewriter
Primary
\family default
or
\family typewriter
Secondary
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
role
\family default
Shows the
\emph on
actual
\emph default
state:
\family typewriter
None
\family default
,
\family typewriter
NotYetPrimary
\family default
,
\family typewriter
Primary
\family default
,
\family typewriter
RemainsPrimary
\family default
,
\family typewriter
ForcedPrimary
\family default
or
\family typewriter
Secondary
\family default
.
Any differences to the designated state are indicated by a prefix to the
keyword
\family typewriter
Primary
\family default
:
\family typewriter
NotYet
\family default
means that it
\emph on
should
\emph default
become primary, but actually hasn't.
Vice versa,
\family typewriter
Remains
\family default
means that it
\emph on
should
\emph default
leave primary state in order to become secondary, but actually cannot do
that because the
\family typewriter
/dev/mars/mydata
\family default
device is currently in use .
\family typewriter
ForcedPrimary
\family default
indicates that
\emph on
multiple
\emph default
cluster hosts (see
\family typewriter
%nr-primary{}
\family default
) are claiming to be in actual primary role, e.g.
when another one is in role
\family typewriter
RemainsPrimary
\family default
, or when network interruption is preventing role change information from
propagating.
\begin_inset Newline newline
\end_inset
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
%todo-primary{} == 0
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
%todo-primary{} == 1
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
%is-primary{} == 0
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
None
\family default
/
\family typewriter
Secondary
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
NotYetPrimary
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
%is-primary{} == 1
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
RemainsPrimary
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
Primary / ForcedPrimary
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
primarynode
\family default
Display
\family typewriter
(none)
\family default
or the hostname of the designated primary.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
commstate
\family default
When the last metadata communication to the designated primary is longer
ago than
\family typewriter
${window}
\family default
(see also
\family typewriter
--window=
\emph on
seconds
\family default
\emph default
option), display that age in human readable form.
See also primitive macro
\family typewriter
%alive-age{}
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
syncinfo
\family default
Shows an informational progress bar when sync is running.
Intended for humans.
Scripts should not rely on any details from this.
Scripts may use this only as an
\emph on
approximate
\emph default
means for detecting progress (when comparing the
\emph on
full
\emph default
output text to a prior version and finding
\emph on
any
\emph default
difference, they may conclude that some progress has happened, how small
whatsoever).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
replinfo
\family default
Shows an informational progress bar when fetch is running.
This should not be used for scripting at all, because it contains realtime
information in human-readable form.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
fetch-line
\family default
Additional details, called by
\family typewriter
replinfo
\family default
.
Shows the amount of data to be fetched, as well as the current transfer
rate and a very rough estimation of the future duration.
When primitive macros
\family typewriter
%fetch-age{}
\family default
or
\family typewriter
%fetch-lag{}
\family default
exceed
\family typewriter
${window}
\family default
, their values are also displayed for human informational purposes.
See description of these primitive macros.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
replay-line
\family default
Additional details, called by
\family typewriter
replinfo
\family default
.
Shows the amount of data to be replayed, as well as the current replay
rate and a very rough estimation of the future duration.
When primitive macro
\family typewriter
%replay-age{}
\family default
exceeds
\family typewriter
${window}
\family default
, it is also displayed for human informational purposes.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
comminfo
\family default
When the network communication is in an unusual condition, display it.
Otherwise, don't produce any output.
\end_layout
\begin_layout Section
Switch Primary / Secondary Roles
\begin_inset CommandInset label
LatexCommand label
name "sec:Switch-Primary-/"
\end_inset
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/switching.fig
width 90col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
MARS distinguishes between
\emph on
intended
\emph default
and
\emph on
forced
\emph default
switching.
This distinction is necessary due to the communication architecture (asynchrono
us communication vs synchronous communication, see explanation of Lamport
Clock in
\family typewriter
mars-for-kernel-developers.pdf
\family default
).
\end_layout
\begin_layout Standard
Asynchronous communication means that (in worst case) a message may take
(almost) arbitrary time in a distorted network to propagate to another
node.
As a consequence, the risk for accidentally creating an (unintended) split
brain is increased (as compared to a synchronous system like DRBD).
\end_layout
\begin_layout Standard
In order to minimize this risk, MARS has invested a lot of effort into an
internal handover protocol when you start an
\emph on
intended
\emph default
primary switch.
\end_layout
\begin_layout Subsection
Intended Switching / Planned Handover
\begin_inset CommandInset label
LatexCommand label
name "subsec:Intended-Switching"
\end_inset
\end_layout
\begin_layout Standard
Before starting a planned handover from your old primary
\family typewriter
hostA
\family default
to a new primary
\family typewriter
hostB
\family default
, you should check the replication of the resource.
As a human, use
\family typewriter
marsadm view mydata
\family default
.
For scripting, use the macros from section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Predefined-Trivial-Macros"
\end_inset
(see also section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Scripting-HOWTO"
\end_inset
; an example can be found in
\begin_inset Flex URL
status open
\begin_layout Plain Layout
contrib/example-scripts/check-mars-switchable.sh
\end_layout
\end_inset
).
The network should be OK, and the amount of replication delay should be
as low as possible.
Otherwise, handover may take a very long time.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Best practice is to
\series bold
prepare
\begin_inset Foot
status open
\begin_layout Plain Layout
Precondition for a plain
\family typewriter
marsadm primary
\family default
(without
\family typewriter
systemd
\family default
) is that you are up, that means in attached and connected state (cf.
\family typewriter
marsadm up
\family default
), that you are no sync target anymore, and (only when
\family typewriter
systemd
\family default
isn't configured to automatically stop the application at the old site)
that any old primary (in this case
\family typewriter
A
\family default
) does not use its
\family typewriter
/dev/mars/mydata
\family default
device any longer, and that the network is healthy.
If some (parts of) logfiles are not yet (fully) transferred to the new
primary, you will need enough space on
\family typewriter
/mars/
\family default
at the target side.
If one of the preconditions described in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Operation-of-the"
\end_inset
is violated,
\family typewriter
marsadm primary
\family default
may refuse to start.
\end_layout
\begin_layout Plain Layout
These preconditions try to protect you from doing silly things, such as
accidentally provoking a split brain error state.
We try to avoid split brain as best as we can.
Therefore, we distinguish between
\emph on
intended
\emph default
and
\emph on
emergeny
\emph default
switching.
Intended switching will try to avoid split brain
\emph on
as best as it can
\emph default
.
\end_layout
\end_inset
a planned handover
\series default
by the following steps:
\end_layout
\begin_layout Enumerate
Check the network and the replication lag.
It should be low (a few hundred megabytes, or a low number of gigabytes
– see also the rough time forecast shown by
\family typewriter
marsadm view mydata
\family default
when there is a larger replication delay, or directly access the forecast
by
\family typewriter
marsadm view-replinfo
\family default
).
\end_layout
\begin_layout Enumerate
Only when the
\family typewriter
systemd
\family default
method from section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
is
\emph on
not
\emph default
used: stop your application on hostA, then say on hostA:
\begin_inset Newline newline
\end_inset
\family typewriter
umount /dev/mars/mydata
\begin_inset Newline newline
\end_inset
\family default
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you use the automatic handover method provided by systemd templates (see
section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
), this step is
\emph on
not needed
\emph default
.
\end_layout
\begin_layout Enumerate
Only when systemd templates are
\emph on
not
\emph default
used, and only for increased safety on hostA:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm wait-umount mydata
\begin_inset Newline newline
\end_inset
\family default
This will reduce the risk of
\series bold
hanging umounts
\series default
leading to long-lasting waits at the future primary hostB.
Such problems will be detected earlier, so you have more possibilties for
fixing them.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Also good practice: use
\family typewriter
lsof /dev/mars/mydata
\family default
before umount for even earlier detection of hanging processes.
\end_layout
\begin_layout Enumerate
Optionally, and only when the
\family typewriter
systemd
\family default
method from section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
is
\emph on
not
\emph default
used: on host
\family typewriter
B
\family default
, wait until
\family typewriter
marsadm view-diskstate mydata
\family default
shows
\family typewriter
UpToDate
\family default
.
This way, you are gaining more control over the
\emph on
duration
\emph default
of the handover.
In case of unexpected network problems, disk space problems, etc, you can
script a compensation action like giving up much earlier, and restarting
your application at the old primary hostA much earlier.
\end_layout
\begin_layout Enumerate
On hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm primary mydata
\family default
\begin_inset Newline newline
\end_inset
When combined with the
\family typewriter
systemd
\family default
method (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
), this will even automatically stop the application at hostA, wait for
handover, and start the application at hostB.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
The most important difference to DRBD: don't use an intermediate
\family typewriter
marsadm secondary mydata
\family default
at hostA.
Although it is possible, there are severeral
\emph on
disadvantages
\emph default
\begin_inset Foot
status open
\begin_layout Plain Layout
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\family typewriter
marsadm secondary
\family default
is
\emph on
discouraged
\emph default
for several reasons.
It tells the
\emph on
whole cluster
\emph default
that
\emph on
nobody
\emph default
is designated as primary anymore.
\emph on
All
\emph default
nodes should go into secondary mode, globally.
In the current version of MARS, the secondaries will no long fetch any
logfiles, since in split brain situations they don't know which version
is the
\begin_inset Quotes eld
\end_inset
right
\begin_inset Quotes erd
\end_inset
one.
When a primary host is designated, this is the
\begin_inset Quotes eld
\end_inset
right
\begin_inset Quotes erd
\end_inset
one by definition.
Syncing is also not possible when there is no designated primary.
When the device
\family typewriter
/dev/mars/mydata
\family default
is in use somewhere, it will remain in
\emph on
actual
\emph default
primary mode during that time, and the secondaries will sync therefrom.
As soon as the local
\family typewriter
/dev/mars/mydata
\family default
is released, the node will
\emph on
actually
\emph default
go into secondary mode if it is no longer designated as primary.
\end_layout
\end_inset
from losing the primary state.
In case of an unexpected crash at the wrong moment, nobody might know anymore
where the primary was running before.
Best practice is to always switch
\emph on
directly
\emph default
from the old primary hostA to the new primary hostB.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you need the local device
\family typewriter
/dev/mars/mydata
\family default
to disappear
\emph on
everywhere
\emph default
in the whole cluster, you don't need the discouraged
\family typewriter
marsadm secondary
\family default
command.
\family typewriter
marsadm detach
\family default
or
\family typewriter
marsadm down
\family default
can do it also, without destroying knowledge about the former designated
primary.
There is only one use case where
\family typewriter
marsadm secondary
\family default
is really needed: final destruction of a resource before
\family typewriter
marsadm delete-resource
\family default
is executed.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In contrast to DRBD, MARS remembers the designated primary, even when your
system crashes and reboots.
With DRBD, you typically will have to re-setup the DRBD roles with (scripted)
commands like
\family typewriter
drbdadm up
\begin_inset Formula $\ldots$
\end_inset
; drbdadm primary
\begin_inset Formula $\ldots$
\end_inset
\family default
.
Instead, MARS will
\series bold
automatically resume
\series default
its former roles just by saying
\family typewriter
modprobe mars
\family default
.
When combined with a proper
\family typewriter
systemd
\family default
setup (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
), this will even automatically re-start your application after the crash.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Another fundamental difference to DRBD: when the network is healthy, there
can only exist
\emph on
one
\emph default
designated primary at a time.
By saying
\family typewriter
marsadm primary mydata
\family default
on host
\family typewriter
B
\family default
,
\series bold
all other
\series default
hosts (including
\family typewriter
hostA
\family default
) will
\series bold
automatically go into secondary role
\series default
after a while.
You don't need to tell them explicitly, because MARS is automatically propagati
ng the information for you.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
A
\emph on
very rough
\emph default
estimation of the time to become
\family typewriter
UpToDate
\family default
is displayed by
\family typewriter
marsadm view mydata
\family default
or other macros (e.g.
\family typewriter
view-replinfo
\family default
).
However, on very flaky networks, the estimation may be flickering.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Planned handover is refused
\emph on
by default
\emph default
when some sync is running somewhere, even at a third hostC.
By adding the option
\family typewriter
--ignore-sync
\family default
, you are no longer protected by this
\emph on
safety measure
\emph default
, and you are willing to accept that any already running sync at any hostC
or hostD will restart from point 0, in order to ensure consistency.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Tip: newer versions of
\family typewriter
mars
\family default
+
\family typewriter
marsadm
\family default
are supporting the option
\family typewriter
--parallel
\family default
combined with
\family typewriter
all
\family default
, e.g.
\family typewriter
marsadm primary all --parallel
\family default
.
Instead of waiting until
\emph on
all
\emph default
the resources have left the primary role at the old primary (barrier synchoniza
tion), the handover speed of each resource is treated
\emph on
individually
\emph default
.
Slow resources will no longer retard fast ones, minimizing total downtime.
However, check that your cluster manager can deal with a rather high parallelis
m degree.
At the moment, the
\family typewriter
systemd
\family default
interface is not yet prepared for this.
\end_layout
\begin_layout Subsection
Forced Switching
\begin_inset CommandInset label
LatexCommand label
name "subsec:Forced-Switching"
\end_inset
\end_layout
\begin_layout Standard
In case of an incident, the connection to the old primary hostA may be lost
for several reasons.
Then, at hostB, we just don't know anything about its
\emph on
current
\emph default
state (which may deviate from its
\emph on
last known
\emph default
state).
The following command sequence will skip many checks (essentially you just
need to be attached and you must not be a current sync target) and tell
hostB to become primary forcefully:
\end_layout
\begin_layout Enumerate
On hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm pause-fetch mydata
\family default
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
notice that this is similar to
\family typewriter
drbdadm disconnect mydata
\family default
as you might be used from DRBD.
For better compatibility with DRBD, you may use the alternate syntax
\family typewriter
marsadm disconnect mydata
\family default
instead.
However, there is a subtle difference to DRBD: DRBD will drop
\emph on
both
\emph default
sides of its single bi-directional connection and no longer try to re-connect
from any of both sides.
In contrast,
\family typewriter
marsadm pause-fetch
\family default
is equivalent to
\family typewriter
pause-fetch-local
\family default
, which instructs only the
\emph on
local
\emph default
host to stop fetching logfiles.
Other members of the cluster, including the former primary, are
\emph on
not
\emph default
instructed to do so.
They may continue fetching logfiles over their own private TCP connections,
potentially using many connections in parallel, potentially distributed
over multiple routes, and potentially even from any
\emph on
other
\emph default
member of the resource, if they think they can get the data from there.
In order to instruct
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice that not all such instructions may arrive at all sites when the network
is interrupted (or extremely slow).
\end_layout
\end_inset
\emph on
all
\emph default
members of the resource to stop fetching logfiles, you may use
\family typewriter
marsadm pause-fetch-global mydata
\family default
instead (cf section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Operation-of-the"
\end_inset
).
\end_layout
\end_deeper
\begin_layout Enumerate
On hostB:
\family typewriter
\begin_inset Newline newline
\end_inset
marsadm primary --force mydata
\family default
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
this is the forceful failover.
Depending on the current replication lag, you may lose some data.
Use
\family typewriter
--force
\family default
only if you know what you are doing!
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When
\family typewriter
systemd
\family default
is configured properly (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
), your application will start automatically at the new primary site.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
when the replication network is interrupted while the old primary hostA
continues
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice: in certain network outage scenarios, you may not be able to remotely
login to the console and to check whether a server is running.
Therefore it may happen that you erronously think hostA is dead, while
in reality it continues running.
Even if you would know it, you might not be able to remotely kill it in
a STONITH-like manner.
\end_layout
\end_inset
running, it cannot know that hostB is the new designated primary.
Therefore hostA will continue running by default.
This means that your application will run twice! Only when the metadata
exchange is working again (by default on port 7777), the old hostA will
be automatically shut down by its local
\family typewriter
systemd
\family default
configuration, when configured properly (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
).
In difference to the
\emph on
planned
\emph default
handover from section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Intended-Switching"
\end_inset
, this may happen much later.
In case of very long-last network outages, it may take even days or weeks.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Running both sites in parallel for a long time may seriously damage your
business.
Ensure that any
\series bold
customer traffic
\series default
cannot go to the old site! Be sure to configure your BGP in a proper way,
such that
\emph on
only
\emph default
, and
\emph on
only
\emph default
the new site will receive any customer traffic from both inside and outside
networks, like the internet.
\end_layout
\end_deeper
\begin_layout Enumerate
For safety on hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm resume-fetch mydata
\family default
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Standard
The new primary would not really need this, because primaries are producing
their own logfiles without need for fetching.
This is only to undo the previous
\family typewriter
pause-fetch
\family default
, in order to avoid future surprises when the new primary will somewhen
change to secondary mode again (in the far-distant future), and you have
forgotten to remember the fact that fetching had been switched off.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Newer marsadm versions, starting from
\family typewriter
mars0.1astable113
\family default
, do not need this step anymore.
After successful activation of
\family typewriter
/dev/mars/mydata
\family default
, the equivalent of
\family typewriter
marsadm up mydata
\family default
is executed automatically.
\end_layout
\end_deeper
\begin_layout Standard
When using
\family typewriter
--force
\family default
, many precondition checks and other internal checks are skipped, in particular
the internal handover protocol for split brain avoidance.
\end_layout
\begin_layout Standard
In general, use of
\family typewriter
--force
\family default
is
\emph on
likely
\emph default
to
\series bold
provoke a split brain
\series default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\series bold
Split brain
\series default
is always an
\series bold
erroneous state
\series default
which should be never entered without reason! Once you have entered it
accidentally, you
\series bold
must
\series default
resolve it ASAP (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Split-Brain-Resolution"
\end_inset
), otherwise you cannot operate your resource in the long term.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
In case of
\emph on
connection loss
\emph default
(e.g.
networking problems / network partitions), you may not be able to reliably
detect whether a split brain has actually occured, or not.
\end_layout
\begin_layout Paragraph
Some Background (may be skipped)
\end_layout
\begin_layout Standard
In contrast to DRBD, split brain situations are handled differently by MARS
.
When two primaries are accidentally active at the same time, each of them
writes into different logfiles
\family typewriter
/mars/resource-mydata/log-000000001-hostA
\family default
and
\family typewriter
/mars/resource-mydata/log-000000001-hostB
\family default
where the
\emph on
origin
\emph default
host is always recorded in the filename.
Therefore, both nodes
\emph on
can theoretically
\emph default
run in primary mode independently from each other, at least for some time.
They
\emph on
might
\emph default
even cron (historic
\family typewriter
log-rotate
\family default
) independently from each other.
However, this is really no good idea.
The replication to third nodes will likely get stuck, and your
\family typewriter
/mars/
\family default
filesystem(s) will eventually run out of space.
Any further secondary node (when having
\begin_inset Formula $k>2$
\end_inset
replicas) will certainly get into serious problems: it simply does not
know which split-brain version it should follow.
Therefore, you will certainly loose the actuality of your redundancy.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Split brain situations are detected
\emph on
passively
\emph default
by secondaries.
Whenever a secondary detects that somewhere a split brain has happend,
it refuses to replay any logfiles behind the split point (and also to fetch
them when possible), or anywhere where something appears suspect or ambiguous.
This tries to keep its local disk state always being
\begin_inset Quotes eld
\end_inset
as consistent as possible
\begin_inset Quotes erd
\end_inset
, but outdated with respect to any of the split brain versions.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\family typewriter
marsadm primary –force
\family default
is rejected in newer marsadm versions
\begin_inset Foot
status open
\begin_layout Plain Layout
Beware: older versions before
\family typewriter
mars0.1stable52
\family default
did deliberately skip this check because a few years ago somebody at 1&1
placed a
\emph on
requirement
\emph default
on this.
Fortunately, the requirement now has gone, so a safee behaviour could be
implemented.
The new behaviour is for your safety, to prevent you from doing
\begin_inset Quotes eld
\end_inset
silly
\begin_inset Quotes erd
\end_inset
things in case you are under pressure during an incident (try to safeguard
human error as best as possible).
\end_layout
\end_inset
if your replica is a current sync target.
This is not a bug: it should prevent you from forcing an inconsistent replica
into primary mode, which will
\emph on
certainly
\emph default
lead to inconsistent data.
However, in extremely rare cases of severe damage of
\emph on
all
\emph default
of your replicas, you may be desperate.
Only in such a rare case, and only then, you might decide to force any
of your replicas (e.g.
based on their last sync progress bar) into primary role although none
of the re-syncs had finished before.
In such a case, and only if you really know what you are doing, you may
use
\family typewriter
marsadm fake-sync
\family default
to first mark your inconsistent replica as UpToDate (which is a
\series bold
lie
\series default
) and then force it to primary as explained above.
Afterwards, you will certainly need
\family typewriter
fsck
\family default
or another type of repair before you can restart your application.
Good luck! And don't forget to check the size of
\family typewriter
lost+found
\family default
afterwards.
This is really your
\emph on
very last
\emph default
chance if nothing else had succeeded before.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Tip: newer versions of
\family typewriter
mars
\family default
+
\family typewriter
marsadm
\family default
are supporting the option
\family typewriter
--parallel
\family default
combined with
\family typewriter
all
\family default
, e.g.
\family typewriter
marsadm primary --force all --parallel
\family default
.
This may potentially speed up startup.
However, check that your cluster manager can deal with a rather high parallelis
m degree.
At the moment, the
\family typewriter
systemd
\family default
interface is not yet prepared for this.
\end_layout
\begin_layout Section
Split Brain Resolution
\begin_inset CommandInset label
LatexCommand label
name "subsec:Split-Brain-Resolution"
\end_inset
\end_layout
\begin_layout Standard
Split brain can naturally occur during a long-lasting network outage (aka
network partition) when you (forcefully) switch primaries inbetween, or
due to final loss of your old primary node (fatal node crash) when not
all logfile data had been transferred immediately before the final crash.
\end_layout
\begin_layout Standard
In general,
\series bold
split brain is unavoidable
\series default
in
\emph on
any
\emph default
distributed system, even if you use a passive crossover cable with DRBD,
and when the crossover cable fails at the wrong moment.
Please search Wikipedia for the CAP theorem, or read the corresponding
section in
\family typewriter
mars-architecture-guide.pdf
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Remember that split brain is an
\series bold
erroneous state
\series default
which must be resolved as soon as possible!
\end_layout
\begin_layout Standard
Whenever split brain occurs for whatever reason, you have two choices for
resolution: either destroy one of your versions, or retain it under a different
resource name.
\end_layout
\begin_layout Standard
In any of both cases, do the following steps ASAP:
\end_layout
\begin_layout Enumerate
\series bold
Manually
\series default
check which (surviving) version is the
\begin_inset Quotes eld
\end_inset
right
\begin_inset Quotes erd
\end_inset
one.
Any error is up to you: destroying the wrong version is
\emph on
your
\emph default
fault.
\begin_inset Newline newline
\end_inset
Newer versions of
\family typewriter
marsadm view
\family default
are supporting your decision by telling you the amount of logfile data
you would destroy when destroying a certain version of a certain host.
Typically, the smaller version is a candidate for destruction.
However, there are situations where this may be wrong, such as amok-running
applications running like endless loops, or Spammer attacks against databases,
or similar.
MARS cannot know about this.
\end_layout
\begin_layout Enumerate
If you did not already switch your primary to the final destination determined
in the previous step, do it now (see description in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Forced-Switching"
\end_inset
).
Don't use an intermediate
\family typewriter
marsadm secondary
\family default
command (as known from DRBD):
\emph on
directly
\emph default
switch to the new designated primary!
\end_layout
\begin_layout Enumerate
Unless
\family typewriter
systemd
\family default
is configured properly (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:systemd-Templates"
\end_inset
), do the following manually: on each non-right version (which you don't
want to retain) which had been primary before, umount your
\family typewriter
/dev/mars/mydata
\family default
or otherwise stop using it (e.g.
stop iSCSI or other users of the device).
Wait until each of them has actually left primary state and until their
local logfile(s) have been fully written back to the underlying disk.
\end_layout
\begin_layout Enumerate
Wait until the network works again.
All your (surviving) cluster nodes
\emph on
must
\emph default
\begin_inset Foot
status open
\begin_layout Plain Layout
If you are a MARS expert and you really know what you are doing (in particular,
you can anticipate the effects of the Lamport clock and of the symlink
update protocol including the
\begin_inset Quotes eld
\end_inset
eventually consistent
\begin_inset Quotes erd
\end_inset
behaviour including any not-yet-consistent intermediate states), you may
deviate from this requirement, at your own risk.
\end_layout
\end_inset
be able to communicate with each other.
If this is not possible, or if it would take too long, fall back to one
of the method described in appendix ......
......
section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Final-Destroy-of"
\end_inset
, but do this only when necessary.
\end_layout
\begin_layout Standard
The next steps are different for different use cases:
\end_layout
\begin_layout Paragraph
Destroying a Wrong Split Brain Version
\end_layout
\begin_layout Standard
Continue with the following steps, each on those cluster node(s) where you
do not want to retain its split-brain version.
In preference, start with the old
\begin_inset Quotes eld
\end_inset
wrong
\begin_inset Quotes erd
\end_inset
primaries first (see advice at the end of this section):
\end_layout
\begin_layout Enumerate-Resume
On
\series bold
all
\series default
affected secondary nodes hostX where SPLIT BRAIN is reported:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm invalidate mydata
\family default
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
setcounter{enumi}{4}
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
Typically, no split brain is reported anymore after that (via
\family typewriter
marsadm view all
\family default
), and you are done.
\end_layout
\begin_layout Standard
In rare cases (when
\family typewriter
/mars
\family default
is almost full somewhere, or when emergency mode has occured somewhere),
you may need to run
\family typewriter
marsadm cron
\family default
at the primary host, and to repeat
\family typewriter
marsadm invalidate
\family default
on any SPLIT BRAIN host.
In extremely rare of overloaded nodes, you may need to repeat this several
times.
\end_layout
\begin_layout Standard
In very rare cases, when things are screwed up very heavily (e.g.
a partly destroyed
\family typewriter
/mars/
\family default
partition), you may try an alternate method described in appendix
\begin_inset CommandInset ref
LatexCommand ref
reference "chap:Alternative-Methods-for"
\end_inset
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Check that state
\family typewriter
Orphan
\family default
is left after a while.
Notice that
\family typewriter
invalidate
\family default
is only
\emph on
restarting
\emph default
an existing replica, but does not wait for its completion.
\end_layout
\begin_layout Paragraph
Retaining a Split Brain Version (optionally, typically not needed, may be
skipped)
\begin_inset CommandInset label
LatexCommand label
name "par:Retaining-a-Split"
\end_inset
\end_layout
\begin_layout Standard
On those cluster nodes where you want to retain some SPLIT BRAIN version
(e.g.
for inspection or debugging purposes, or as a kind of
\begin_inset Quotes eld
\end_inset
emergengy backup
\begin_inset Quotes erd
\end_inset
):
\end_layout
\begin_layout Enumerate-Resume
\family typewriter
marsadm down mydata
\end_layout
\begin_layout Enumerate-Resume
\family typewriter
marsadm leave-resource mydata
\end_layout
\begin_layout Enumerate-Resume
After having done this on
\emph on
all
\emph default
those cluster nodes, check that the split brain is gone (e.g.
by saying
\family typewriter
marsadm view mydata
\family default
at the primary).
In very rare cases, you might also need a
\family typewriter
log-purge-all
\family default
at the primary (see page
\begin_inset CommandInset ref
LatexCommand pageref
reference "log-purge-all$res"
\end_inset
).
\end_layout
\begin_layout Enumerate-Resume
Rename the underlying local
\family typewriter
/dev/lv/mydata
\family default
is into something like
\family typewriter
/dev/lv/mydata
\family default
-backup.
For example:
\begin_inset Newline newline
\end_inset
\family typewriter
lvrename lv mydata mydata-backup
\family default
\begin_inset Newline newline
\end_inset
For details, see
\family typewriter
man lvrename
\family default
.
This is
\emph on
extremely
\emph default
recommended to avoid confusion with the old resource name.
\end_layout
\begin_layout Enumerate-Resume
For safety: check that each underlying local disk
\family typewriter
/dev/lv/mydata-backup
\family default
is really usable afterwards, e.g.
by test-mounting it (and
\family typewriter
fsck
\family default
when needed).
If all is OK, don't forget to umount it before proceeding with the next
step.
\end_layout
\begin_layout Enumerate-Resume
Finally, you may either delete your backup somewhen via
\family typewriter
lvremove
\family default
, or you may create a completely new MARS resource out of it, but
\emph on
under a different name
\emph default
.
See description in section
\begin_inset CommandInset ref
LatexCommand vref
reference "sec:Creating-and-Maintaining"
\end_inset
.
\end_layout
\begin_layout Enumerate-Resume
Optionally, if you have enough disk space (check with
\family typewriter
vgs
\family default
): re-create your replica by freshly creating a new
\family typewriter
/dev/vg/mydata
\family default
with the right size, and
\family typewriter
marsadm join-resource mydata /dev/vg/mydata
\family default
.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Generally:
\series bold
best practice
\series default
is to always keep your LV names equal to your MARS resource names.
This can avoid a
\emph on
lot
\emph default
of unnecessary confusion.
\end_layout
\begin_layout Paragraph
Keeping a Good Version (typically no actions needed)
\end_layout
\begin_layout Standard
When you had a secondary which did not participate in the split brain, but
just got confused and therefore stopped replaying logfiles immediately
before the split-brain point, it will typically
\begin_inset Foot
status open
\begin_layout Plain Layout
In general, such a
\begin_inset Quotes eld
\end_inset
good
\begin_inset Quotes erd
\end_inset
behaviour cannot be guaranteed for all secondaries.
Race conditions in complex networks may asynchronously transfer
\begin_inset Quotes eld
\end_inset
wrong
\begin_inset Quotes erd
\end_inset
logfile data to a secondary much earlier than conflicting
\begin_inset Quotes eld
\end_inset
good
\begin_inset Quotes erd
\end_inset
logfile data which will be marked
\begin_inset Quotes eld
\end_inset
good
\begin_inset Quotes erd
\end_inset
only in the
\emph on
future.
\emph default
It is impossible to predict this in advance.
\end_layout
\end_inset
resume replay after the SPLIT BRAIN has been resolved at the other nodes.
Then you don't need to do any action for it.
\end_layout
\begin_layout Standard
When all SPLIT BRAIN versions have disappeared from the cluster (by
\family typewriter
invalidate
\family default
or
\family typewriter
leave-resource
\family default
as described before), the confusion should be over, and the secondary should
automatically resume tracking of the new unique version.
\end_layout
\begin_layout Standard
Please check that
\emph on
all
\emph default
of your secondaries are no longer stuck.
You need to execute split brain resolution only for
\emph on
stuck
\emph default
nodes.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint / advice for
\begin_inset Formula $k>2$
\end_inset
replicas: it is a good idea to start split brain resolution
\emph on
first
\emph default
with those (few) nodes which had been (accidentally) primary before, but
are not the new designated primary.
Usually, you had 2 primaries during split brain, so this will apply only
to
\emph on
one
\emph default
of them.
Leave the other one intact, by not umounting
\family typewriter
/dev/mars/mydata
\family default
at all, and keeping your applications running.
Even during emergency mode, see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Emergency-Mode"
\end_inset
.
\emph on
First
\emph default
resolve the problem of the
\begin_inset Quotes eld
\end_inset
wrong
\begin_inset Quotes erd
\end_inset
primary(s) via
\family typewriter
invalidate
\family default
or
\family typewriter
leave-resource
\family default
.
Wait for a short while.
Then check the rest of your secondaries, whether they now are already following
the new (unique) primary, and finally check whether the split brain warning
reported by
\family typewriter
marsadm view all
\family default
is gone everywhere.
This way, you can often skip unnecessary invalidations of replicas.
\end_layout
\begin_layout Section
Final Destruction of a Damaged Node
\begin_inset CommandInset label
LatexCommand label
name "subsec:Final-Destroy-of"
\end_inset
\end_layout
\begin_layout Standard
When a node has eventually died (e.g.
defective hardware),
\series bold
do not forget
\series default
\begin_inset Foot
status open
\begin_layout Plain Layout
If you forget this,
\family typewriter
/mars
\family default
will fill up forever.
Finally, emergency mode will be triggered.
\end_layout
\end_inset
the following steps ASAP:
\end_layout
\begin_layout Enumerate
\emph on
Physically
\emph default
remove the dead node from your network.
Unplug all network cables! Failing to do so might provoke a disaster in
case it somehow resurrects in an uncontrolled manner, such as a partly-damaged
\family typewriter
/mars/
\family default
filesystem, a half-defective kernel, RAM / kernel memory corruption, disk
corruption, or whatever.
Although MARS has some provisions like md5 checksums in its transaction
logfiles: don't risk any
\series bold
unpredictable behaviour
\series default
!
\end_layout
\begin_layout Enumerate
\series bold
Manually
\series default
check which of the surviving versions will be the
\begin_inset Quotes eld
\end_inset
right
\begin_inset Quotes erd
\end_inset
one.
Any human error is up to you: resurrecting an unnecessarily old / outdated
version and/or decommissioning the productive primary server will be
\emph on
your
\emph default
fault.
\end_layout
\begin_layout Enumerate
If you did not already switch your primary to the final destination determined
in the previous step, do it now (see description in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Forced-Switching"
\end_inset
).
\end_layout
\begin_layout Enumerate
On a surviving node, give the following commands:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Enumerate
\family typewriter
marsadm --host=your-damaged-host down mydata --force
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm --host=your-damaged-host leave-resource mydata --force
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Check for misspellings, in particular the hostname of the dead node, and
check the command syntax before typing return! Otherwise, you may forcefully
destroy the wrong
\begin_inset Foot
status open
\begin_layout Plain Layout
That said, MARS appears to be rather tolerant of human errors.
As long as your
\family typewriter
/dev/vg/mydata
\family default
is not removed at LVM level, you have a chance for recovery.
Once a sysadmin destroyed a whole cluster by accident, including all of
its resources, and while it was continuously running in primary role.
Even transaction logging did continue on some orphan logfiles, but
\family typewriter
/mars
\family default
was filling up
\begin_inset Quotes eld
\end_inset
unexpectedly
\begin_inset Quotes erd
\end_inset
.
Fortunately, this behaviour led to a monitoring alert and to detection
of the problem.
It was early enough for a correction without causing any extraordinary
customer downtime outside of accepted SLAs, and no data loss at all.
\end_layout
\end_inset
node!
\end_layout
\end_deeper
\begin_layout Enumerate
Repeat the same with
\emph on
all
\emph default
resources which were formerly present at
\family typewriter
your-damaged-host
\family default
.
\end_layout
\begin_layout Enumerate
Finally, say
\family typewriter
\begin_inset Newline newline
\end_inset
marsadm --host=$your_damaged_host leave-cluster --force
\end_layout
\begin_layout Standard
Now all your surviving nodes should
\emph on
believe
\emph default
that the old node
\family typewriter
$your_damaged_host
\family default
does no longer exist, and that it does no longer participate in any resource.
For safety, check this via
\family typewriter
marsadm view
\family default
everywhere.
\end_layout
\begin_layout Standard
As another safeguard, any re-attempt to
\begin_inset Quotes eld
\end_inset
surrect
\begin_inset Quotes erd
\end_inset
a
\begin_inset Quotes eld
\end_inset
zombie
\begin_inset Quotes erd
\end_inset
from its
\begin_inset Quotes eld
\end_inset
claimed death
\begin_inset Quotes erd
\end_inset
and/or from its
\begin_inset Quotes eld
\end_inset
real death
\begin_inset Quotes erd
\end_inset
should
\emph on
spit at you
\emph default
with some tons of warnings.
These warnings are a
\emph on
feature
\emph default
, not a bug.
If you
\emph on
really
\emph default
are an expert and if you
\emph on
really
\emph default
know what you are doing, you may ignore this AT YOUR OWN RISK.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Even if your dead node comes to life again in some way: always ensure that
the mars kernel module cannot run any more on such a zombie server.
\emph on
Never
\emph default
do a
\family typewriter
modprobe mars
\family default
on a node marked as dead this way!
\end_layout
\begin_layout Standard
Further advice for complicated cases of destruction are in appendix
\begin_inset CommandInset ref
LatexCommand ref
reference "chap:Alternative-De--and"
\end_inset
and
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Cleanup-in-case"
\end_inset
.
\end_layout
\begin_layout Section
Online Resizing during Operation
\begin_inset CommandInset label
LatexCommand label
name "sec:Online-Resizing-during"
\end_inset
\end_layout
\begin_layout Standard
You need LVM or some other means of increasing the physical size of your
disk (e.g.
via firmware of some RAID controllers).
The network must be healthy.
Do the following steps:
\end_layout
\begin_layout Enumerate
Increase your local disks (usually
\family typewriter
/dev/vg/mydata
\family default
)
\emph on
everywhere
\emph default
in the whole cluster.
In order to avoid wasting space, increase them
\emph on
uniformly
\emph default
to the same size (when possible).
For example, on both hostA and hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
lvresize -L +100G /dev/vg/mydata
\end_layout
\begin_layout Enumerate
For safety, say on both hostA and hostB
\family typewriter
\begin_inset Newline newline
\end_inset
marsadm up mydata
\end_layout
\begin_layout Enumerate
For safety, say on both hostA and hostB
\family typewriter
\begin_inset Newline newline
\end_inset
marsadm wait-cluster
\end_layout
\begin_layout Enumerate
Only at the primary hostA:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm resize mydata
\end_layout
\begin_layout Enumerate
A
\emph on
partial
\emph default
fast full-sync will start at hostB.
Only the
\emph on
new
\emph default
portion of the block device will be synced.
Check that sync is running, or has already finished.
\end_layout
\begin_layout Enumerate
If you have intermediate layers such as iSCSI, you may need some
\family typewriter
iscsiadm
\family default
update or other commands.
\end_layout
\begin_layout Enumerate
Generally not needed, only for
\emph on
extreme
\emph default
safety / paranoia: you may wait until the partial sync has finished.
This is not really needed, but it may
\emph on
slightly(!)
\emph default
reduce the risk in case of an unplanned incident at the primary side.
If you execute the last step before the sync has finished, some data might
have been already written to the new portions of the underlying LV.
These writes will be written to the transaction log, and will be replicated.
Thus there is no real danger, and your secondary will be
\series bold
logically consistent
\series default
in reality, although it will be
\emph on
reported
\emph default
as
\family typewriter
InConsistent
\family default
by marsadm in the meantime.
If you want to avoid confusion about state
\family typewriter
Consistent
\family default
, and/or if you want extremely high protection against damaged logfiles
by hardware defects at the wrong moment (although the transaction logfiles
are already protected by md5 checksums), and/or if you are paranoid, it
may be helpful to wait until the sync has finished.
Normally, this is not needed, and you may immediately proceed to the last
step:
\end_layout
\begin_layout Enumerate
Now you may increase your filesystem.
This is specific for the filesystem type and documented elsewhere.
Some filesystems are able to increase their size while they are mounted
and while the applications are running on top of them, but others cannot
do this.
For example, an xfs online resize during operation can be triggered at
primary hostA where
\family typewriter
/dev/mars/mydata
\family default
is currently mounted:
\begin_inset Newline newline
\end_inset
\family typewriter
xfs_growfs /mountpoint/of/mydata
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: in general, the sync of the new portions is not really needed, because
the new junk data just does not care at filesystem level.
If you are not paranoid and if you know what you are doing, you may use
\family typewriter
marsadm fake-sync mydata
\family default
to abort unnecessary network traffic.
\end_layout
\begin_layout Section
Defending Overflow of
\family typewriter
/mars/
\begin_inset CommandInset label
LatexCommand label
name "sec:Defending-Overflow"
\end_inset
\end_layout
\begin_layout Standard
This section describes an important difference to DRBD.
The metadata of DRBD is allocated
\emph on
statically
\emph default
at
\emph on
creation
\emph default
\emph on
time
\emph default
of the resource.
In contrast, the MARS transaction logfiles are allocated
\emph on
dynamically
\emph default
at
\emph on
runtime
\emph default
.
\end_layout
\begin_layout Standard
This leads to a potential risk from the perspective of a sysadmin: what
happens if the
\family typewriter
/mars/
\family default
filesystem runs out of space?
\end_layout
\begin_layout Standard
In practice, no harm will occur to your data.
MARS will automatically go into the so-called emergency mode.
Resolution of emergency mode is very similar to resolution of split brain
(section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Resolution-of-Split"
plural "false"
caps "false"
noprefix "false"
\end_inset
): at all of your secondaries, type (repeatedly)
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm invalidate all
\end_layout
\begin_layout Standard
This is all you need to know.
If you are impatient, you may now skip the rest of this section.
\end_layout
\begin_layout Standard
For some background explanations, keep reading on.
\end_layout
\begin_layout Standard
Overflow and its treatment is
\emph on
unavoidable
\emph default
for long-distance replication.
If you want a system which can survive long-lasting network outages, while
keeping your replicas consistent as long as possible (called
\series bold
anytime consistency
\series default
), then you
\emph on
need
\emph default
dynamic storage.
It is
\emph on
impossible
\emph default
to solve with static pre-allocated memory
\begin_inset Foot
status open
\begin_layout Plain Layout
The bitmaps used by DRBD cannot preserve the
\emph on
order
\emph default
of write operations.
They cannot do that, because their space is
\begin_inset Formula $O(k)$
\end_inset
for some constant
\begin_inset Formula $k$
\end_inset
.
In contrast, MARS preserves the order.
Preserving the order as such (even when only
\emph on
facts
\emph default
about the order were recorded without recording the actual data contents)
requires
\begin_inset Formula $O(n)$
\end_inset
space where
\begin_inset Formula $n$
\end_inset
is infinitely growing over time.
\end_layout
\end_inset
.
A true solution would need
\emph on
infinite memory
\emph default
.
But suchalike does not exist on earth.
\end_layout
\begin_layout Standard
It would be an even worse idea to statically pre-allocate a lot of space
for
\emph on
each
\emph default
of your resources.
The latter would waste a lot of space, because some resources will likely
fill much more quickly than others.
MARS deals with this by using a
\emph on
common
\emph default
filesystem /mars which is
\emph on
shared
\emph default
by the transaction logs of
\emph on
all
\emph default
of your resources.
\end_layout
\begin_layout Standard
Although the size of /mars is statically allocated at cluster generation
time, there is a workaround for the problem.
When
\family typewriter
/mars
\family default
fills up during a network outage, and you have some spare space on your
VG, and when the network outage will be repaired shortly, you may decide
to dynamically extend /mars during operation.
\end_layout
\begin_layout Standard
Because of these fundamental differences, DRBD and MARS have different applicati
on areas.
If you just want a simple system for mirroring your data over short distances
via passive
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice: newer generation 10GBit technologies like SFP+ are no longer passive.
They involve some active chips, which may fail independently from your
servers.
In case of a failure, the CAP theorem property P is violated, and you only
have the choice between C and A.
For details, see
\family typewriter
mars-architecture-guide.pdf
\family default
.
\end_layout
\end_inset
crossover cable, and when failures of the crossover cables are very unlikely,
DRBD will be a suitable choice.
However, if you need to replicate over longer distances, or if you need
higher levels of reliability even when multiple failures may accumulate
(such as network loss during a
\emph on
re
\emph default
sync of DRBD), the transaction logs of MARS can solve it, but at some
\emph on
cost
\emph default
.
\end_layout
\begin_layout Subsection
Countermeasures against overflow
\end_layout
\begin_layout Subsubsection
Dimensioning of
\family typewriter
/mars/
\begin_inset CommandInset label
LatexCommand label
name "subsec:Dimensioning-of-/mars/"
\end_inset
\end_layout
\begin_layout Standard
The first (and most important) measure against overflow of
\family typewriter
/mars/
\family default
is simply to dimension it large enough to survive longer-lasting problems,
preferably one weekend.
\end_layout
\begin_layout Standard
Recommended size is at least one dedicated disk, residing at a hardware
RAID controller with BBU (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Preparation:-What-you"
\end_inset
).
During normal operation, that size is needed only for a small fraction,
typically a few percent or even less than one percent.
However, it is your
\series bold
safety margin
\series default
.
Keep it high enough!
\end_layout
\begin_layout Subsubsection
Monitoring
\end_layout
\begin_layout Standard
The next (equally important) measure is
\series bold
monitoring in userspace
\series default
.
\end_layout
\begin_layout Standard
Following is a list of countermeasures both in userspace and in kernelspace,
in the order of
\begin_inset Quotes eld
\end_inset
defensive walling
\begin_inset Quotes erd
\end_inset
:
\end_layout
\begin_layout Enumerate
Regular userspace monitoring must throw an INFO if a certain freespace limit
\begin_inset Formula $l_{1}$
\end_inset
of
\family typewriter
/mars/
\family default
is undershot.
Typical values for
\begin_inset Formula $l_{1}$
\end_inset
are 30%.
Typical actions are automated calls of
\family typewriter
marsadm cron
\family default
.
\end_layout
\begin_layout Enumerate
Regular userspace monitoring must throw a WARNING if a certain freespace
limit
\begin_inset Formula $l_{2}$
\end_inset
of
\family typewriter
/mars/
\family default
is undershot.
Typical values for
\begin_inset Formula $l_{2}$
\end_inset
are 20%.
Typical actions are (in addition to
\family typewriter
cron
\family default
) alarming human supervisors via SMS and/or further stronger automated actions.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Frequently large space is occupied by files stemming from debugging output,
or from other programs or processes.
A hot candidate is
\begin_inset Quotes eld
\end_inset
forgotten
\begin_inset Quotes erd
\end_inset
removal of debugging output to
\family typewriter
/mars/
\family default
.
Sometimes, an
\family typewriter
rm -rf $(find /mars/ -name
\begin_inset Quotes eld
\end_inset
*.log
\begin_inset Quotes erd
\end_inset
)
\family default
can work miracles.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Another source of space hogging is a
\begin_inset Quotes eld
\end_inset
forgotten
\begin_inset Quotes erd
\end_inset
\family typewriter
pause-sync
\family default
or
\family typewriter
disconnect
\family default
.
Therefore, a simple
\family typewriter
marsadm up all
\family default
may also work miracles (if you didn't want to freeze some mirror deliberately).
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you just wanted to freeze a mirror at an outdated state for a very long
time, you simply
\emph on
cannot
\emph default
do that without causing infinite growth of space consumption in
\family typewriter
/mars/
\family default
.
Therefore, a
\family typewriter
marsadm leave-resource $res
\family default
at
\emph on
exactly that(!)
\emph default
secondary site where the mirror is frozen, can also work miracles.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: you can / should start some of these measures even earlier at the
INFO level (see item 1), or even earlier.
\end_layout
\begin_layout Enumerate
Regular userspace monitoring must throw an ERROR if a certain freespace
limit
\begin_inset Formula $l_{3}$
\end_inset
of
\family typewriter
/mars/
\family default
is undershot.
Typical values for
\begin_inset Formula $l_{3}$
\end_inset
are 10%.
Typical actions are alarming the CEO via SMS and/or even stronger automated
actions.
For example, you may choose to automatically call
\family typewriter
marsadm leave-resource $res
\family default
on some or all secondary nodes, such that the primary will be left alone
and now has a chance to really delete its logfiles because no one else
is any longer potentially needing it.
\end_layout
\begin_layout Enumerate
First-level kernelspace action, automatically executed when
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_4_gb
\end_layout
\end_inset
\family default
+
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_3_gb
\end_layout
\end_inset
\family default
+
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_2_gb
\end_layout
\end_inset
\family default
+
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_1_gb
\end_layout
\end_inset
\family default
is undershot:
\begin_inset Newline newline
\end_inset
a warning will be issued.
\end_layout
\begin_layout Enumerate
Second-level kernelspace action, automatically executed when
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_3_gb
\end_layout
\end_inset
\family default
+
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_2_gb
\end_layout
\end_inset
\family default
+
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_1_gb
\end_layout
\end_inset
\family default
is undershot:
\begin_inset Newline newline
\end_inset
all locally secondary resources will delete local copies of transaction
logfiles which are no longer needed locally.
This is a desperate action of the kernel module.
\end_layout
\begin_layout Enumerate
Third-level kernelspace action, automatically executed when
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_2_gb
\end_layout
\end_inset
\family default
+
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_1_gb
\end_layout
\end_inset
\family default
is undershot:
\begin_inset Newline newline
\end_inset
all locally secondary resources will stop fetching transaction logfiles.
This is a more desperate action of the kernel module.
You don't want to get there (except for testing).
\end_layout
\begin_layout Enumerate
Last desperate kernelspace action when all else has failed and
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_free_space_1_gb
\end_layout
\end_inset
\family default
is undershot:
\begin_inset Newline newline
\end_inset
all locally primary resources will enter
\series bold
emergency mode
\series default
(see description below in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Emergency-Mode"
\end_inset
).
This is the most desperate action of the kernel module.
You don't want to get there (except for testing).
\end_layout
\begin_layout Standard
In addition, the kernel module obeys a general global limit
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/required_total_space_0_gb
\end_layout
\end_inset
+
\family default
the sum of all of the above limits.
When the
\emph on
total size
\emph default
of
\family typewriter
/mars/
\family default
undershots that sum, the kernel module refuses to start at all, because
it assumes that it is senseless to try to operate MARS on a system with
such low memory resources.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
The current level of emergency kernel actions may be viewed at any time
via
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/mars_emergency_mode
\end_layout
\end_inset
\family default
.
\end_layout
\begin_layout Subsubsection
Throttling
\begin_inset CommandInset label
LatexCommand label
name "subsec:Throttling"
\end_inset
\end_layout
\begin_layout Standard
This not generally recommended.
It may harm the IO performance from the viewpoint of your customers.
Thus use it only as a
\emph on
desperate
\emph default
defense against overflow, by
\series bold
throttling your performance pigs
\series default
.
\end_layout
\begin_layout Standard
Motivation: in rare cases, some users with
\family typewriter
ssh
\family default
access can do
\emph on
very
\emph default
silly things.
For example,
\end_layout
\begin_layout Itemize
some users are creating their own backups via user-cron jobs, and they do
it every 5 minutes.
Some example guy created a zip archive (almost 1GB) by regularly copying
his old zip archive into a new one, then appending deltas to the new one,
and finally deleting the old archive.
Every 5 minutes.
Although almost never any new files were added to the archive.
Essentially, he copied over his archive, for nothing.
This led to massive bulk write requests, for ridiculous reasons.
\end_layout
\begin_layout Itemize
another user wrote his own shell script for his own private backup of his
website, although there already is a daily system backup.
He regularly made a complete copy of his entire webspace (more than 60GiB)
via
\family typewriter
cp -a
\family default
, then created a tarball out of the copy, uploaded it into the cloud, finally
removed both the tarball and the complete filesystem copy.
Each time, about 100GB was temporarily allocated (and replicated via MARS).
\end_layout
\begin_layout Standard
Typically, your hard disks / RAID systems allow much higher write IO rates
than you can ever transport over a standard TCP network from your primary
site to your secondary, at least over longer distances.
Therefore, it is easy to create a such a high write load that it will be
\emph on
impossible
\emph default
to replicate it over the network,
\emph on
by construction
\emph default
.
\end_layout
\begin_layout Standard
MARS has some mechanism for throttling bulk writers whenever the network
is weaker than your IO subsystem.
It is off by default.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Notice that DRBD will
\emph on
always
\emph default
throttle your writes whenever the network forms a bottleneck, due to its
synchronous operation mode.
In contrast, MARS allows for buffering of performance peaks in the transaction
logfiles.
\emph on
Only when
\emph default
your buffer in
\family typewriter
/mars/
\family default
runs short (cf subsection
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Dimensioning-of-/mars/"
\end_inset
), MARS may be used for throttling your application writes.
\end_layout
\begin_layout Standard
There are a lot of screws named
\family typewriter
/proc/sys/mars/write_throttle_*
\family default
with the following meaning:
\end_layout
\begin_layout Description
\family typewriter
write_throttle_start_percent
\family default
Whenever the used space in
\family typewriter
/mars/
\family default
is below this threshold, no throttling will occur at all.
Only when this threshold is exceeded, throttling will start
\emph on
slowly
\emph default
.
Defaul value is 0, which means
\begin_inset Quotes eld
\end_inset
off
\begin_inset Quotes erd
\end_inset
.
Practical values for this coule be around 80%.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_end_percent
\family default
Maximum throttling will occur once this space threshold is reached, i.e.
the throttling is now at its maximum effect.
A practical value is 90%, which is the default.
When the actual space in
\family typewriter
/mars/
\family default
lies between
\family typewriter
write_throttle_start_percent
\family default
and
\family typewriter
write_throttle_end_percent
\family default
, the strength of throttling will be interpolated linearly between the extremes.
In practice, this should lead to an equilibrum between new input flow into
\family typewriter
/mars/
\family default
and output flow over the network to secondaries.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_size_threshold_kb
\family default
(readonly) This parameter shows the internal strength calculation of the
throttling.
Only write
\begin_inset Foot
status open
\begin_layout Plain Layout
Read requests are never throttled at all.
\end_layout
\end_inset
requests exceeding this size (in KB) are throttled at all.
Typically, this will hurt the bulk performance pigs first, while leaving
ordinary users (issuing small requests) unaffected.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_ratelimit_kb
\family default
Set the global IO rate in KB/s for those write requests which are throttled.
In case of strongest
\begin_inset Foot
status open
\begin_layout Plain Layout
In case of lighter throttling, the input flow into
\family typewriter
/mars/
\family default
may be higher because small requests are not throttled.
\end_layout
\end_inset
throttling, this parameters determines the input flow into
\family typewriter
/mars/
\family default
.
The default value is 10.000 KB/s.
Please adjust this value to your application needs and to your environment.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_rate_kb
\family default
(readonly) Shows the current rate of exactly those requests which are actually
throttled (in contrast to
\emph on
all
\emph default
requests).
\end_layout
\begin_layout Description
\family typewriter
write_throttle_cumul_kb
\family default
(logically readonly) Same as before, but the cumulative sum of all throttled
requests since startup / reset.
This value can be reset from userspace in order to prevent integer overflow.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_count_ops
\family default
(logically readonly) Shows the cumulative number of throttled requests.
This value can be reset from userspace in order to prevent integer overflow.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_maxdelay_ms
\family default
Each request is delayed at most for this timespan.
Smaller values will improve the responsiveness of your userspace application,
but at the cost of potentially retarding the requests not sufficiently.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_minwindow_ms
\family default
Set the minimum length of the measuring window.
The measuring window is the timespan for which the average (throughput)
rate is computed (see
\family typewriter
write_throttle_rate_kb
\family default
).
Lower values can increase the responsiveness of the controller algorithm,
but at the cost of accuracy.
\end_layout
\begin_layout Description
\family typewriter
write_throttle_maxwindow_ms
\family default
This parameter must be set sufficiently much greater than
\family typewriter
write_throttle_minwindow_ms
\family default
.
In case the flow of throttled operations pauses for some natural reason
(e.g.
switched off, low load, etc), this parameter determines when a completely
new rate calculation should be started over
\begin_inset Foot
status open
\begin_layout Plain Layout
Motivation: if requests would pause for one hour, the measuring window could
become also an hour.
Of course, that would lead to completely meaningless results.
Two requests in one hour is
\begin_inset Quotes eld
\end_inset
incorrect
\begin_inset Quotes erd
\end_inset
from a human point of view: we just have to ensure that averages are computed
with respect to a reasonable maximum time window in the magnitude of 10s.
\end_layout
\end_inset
.
\end_layout
\begin_layout Section
Emergency Mode and its Resolution
\begin_inset CommandInset label
LatexCommand label
name "subsec:Emergency-Mode"
\end_inset
\end_layout
\begin_layout Standard
This section explains some implementation details.
You may skip it.
\end_layout
\begin_layout Standard
When
\family typewriter
/mars/
\family default
is almost full and there is really absolutely no chance of getting rid
of any local transaction logfile (or free some space in any other way),
there is only one exit strategy: stop creating new logfile data.
\end_layout
\begin_layout Standard
This means that the ability for replication gets lost.
\end_layout
\begin_layout Standard
When entering emergency mode, the kernel module will execute the following
steps for all resources where the affected host is acting as a primary:
\end_layout
\begin_layout Enumerate
Do a kind of
\begin_inset Quotes eld
\end_inset
logrotate
\begin_inset Quotes erd
\end_inset
, but create a
\emph on
hole
\emph default
in the sequence of transaction logfile numbers.
The
\begin_inset Quotes eld
\end_inset
new
\begin_inset Quotes erd
\end_inset
logfile is left empty, i.e.
no data is written to it (for now).
The hole in the numbering will prevent any secondaries from replaying any
logfiles behind the hole (should they ever contain some data, e.g.
because the emergency mode has been left again).
This works because the secondaries are regularly checking the logfile numbers
for contiguity, and they will refuse to replay anything which is not contiguous.
As a result, the secondaries will be left in a consistent, but outdated
state (at least if they already were consistent before that).
\end_layout
\begin_layout Enumerate
The kernel module writes back all data present in the temporary memory buffer
(see figure in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-Transaction-Logger"
\end_inset
).
This may lead to a (short) delay of user write requests until that has
finished (typically fractions of a second or a few seconds).
The reason is that the temporary memory buffer must not be increased in
parallel during this phase (race conditions).
\end_layout
\begin_layout Enumerate
After the temporary memory buffer is empty, all local IO requests (whether
reads or writes) are directly going to the underlying disk.
This has the same effect as if MARS would not be present anymore.
Transaction logging does no longer take place.
\end_layout
\begin_layout Enumerate
Any sync from any secondary is stopped ASAP.
In case they are resuming their sync somewhen later, they will start over
from the beginning (position
\begin_inset Formula $0$
\end_inset
).
\end_layout
\begin_layout Standard
In order to leave emergency mode, the sysadmin should do the following steps:
\end_layout
\begin_layout Enumerate
Free enough space.
For example, delete any foreign files on
\family typewriter
/mars/
\family default
which have nothing to do with MARS, or resize the
\family typewriter
/mars/
\family default
filesystem, or whatever.
\end_layout
\begin_layout Enumerate
The following control is intended for testing.
If
\family typewriter
\begin_inset Flex URL
status open
\begin_layout Plain Layout
/proc/sys/mars/mars_reset_emergency
\end_layout
\end_inset
\family default
is off, now is the time to set it.
By default, it should be already set.
\end_layout
\begin_layout Enumerate
Notice: as long as not enough space has been freed, a message containing
\family typewriter
\begin_inset Quotes eld
\end_inset
EMEGENCY MODE HYSTERESIS
\begin_inset Quotes erd
\end_inset
\family default
(or similar) will be displayed by
\family typewriter
marsadm view all
\family default
.
As a consequence, any sync will be automatically halted.
This applies to freshly invoked syncs also, for example created by
\family typewriter
invalidate
\family default
or
\family typewriter
join-resource
\family default
.
\end_layout
\begin_layout Enumerate
On the secondaries, use
\family typewriter
marsadm invalidate $res
\family default
in order to request updating your outdated mirrors.
\end_layout
\begin_layout Enumerate
On the primary:
\family typewriter
marsadm cron
\end_layout
\begin_layout Enumerate
As soon as emough space has been freed everywhere to leave the
\family typewriter
EMEGENCY MODE HYSTERESIS
\family default
, sync should really start.
Until that it had been halted.
\end_layout
\begin_layout Enumerate
Recommendation: check at secondaries that state
\family typewriter
Orphan
\family default
has been left after a while.
\end_layout
\begin_layout Standard
Alternatively, there is a more complicated method, which keeps more intermediate
emergency backup replicas:
\end_layout
\begin_layout Enumerate
On
\emph on
all
\emph default
of your secondaries hostX:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm leave-resource mydata
\end_layout
\begin_layout Enumerate
At the primary hostA:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm cron
\end_layout
\begin_layout Enumerate
Wait until
\family typewriter
df /mars
\family default
shows no longer an overflow.
\end_layout
\begin_layout Enumerate
On the first secondary hostB:
\begin_inset Newline newline
\end_inset
\family typewriter
marsadm join-resource mydata /dev/lv/mydata
\end_layout
\begin_layout Enumerate
Wait until sync has finished at hostB.
\end_layout
\begin_layout Enumerate
If you have more than 2 replicas in total: proceed with step 4 at hostC,
and so on.
This time, you could join multipe resources in parallel, because you already
have a life replica at hostB.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Expert advice, if you have only 2 replicas, and provided you have enough
VG space: analogously to paragraph
\begin_inset CommandInset ref
LatexCommand vref
reference "par:Retaining-a-Split"
plural "false"
caps "false"
noprefix "false"
\end_inset
you may use
\family typewriter
lvrename
\family default
for keeping an outdated emergency backup before creating a new LV with
the old name, and before re-joining the latter.
Don't forget to remove your backup LV after sync has finished!
\end_layout
\begin_layout Chapter
Working with
\family typewriter
marsadm
\family default
commands
\family typewriter
\begin_inset CommandInset label
LatexCommand label
name "chap:The-Sysadmin-Interface"
\end_inset
\end_layout
\begin_layout Standard
This chapter is a kind of reference about the
\family typewriter
marsadm
\family default
tool.
The sub-commands of
\family typewriter
marsadm
\family default
are grouped according to the topic they deal with.
\end_layout
\begin_layout Standard
Since MARS work
\emph on
asynchronously
\emph default
at metadata propagation level (which is
\emph on
necessary
\emph default
for long-distance replication over flaky networks), several commands are
only
\emph on
triggering
\emph default
an action, but do not wait for its completion.
\end_layout
\begin_layout Standard
Such cases are indicated by the term
\begin_inset Quotes eld
\end_inset
after a while
\begin_inset Quotes erd
\end_inset
.
Please be aware that this
\begin_inset Quotes eld
\end_inset
while
\begin_inset Quotes erd
\end_inset
may last very long in case of network outages or bad firewall rules.
\end_layout
\begin_layout Standard
In the following tables, column
\begin_inset Quotes eld
\end_inset
Cmp
\begin_inset Quotes erd
\end_inset
means compatibility with DRBD.
Please note that 100% exact compatibility is not possible, because of the
asynchronous communication paradigm.
\end_layout
\begin_layout Standard
The following table documents common options, typically working in combination
with (almost) any
\family typewriter
marsadm
\family default
command (unless documented differently):
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Option
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--dry-run
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Run the command without actually creating symlinks or touching files or
executing rsync.
This option
\emph on
should
\emph default
be used first at any dangerous command, in order to check what would happen.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Don't use in scripts! Only use by hand!
\end_layout
\begin_layout Plain Layout
\size scriptsize
This option does not change the internal waiting logic for thois commands
which emulate synchronous behaviour on top of the asynchronous communication
paradigm.
Many commands are waiting until the desired effect has succeeded.
However, with
\family typewriter
--dry-run
\family default
the desired effect will never happen, so the command may wait forever (or
abort with a timeout).
\end_layout
\begin_layout Plain Layout
\size scriptsize
In addition, this option can lead to additional aborts of the commands due
to unmet conditions, which cannot be met because the symlinks are not actually
created / altered.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Thus this option can give only a
\series bold
rough estimate
\series default
of what would happen later.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--force
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
almost
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Some preconditions are skipped, i.e.
the command will / should work although some (more or less) vital preconditions
are violated.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Instead of giving
\family typewriter
--force
\family default
, you may alternatively prefix your command with
\family typewriter
force-
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
THIS OPTION IS DANGEROUS!
\end_layout
\begin_layout Plain Layout
\size scriptsize
Use it only when you are absolutely sure that you know what you are doing!
\end_layout
\begin_layout Plain Layout
\size scriptsize
Use it only as a last resort if the same command without
\family typewriter
--force
\family default
has failed
\emph on
for no good reason
\emph default
!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--parallel
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Only makes sense in combination with
\family typewriter
all
\family default
.
This is roughly equivalent to forking a bunch of parallel
\family typewriter
marsdm
\family default
processes, like in pseudo shell script notation:
\family typewriter
for i in $resource_list; do marsadm $parameters $i & done; wait
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Several cluster managers are not re-entrant and may deadlock.
First check whether this option is usable in your concrete environment!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--parallel=$number
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
--parallel
\family default
, but limit the parallelism degree to a maximum number of parallel processes.
This may be useful for limiting the parallelism of startup processes, e.g.
when kernel caches are cold, so the machine would get
\emph on
overloaded
\emph default
when too many resources would be starting in parallel.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Several cluster managers are not re-entrant and may deadlock.
First check whether this option is usable in your concrete environment!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--ignore-sync
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Use this for a
\emph on
planned
\emph default
handover instead of
\family typewriter
--force
\family default
.
Only one precondition is relaxed: some sync may be running somewhere.
\end_layout
\begin_layout Plain Layout
\size scriptsize
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Careful when using this on extremely huge LVs where the sync may take serveral
days, or weeks.
It is your sysadmin decision what you want to prefer: restarting the sync,
or planned handover.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--ignore-deleted-peers=$number
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Only for experts - usually not needed - may be harmful - read the sourcecode!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--verbose
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Some (few) commands will become more speaky.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--timeout=$seconds
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Some commands require response from either the local kernel module, or from
other cluster nodes.
In order to prevent infinite waiting in case of network outages or other
problems, the command will fail after the given timeout has been reached.
\end_layout
\begin_layout Plain Layout
\size scriptsize
When $seconds is -1, the command will wait forever.
\end_layout
\begin_layout Plain Layout
\size scriptsize
When $seconds is 0, the command will not wait in case any precondition is
not met, und abort without performing an action..
\end_layout
\begin_layout Plain Layout
\size scriptsize
The default timeout is 5s.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--window=$seconds
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
The time window for checking the aliveness of other nodes in the network.
When no symlink updates have been transferred from the other host since
more than the window time, the host is considered dead.
Default is 60s.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--stuck-seconds=$seconds
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Silencing period.
When replay is hanging
\emph on
unecpectedly
\emph default
for a longer time, spit a WARNING.
Nevertheless, there might be valid reasons, such as completely overloaded
hardware.
Therefore the default is much higher than
\family typewriter
--window
\family default
, around 3600s (1 hour).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--keep-backup-hours=$hours
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Only relevant for
\family typewriter
cron
\family default
and
\family typewriter
link-purge-all
\family default
.
Old remains from dead / unreachable machines, and some backup data produced
by join-cluster and split-cluster (potentially useful for experts), will
be purged after this age.
Default is 24 * 7 hours.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--autoclean
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Only relevant for
\family typewriter
cron
\family default
.
Very old
\emph on
historic
\emph default
remains from
\emph on
decommissioned
\emph default
machines will be purged after this age.
Default is an age of the remains of more than 1 month.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--threshold=$size
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
The macros containing the substring
\family typewriter
-threshold-
\family default
or
\family typewriter
-almost-
\family default
are using this as a default value for approximation whether some data transfer
(e.g.
logfile and/or sync) has approximately completed.
Default is 10MiB.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Notice: when data is continuously appended to the logfile, completeness
may
\emph on
never
\emph default
be reached.
Some data may always fly around somewhere in the network transfer channels.
\end_layout
\begin_layout Plain Layout
\size scriptsize
The $size argument may be a number optionally followed by one the lowercase
characters k m g t p for indicating kilo mega giga tera or peta bytes as
multiples of 1000.
When using the corresponding uppercase character, multiples of 1024 are
formed instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--host=$host
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
The command acts as if the command were executed on another host $host.
This option should not be used regularly, because the local information
in the symlink tree may be outdated or even wrong.
Additionally, some local information like remote sizes of physical devices
(e.g.
remote disks) is not present in the symlink tree at all, or is wrong (reflectin
g only the
\emph on
local
\emph default
state).
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
THIS OPTION IS DANGEROUS!
\end_layout
\begin_layout Plain Layout
\size scriptsize
Use it only for final destruction of dead cluster nodes, see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Final-Destroy-of"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--ssh-port=$number
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
(deprecated) Only useful when the old
\family typewriter
ssh
\family default
-based or
\family typewriter
rsync
\family default
-based
\family typewriter
{join,merge,split}-cluster
\family default
or
\family typewriter
join-resource
\family default
commands are used.
When newer
\family typewriter
mars.ko
\family default
and
\family typewriter
marsadm
\family default
versions are installed throughout the whole cluster, this is not needed
anymore.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--no-ssh
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Avoid any potential timeouts / hangs caused by networks or firewalls, by
explicitly disabling the old ssh-based communication method, and relying
on the new MARS communication protocol (by defaut on port 7777).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--ip=$ip
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
hfill
\end_layout
\end_inset
or
\begin_inset Newline newline
\end_inset
--ip-$peer=$ip
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Override the IP information for the local host or
\family typewriter
$peer
\family default
at the command line.
When this option is
\emph on
not
\emph default
given, the following rules apply in the following order:
\end_layout
\begin_layout Enumerate
\size scriptsize
lookup the IP for
\family typewriter
$peer
\family default
from the symlink tree in directory
\family typewriter
/mars/ips/
\family default
.
\end_layout
\begin_layout Enumerate
\size scriptsize
so-called
\emph on
probe data
\emph default
from other hosts in the cluster.
This tries to retrieve preliminary information as best as possible.
It can however only work when the other peers are reachable, which also
implies that in turn
\emph on
their
\emph default
currently configurred local peer IP must be correct.
\end_layout
\begin_layout Enumerate
\size scriptsize
Backups in
\family typewriter
/mars/backup-$timestamp/
\family default
as automatically created by several commands like
\family typewriter
merge-cluster
\family default
and
\family typewriter
split-cluster
\family default
.
When multiple historic backups are available, the
\emph on
youngest
\emph default
version will always win.
\end_layout
\begin_layout Enumerate
\size scriptsize
fallback to a DNS query via
\family typewriter
/usr/bin/host
\family default
.
\end_layout
\begin_layout Enumerate
\size scriptsize
all local network interfaces are scanned by
\family typewriter
/sbin/ip
\family default
for IPv4 adresses, and the
\emph on
first
\emph default
one is taken.
This may lead to wrong decisions if you have multiple network interfaces.
\end_layout
\begin_layout Plain Layout
\size scriptsize
In order to override this type of error-prone automatic IP detection and
to explicitly tell the IP address of your
\emph on
storage network
\emph default
(which might be different from the ordinary IP address of your host), please
use this option for maximum safety.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Usually you will need this only at
\family typewriter
{create,join,merge}-cluster
\family default
to determine any not yet known addresses.
Typically,
\family typewriter
{leave,split}-cluster
\family default
are able to automatically detect historic information from the backups.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
--verbose
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Some (few) commands will become more speaky.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Section
Cluster Operations
\begin_inset CommandInset label
LatexCommand label
name "sec:Cluster-Operations"
\end_inset
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
create-cluster
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the
\family typewriter
/mars/
\family default
filesystem must be mounted and it must be empty (
\family typewriter
mkfs.ext4
\family default
, see instructions in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Setup-your-Cluster"
\end_inset
).
The
\family typewriter
mars.ko
\family default
kernel module must
\emph on
not
\emph default
be loaded.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the initial symlink tree is created in
\family typewriter
/mars/
\family default
.
Additionally, the
\family typewriter
/mars/uuid
\family default
symlink is created for later distribution in the cluster.
It uniquely indentifies the cluster in the world.
\end_layout
\begin_layout Plain Layout
\size scriptsize
This must be called exactly once at the initial primary.
\end_layout
\begin_layout Plain Layout
\size footnotesize
Hint: use the
\family typewriter
--ip=
\family default
option if you have multiple network interfaces.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Example on hostA:
\family typewriter
marsadm --ip=192.168.2.101 create-cluster
\end_layout
\begin_layout Plain Layout
\size footnotesize
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Nodenames (see
\family typewriter
uname -n
\family default
and
\family typewriter
man 1 uname
\family default
and
\family typewriter
man 2 uname
\family default
) are the most critical part of your setup.
They
\series bold
must
\series default
be
\series bold
globally unique
\series default
, and they
\series bold
must never change, perpetually.
Any (human) error is your fault!
\begin_inset Newline newline
\end_inset
See also the GPL: NO WARRANTY
\end_layout
\begin_layout Plain Layout
\series bold
\size footnotesize
11.
BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY FOR
THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.
EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER
PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER
EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH
YOU.
SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY
SERVICING, REPAIR OR CORRECTION.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
join-cluster
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$host
\end_layout
\begin_layout Plain Layout
-or-
\end_layout
\begin_layout Plain Layout
\family typewriter
\size scriptsize
join-cluster
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$host
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$host_ip
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Preconditions: the cluster must have been already created with
\family typewriter
create-cluster
\family default
at another node
\family typewriter
$host
\family default
(optionally supplying an alternative IP address
\family typewriter
$host_ip
\family default
).
At your local node, the
\family typewriter
/mars/
\family default
filesystem must be mounted and it must be empty (
\family typewriter
mkfs.ext4
\family default
, see instructions in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Setup-your-Cluster"
\end_inset
).
,
\begin_inset space ~
\end_inset
The
\family typewriter
mars.ko
\family default
kernel module must be loaded
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
In ancient MARS versions before mars0.1astable101 the kernel module
\emph on
must not
\emph default
be loaded, and a working ssh connecttion to
\family typewriter
$host
\family default
must work as root (without password), and
\family typewriter
rsync
\family default
must be installed at all cluster nodes.
PROVISIONARY: in
\emph on
some
\emph default
newer MARS versions >= mars0.1astable101, the old ssh-based method is automatica
lly used as a fallback when the kernel module is forgotten to load; however
this provisionary workaround shall disappear in future.
\end_layout
\end_inset
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the initial symlink tree
\family typewriter
/mars/
\family default
is replicated from the remote host
\family typewriter
$host
\family default
, and the local host has been added as another cluster member.
\end_layout
\begin_layout Plain Layout
\size scriptsize
This must be called exactly once at every initial secondary node.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Hint: use the
\family typewriter
--ip=
\family default
option if you have
\emph on
multiple
\emph default
interfaces on your
\emph on
local
\emph default
hostB, and thus the local IP detection is not unique.
Be sure to use the right IP, e.g.
if you have a dedicated replication network.
Similarly, use the optional
\family typewriter
$host_ip
\family default
parameter if the current primary hostA
\emph on
also
\emph default
has
\emph on
multiple
\emph default
IP addresses, and thus the partner IP (in the replication network) is also
not uniquely deducable from the hostname.
\begin_inset Newline newline
\end_inset
Full example on hostB:
\family typewriter
marsadm --ip=192.168.2.102 join-cluster hostA 192.168.2.101
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
leave-cluster
\begin_inset CommandInset label
LatexCommand label
name "leave-cluster"
\end_inset
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the
\family typewriter
/mars/
\family default
filesystem must be mounted and it must contain a valid MARS symlink tree
produced by the other
\family typewriter
marsadm
\family default
commands.
The local node must no longer be member of any resource (see
\family typewriter
marsadm leave-resource
\family default
).
The kernel module should be loaded and the network should be operating
in order to also propogate the effect to the other cluster nodes.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the local node is removed from the replicated symlink tree
\family typewriter
/mars/
\family default
such that other nodes will cease to communicate with it after a while.
The converse it not true: the local node
\emph on
may
\emph default
continue
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
Reason:
\family typewriter
leave-cluster
\family default
removes only its
\emph on
own
\emph default
IP address from
\family typewriter
/mars/ips/
\family default
, but does not destroy the usual symmetry of the symlink tree by leaving
the other IPs intact.
Therefore, the local node will continue fetching updates from all nodes
present in
\family typewriter
/mars/ips/
\family default
.
As an effect, the local node will
\emph on
passively
\emph default
mirror the symlinks of other cluster members, but not vice versa.
There is no communication from the local node to the other ones, turning
the local node into a
\series bold
whitness
\series default
according to some terminology from Distributed Systems.
This is a feature, not a bug.
It could be used for porst-mortem analysis, or for monitoring purposes.
However,
\emph on
deletions
\emph default
of symlinks are not guaranteed to take place, so your whitness may
\emph on
accumulate
\emph default
thousands of old symlinks over a long time.
If you want to eventually stop all communication to the local node, just
run
\family typewriter
rmmod
\family default
.
\end_layout
\end_inset
passivley fetching the symlink tree.
In order to really stop all communication, the kernel module should be
unloaded afterwards (rmmod mars).
The local
\family typewriter
/mars/
\family default
filesystem should be manually destroyed thereafte,r, e.g.
for decommissioning of hardware.
This is
\emph on
strongly receommended
\emph default
for preventing
\begin_inset Quotes eld
\end_inset
zombies
\begin_inset Quotes erd
\end_inset
to resurrect by accident (human error, which is always AT YOUR RSIK).
\end_layout
\begin_layout Plain Layout
\size scriptsize
In case of an unintended hardware destruction (e.g.
fire, water, ...) this command should be used on another healty cluster node
$helper in order to finally remove $damaged from the cluster via the command
\family typewriter
marsadm leave-cluster --host=$damaged --force
\family default
.
An example is explained in section
\begin_inset CommandInset ref
LatexCommand vref
reference "subsec:Final-Destroy-of"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Before leave-cluster, ensure that all other cluster nodes know that it is
no longer participating in
\emph on
any
\emph default
resource!
\end_layout
\begin_layout Plain Layout
\size scriptsize
Hint: this can be usually achieved by
\family typewriter
marsadm leave-resource $resource --host=$damaged --force
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
In case you cannot use
\family typewriter
leave-cluster
\family default
for any reason (e.g.
complete network shutdown, no communication anymore possible at all), here
is an ADVICE for a last resort AT YOUR RISK: destroy the
\family typewriter
/mars/
\family default
filesystem on the host
\family typewriter
$deadhost
\family default
you want to remove (e.g.
by
\family typewriter
mkfs
\family default
), or take other measures to
\emph on
ensure
\emph default
that it cannot be accidentally re-used in any way (e.g.
physical destruction of the underlying RAID,
\family typewriter
lvremove
\family default
, etc).
On all other hosts, do
\family typewriter
rmmod mars
\family default
, then delete the symlink
\family typewriter
/mars/ips/ip-$deadhost
\family default
everywhere by hand, and finally
\family typewriter
modprobe mars
\family default
again.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
Notice that the last
\family typewriter
leave-resource
\family default
operation does not delete the cluster as such.
It just creates an
\emph on
empty
\emph default
cluster which has no longer any members.
In particular, the cluster ID
\family typewriter
/mars/uuid
\family default
is
\emph on
not
\emph default
removed, deliberately
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
This is a feature, not a bug.
The
\family typewriter
uuid
\family default
is created once, but alterered anywhere.
An exception is
\family typewriter
marsadm merge-cluster
\family default
(see there).
The only way to get rid of the uuid is
\emph on
external
\emph default
deletion (not by
\family typewriter
marsadm
\family default
)
\emph on
together(!)
\emph default
with all other contents of
\family typewriter
/mars/
\family default
.
This prevents you from accidentally merging half-dead remains which could
have survived a disaster for any reason, such as snapshotting filesystems
/ VMs or whatever.
\end_layout
\end_inset
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Before you can re-use
\emph on
any
\emph default
left-over
\family typewriter
/mars/
\family default
filesystem for re-joining the old cluster, or for creating / joining a
new / different cluster, you
\emph on
must
\emph default
create a fresh filesystem (see instructions in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Setup-your-Cluster"
\end_inset
) via
\family typewriter
mkfs.ext4
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
merge-cluster
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$host
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Preconditions: The set of resources at the local cluster (transitively)
and at the other cluster as addressed by some foreign member
\family typewriter
$host
\family default
(transitively) must be disjoint.
\emph on
All(!)
\emph default
hosts must be mutually reachable via the MARS ports (default 7777 to 7779).
Since
\family typewriter
mars0.1astable114,
\family default
\family typewriter
ssh
\family default
and
\family typewriter
rsync
\family default
are no longer required, provided that
\emph on
both
\emph default
clusters have been fully updated.
Otherwise ssh must be working between all members of both clusters, without
password (e.g.
via ssh-agent).
\end_layout
\begin_layout Plain Layout
\size scriptsize
Create the union of both clusters, consisting of the union of all participating
machines (transitively).
Resource memberships are unaffected.
This is useful for creating a
\begin_inset Quotes eld
\end_inset
virtual LVM cluster
\begin_inset Quotes erd
\end_inset
where resources can be migrated later via
\family typewriter
join-resource
\family default
/
\family typewriter
leave-resource
\family default
operations.
Usage examples can be found in the Football sub-project of MARS.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
Attention! use a newer version of MARS.
The old branch
\family typewriter
0.1.y
\family default
does not scale well in number of cluter members, because it evolved from
a lab prototype with
\begin_inset Formula $O(n^{2})$
\end_inset
behaviour at metadata exchange.
Never exceed the maximum cluster members as described in appendix
\begin_inset CommandInset ref
LatexCommand vref
reference "chap:Technical-Data-MARS"
\end_inset
.
For safety, you should better stay at 1/2 of the numbers mentioned there.
Use
\family typewriter
split-cluster
\family default
for going back to smaller clusters again after your background data migration
has completed.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Future versions of MARS will be constructed for very big clusters in the
range of thousands of nodes.
Development has not yet stabilized there, and operational experiences are
missing at the moment.
Be careful until official announcements are appearing in the ChangeLog,
reporting of operational experiences from the 1&1 big cluster at metadata
level.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
merge-cluster-check
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$host
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Check in advance whether the set of resources at the local cluster and at
the other cluster
\family typewriter
$host
\family default
are disjoint.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
split-cluster
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
This is almost the inverse operation of
\family typewriter
merge-cluster
\family default
: it determines the minimum sub-cluster groups participating in some common
resources.
Then it splits the cluster memberships such that unnecessary connections
between non-related nodes are interrupted.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Use this for avoidance of too big clusters.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Since
\family typewriter
mars0.1astable114,
\family default
\family typewriter
ssh
\family default
and
\family typewriter
rsync
\family default
are no longer required, provided that
\emph on
all
\emph default
hosts are mutually reachable over the default metadata communication port
7777.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-cluster
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Waiting"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
update-cluster
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Waiting"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
create-uuid
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
Deprecated.
Only for compatibility with very old version light0.1beta05 or earlier.
Will disappear somewhen in future.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Precondition: the
\family typewriter
/mars/
\family default
filesystem must be mounted.
A
\family typewriter
uuid
\family default
(such as automatically created by recent versions of
\family typewriter
marsadm create-cluster
\family default
) must not already exist; i.e.
you have a very old and outdated symlink tree.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the
\family typewriter
/mars/uuid
\family default
symlink is created for later distribution in the cluster.
It uniquely indentifies the cluster in the world.
\end_layout
\begin_layout Plain Layout
\size scriptsize
This must be called at most once at the current primary.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Section
Resource Operations
\begin_inset CommandInset label
LatexCommand label
name "sec:Resource-Operations"
\end_inset
\end_layout
\begin_layout Standard
Common precondition for all resource operations is that the
\family typewriter
/mars/
\family default
filesystem is mounted, that it contains a valid MARS symlink tree produced
by other
\family typewriter
marsadm
\family default
commands (including a unique
\family typewriter
uuid
\family default
), that your current node is a valid member of the cluster, and that the
kernel module
\family typewriter
mars.ko
\family default
is loaded.
When communication is impossible due to network outages or bad firewall
rules, most commands will succeed, but other cluster nodes may take a long
time to notice your changes.
\end_layout
\begin_layout Standard
Instead of executing
\family typewriter
marsadm
\family default
commands serveral times for each resource argument, you may give the special
resource argument
\family typewriter
all
\family default
.
This work even when combined with
\family typewriter
--force
\family default
, but be cautious when giving dangerous command combinations like
\family typewriter
marsadm delete-resource --force all
\family default
.
\end_layout
\begin_layout Standard
In newer versions of
\family typewriter
marsadm
\family default
, you may give a comma-separated list of resource names in place of
\family typewriter
all
\family default
.
This way, you have more fine-grained control over the set of resource names
you want to use.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Beware when combining this with
\family typewriter
--host=somebody
\family default
.
In some very rare cases, like final destruction of a whole datacenter after
an earthquake, you might need a combination like
\family typewriter
marsadm --host=defective delete-resource --force all
\family default
.
Don't use such combinations if you don't need them
\emph on
really
\emph default
! You can easily shoot yourself in your head if you are not carefully operating
such commands!
\end_layout
\begin_layout Subsection
Resource Creation / Deletion / Modification
\begin_inset CommandInset label
LatexCommand label
name "subsec:Resource-Creation"
\end_inset
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
create-resource
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$disk_dev
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
[$mars_name]
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
[$size]
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the resource argument
\family typewriter
$res
\family default
must denote a
\emph on
new
\emph default
(not yet existing) resource name in the cluster.
The argument
\family typewriter
$disk_dev
\family default
must denote an absolute path to a usable local block device, its size must
be greater zero.
When the optional
\family typewriter
$mars_name
\family default
is given, that name must not already exist on the local node; when not
given,
\family typewriter
$mars_name
\family default
defaults to
\family typewriter
$res
\family default
.
When the optional
\family typewriter
$size
\family default
argument is given, it must be a number, optionally followed by a lowercase
suffix
\family typewriter
k
\family default
,
\family typewriter
m
\family default
,
\family typewriter
g
\family default
,
\family typewriter
t
\family default
, or
\family typewriter
p
\family default
(denoting size factors as multiples of 1000), or an uppercase suffix
\family typewriter
K
\family default
,
\family typewriter
M
\family default
,
\family typewriter
G
\family default
,
\family typewriter
T
\family default
or
\family typewriter
P
\family default
(denoting size factors as multiples of 1024).
The given size must not exceed the actual size of
\family typewriter
$disk_dev
\family default
.
It will specify the future resource size as shown by
\family typewriter
marsadm view-resource-size $res
\family default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the resource
\family typewriter
$res
\family default
is created, the inital role of the current node is primary.
The corresponding symlink tree information is asynchonously distributed
in the cluster (in the background).
The device
\family typewriter
/dev/mars/$mars_name
\family default
should appear after a while.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Notice: when
\family typewriter
$size
\family default
is strictly smaller than the size of
\family typewriter
$disk_dev
\family default
, you will unnecessarily waste some space..
\end_layout
\begin_layout Plain Layout
\size scriptsize
This must be called exactly once for any new resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
join-resource
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$disk_dev
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
[$mars_name]
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the resource argument
\family typewriter
$res
\family default
must denote an already existing resource in the whole cluster (i.e.
its symlink tree information must have been received; use
\family typewriter
marsadm wait-cluster
\family default
for achieving this).
The resource must have a designated primary, and it must no be in emergency
mode.
There must not exist a split brain in the cluster.
The local node must not be already member of that resource.
The argument
\family typewriter
$disk_dev
\family default
must denote an absolute path to a usable (but currently unused) local block
device, its size must be greater or equal to the logical size of the resource.
When the optional
\family typewriter
$mars_name
\family default
is given, that name must not already exist on the local node; when not
given,
\family typewriter
$mars_name
\family default
defaults to
\family typewriter
$res
\family default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the current node becomes a member of resource
\family typewriter
$res
\family default
, the inital role is secondary.
The initial full sync should start after a while.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Notice: when the size of $disk_dev is strictly greater than the size of
the resource, you will unnecessarily waste some space.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
After a while, state
\family typewriter
Orphan
\family default
should be left.
Don't forget to regularly monitor for longer occurrences of
\family typewriter
Orphan
\family default
!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
leave-resource
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local node must be a member of the resource
\family typewriter
$res
\family default
; its current role must be secondary.
It must be detached (see
\family typewriter
marsadm down
\family default
).
The kernel module should be loaded and the network should be operating
in order to also propogate the effect to the other cluster nodes.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the local node is no longer a member of
\family typewriter
$res
\family default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Notice: as a side effect for other nodes, their
\family typewriter
cron
\family default
(or historic
\family typewriter
log-delete
\family default
) may now become possible, since the current node does no longer count as
a candidate for logfile application.
As another side effect, split brain situation may be (partly) resolved
by this.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Please notice that this command
\emph on
may likely
\emph default
resolve split brain (but cannot guarantee in general).
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
The contents of the disk is not changed by this command.
Before issuing this command, check whether the disk appears to be locally
consistent (see
\family typewriter
view-is-consistent
\family default
)! After giving this command, any internal information indicating the consistenc
y state will be gone, and you will no longer be able to guess consistency
properties.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
When you are
\emph on
sure
\emph default
.that the disk was consistent before (or is now by manually checking it),
you may re-create a new resource out of it via
\family typewriter
create-resource
\family default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
In case of an eventual node loss (e.g.
fire, water, ...) this command needs to be used on another node $helper in
order to finally remove all the resources $damaged from the cluster via
the command
\family typewriter
marsadm leave-resource $res --host=$damaged --force
\family default
.
Details are in section
\begin_inset CommandInset ref
LatexCommand vref
reference "subsec:Final-Destroy-of"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
delete-resource
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the resource must be empty (i.e.
all cluster members must have left via
\family typewriter
leave-resource
\family default
).
This precondition is overridable by
\family typewriter
--force
\family default
, increasing the danger to maximum! It is even possible to combine
\family typewriter
--force
\family default
with an invalid resource argument and an invalid
\family typewriter
--host=somebodyelse
\family default
argument in order to desperately try to destroy remains of incomplete or
pysically damaged hardware.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: all cluster members will somewhen be forcefully removed from
\family typewriter
$res
\family default
.
In case of network interruptions, the forced removal may take place far
in the future.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
THIS COMMAND IS
\emph on
VERY
\emph default
DANGEROUS!
\end_layout
\begin_layout Plain Layout
\size scriptsize
Use this only in desperate situations, and only manually.
Don't call this from scripts.
You are forcefully using a sledgehammer, even without
\family typewriter
--force
\family default
! The danger is that the
\emph on
true
\emph default
state of other cluster nodes cannot be known in general, e.g.
network problems etc.
Even when it were known, it could be compromised by
\series bold
byzantine failures
\series default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
It is strongly advised to try this command with
\family typewriter
--dry-run
\family default
first.
\end_layout
\begin_layout Plain Layout
\size scriptsize
When combined with
\family typewriter
--force
\family default
, this command will definitely
\series bold
murder
\series default
other cluster nodes, possibly after a long while, and even when they are
operating in primary mode / having split brains / etc.
However, there is no guarantee that other cluster nodes will be
\emph on
really
\emph default
dead – it is (theoretically) possible that they remain only
\emph on
half
\emph default
\emph on
dead
\emph default
.
For example, a half dead node may continue to write data to
\family typewriter
/mars/
\family default
and thus lead to overflow somewhen.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
This command implies a forceful detach, possibly destroying consistency.
\end_layout
\begin_layout Plain Layout
\size scriptsize
It is similar in spirit to
\series bold
STONITH
\series default
, but on cluster level, affection all known resource members.
In particular, when a cluster node was operating in primary mode (
\family typewriter
/dev/mars/mydata
\family default
being continuously in use), the forceful detach cannot be carried out until
the device is completely unused.
In the meantime, the current transaction logfile will be appended to, but
the file
\emph on
might
\emph default
be already unlinked (orphan file filling up the disk).
After the forceful detach, the underlying disk need not be consistent (although
MARS does its best).
Since this command deletes any symlinks which normally would indicate the
consistency state, no guarantees about consistency can be given after this
\emph on
in general
\emph default
! Always check consistency by hand!
\end_layout
\begin_layout Plain Layout
\size scriptsize
When possible / as soon as possible, check the local state on the other
nodes in order to
\emph on
really
\emph default
shutdown the resource everywhere (e.g.
to
\emph on
really
\emph default
unuse the
\family typewriter
/dev/mars/mydata
\family default
device, etc).
\end_layout
\begin_layout Plain Layout
\size scriptsize
After this command, you
\emph on
should
\emph default
rebuild the resource under a different name, in order to avoid any clashes
caused by unexpected resurrection of
\begin_inset Quotes eld
\end_inset
dead
\begin_inset Quotes erd
\end_inset
or
\begin_inset Quotes eld
\end_inset
half-dead
\begin_inset Quotes erd
\end_inset
zombie nodes (beware of shapshot / restores on virtual machines!!).
MARS does its best to avoid problems even in case the new resource name
should equal the old one, but there can be
\emph on
no guarantee
\emph default
in all possible failure scenarios / usage scenarios.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Whenever possible, prefer
\family typewriter
leave-resource
\family default
over this kind of sledgehammer!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
activate-guest
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the current host must be a cluster member (see commands
\family typewriter
join-cluster
\family default
and
\family typewriter
merge-cluster
\family default
), but need not (yet) be a resource member.
The resource must exist somewhere else in the cluster.
No additional storage is needed, except a few kilo or megabytes (typically)
for the symlink tree.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: symlink updates with other resource members and/or guests
are more frequently.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Consequently, marsadm commands and macros with the
\family typewriter
--host=
\family default
option may be used for remote state inspection, etc.
\end_layout
\begin_layout Plain Layout
\family typewriter
\size scriptsize
marsadm view all
\family default
will display the guest and its status.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
deactivate-guest
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the resource must exist.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any previous pure
\family typewriter
activate-guest
\family default
is rolled back.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
After about a month,,
\family typewriter
marsadm cron
\family default
will also remove the guest relationship.
This is to protect you from long-term accumulation of unnecessary guest
relationships, which are intended only for
\emph on
temporary
\emph default
purposes (in constrast to
\emph on
full
\emph default
resource memberships requiring storage space for keeping
\emph on
persistent
\emph default
replicas).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-resource
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
{is-,}{attach,
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
primary,
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
device}{-off,}
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Waiting"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Operation of the Resource
\begin_inset CommandInset label
LatexCommand label
name "subsec:Operation-of-the"
\end_inset
\end_layout
\begin_layout Standard
Common preconditions are the preconditions from section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Resource-Operations"
\end_inset
, plus the respective resource
\family typewriter
$res
\family default
must exist, and the local node must be a member of it.
With the single exception of
\family typewriter
attach
\family default
itself, all other operations must be started in
\family typewriter
attached
\family default
state.
\end_layout
\begin_layout Standard
When
\family typewriter
$res
\family default
has the special reserved value
\family typewriter
all
\family default
, the following operations will work on all resources where the current
node is a member (analogously to DRBD).
\end_layout
\begin_layout Standard
With newer versions of
\family typewriter
marsadm
\family default
, you can also give a list of comma-separated resource names in place of
\family typewriter
all
\family default
.
\end_layout
\begin_layout Standard
\noindent
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
attach
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
yes
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local disk belonging to $res is not in use by anyone else.
Its contents has not been altered in the meantime since the last
\family typewriter
detach
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Mounting
\emph on
read-only
\emph default
is allowed during the detached phase.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
However, be careful! If you
\emph on
accidentally
\emph default
forget to give the right readonly-mount flags, if you use
\family typewriter
fsck
\family default
in repair mode inbetween, or alter the disk content in any other way (beware
of LVM snapshots / restores etc), you will almost certainly produce an
\series bold
unnoticed inconsistency
\series default
(not reported by
\family typewriter
view-is-consistent
\family default
)! MARS has
\emph on
no chance
\emph default
to notice suchalike!
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: MARS uses the local disk and is able to work with it (e.g.
replay logfiles on it).
\end_layout
\begin_layout Plain Layout
\size scriptsize
Note: the local disk is opened in exclusive read-write mode.
This should protect against most common misuse, such as opening the disk
in parallel to MARS.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
However, this does not necessarily protect against non-exclusive openers.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
detach
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
yes
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local
\family typewriter
/dev/mars/mydata
\family default
device (when present) is no longer opened by anybody.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the local disk belonging to $res is no longer in use.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
In contrast to DRBD, you need not explicitly pause syncing, fetching, or
replaying
\emph on
to
\emph default
(as apposed to
\emph on
from
\emph default
) the local disk.
These processes are automatically paused.
Another difference to DRBD: the fetch / replay processes etc will usually
\emph on
automatically
\emph default
resume after re-attach, as far as possible in the respective new situation.
This will usually work even over
\family typewriter
rmmod
\family default
or reboot cycles, since the internal symlink tree will automatically persist
all todo switches for you (c.f.
section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-State-of"
\end_inset
).
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
Notice: only
\emph on
local
\emph default
transfer operations
\emph on
to
\emph default
the local disk are paused by a detach.
When another node is remotely running a sync
\emph on
from
\emph default
your local disk, it will likely remain in use for remote reading.
The reason is that the server part of MARS is operating purely passively,
in order serve all remote requests as best as possible (similar to the
original Unix philosophy).
In order to really stop all accesses, do a
\family typewriter
pause-sync
\family default
on all other resource member where a sync is currently running.
You may also try
\family typewriter
pause-sync-global
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
WARNING! After this, and ather having paused any remote data access, you
might use the underlying disk for your own purposes, such as test-mounting
it in
\emph on
readonly
\emph default
mode.
\series bold
Don't modifiy
\series default
its contents in any way! Not even by an
\family typewriter
fsck
\family default
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
Some (but not all)
\family typewriter
fsck
\family default
tools for some filesystems have options to start only a test repair / verify
mode / dry run, without doing actual modifications to the data.
Of course, these modes
\emph on
can
\emph default
be used.
But be really sure! Double-check for the right options!
\end_layout
\end_inset
! Otherwise, you will have inconsistencies
\emph on
guaranteed
\emph default
.
MARS has no way for knowing of any modifications to your disk when bypassing
\family typewriter
/dev/mars/*
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
In case you accidentally modified the underlying disk at the
\emph on
primary
\emph default
side, you may choose to resolve the inconsistencies by
\family typewriter
marsadm invalide $res
\family default
on
\emph on
each
\emph default
secondary.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-sync
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-sync-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-sync-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any sync operation targeting the local disk (when not yet
completed) is paused after a while (cf section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-State-of"
\end_inset
).
When successfully completed, this operation will remember the switch state
forever and automatically become relevant if a sync is needed again (e.g.
\family typewriter
invalidate
\family default
or
\family typewriter
resize
\family default
).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-sync-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
*-local
\family default
, but operates on all members of the resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-sync
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
resume-sync-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-sync-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: additionally, a primary must be designated, and it must not
be in emergency mode.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any sync operation targeting the local disk (when not yet
completed) is resumed after a while.
When completed, this operation will remember the switch state forever and
become relevant if a sync is needed again (e.g.
\family typewriter
invalidate
\family default
or
\family typewriter
resize
\family default
).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-sync-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
*-local
\family default
, but operates on all members of the resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-fetch
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-fetch-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-fetch-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
The resource
\emph on
should
\emph default
be in secondary role.
Otherwise the switch has
\emph on
no
\emph default
\emph on
immediate
\emph default
effect, but will come (possibly unexpectedly) into effect whenever secondary
role is entered later for whatever reason.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any transfer of (parts of) transaction logfiles which are
present at another primary host to the local
\family typewriter
/mars/
\family default
storage are paused at their current stage.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
This switch works independently from
\family typewriter
{pause,resume}-replay
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-fetch-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
*-local
\family default
, but operates on all members of the resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-fetch
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
resume-fetch-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-fetch-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
The resource
\emph on
should
\emph default
be in secondary role.
Otherwise the switch has
\emph on
no
\emph default
\emph on
immediate
\emph default
effect, but will come (possibly unexpectedly) into effect whenever secondary
role is entered later for whatever reason.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any (parts of) transaction logfiles which are present at
another primary host shouldl be transferred to the local
\family typewriter
/mars/
\family default
storage as far as not yet locally present.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
This works independently from
\family typewriter
{pause,resume}-replay
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-fetch-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
*-local
\family default
, but operates on all members of the resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-replay
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-replay-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-replay-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
The resource
\emph on
should
\emph default
be in secondary role.
Otherwise the switch has
\emph on
no
\emph default
\emph on
immediate
\emph default
effect, but will come (possibly unexpectedly) into effect whenever secondary
role is entered later for whatever reason.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any local replay operations of transaction logfiles to the
local disk are paused at their current stage.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
This works independently from
\family typewriter
{pause,resume}-fetch
\family default
resp.
\family typewriter
{dis,}connect
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
pause-replay-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
*-local
\family default
, but operates on all members of the resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-replay
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-replay-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-replay-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: must be in secondary role.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: any (parts of) locally existing transaction logfiles (whether
replicated from other hosts or produced locally) are started for replay
to the local disk, as far as they have not yet been applied.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resume-replay-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Like
\family typewriter
*-local
\family default
, but operates on all members of the resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
connect
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
connect-local
\family default
and to
\family typewriter
resume-fetch-local
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Note: although this sounds similar to DRBD's
\family typewriter
drbdadm connect
\family default
, there are subtle differences.
DRBD has exactly one connection per resource, which is associated with
\emph on
pairs
\emph default
of nodes.
In contrast, MARS may create multiple connections per resource at runtime,
and these are associated with the
\emph on
target
\emph default
host (not with
\emph on
pairs
\emph default
of hosts).
As a consequence, the fetch may
\emph on
potentially
\emph default
occur from any other source host which happens to be reachable (although
the current implementation prefers the current designated primary, but
this may change in future).
In addition,
\family typewriter
marsadm disconnect
\family default
does not stop
\emph on
all
\emph default
communication.
It only stops fetching logfiles.
The symlink updates running in background (default port 7777) are
\emph on
not
\emph default
stopped, in order to always propagate as much metadata as possible throughout
the cluster.
In case of a later incident, chances will be higher for a better knowledge
of the
\emph on
real
\emph default
state of the cluster.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
connect-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
resume-fetch-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
connect-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
resume-fetch-global
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
disconnect
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
disconnect-local
\family default
and to
\family typewriter
pause-fetch-local
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
See above note at
\family typewriter
connect
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
disconnect-local
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-fetch-local
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
disconnect-global
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
partly
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-fetch-global
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
up
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
yes
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
attach
\family default
followed by
\family typewriter
resume-fetch
\family default
followed by
\family typewriter
resume-replay
\family default
followed by
\family typewriter
resume-sync
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
down
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
yes
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
pause-sync
\family default
followed by
\family typewriter
pause-fetch
\family default
followed by
\family typewriter
pause-replay
\family default
followed by
\family typewriter
detach
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Hint: consider to prefer plain
\family typewriter
detach
\family default
over this, because
\family typewriter
detach
\family default
will remember the last state of all switches, while
\family typewriter
down
\family default
will
\emph on
not
\emph default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
primary
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
almost
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
There are three variants:
\end_layout
\begin_layout Plain Layout
Variant 1: planned handover (no
\family typewriter
--force
\family default
)
\end_layout
\begin_layout Plain Layout
\size scriptsize
Precondition: sync must have finished at any resource member.
All relevant transaction logfiles must be either already locally present,
or be fetchable (see
\family typewriter
marsadm up
\family default
, or low-level commands
\family typewriter
resume-fetch
\family default
and
\family typewriter
resume-replay
\family default
).
When some logfile data is locally missing, there must be enough space on
\family typewriter
/mars/
\family default
to fetch it.
Any replay must not have been interrupted by a replay error (see macro
%replay-code{} or diskstate
\family typewriter
DefectiveLog
\family default
).
The current designated primary must be reachable over network.
When there is no designated primary (i.e.
\family typewriter
marsadm secondary
\family default
had been executed before, which is explicitly
\emph on
not recommended
\emph default
), at least the old primary must be reachable.
The (old) primarie's virutal device
\family typewriter
/dev/mars/mydata
\family default
must not be in use any more (see
\family typewriter
marsadm wait-umount
\family default
).
A split brain must not already exist.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the current host is in primary role;
\family typewriter
/dev/mars/$dev_name
\family default
appears locally and is usable; the equivalent of
\family typewriter
marsadm up $res
\family default
has been executed as a safeguard against any forgotten previous
\family typewriter
pause-*
\family default
operations.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Switches the
\series bold
designated primary
\series default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Description of the
\series bold
Handover
\series default
protocol (when
\family typewriter
--force
\family default
is not given): when another host is currently primary, it is first asked
to leave its primary role.
When systemd templates are active, this will be automatically triggered
via
\family typewriter
systemctl stop $stop_unit
\family default
.
Otherwise, you are resposible for stopping the load yourself, and you dhoulf
use
\family typewriter
marsadm wait-umount
\family default
in advance for checking.
Anyway, the handover procol s waiting until the former primary has actually
become secondary.
After that, the local host is requested to become primary.
Before actually becoming primary, all relevant logfiles are transferred
over the network and replayed, in order to avoid accidental creation of
split brain as best as possible
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
Note that split brain avoidance is
\series bold
best effort
\series default
and cannot be guaranteed in general.
For example, it may be impossible to avoid split brain in case of long-lasting
network outages.
\end_layout
\end_inset
.
Only after that,
\family typewriter
/dev/mars/$dev_name
\family default
will appear.
When network transfers of the symlink tree are very slow (or currently
impossible), this command may take a very long time.
\end_layout
\begin_layout Plain Layout
\size scriptsize
In case a split brain is already detected at the initial situation, the
local host will refuse to switch the designated primary without
\family typewriter
--force
\family default
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
In case of
\begin_inset Formula $k>2$
\end_inset
replicas: if you want to handover between host
\family typewriter
A
\family default
and
\family typewriter
B
\family default
while a sync is currently running at host
\family typewriter
C
\family default
, you have the following options:
\end_layout
\begin_layout Enumerate
\size scriptsize
wait until the sync has finished (see macro
\family typewriter
sync-rest
\family default
, or
\family typewriter
marsadm view
\family default
in general).
\end_layout
\begin_layout Enumerate
\size scriptsize
do a
\family typewriter
leave-resouce
\family default
on host
\family typewriter
C
\family default
, and later
\family typewriter
join-resource
\family default
after the handover completed successfully.
\end_layout
\begin_layout Enumerate
\size scriptsize
use the option
\family typewriter
--ignore-sync
\family default
, which leads to a restart of the running sync from position 0.
\end_layout
\begin_layout Plain Layout
Variant 2: planned handover (no
\family typewriter
--force
\family default
) with sync abort (
\family typewriter
--ignore-sync
\family default
)
\end_layout
\begin_layout Plain Layout
\size scriptsize
2)
\series bold
Handover ignoring running syncs,
\series default
by adding the option
\family typewriter
--ignore-sync
\family default
.
Any running syncs will restart from scratch, in order to ensure consistency.
Use this only when the planned handover is more important than the sync
time.
\end_layout
\begin_layout Plain Layout
Variant 3: unplanned failover (
\family typewriter
--force
\family default
)
\end_layout
\begin_layout Plain Layout
\size scriptsize
3)
\series bold
Forced switching
\series default
: by giving –force while
\family typewriter
pause-fetch
\family default
is active (but not
\family typewriter
pause-replay
\family default
), most preconditions are ignored, and MARS does its best to actually become
primary even if some logfiles are missing or incomplete or even defective.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\family typewriter
\size scriptsize
primary --force
\family default
is a potentially harmful variant, because it will provoke a split brain
in most cases, and therefore in turn will lead to
\series bold
data loss
\series default
because one of your split brain versions must be discarded later in order
to resolve the split brain (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Split-Brain-Resolution"
\end_inset
).
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\series bold
\size scriptsize
Never
\series default
call
\family typewriter
primary --force
\family default
when planned handover via
\family typewriter
primary
\family default
without
\family typewriter
--force
\family default
is sufficient! If
\family typewriter
primary
\family default
without
\family typewriter
--force
\family default
complains that the device is in use at the former primary side, take it
seriously! Don't override with
\family typewriter
--force
\family default
, but rather umount
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
A common misconception is when people think that they can keep their filesystem
mounted without provoking a split brain, because they have their application
stopped and thus don't write any data into the filesystem.
This is a wrong idea, because filesystems may write some metadata, like
booking information, even after hours or days of inactivity.
Therefore MARS insists that the device is no longer in use before any handover
can take place.
\end_layout
\end_inset
the device at the other side!
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Only use
\family typewriter
primary --force
\family default
when something is
\emph on
already broken
\emph default
, such as a network outage, or a node crash, etc.
During ordinary operations (network OK, nodes OK), you should never need
\family typewriter
primary --force
\family default
!
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
If you umount
\family typewriter
/dev/mars/mydata
\family default
on the old primary
\family typewriter
A
\family default
, and then wait until
\family typewriter
marsadm view
\family default
(or another suitable macro) on the target host
\family typewriter
B
\family default
shows that everything is
\family typewriter
UpToDate
\family default
, you have some
\emph on
chance
\emph default
for avoiding a split brain even with
\family typewriter
primary --force
\family default
.
However, there is no guarantee.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\family typewriter
\size scriptsize
primary --force
\family default
switches the
\emph on
designated
\emph default
primary.
In some extremely rare cases, when
\emph on
multiple
\emph default
faults have accumulated in a
\emph on
weird
\emph default
situation, it
\emph on
might
\emph default
be impossible becoming the / an actual primary.
Typically you may be
\emph on
already
\emph default
in a split brain situation.
This has not been observed for a long operations time on recent versions
of MARS, but in general becoming primary via
\family typewriter
--force
\family default
cannot be guaranteed always, although MARS does its best.
In split brain situations, or if you ever encounter such a problem, you
\emph on
must
\emph default
resolve the split brain immediately after giving this command (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Split-Brain-Resolution"
\end_inset
).
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Hint in case of
\begin_inset Formula $k>2$
\end_inset
replicas:
\family typewriter
marsadm invalidate
\family default
cannot resolve a split brain at
\emph on
other
\emph default
secondaries (which are neither the old nor the new designated primary).
Therefore, prefer the
\family typewriter
leave-resource
\family default
method described in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Split-Brain-Resolution"
\end_inset
, starting with a
\family typewriter
leave-resource
\family default
phase at the old primary, and proceeding to
\begin_inset Quotes eld
\end_inset
unrelated
\begin_inset Quotes erd
\end_inset
secondaries step by step, until the split brain is gone.
Don't
\family typewriter
join-resource
\family default
again before the split brain is gone! This way, all these replicas will
remain consistent for now, but of course outdated (or potentially even
a
\begin_inset Quotes eld
\end_inset
wrong
\begin_inset Quotes erd
\end_inset
split-brain version, but
\emph on
potentially usable
\emph default
in case you get under pressure in some way).
In the hopefully unlikely case that you should later discover that you
accidentally forced the
\emph on
wrong
\emph default
replica via
\family typewriter
primary --force
\family default
, you will have a chance for recovery by either forcing the
\begin_inset Quotes eld
\end_inset
correct
\begin_inset Quotes erd
\end_inset
host to primary (if it did not already leave the resource), or by creating
a completely fresh resource out of the
\begin_inset Quotes eld
\end_inset
correct
\begin_inset Quotes erd
\end_inset
local disk.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Generally: in case of
\family typewriter
primary --force
\family default
, the preconditions are different.
The fetch
\emph on
must
\emph default
be switched off (see
\family typewriter
pause-fetch
\family default
), in order to get stable logfile positions.
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Forced-Switching"
\end_inset
.
For your safety,
\family typewriter
--force
\family default
does not work in newer marsadm (after mars0.1stable52) when your replica
is a current sync target.
More explanations see section
\begin_inset CommandInset ref
LatexCommand vref
reference "subsec:Forced-Switching"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
secondary
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
almost
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local
\family typewriter
/dev/mars/$dev_name
\family default
is no longer in use (e.g.
umounted).
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: There exists no designated primary any more.
During split brain and when the network is OK (again), all actual primaries
(including the local host) will leave primary ASAP (i.e.
when their
\family typewriter
/dev/mars/mydata
\family default
is no longer in use).
Any secondary will start following (old) logfiles (even from backlogs)
by replaying transaction logs if it is
\emph on
uniquely
\emph default
possible (which is often violated during split brain).
On any secondary,
\family typewriter
/dev/mars/$dev_name
\family default
will have disappeared.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Notice: in difference to DRBD, you
\series bold
don't need
\series default
and you
\series bold
should not use
\series default
this command during normal operation, including handover.
Any resource member which is
\emph on
not
\emph default
designated as primary will
\emph on
automatically
\emph default
go into secondary role.
For example, if you have
\begin_inset Formula $k=4$
\end_inset
replicas, only
\emph on
one of them
\emph default
can be designated as a primary.
When the network is OK, all other 3 nodes will know this fact, and they
will
\emph on
automatically
\emph default
go into secondary mode, following the transaction logs from the (new) primary.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
Hint: avoid this command.
It turns off
\emph on
any
\emph default
primary,
\series bold
globally
\series default
\begin_inset Foot
status open
\begin_layout Plain Layout
\size scriptsize
A serious
\series bold
misconception
\series default
among some people is when they believe that they can switch
\begin_inset Quotes eld
\end_inset
a certain node to secondary
\begin_inset Quotes erd
\end_inset
.
It is not possible to switch individual nodes to secondary, without affecting
other nodes! The concept of
\begin_inset Quotes eld
\end_inset
designated primary
\begin_inset Quotes erd
\end_inset
is
\series bold
global
\series default
throughout a resource!
\end_layout
\end_inset
.
You cannot start a sync after that (e.g.
\family typewriter
invalidate
\family default
or
\family typewriter
join-resource
\family default
or
\family typewriter
resume-sync
\family default
), because it is
\emph on
not unique
\emph default
wherefrom the data shall be fetched.
In split brain situations (when the network is OK again), this may have
further drawbacks.
It is much better / easier to
\series bold
\emph on
directly
\emph default
switch the designated primary
\series default
from one node to another via the
\family typewriter
primary
\family default
command.
See also section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Forced-Switching"
\end_inset
.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
There is only one valid use case where you
\emph on
really
\emph default
need this command: before finally destroying a resouce via the
\emph on
last
\emph default
\family typewriter
leave-resource
\family default
(or before
\emph on
forcefully killing
\emph default
your resource via the dangerous
\family typewriter
delete-resource
\family default
).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-umount
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Waiting"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
log-purge-all
\begin_inset CommandInset label
LatexCommand label
name "log-purge-all$res"
\end_inset
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: all locally known logfiles and version links are removed,
whenever they are not / no longer reachable by any split brain version.
\end_layout
\begin_layout Plain Layout
Rationale: remove hindering split-brain /
\family typewriter
leave-resource
\family default
leftovers.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Usually, you don't need this.
\family typewriter
leave-resource
\family default
and
\family typewriter
invalidate
\family default
are already doing a similar logfile cleanup for you.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Use this only as a desperate last resort when split brain does not go away
by means of
\family typewriter
leave-resource
\family default
(which
\emph on
could
\emph default
happen in very weird scenarios such as MARS running on virtual machines
doing a restore of their snapshots, or otherwise unexpected resurrection
of dead or half-dead nodes).
\end_layout
\begin_layout Plain Layout
THIS IS
\emph on
POTENTIALLY
\emph default
DANGEROUS
\end_layout
\begin_layout Plain Layout
\size scriptsize
This command
\emph on
might
\emph default
destroy some valuable logfiles / other information in case the local informatio
n is outdated or otherwise incorrect, as could be the case during very awkward
disaster scenarios, such as corrupted
\family typewriter
/mars
\family default
filesystems.
MARS does its best for checking anything, but there cannot be an absolute
guarantee.
\end_layout
\begin_layout Plain Layout
That said, no single incident has been observed during millions of operation
hours.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Hint: use
\family typewriter
--dry-run
\family default
beforehand for checking!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
err-purge-all
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: errors reported by
\family typewriter
marsadm view $res --verbose
\family default
are deleted after a while.
However notice that some error reports may soon re-appear in case the error
condition is persisting.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
link-purge-all
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: all deletable links withspeical value
\family typewriter
.deleted
\family default
, which have been fully replicated throughout the whole cluster, will be
deleted eventually.
This is necessary to prevent inode overflow on
\family typewriter
/mars
\family default
.
\end_layout
\begin_layout Plain Layout
Notice:
\family typewriter
marsadm cron
\family default
will do this also.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
resize
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
[$size]
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
almost
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: The local host must be primary.
All disks in the cluster participating in
\family typewriter
$res
\family default
must be physically larger than the logical resource size (e.g, by use of
\family typewriter
lvm
\family default
; can be checked by macros
\family typewriter
%disk-size{}
\family default
and
\family typewriter
%resource-size{}
\family default
).
When the optional
\family typewriter
$size
\family default
argument is present, it must be smaller than the minimum of all physical
sizes, but larger than the current logical size of the resource.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the logical size of
\family typewriter
/dev/mars/$dev_name
\family default
will reflect the new size after a while.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Logfile Operations
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
cron
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Do all necessary housekeeping tasks.
\end_layout
\begin_layout Plain Layout
\size scriptsize
This needs to be regularly called by an external cron job or similar.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
log-rotate
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Historic.
Please use
\family typewriter
cron
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
log-delete
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Historic.
Please use
\family typewriter
cron
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
log-delete-one
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Historic.
Please use
\family typewriter
cron
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
log-delete-all
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Historic.
Please use
\family typewriter
cron
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Consistency Operations
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
invalidate
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local node must be in secondary role at
\family typewriter
$res
\family default
.
A
\emph on
designated
\emph default
primary must exist, and it must be reachable over network.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: the local disk is marked as
\family typewriter
InConsistent
\family default
, and a fast fullsync from the designated primary will start after a while.
Any
\emph on
local
\emph default
split brain (deviation from the designated primary) will be resolved, but
any
\emph on
other
\emph default
split brain at other secondaries will
\emph on
not
\emph default
be affected.
When the fullsync has finished successfully, the local node will be consistent
again.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
After a while, state
\family typewriter
Orphan
\family default
should be left.
Don't forget to regularly monitor for longer occurrences of
\family typewriter
Orphan
\family default
!
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
fake-sync
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local node must be in secondary role at
\family typewriter
$res
\family default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: when a fullsync is running, it will stop after a while, and
the local node will be
\emph on
marked
\emph default
as consistent as if it were consistent again.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
THIS IS HIGLY DANGEROUS FOR DATA CONSISTENCY!
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
ONLY USE THIS IF YOU REALLY KNOW WHAT YOU ARE DOING!
\begin_inset Newline newline
\end_inset
See the WARNING in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Creating-and-Maintaining"
\end_inset
\begin_inset Newline newline
\end_inset
Use this only
\emph on
before
\emph default
creating a fresh filesystem inside
\family typewriter
/dev/mars/$res
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-replay
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
ONLY FOR ADVANCED HACKERS WHO KNOW WHAT THEY ARE DOING!
\begin_inset Newline newline
\end_inset
This command is deliberately not documented.
You need the competence level RTFS (
\begin_inset Quotes eld
\end_inset
read the fucking sources
\begin_inset Quotes erd
\end_inset
).
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Section
Further
\family typewriter
marsadm
\family default
Operations
\begin_inset CommandInset label
LatexCommand label
name "sec:Further-marsadm-Operations"
\end_inset
\end_layout
\begin_layout Subsection
Inspection Commands
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
view-
\emph on
macroname
\begin_inset Newline newline
\end_inset
\emph default
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Display the output of a macro evaluation.
See section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Inspecting-the-State"
\end_inset
for a thorough description.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
view
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Equivalent to
\family typewriter
view-default
\family default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
role
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Use
\family typewriter
view-role
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
state
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Use
\family typewriter
view-state
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
cstate
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Use
\family typewriter
view-cstate
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
dstate
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Use
\family typewriter
view-dstate
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
status
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated.
Use
\family typewriter
view-status
\family default
instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
show-state
\end_layout
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Don't use it.
Use
\family typewriter
view-state
\family default
instead, or other macros.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
show-info
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Don't use it.
Use
\family typewriter
view-info
\family default
instead, or other macros.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
show
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Don't use it.
Implement your own macros instead.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
show-errors
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Deprectated, will vanish.
Use
\family typewriter
view-the-err-msg
\family default
or
\family typewriter
view-resource-err
\family default
similar macros.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
cat
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$file
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Write the file content to stdout, but replace all occurences of numeric
timestamps converted to a human-readable format.
Thus is most useful for inspection of status and log files, e.g.
\family typewriter
marsadm cat /mars/5.total.log
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Setting Parameters
\begin_inset CommandInset label
LatexCommand label
name "subsec:Setting-Parameters"
\end_inset
\end_layout
\begin_layout Subsubsection
Per-Resource Parameters
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-emergency-limit $res
\emph on
n
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
The argument
\emph on
n
\emph default
must be percentage between 0 and 100 %.
When the remaining store space in
\family typewriter
/mars/
\family default
undershoots the given percentage, the resource will go
\emph on
earlier
\emph default
into emergency mode than by the global computation described in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Defending-Overflow"
\end_inset
.
0 means unlimited.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-emergency-limit $res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Inquiry of the preceding value.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-connect-pref-list $res host1,host2,hostn
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Provisionary and deprecated - this command should hopefully disappear somewhen
in future.
Avoid it.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Set the order of preferences for connections (in DRBD-like speak) when there
are more than 2 hosts participating in a resource (aka peers).
Of course, these peers need also to be cluster members.
The last argument must be a comma-separated list of node names (aka peer
names).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-connect-pref-list $res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Provisionary and deprecated - this command should hopefully disappear somewhen
in future.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Inquiry of the preceding value.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsubsection
Global Parameters
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-global-sync-limit-value
\emph on
n
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Limit the concurrency of sync operations to some maximum number.
0 means unlimited.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-global-sync-limit-value
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Inquiry of the preceding value.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-global-enabled-log-compressions
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$features
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Tell the whole cluster which compression features to use globally for logfile
compression.
The effective value can be checked via
\family typewriter
marsadm view-enabled-log-compressions
\family default
.
See
\family typewriter
marsadm view-potential-features
\family default
and
\family typewriter
marsadm --help
\family default
for a list of compression feature names, which must be separated by
\family typewriter
|
\family default
symbols.
Details are described in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:Data-Compression-Checksumming"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-global-enabled-net-compressions
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$features
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Tell the whole cluster which compression features to use globally for network
transport compression.
The effective value can be checked via
\family typewriter
marsadm view-enabled-net-compressions
\family default
.
See
\family typewriter
marsadm view-potential-features
\family default
and
\family typewriter
marsadm --help
\family default
for a list of compression feature names, which must be separated by
\family typewriter
|
\family default
symbols.
Details are described in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:Data-Compression-Checksumming"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\end_inset
,
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-global-disabled-digests
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$features
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Tell the whole cluster which digests to disable globally for checksumming
of transaction logfile data.
The effective value can be checked via
\family typewriter
marsadm view-disabled-digests
\family default
.
See
\family typewriter
marsadm view-potential-features
\family default
and
\family typewriter
marsadm --help
\family default
for a list of compression feature names, which must be separated by
\family typewriter
|
\family default
symbols.
Details are described in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:Data-Compression-Checksumming"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\end_inset
,
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Waiting
\begin_inset CommandInset label
LatexCommand label
name "subsec:Waiting"
\end_inset
\end_layout
\begin_layout Standard
For scripting, these commands are often needed for race avoidance.
MARS' symlink are not propagated
\emph on
immediately
\emph default
throughout the whole cluster, but will take some time (also called
\series bold
eventually consistent
\series default
using a so-called Lamport clock).
The following commands can be used for triggering a status update, and
then waiting until information is recent enough.
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-cluster
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the
\family typewriter
/mars/
\family default
filesystem must be mounted and it must contain a valid MARS symlink tree
produced by the other
\family typewriter
marsadm
\family default
commands.
The kernel module must be loaded.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: none.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Wait until
\emph on
all relevant
\emph default
nodes in the cluster have sent a status update of their version of the symlink
tree, or until timeout.
The default timeout is 30 s (exceptionally) and may be changed by
\family typewriter
--timeout=$seconds
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Use this for avoidance of rance conditions in the cluster, for nodes pariticipa
ting in some of the local resources.
This command does its best to get the current status from the other cluster
members.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
This works only for resources which have been
\emph on
already
\emph default
joined.
It you want to do a
\family typewriter
join-resource
\family default
, use
\family typewriter
update-cluster
\family default
instead for fetching / updating the not-yet-joined symlink information
also.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
update-cluster
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the
\family typewriter
/mars/
\family default
filesystem must be mounted everywhere and it must contain a valid MARS
symlink tree produced by the other
\family typewriter
marsadm
\family default
commands.
The network must be healthy.
The kernel module must be loaded everywhere.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: none.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Wait until
\emph on
all
\emph default
nodes in the
\emph on
whole
\emph default
cluster have sent a status update of their
\emph on
full
\emph default
symlink tree, including any joined or non-joined information, or until
timeout.
The default timeout is 30 s (exceptionally) and may be changed by
\family typewriter
--timeout=$seconds
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Use this before join-resource to ensure that
\emph on
all
\emph default
symlink information is recent.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-resource
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
{is-,}{attach,
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
primary,
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
device}{-off,}
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: the local node must be a member of the resource
\family typewriter
$res
\family default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition: none.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Wait until the local node reaches a specified condition on
\family typewriter
$res
\family default
, or until timeout.
The default timeout of 60 s may be changed by
\family typewriter
--timeout=$seconds
\family default
.
The last argument denotes the condition.
The condition is inverted if suffixed by
\family typewriter
-off
\family default
.
When preceded by
\family typewriter
is-
\family default
(which is the most useful case), it is checked whether the condition is
actually reached.
When the
\family typewriter
is-
\family default
prefix is left off, the check is whether another
\family typewriter
marsadm
\family default
command has been already given which
\emph on
tries
\emph default
to achieves the intended result (typicially, you may use this after the
\family typewriter
is-
\family default
variant has failed).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-connect
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
almost
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
This is an alias for
\family typewriter
wait-cluster
\family default
waiting until only those nodes are reachable which are particiapting at
\family typewriter
$res
\family default
(instead of waiting for
\emph on
all
\emph default
hosts participating in
\emph on
any
\emph default
of the locally joined resources).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
wait-umount
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Precondition: none additionally.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Postcondition:
\family typewriter
/dev/mars/$dev_name
\family default
is no longer in use (e.g.
umounted).
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
\family typewriter
systemd
\family default
Control Commands
\begin_inset CommandInset label
LatexCommand label
name "subsec:systemd-Control-Commands"
\end_inset
\end_layout
\begin_layout Standard
These are optional commands when you want to use systemd for control of
your services running on top of MARS, and for more automated handover /
failover.
The concept is described in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:systemd-Templates"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
systemd-trigger
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Tell the macro processor engine of marsadm that some systemd templates and/or
configurations have changed.
This will automatically re-compute any necessary systemd units residing
in
\family typewriter
/run/systemd/system/
\family default
from template files provided in one of the directories from
\family typewriter
@MARS_PATH/$SYSTEMD_SUBDIR/
\family default
, and will automatically remove any
\emph on
instances
\emph default
(not templates) which are no longer needed.
Finally,
\family typewriter
systemctl reload-daemon
\family default
is executed, and any necessary units are started / stopped according to
the new situation.
\begin_inset Newline newline
\end_inset
The macro language behind the template engine is described in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:systemd-Templates"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\size default
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
When combined with
\family typewriter
--force
\family default
, this will forcefully re-compute any template instances, even when already
created before.
Without
\family typewriter
--force
\family default
, there is an internal check whether re-creation is necessary.
This check might be fooled by manual intervention into
\family typewriter
/run/systemd/system/
\family default
, so
\family typewriter
--force
\family default
will repair it.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-systemd-unit
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$start_unit
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$stop_unit
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Assign new start and unit names to a resource, or delete any existing names
when the empty string
\family typewriter
\begin_inset Quotes eld
\end_inset
\begin_inset Quotes erd
\end_inset
\family default
is provided as
\family typewriter
$start_unit
\family default
.
Afterwards, a
\family typewriter
systemd-trigger
\family default
is executed, which causes start / stop operations according to the new
situation.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-systemd-unit
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Report the current assignment of start and stop unit names to the given
resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-systemd-want
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$hostname
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Manually override the host where $start_unit should appear.
This is useful for a temporary stop of the applicatiom stack when $hostname
has the special value
\family typewriter
\begin_inset Quotes eld
\end_inset
(none)
\begin_inset Quotes erd
\end_inset
\family default
.
See the
\family typewriter
fsck
\family default
example in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:systemd-Templates"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\begin_inset Newline newline
\end_inset
In split brain situations, it
\emph on
might
\emph default
be useful for manual override, but notice that
\family typewriter
marsadm primary –force
\family default
should be preferred because it switches
\emph on
both
\emph default
the designated primary
\emph on
and
\emph default
the application stack.
Notice that the application stack won't actually start at a location where
\family typewriter
/dev/mars/$res
\family default
is not present.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-systemd-want
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$res
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Report the current systemd start location for the given resource.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Low-Level Expert Commands
\end_layout
\begin_layout Standard
These commands are for experts and advanced sysadmins only.
The interface is not stable, i.e.
the meaning may change at any time.
Use at your own risk!
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
set-link
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
RTFS.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-link
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
RTFS.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
delete-file
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
RTFS.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Standard
The following commands are for manual setup / repair of cluster membership.
Only to be used by experts who know what they are doing! In general, cluster-wi
de operations on IP addresses needs to be repeated at all hosts in the cluster
iff the communication is not (yet) possible and/or not (yet) actually working
(e.g.
firewalling problems etc).
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "30col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
lowlevel-ls-host-ips
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "50col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
List all configured cluster members together with their currently configured
IP addresses, as known in
\family typewriter
/mars/ips/
\family default
\emph on
locally
\emph default
.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "30col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
lowlevel-set-host-ip
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$hostname
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$ip
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "50col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Change the assignment of IP addresses in
\family typewriter
/mars/ips/
\family default
at least
\emph on
locally
\emph default
, and
\emph on
try
\emph default
to push the information also to other known peers (which is
\emph on
unreliable
\emph default
in general).
This may be used when hosts are moved to different network locations, or
when different network interfaces are to be used for replication (e.g.
dedicated replication IPs).
Notice that the names of hosts must not change at all, only their IP addresses
may be changed, or new peers may be manually added this way.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Tip: check active connections with
\family typewriter
netstat
\family default
& friends.
Updates may need some time to proceed (socket timeouts etc).
\end_layout
\begin_layout Plain Layout
\size scriptsize
Hint: for safety, call this on
\emph on
all
\emph default
members of a cluster to ensure consistency.
Otherwise it may happen that some cluster members do not know the
\emph on
new
\emph default
IP address where to fetch the
\emph on
new
\emph default
information from.
See also the description of the
\family typewriter
--ip-$peer=$peer_ip
\family default
option.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
For creation of new cluster memberships, always prefer
\family typewriter
join-resource
\family default
.
It checks for any uuid mismatches and for any resource name clashes / violation
s of resource name uniqueness, which could be
\series bold
extremely dangerous
\series default
for your data.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "30col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
lowlevel-delete-host
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
$hostname
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "50col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Please prefer
\family typewriter
leave-resource
\family default
followed by
\family typewriter
leave-cluster
\family default
instead.
This is only a fallback for
\emph on
experts
\emph default
.
\end_layout
\begin_layout Plain Layout
\size scriptsize
Useful for decommissioning of dead / physically destroyed hosts after a
disaster.
Removes a host from the cluster membership in
\family typewriter
/mars/ips/
\family default
at least
\emph on
locally
\emph default
, together with its IP address assignment.
It also
\emph on
tries
\emph default
to push the deletion to other cluster members (which is
\emph on
unreliable
\emph default
in general).
This does not remove any further information.
In particular, resource memberships are untouched.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\size scriptsize
Please use
\family typewriter
leave-resource --host=$name --force
\family default
first.
Repeat this for
\emph on
all
\emph default
former resource memberships.
Otherwise you may produce left-over
\begin_inset Quotes eld
\end_inset
zombie resource memberships
\begin_inset Quotes erd
\end_inset
, which in turm may prevent
\family typewriter
marsadm cron
\family default
from deleting logfile data, and consequently filling up
\family typewriter
/mars/
\family default
forever.
When
\emph on
all
\emph default
replicas of any such resource are decommissioned eventually, also use
\family typewriter
delete-resource --force
\family default
and friends, and/or
\family typewriter
marsadm cron --autoclean
\family default
after a retention period of 1 month or more.
\end_layout
\begin_layout Plain Layout
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
\size scriptsize
Have a
\emph on
serious look
\emph default
at
\family typewriter
leave-resource --host=$hostname
\family default
, first without
\family typewriter
--force
\family default
, and also
\family typewriter
leave-cluster --host=$hostname
\family default
, first without
\family typewriter
--force
\family default
, which are checking for some common pitfalls.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Senseless Commands (from DRBD)
\end_layout
\begin_layout Standard
For completeness, here is a list of commands which do not make sense with
MARS.
Some of them are syntactically parsed for scrpting compatibility, but are
not doing anything.
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
syncer
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
new-current-uuid
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
create-md
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
dump-md
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
dump
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
get-gi
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
show-gi
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
outdate
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
adjust
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
yes
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
Implemented as NOP (not necessary with MARS).
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
hidden-commands
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Forbidden Commands (from DRBD)
\end_layout
\begin_layout Standard
These commands are not implemented because they would be dangerous in MARS
context:
\end_layout
\begin_layout Standard
\size scriptsize
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Command / Params
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Cmp
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
Description
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
invalidate-remote
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
This would be dangerous in case you have multiple secondaries.
A similar effect can be achieved with the
\family typewriter
--host=
\family default
option.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\family typewriter
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "20col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\family typewriter
\size scriptsize
verify
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
no
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\size scriptsize
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
\size scriptsize
This would cause unintended side effects due to races between logfile transfer
/ application and block-wise comparison of the underlying disks.
However,
\family typewriter
marsadm join-resource
\family default
or
\family typewriter
invalidate
\family default
will do the same as DRBD verify followed by DRBD resync, i.e.
this will automatically correct any found errors;.
Note that the fast-fullsync algorithm of MARS will minimize network traffic.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Chapter
Tuning, tips and tricks
\begin_inset CommandInset label
LatexCommand label
name "chap:Tuning,-tips-and"
\end_inset
\end_layout
\begin_layout Section
IO Performance Tuning
\begin_inset CommandInset label
LatexCommand label
name "sec:IO-Performance-Tuning"
\end_inset
\end_layout
\begin_layout Standard
There
\emph on
exist
\emph default
some use cases where MARS
\emph on
can
\emph default
deliver better IO performance than a raw block device.
However, this cannot be expected
\emph on
in general
\emph default
.
In some
\emph on
other
\emph default
cases the performance may be
\emph on
lower
\emph default
than with a
\emph on
single
\emph default
local raw device.
\end_layout
\begin_layout Standard
For demonstration, we use the
\family typewriter
blkreplay
\family default
tool from
\begin_inset Flex URL
status open
\begin_layout Plain Layout
http://blkreplay.org
\end_layout
\end_inset
and a load which has been captured from a
\series bold
real datacenter
\series default
(1&1 Ionos ShaHoLin = Shared Hosting Linux).
The load already contains a parallelism degree of 20 LXC containers running
in parallel at the same iron.
This corresponds to about 60,000 web spaces running on 20 Apache instances,
already in parallel.
In difference to artificial benchmarks (like pure random IO or pure sequential
IO), this benchmark is much more close to real server operations, while
artificial benchmarks are not meaningful for practice in general, because
they can deviate from real server operations by
\emph on
factors
\emph default
or even by
\series bold
orders of magnitude
\series default
.
\end_layout
\begin_layout Standard
In order to determine the limits of the test candidates, the timing of the
original workload was converted to a linear ramp-up, simulating an
\series bold
overloaded
\series default
system.
Otherwise benchmarking would not be possible.
\end_layout
\begin_layout Standard
The following
\family typewriter
blkreplay
\family default
benchmarks were executed on an otherwise unloaded Dell R630 with 40 CPU
threads on 2 sockets, 192 GB RAM, a Dell R730 hardware RAID controller
with 2 GB BBU cache, and 10 spindles Dell 1.8 TB 2.5 inch SAS disks configured
as RAID-6.
All data, including the
\family typewriter
/mars
\family default
directory, was located on the hardware RAID via LVM2.
\family typewriter
/dev/vginfong/lv-0
\family default
was assigned a size of 8 TiB.
For testing, vanilla kernel 4.9.x with the MARS pre-patch and
\family typewriter
mars0.1astable72
\family default
was used.
\end_layout
\begin_layout Standard
The
\family typewriter
blkreplay
\family default
parameters were as follows:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
output_label="MARS"
\end_layout
\begin_layout Plain Layout
\end_layout
\begin_layout Plain Layout
# input description
\end_layout
\begin_layout Plain Layout
input_file_list="http://blkreplay.org/loads/natural/1and1/shared-hosting/2016/Sha
HoLin_from_bare_metal/x20/shaholin-x20-ramped/shaholin-x20.adjacent.ramped-100.load.
gz"
\end_layout
\begin_layout Plain Layout
replay_duration=110
\end_layout
\begin_layout Plain Layout
speedup=10
\end_layout
\begin_layout Plain Layout
threads=512
\end_layout
\begin_layout Plain Layout
cmode=with-conflicts
\end_layout
\begin_layout Plain Layout
scheduler="noop"
\end_layout
\begin_layout Plain Layout
\end_layout
\begin_layout Plain Layout
# hardware setup
\end_layout
\begin_layout Plain Layout
replay_host_list="icpu5133"
\end_layout
\begin_layout Plain Layout
replay_device_list="/dev/vginfong/lv-0"
\end_layout
\begin_layout Plain Layout
\end_layout
\begin_layout Plain Layout
# output description
\end_layout
\begin_layout Plain Layout
enable_graph=1
\end_layout
\begin_layout Plain Layout
graph_options="--no-static --dynamic"
\end_layout
\end_inset
\end_layout
\begin_layout Standard
We start with the
\series bold
raw
\series default
device
\family typewriter
/dev/vginfong/lv-0
\family default
which had a size of 8 TiB.
The throughput is about 1418 IOPS, and the latency diagram shows that the
system is overloaded, but can cope with that overload:
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/blkreplay/MARS.MARS.raw.iosched-noop.nr_request-128.icpu5133.vginfong.lv-0.g01.latency.realtime.png
width 100col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
As you can see in the filename, the NOOP kernel IO scheduler was used, and
the kernel parameter
\family typewriter
nr_requests
\family default
was left at its default value of 128.
When you read the specs of the Dell R730 hardware RAID controller, you
will notice that it can handle a much higher IO request parallelism of
almost 1024 requests in parallel.
\end_layout
\begin_layout Standard
So the first natural tuning attempt is
\family typewriter
nr_requests=1020
\family default
, in order to release the
\begin_inset Quotes eld
\end_inset
kernel IO handbrake
\begin_inset Quotes erd
\end_inset
.
This results in an improved throughput of 1562 IOPS, and even the
\emph on
maximum
\emph default
latencies are improved, but the
\emph on
average
\emph default
latencies are becoming a little bit worse:
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/blkreplay/MARS.MARS.raw.iosched-noop.nr_request-1020.icpu5133.vginfong.lv-0.g01.latency.realtime.png
width 100col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
It is well known since decades that there is a principal tradeoff between
throughput and latencies in IO systems.
Thus it is not a surprising result.
\end_layout
\begin_layout Standard
On servers, overload situations should be rare, and during overload throughput
is typically much more important than latencies, as long as latencies are
not exceedingly high.
Thus we can recommend
\family typewriter
nr_requests=1000
\family default
for production.
\end_layout
\begin_layout Standard
However, some sysadmins might be tempted to question why the NOOP scheduler
has been used.
On the internet, there are a ton of claims that other IO schedulers like
CFQ are much better.
\end_layout
\begin_layout Standard
Well, testing with CFQ instead of NOOP is no problem for
\family typewriter
blkreplay
\family default
.
However, the result is very surprising.
While the IOPS are 1539, which is only a slight decrease which could result
from measurement tolerances, the latencies are now turning almost into
a disaster:
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/blkreplay/MARS.MARS.raw.iosched-cfq.nr_request-1020.icpu5133.vginfong.lv-0.g01.latency.realtime.png
width 100col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
In production, you should never encounter IO latencies of almost 15 seconds.
So what is going wrong here?
\end_layout
\begin_layout Standard
Here is an explanation.
A hardware RAID controller
\emph on
already
\emph default
has an
\emph on
internal
\emph default
IO scheduler.
This IO scheduler is hidden in a black box, such that many sysadmins don't
know of its existence.
If you add another IO scheduler at kernel level, you will have
\series bold
two different
\series default
IO schedulers running in parallel, and sometimes taking
\series bold
contradictory decisions
\series default
.
\end_layout
\begin_layout Standard
These contradictory IO scheduling decisions may lead to problems in certain
cases and scenarios.
\end_layout
\begin_layout Standard
There is another risk of interference with a third IO scheduler, which is
MARS' internal asymmetric writeback scheduler.
The latter is currently well-tuned for co-working with a BBU cache and
its internal scheduler, running on bare metal.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Never use MARS inside of VMs! There you will have
\emph on
several
\emph default
additional IO schedulers and further types of IO bottlenecks
\begin_inset Foot
status open
\begin_layout Plain Layout
Example: data container formats like
\family typewriter
qcow2
\family default
can act as serious bottlenecks.
Never place
\family typewriter
/mars
\family default
on top of them! Potential exceptions (after well-founded investigations)
are functional testing, and certain non-critical workstation-like workloads.
In general, never plan to place unknown or enterprise-critical workloads
on top of them!
\end_layout
\end_inset
inbetween, even if you try to disable some of them.
\end_layout
\begin_layout Standard
While kernel-level IO schedulers like CFQ certainly have their merits at
improving your workstation's IO behaviour, they are counter-productive
at servers with hardware RAID controllers.
\end_layout
\begin_layout Standard
So the advice is clear:
\series bold
switch them off
\series default
\emph on
in such a case
\emph default
.
\end_layout
\begin_layout Standard
Even if you have a software RAID, check with
\family typewriter
blkreplay
\family default
that any IO schedulers are
\emph on
really
\emph default
improving things.
Notice that device driver restrictions like
\family typewriter
nr_requests
\family default
may also work similarly to an IO scheduler.
When possible, use your real workload, captured with
\family typewriter
blktrace
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Never use a benchmark which only delivers IOPS! As demonstrated, inappropriate
IOPS tuning (or choice of inappropriate components) can worsen latencies
so much that production can be endangered!
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Always look at
\emph on
both
\emph default
IOPS
\emph on
and
\emph default
latencies!
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
\emph on
Average
\emph default
latencies, even when enriched with
\emph on
standard deviation
\emph default
, are not enough.
Classical statistics does not clearly describe operational problems like
\series bold
hangs
\series default
and
\series bold
exceptionally high latency requests
\series default
, which may occur only rarely, but can then lead to
\series bold
serious incidents
\series default
.
Use a tool which can clearly display
\emph on
any
\emph default
faulty behaviour, such as
\family typewriter
blkreplay
\family default
's
\series bold
latency diagrams
\series default
!
\end_layout
\begin_layout Standard
Now we come to benchmarking
\family typewriter
/dev/mars/lv-0
\family default
placed on top of
\family typewriter
/dev/vginfong/lv-0
\family default
.
Notice that MARS needs to write all write requests twice: once into the
transaction logfile, and a second time by writeback into
\family typewriter
/dev/vginfong/lv-0
\family default
.
\end_layout
\begin_layout Standard
So you might expect that performace of
\family typewriter
/dev/mars/lv-0
\family default
could be worse than at the underlying raw device.
\end_layout
\begin_layout Standard
Nevertheless, the
\series bold
throughput
\series default
is now measured 4338 IOPS, which means that performance has
\series bold
more than doubled
\series default
.
You can also see it by the duration of the benchmark at the x axis.
Even the latencies have improved in many cases:
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/blkreplay/MARS.MARS.mars.iosched-noop.nr_request-1020.icpu5133.mars.lv-0.g01.latency.realtime.png
width 100col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
How is it possible to be faster than a RAW device? How can this be explained?
\end_layout
\begin_layout Standard
Look at the graphics and at the explanations from section
\begin_inset CommandInset ref
LatexCommand vref
reference "sec:The-Transaction-Logger"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
The key to local IO performance is the
\series bold
re-ordering of writeback
\series default
according to ascending sector numbers.
This can reduce mechanical seek times of hard disks considerably, and even
by factors, such that it can over-compensate the doubled writes to the
transaction logfile, and even when both are residing at the same RAID set.
\end_layout
\begin_layout Standard
Since RAID-6 is has more expensive write operations due to its CRC computations
and updates, RAID-6 will much more profit from this effect.
Other RAID modes like RAID-10 may show a lower throughput improvement.
\end_layout
\begin_layout Standard
Notice: this effect is not only dependent from total RAM size and from the
maximum size of the MARS temporary memory buffer (tuning parameter
\family typewriter
/proc/sys/mars/mars_mem_percent
\family default
which defaults to a limit of 20%).
It is also highly dependent from the actual seek behaviour of the
\series bold
workload
\series default
.
\end_layout
\begin_layout Standard
For example, if you use
\family typewriter
dd
\family default
for sequentially overwriting /dev/mars/lv-0 with a parallelism degree of
1, the writeback optimization of MARS cannot be exploited.
However,
\family typewriter
dd
\family default
is no appropriate benchmarking tool, and has almost nothing to do with
real workloads occuring in datacenters, which typically are neither sequential,
nor do they have a parallelism degree of only 1.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Please don't try to lead any discussions about this: simply use
\family typewriter
blktrace
\family default
to capture your real server workload, and compare it to a run of dd.
Only if you encounter the same behaviour as
\family typewriter
dd
\family default
, only then you can really claim that your workload is like
\family typewriter
dd
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Any
\series bold
assumptions about workloads
\series default
are very dangerous: they can deviate from practice not only by factors,
but sometimes even by
\emph on
orders of magnitude
\emph default
.
There no substitute for real measuments of
\series bold
actual workload behaviour
\series default
.
\end_layout
\begin_layout Standard
Notice: the writeback optimization of MARS can typically only improve performanc
e of HDDs, but not of SSDs.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
By placing
\family typewriter
/mars
\family default
onto its own physical device with appropriate speed, you can compensate
the doubled writes to some degree.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Depending on the workload and on RAID parameters,
\family typewriter
/mars
\family default
may be better placed onto SSDs, or better be placed on HDDs.
There is no general rule.
Just use
\family typewriter
blktrace
\family default
on your real workload, and check several configuration alternatives (also
different RAID levels etc) with
\family typewriter
blkreplay
\family default
.
\end_layout
\begin_layout Section
Data Compression and Checksumming (Digests)
\begin_inset CommandInset label
LatexCommand label
name "sec:Data-Compression-Checksumming"
\end_inset
\end_layout
\begin_layout Standard
Data compression can reduce the amount of data which needs to be piped through
long-distance or other network bottlenecks.
It is available in newer MARS versions, starting from mars0.1astable91.
You also need to install the corresponding new version of
\family typewriter
marsadm
\family default
across the whole cluster.
\end_layout
\begin_layout Standard
The locally compiled-in compression and checksumming features as compiled
into your currently running
\family typewriter
mars.ko
\family default
can be queried via
\end_layout
\begin_layout Quote
\family typewriter
marsadm view-implemented-features
\end_layout
\begin_layout Standard
The output may depend on your kernel compile options, such as the enabled
crypto algorithms of your kernel.
Typical output should look like
\end_layout
\begin_layout Quote
\begin_inset Flex URL
status open
\begin_layout Plain Layout
CHKSUM_MD5_OLD|CHKSUM_MD5|CHKSUM_CRC32C|CHKSUM_CRC32|CHKSUM_SHA1|COMPRESS_LZO|CO
MPRESS_LZ4|COMPRESS_ZLIB
\end_layout
\end_inset
\end_layout
\begin_layout Standard
In case you get less options, check your kernel
\family typewriter
.config
\family default
for the corresponding crypto algorithms, which can be compiled into your
kernel firmly, or as a module.
When necessary, re-compile your kernel with more crypto options enabled
(see build instructions in section
\begin_inset CommandInset ref
LatexCommand formatted
reference "sec:MARS-Kernel-Module"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Standard
When the compile-time option
\family typewriter
CONFIG_MARS_BENCHMARK=y
\family default
is enabled,
\family typewriter
modprobe mars
\family default
will show you a list of benchmark results for each enabled crypto algorithm,
in units of nanoseconds.
Smaller numbers are better.
Notice that results may depend on your processor model, and on availability
of hardware acceleration (as supported by the crypto infrastucture of your
kernel).
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Take the benchmark results with a grain of salt.
The performance of some crypto algorithms may heavily depend on the
\emph on
compressibility
\emph default
of the data to be compressed.
\family typewriter
CONFIG_MARS_BENCHMARK
\family default
uses a rather artifical test data pattern, which may deviate from the compressi
bility of your real productive data.
Take the results with similar caution than BOGOMIPS, which are also not
comparable with other benchmarks in general.
\end_layout
\begin_layout Standard
In order to work properly,
\emph on
all
\emph default
cluster members must have loaded a newer version of
\family typewriter
mars.ko
\family default
.
During rolling upgrade to newer MARS versions, mixed operation of different
MARS versions is supported, even in combination with some old versions
supporting only the traditional CHKSUM_MD5_OLD (which has some shortcomings
and should not be used anymore in future).
Only
\emph on
common
\emph default
features are actually usable.
You can query the commonly usable options via the commands
\end_layout
\begin_layout Quote
\family typewriter
marsadm view-usable-compressions
\end_layout
\begin_layout Standard
and
\end_layout
\begin_layout Quote
\family typewriter
marsadm view-usable-digests
\end_layout
\begin_layout Standard
These should should show you a (possibly empty) list of those options which
are really usable
\emph on
at the moment
\emph default
.
By installing newer / better versions of
\family typewriter
mars.ko
\family default
and
\family typewriter
marsadm
\family default
, the list may become longer.
\end_layout
\begin_layout Standard
An overview of currently usable options, as well as the actually used algorithms
, are displayed at the headings produced by
\family typewriter
marsadm view all
\family default
.
\end_layout
\begin_layout Subsection
Network Transport Compression
\begin_inset CommandInset label
LatexCommand label
name "subsec:Network-Transport-Compression"
\end_inset
\end_layout
\begin_layout Standard
By default, network transport compression is disabled, since it may worsen
the CPU consumption.
You can enabled it for the whole cluster via
\end_layout
\begin_layout Quote
\family typewriter
marsadm set-global-enabled-net-compressions
\backslash
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
\begin_inset Quotes eld
\end_inset
COMPRESS_LZO|COMPRESS_LZ4|COMPRESS_ZLIB
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Standard
(or a shorter list of compress options), and you can disable it globally
by supplying an empty list:
\end_layout
\begin_layout Quote
\family typewriter
marsadm set-global-enabled-net-compressions
\begin_inset Quotes eld
\end_inset
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Standard
Notice: this will compress the
\emph on
data payloads
\emph default
of network traffic, both for (incremental) logfile traffic (by default
on port 7778), and for sync traffic (by default on port 7779).
\end_layout
\begin_layout Subsection
Logfile Payload Compression
\begin_inset CommandInset label
LatexCommand label
name "subsec:Logfile-Payload-Compression"
\end_inset
\end_layout
\begin_layout Standard
By default, logfile data compression is disabled, since it may worsen the
CPU consumption, and may worsen local IO performance.
You can enable it for the whole cluster via
\end_layout
\begin_layout Quote
\family typewriter
marsadm set-global-enabled-log-compressions
\backslash
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
\begin_inset Quotes eld
\end_inset
COMPRESS_LZO|COMPRESS_LZ4|COMPRESS_ZLIB
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Standard
(or a shorter list of compress options), and you can disable it globally
by supplying an empty list:
\end_layout
\begin_layout Quote
\family typewriter
marsadm set-global-enabled-log-compressions
\begin_inset Quotes eld
\end_inset
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Standard
In difference to network compression, this does not apply to sync data.
It compresses the logfile payload
\emph on
before
\emph default
it is written to the transaction logfile.
As a side effect, it also reduces network traffic, because the logfiles
are usually smaller.
Additionally, your
\family typewriter
/mars
\family default
directory may run out of space less quickly.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
However, as a major drawback, this may slow down the IO latencies of writes
considerably, and thus may drastically reduce local IO performance (depending
on performance of your crypto hardware, and on compressibility of data,
etc).
In particular, ZLIB is known to be a very slow algorithm (but to compress
somewhat better than others), while LZO is a very old but very fast algorithm.
In many cases, LZO or LZ4 are preferable.
Do not enable this option blindly.
Always observe the performance of your system afterwards.
\end_layout
\begin_layout Subsection
Logfile Payload Digests
\begin_inset CommandInset label
LatexCommand label
name "subsec:Logfile-Payload-Digests"
\end_inset
\end_layout
\begin_layout Standard
By default, all of these options are
\emph on
enabled
\emph default
, because most users want to checksum the logfile data for detection of
hardware errors, such as BBU cache failures, or silent corruption during
the network transport of logfile data.
When your secondaries encounter a checksum mismatch, they will
\series bold
\emph on
refuse
\emph default
to apply the defective data
\series default
, and will report
\family typewriter
DefectiveLog
\family default
or similar message in the
\family typewriter
diskstate
\family default
part of
\family typewriter
marsadm view all
\family default
(see section
\begin_inset CommandInset ref
LatexCommand nameref
reference "subsec:Standard-marsadm-view"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Standard
Most people view this behaviour as a
\emph on
feature
\emph default
.
It protects you from some types of data corruption.
\end_layout
\begin_layout Standard
If you want to disable some or all of the logfile digest algorithms, you
can do via
\end_layout
\begin_layout Quote
\family typewriter
marsadm set-global-disabled-log-digests
\backslash
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
\begin_inset Quotes eld
\end_inset
CHKSUM_MD5_OLD|CHKSUM_MD5|CHKSUM_CRC32C|CHKSUM_CRC32|CHKSUM_SHA1
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Disabling
\emph on
all
\emph default
of these options may improve local IO performance, but at the cost of less
reliability.
However, several compression algorithms are already doing some internal
checksumming upon decompression.
For maximum performance on weak hardware, it may pay off to enable compression,
while disabling separate digesting.
Please check what is the best combination for your hardware, your load,
etc.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you decide to keep the logfile digests, e.g.
when HA SLAs are more important than maximum performance: notice that checksumm
ing is done at the
\emph on
input
\emph default
data
\emph on
before
\emph default
any compression is applied.
This increases safety against (potential / theoretical) problems with compressi
on / decompression errors.
\end_layout
\begin_layout Subsection
Network Payload Digests
\begin_inset CommandInset label
LatexCommand label
name "subsec:Network-Payload-Digests"
\end_inset
\end_layout
\begin_layout Standard
By default, all of these options are
\emph on
enabled
\emph default
, because checksumming over the network at fast full-sync cannot be disabled
by concept.
At least one of the network digests must always remain enabled.
If you try to disable all of them, an automatic fallback to
\family typewriter
CHKSUM_MD5_OLD
\family default
will occur.
Since this a rather slow and non-optimum algorithm, disabling the faster
ones (such as
\family typewriter
CHKSUM_CRC32C
\family default
) is no good idea.
\end_layout
\begin_layout Standard
If you want to disable some of the network digest algorithms, you can do
similarly to
\end_layout
\begin_layout Quote
\family typewriter
marsadm set-global-disabled-net-digests
\backslash
\begin_inset Newline newline
\end_inset
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
strut
\backslash
hfill
\end_layout
\end_inset
\begin_inset Quotes eld
\end_inset
CHKSUM_MD5|CHKSUM_CRC32C|CHKSUM_CRC32|CHKSUM_SHA1
\begin_inset Quotes erd
\end_inset
\end_layout
\begin_layout Section
The
\family typewriter
/proc/sys/mars/
\family default
and other Expert Tweaks
\begin_inset CommandInset label
LatexCommand label
name "sec:The-/proc/sys/mars/-Expert"
\end_inset
\end_layout
\begin_layout Standard
In many cases, you will not need to deal with tweaks in
\family typewriter
/proc/sys/mars/
\family default
because everything should already default to reasonable predefined values.
This is not a
\begin_inset Quotes eld
\end_inset
stable
\begin_inset Quotes erd
\end_inset
interface.
It may change during development of MARS.
It allows access to some
\emph on
internal
\emph default
kernel variables of the
\family typewriter
mars.ko
\family default
kernel module at
\emph on
runtime
\emph default
.
\end_layout
\begin_layout Standard
This means, all values modified via /proc/ are not persistent.
They will be reset to default at
\family typewriter
rmmod mars
\family default
or at reboot.
If you need some persistence, implement it by yourself, e.g.
at startup scripts.
\end_layout
\begin_layout Standard
This section describes only those tweaks which could be helpful for sysadmins,
but not those for developers / very deep internals.
\end_layout
\begin_layout Subsection
Tuning Network Performance
\begin_inset CommandInset label
LatexCommand label
name "subsec:Tuning-Network-Performance"
\end_inset
\end_layout
\begin_layout Standard
Since a few years, a feature called
\begin_inset Quotes eld
\end_inset
socket bundling
\begin_inset Quotes erd
\end_inset
is available.
\end_layout
\begin_layout Standard
It is mostly intendend for lines showing high packet loss.
By using multiple TCP sockets in parallel for emulating a single logical
connection, throughput can be significantly increased.
\end_layout
\begin_layout Standard
Example for setting the socket parallelism to 4:
\end_layout
\begin_layout Itemize
\family typewriter
echo 4 > /proc/sys/mars/parallel_connections
\end_layout
\begin_layout Standard
The following graphics shows the throughput of a non-fast
\begin_inset Foot
status open
\begin_layout Plain Layout
The fast fullsync algorithm would not saturate the
\family typewriter
eth0
\family default
link with traffic from a single resource.
\end_layout
\end_inset
fullsync of a
\emph on
single
\emph default
100GiB resource over a loaded long-distance line between Europe/Germany
and USA/Midwest.
In order to compensate highly varying load at the line, all the experiments
were repeated more than 10 times and averaged.
Each bar shows the throughput for a particular socket parallelism.
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/socket-bundling-long-summary.png
width 70col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
Notice that the uplinks of the two servers are only 1 GBit/s respectively.
When the uplink is saturated, about 100 MByte/s is the maximum possible
peak throughput in theory.
You can easily recognize that the peak throughput is almost reached with
a parallelism degree of 2, but using even more sockets appears to be slightly
counter-productive.
One of the reasons is that more sockets will increase contention on the
line, and thus increasing packet loss.
Another potential reason is that higher parallelism at sockets will lead
to higher parallelism in disk reads, in turn leading to more permutations
of disk read positions (more
\emph on
random
\emph default
reads instead of purely sequential reads), which is counter-productive
for disk readahead strategies.
\end_layout
\begin_layout Standard
The next graphics shows the same, but over a medium distance of about 50km.
This line is even more heavily loaded with respect to the number of TCP
connections running in parallel (probly some 10,000 or even 100,000 if
not more), and there is some kind of
\begin_inset Quotes eld
\end_inset
traffic shaping
\begin_inset Quotes erd
\end_inset
at some intermediate network gear which will
\begin_inset Quotes eld
\end_inset
punish
\begin_inset Quotes erd
\end_inset
those traffic sources disproportionally increasing overall packet loss.
This can explain the even higher counter-productive effect of using too
much sockets and thus injecting additional packet loss:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/socket-bundling-short-summary.png
width 70col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In general, the optimum value for
\family typewriter
/proc/sys/mars/parallel_connections
\family default
may depend on many runtime factors such as other load running over some
(parts of) physical equipment.
You will need to determine optimum values yourself.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Notice that socket bundling is conceptually the
\begin_inset Quotes eld
\end_inset
opposite
\begin_inset Quotes erd
\end_inset
of traffic shaping.
You are trying to get
\emph on
more
\emph default
bandwidth, at the cost of
\emph on
other
\emph default
traffic competing for the same network resources.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
If you are operating masses of servers, don't set the MARS socket parallelism
\series bold
too high
\series default
everywhere.
You might
\begin_inset Quotes eld
\end_inset
steal
\begin_inset Quotes erd
\end_inset
too much bandwidth from other applications when starting masses of syncs
in parallel, e.g.
after an incident.
Best practice is to start with a default value of 1, and to increase it
only
\emph on
on demand
\emph default
, and/or preferably
\emph on
only
\emph default
at those servers where high load really occurs or where some urgent actions
need a
\emph on
temporary
\emph default
boost.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Experts in networking may try to load-balance the parallel TCP connections
over multiple physical paths, for example by hashing over the dynamic source
port numbers.
However, we currently have no experience with suchalike setups.
\end_layout
\begin_layout Subsection
Syslogging
\end_layout
\begin_layout Standard
All internal messages produced by the kernel module belong to one of the
following classes:
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
0 debug messages
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
1 info messages
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
2 warnings
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
3 error messages
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
4 fatal error messages
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
5 any message (summary of 0 to 4)
\end_layout
\begin_layout Subsubsection
Logging to Files
\end_layout
\begin_layout Standard
This feature will likely disappear when MARS goes to kernel upstream.
It was mostly intended for debugging during early beta phases and is no
longer needed for stable operation.
Developers may use it for spotting potential problems.
\end_layout
\begin_layout Standard
The classes may be used to produce status files
\family typewriter
$class.*.status
\family default
in the
\family typewriter
/mars/
\family default
and/or in the
\family typewriter
/mars/resource-
\emph on
mydata
\emph default
/
\family default
directory / directories.
\end_layout
\begin_layout Standard
When you create a file
\family typewriter
$class.*.log
\family default
in parallel to any
\family typewriter
$class.*.status
\family default
, the
\family typewriter
*.log
\family default
file will be appended forever with the same messages as in
\family typewriter
*.status
\family default
.
The difference is that *.status is regenerated anew from an empty starting
point, while *.log can (potentially) increase indefinitely unless you remove
it, or rename it to something else.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Beware, any permamently present
\family typewriter
*.log
\family default
file can easily fill up your
\family typewriter
/mars/
\family default
partition until the problems described in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Defending-Overflow"
\end_inset
will appear.
Use
\family typewriter
*.log
\family default
only for a
\series bold
limited time
\series default
, and
\series bold
only for debugging!
\end_layout
\begin_layout Subsubsection
Logging to Syslog
\end_layout
\begin_layout Standard
The classes also play a role in the following
\family typewriter
/proc/sys/mars/
\family default
tweaks:
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
syslog_min_class
\family default
(rw) The
\emph on
mimimum
\emph default
class number for
\emph on
permanent
\emph default
syslogging.
By default, this is set to -1 in order to switch off perment logging completely.
Permament logging can easily flood your syslog with such huge amounts of
messages (in particular when class=0), that your system as a whole may
become unusable (because vital kernel threads may be blocked too long or
too often by the userspace syslog daemon).
Instead, please use the flood-protected syslogging described below!
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
syslog_max_class
\family default
(rw) The
\emph on
maximum
\emph default
class number for
\emph on
permanent
\emph default
syslogging.
Please use the flood-protected version instead.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
syslog_flood_class
\family default
(rw) The mimimum class of flood-protected syslogging.
The maximum class is always 4.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
syslog_flood_limit
\family default
(rw) The maxmimum number of messages after which the flood protection will
start.
This is a hard limit for the the number of messages written to the syslog.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
syslog_flood_recovery_s
\family default
(rw) The number of seconds after which the internal flood counter is reset
(after flood protection state has been reached).
When no new messages appear after this time, the flood protection will
start over at count 0.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
The rationale behind flood protected syslogging: sysadmins are usually only
interested in the point in time where some problems / incidents / etc have
\emph on
started
\emph default
.
They are usually not interested in capturing
\emph on
each
\emph default
and
\emph on
every
\emph default
single error message (in particular when they are flooding the system logs).
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
If you
\emph on
really
\emph default
need complete error information, use the
\family typewriter
*.log
\family default
files described above, compress them and save them to somewhere else
\emph on
regularly
\emph default
by a cron job.
This bears much less overhead than filtering via the syslog daemon, or
even remote syslogging in real time which will almost surely screw up your
system in case of network problems co-inciding with flood messages, such
as caused in turn by those problems.
Don't rely on real-time concepts, just do it the old-fashioned batch job
way.
\end_layout
\begin_layout Subsubsection
Tuning Verbosity of Logging
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
show_debug_messages
\family default
Boolean switch, 0 or 1.
Mostly useful only for kernel developers.
This can easily flood your logs if our are not careful.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
show_log_messages
\family default
Boolean switch, 0 or 1.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
show_connections
\family default
Boolean switch, 0 or 1.
Show detailed internal statistics on sockets.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
show_statistics_local
\begin_inset space ~
\end_inset
/
\begin_inset space ~
\end_inset
show_statistics_global
\family default
Only useful for kernel developers.
Shows some internal information on internal brick instances, memory usage,
etc.
\end_layout
\begin_layout Subsection
Tuning the Sync
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
sync_flip_interval_sec
\family default
(rw) The sync process must not run in parallel to logfile replay, in order
to easily guarantee consistency of your disk.
If logfile replay would be paused for the full duration of very large or
long-lasting syncs (which could take some days over very slow networks),
your
\family typewriter
/mars/
\family default
filesystem could overflow because no replay would be possible in the meantime.
Therefore, MARS regulary flips between actually syncing and actually replaying,
if both is enabled.
You can set the time interval for flipping here.
\begin_inset Newline newline
\end_inset
Increasing this value may improve overall sync throughput, at the cost of
some more space required by
\family typewriter
/mars
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
sync_limit
\family default
(rw) When > 0, this limits the maximum number of sync processes actually
running parallel.
This is useful if you have a large number of resources, and you don't want
to overload the network and/or your local IO system with too many sync
processes running
\emph on
in parallel
\emph default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
sync_nr
\family default
(ro) Passive indicator for the number of sync processes currently running.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
sync_want
\family default
(ro) Passive indicator for the number of sync processes which
\emph on
demand
\emph default
running.
\end_layout
\begin_layout Subsection
Lowlevel TCP Tuning (Networking Experts Only)
\begin_inset CommandInset label
LatexCommand label
name "subsec:TCP-Tuning"
\end_inset
\end_layout
\begin_layout Standard
When
\family typewriter
CONFIG_MARS_SEPARATE_PORTS
\family default
and
\family typewriter
CONFIG_MARS_IPv4_TOS
\family default
are enabled, MARS uses the following types of traffic:
\end_layout
\begin_layout Description
\family typewriter
MARS_TRAFFIC_META
\family default
(by default on port 7777 with
\family typewriter
IPTOS_LOWDELAY
\family default
) This can be tuned in directory
\family typewriter
/proc/sys/mars/tcp_tuning_0_meta_traffic/
\family default
.
\end_layout
\begin_layout Description
\family typewriter
MARS_TRAFFIC_REPLICATION
\family default
(by default on port 7778 with
\family typewriter
IPTOS_RELIABILITY
\family default
) This can be tuned in directory
\family typewriter
/proc/sys/mars/tcp_tuning_1_replication_traffic/
\family default
.
\end_layout
\begin_layout Description
\family typewriter
MARS_TRAFFIC_SYNC
\family default
(by default on port 7779 with
\family typewriter
IPTOS_MINCOST
\family default
) This can be tuned in directory
\family typewriter
/proc/sys/mars/tcp_tuning_2_sync_traffic/
\family default
.
Attention: since the advent of
\family typewriter
DSCP
\family default
, this bit (hex
\family typewriter
0x2
\family default
in host byte order) is suppressed by the kernel, and yields
\family typewriter
DS0
\family default
.
\end_layout
\begin_layout Standard
In each of these directories, the following tunables are available (only
for networking experts who know what they are doing):
\end_layout
\begin_layout Description
\family typewriter
ip_tos
\family default
As explained above.
Notice: hex constants from
\family typewriter
/usr/include/linux/ip.h
\family default
must be converted to decimal before forwarding to the
\family typewriter
/proc
\family default
interface.
\end_layout
\begin_layout Description
\family typewriter
tcp_window_size
\family default
Current default is 8 * 1024 * 1024.
\end_layout
\begin_layout Description
\family typewriter
tcp_nodelay
\family default
Current default is 0.
\end_layout
\begin_layout Description
\family typewriter
tcp_timeout
\family default
Current default is 2.
\end_layout
\begin_layout Description
\family typewriter
tcp_keepcnt
\family default
Current default is 3.
\end_layout
\begin_layout Description
\family typewriter
tcp_keepintvl
\family default
Current default is 3.
\end_layout
\begin_layout Description
\family typewriter
tcp_keepidle
\family default
Current default is 4.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Further tuning parameters are in the standard Linux kernel.
Notice that
\family typewriter
IP_TOS
\family default
is internally converted to
\family typewriter
DSCP
\family default
, which in turn can be further manipulated by
\family typewriter
netfilter
\family default
/
\family typewriter
iptables
\family default
and/or by
\family typewriter
qdisc
\family default
(
\family typewriter
tc
\family default
) and/or by further (external) networking components.
The ancient TOS settings are meant as a default
\emph on
starting point
\emph default
for further customization to your needs.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Typically,
\emph on
public
\emph default
internet transports are flattening / ignoring or otherwise manipulating
\begin_inset Foot
status open
\begin_layout Plain Layout
DSCP markings can be only made reliable on private networks (possibly requiring
some effort).
Public Internet service and transit providers do not necessarily treat
the TOS values or DSCP markings with any form of priority and may also
remove or change them without any notice.
Some internet service or transit providers also do use specific DSCP markings
to mark packets for being dropped, which may result in hard to find transmissio
n errors.
\end_layout
\begin_layout Plain Layout
If want to use MARS on a public internet connection, you should use
\series bold
encrypted
\series default
\series bold
VPN
\series default
with different DSCP markings, and coordinate them with your network services
provider.
\end_layout
\end_inset
the TOS / DSCP fields.
There it will not work.
Anyway, you should never route unencrypted MARS traffic over public transports,
for obvious security reasons.
Notice: MARS replication is meant for company-
\emph on
internal
\emph default
networks like
\emph on
internal
\emph default
\series bold
replication networks
\series default
(or storage networks) where some networking department has control of.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Playing with the above settings can easily tear down your whole (replication)
network if you don't know exactly what you are doing.
Please test any changes in the lab first.
Mass rollout should be done in incremental phases, each in power of 10
units.
There might be unexpected effects like packet storms, or packet loss, etc.
Some of these effects may only show up when a certain number of hosts is
exceeded, or when certain load conditions are hammering the overall Distributed
System.
Some very old routers / switches are known to break down unexpectedly when
overloaded in certain ways.
Be careful in a production environment!
\end_layout
\begin_layout Chapter
Advanced users: automation and the macro processor
\begin_inset CommandInset label
LatexCommand label
name "chap:Advanced-users:-automation"
\end_inset
\end_layout
\begin_layout Section
The
\family typewriter
systemd
\family default
Template Generator
\begin_inset CommandInset label
LatexCommand label
name "sec:systemd-Templates"
\end_inset
\end_layout
\begin_layout Standard
Starting with
\family typewriter
mars0.1astable
\family default
79 (much better with
\family typewriter
mars0.1astable119
\family default
), you may use
\family typewriter
systemd
\family default
as a cluster manager at the Mechanics Layer.
MARS will replicate any
\family typewriter
systemd
\family default
-relevant state information across the (big) cluster, achieving some remote
control.
In particular,
\series bold
automated handover
\series default
triggered by
\family typewriter
marsadm primary $resource
\family default
is supported.
More features are likely to be added to future releases.
\end_layout
\begin_layout Subsection
Why
\family typewriter
systemd
\family default
?
\begin_inset CommandInset label
LatexCommand label
name "subsec:Why-systemd?"
\end_inset
\end_layout
\begin_layout Standard
All major Linux distributions are now
\family typewriter
systemd
\family default
based.
It is the new quasi standard.
Although there have been some discussions in the OpenSource community about
its merits and its shortcomings, now it appears to be accepted in large
parts of the Linux world.
\end_layout
\begin_layout Standard
Systemd has a few advantages:
\end_layout
\begin_layout Enumerate
It is running as
\family typewriter
init
\family default
process under the reserved
\family typewriter
pid=1
\family default
.
If it ever would die, then your system as a whole would die.
There is no need for adding yet another MARS clustermanager daemon
\family typewriter
marsd
\family default
or similar, which could fail
\emph on
independently
\emph default
from other parts of the system.
\end_layout
\begin_layout Enumerate
Although
\family typewriter
systemd
\family default
has been criticised as being
\begin_inset Quotes eld
\end_inset
monolithic
\begin_inset Quotes erd
\end_inset
(referring to its internal software architecture), its
\emph on
usage
\emph default
by sysadmins is easily decomposable into many plugins called
\series bold
\emph on
units
\series default
\emph default
.
\end_layout
\begin_layout Enumerate
Local LXC containers, local VMs,
\family typewriter
iSCSI
\family default
exports,
\family typewriter
nfs
\family default
exports and many other parts of the system are often already controlled
by
\family typewriter
systemd
\family default
.
Together with
\family typewriter
udev
\family default
and other parts, it already controls devices, LVM, mountpoints, etc.
Since MARS is only a particular
\emph on
component
\emph default
in a bigger complicated stack, it is an advantage to use the same (more
or less standardized and well-integrated) tools for managing the whole
stack.
\end_layout
\begin_layout Enumerate
Personal experience: the
\series bold
unit dependency engine
\series default
of systemd is extremely elaborated
\begin_inset Foot
status open
\begin_layout Plain Layout
The author misses only one feature: a new dependency type, or an object
type like a
\begin_inset Quotes eld
\end_inset
semaphore
\begin_inset Quotes erd
\end_inset
or
\begin_inset Quotes eld
\end_inset
mutex
\begin_inset Quotes erd
\end_inset
for expressing
\begin_inset Quotes eld
\end_inset
mutual exclusion
\begin_inset Quotes erd
\end_inset
, without any other side effects as for example caused by
\family typewriter
Conflicts=
\family default
.
\end_layout
\end_inset
and useful.
Management of complex transitive dependencies is relatively easy (though
not always fully intuitive).
Writing your own dependency engine would be a huge effort, which can be
saved by just using standard systemd and learning how to configure it properly
for your applications.
\end_layout
\begin_layout Standard
In the opinion of the author, systemd has a few disadvantages, such as:
\end_layout
\begin_layout Enumerate
It is not
\series bold
accepted
\series default
everywhere.
Therefore the
\family typewriter
systemd
\family default
template extensions of
\family typewriter
marsadm
\family default
are
\emph on
not mandatory
\emph default
for MARS operations.
You can use or implement your own alternatives when necessary.
\end_layout
\begin_layout Enumerate
Interfacing to
\series bold
third-party software
\series default
may become hairy.
systemd appears to assume that more or less
\emph on
everything
\emph default
is controlled by systemd.
Pre-existing software would sometimes need to be adapted to systemd, but
this isn't always possible in practice.
For example,
\family typewriter
systemd-notify
\family default
assumes that you can alter some third-party-controlled executables or complex
third-party systems, which often isn't easily possible in practice
\begin_inset Foot
status open
\begin_layout Plain Layout
The problem is that
\family typewriter
systemd-notify
\family default
needs to be inserted into the
\emph on
control flow
\emph default
of your third-party software.
This doesn't work if your third-party software doesn't have the right hooks
in the right places, or when there exists no local control flow at some
(failure) conditions.
Therefore, any status inquiry would need to be configurable at systemd
units, not by any modifications of third-party software.
Unfortunately, the current systemd does not have appropriate features like
\family typewriter
ExecCheckState=/my/state-reporting-script.pl
\family default
or
\family typewriter
.py
\family default
or similar.
\end_layout
\end_inset
.
\end_layout
\begin_layout Enumerate
Sometimes it can be
\series bold
messy
\series default
to deal with.
In particular, it can sometimes
\emph on
believe
\emph default
that some parts of the system
\emph on
were
\emph default
in a particular state, although in reality they aren't.
The current version of systemd lacks an important property called
\series bold
Idempotence
\series default
\begin_inset Foot
status open
\begin_layout Plain Layout
In industrial automation and control, it is quite standard that you specify
the
\series bold
desired target state
\series default
, without having to obey the current state.
For example, if a big fan or a big pump is already running, or if a valve
is already open, there will be no error if somebody tries to
\begin_inset Quotes eld
\end_inset
start
\begin_inset Quotes erd
\end_inset
it (for whatever reason, or when induced from a higher level in the control
hierarchy).
Unfortunately,
\family typewriter
systemctl
\family default
often reports an error code if you try to start a unit when it is currently
running, or when it
\emph on
believes
\emph default
that it
\emph on
were
\emph default
already running (whether this is actually true or not).
\emph on
Sometimes
\emph default
, there is a
\emph on
workaround
\emph default
by first stopping, and then restarting, or similar.
However, this is clearly an
\series bold
absolute no-go
\series default
for HA where uptime and interruption-free service is often a MUST.
For humans who have worked in complex industry plants, it is easy to become
\emph on
desperate
\emph default
about this confusing (and sometimes
\begin_inset Quotes eld
\end_inset
\emph on
unpredictable
\emph default
\begin_inset Quotes erd
\end_inset
) behaviour of systemd, with no easy chance to compensate these deficiencies.
\end_layout
\end_inset
, which is more or less standard in industrial automation and control (e.g.
big industry plants).
Compensation via native systemd units and dependencies may become hairy,
if possible at all
\begin_inset Foot
status open
\begin_layout Plain Layout
According to
\family typewriter
man sd_notify
\family default
, there exists a clearly defined message type
\family typewriter
STOPPING=1
\family default
, but I cannot find a clearly defined and reliable equivalent of STOPPED=1
for reporting that the unit has actually completed the stopping, and that
now it is actually (re-)startable (again).
Notice that some third-party software needs some external preconditions
to be met before it can be started.
From the
\family typewriter
sd_notify
\family default
docs, it is unclear to me whether
\family typewriter
ERRNO=0
\family default
could be
\emph on
misused
\emph default
for such a report.
By reading some systemd sourcecode, I cannot easily tell, because the internal
state model of systemd appears to be extremely complex, and the message
passing model looks even more complex, like a huge finite state automaton
with additional non-trivial transitional conditions.
Semantically unspecified generic messages like STATUS=
\begin_inset Quotes erd
\end_inset
freetext_message
\begin_inset Quotes erd
\end_inset
cannot not help me for achieving a clearly defined and reliable behaviour.
\end_layout
\begin_layout Plain Layout
Notice that some third-party software does not use long-running daemons
at all, or only in certain places.
Then messages like
\family typewriter
MAINPID=
\family default
are not useful at all.
There exist use cases where
\series bold
dynamic polling of actual state
\series default
would be a very simple and easy solution in place of a complex state-keeping
/ state transition / message passing model, for example a new unit directive
like
\family typewriter
ExecCheckState=/my/state-reporting-script.pl
\family default
or
\family typewriter
.py
\family default
or similar.
\end_layout
\end_inset
.
MARS can workaround these shortcomings via a pseudo unit type
\family typewriter
.script
\family default
which allows you to directly call some (wrapper) scripts, or to write some
\series bold
adaptors
\series default
to third-party software.
\end_layout
\begin_layout Enumerate
\series bold
Usability
\series default
/ reporting: in my experience it is less usable for getting an overview
over a bigger local system, and less usable (out-of-the-box) for managing
a bigger cluster at cluster level.
Monitoring needs to be done separately.
\end_layout
\begin_layout Subsection
Execution Model of systemd and marsadm
\begin_inset CommandInset label
LatexCommand label
name "subsec:Execution-Model-systemd"
\end_inset
\end_layout
\begin_layout Standard
marsadm and systemd are playing together and communicating with each other
in the following way:
\end_layout
\begin_layout Standard
\noindent
\align center
\begin_inset Graphics
filename images/systemd-template-generation.fig
width 100col%
\end_inset
\end_layout
\begin_layout Standard
\noindent
Communication between marsadm to systemd is done in the following ways:
\end_layout
\begin_layout Itemize
by instanting a template residing in /etc/marsadm/systemd-templates (or
in another configurable location) and generating an instantiated unit into
/run/systemd/system/ as documented in
\family typewriter
man systemd.unit
\family default
.
The method from
\family typewriter
man systemd.generator
\family default
is currently not yet supported (but possibly in a future release).
\end_layout
\begin_layout Itemize
by replicating the following triggers across the mars cluster:
\end_layout
\begin_layout Itemize
by touching the cluster-global file
\family typewriter
/mars/userspace/systemd-trigger
\family default
which in turn is watched at each cluster members by the systemd unit
\family typewriter
mars-trigger.path
\family default
, which in turn activates
\family typewriter
mars-trigger.service
\family default
, which in turn executes
\family typewriter
ExecStart=/usr/bin/marsadm systemd-trigger-extern
\family default
everywhere in the cluster.
\end_layout
\begin_layout Itemize
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
sloppy
\end_layout
\end_inset
similarly for multiple per-resource triggers, by touching any of the resource-s
pecific trigger files
\family typewriter
/mars/resource-$res/systemd-trigger
\family default
which is turn is watched by systemd units
\family typewriter
mars-$res-trigger.path
\family default
at each resource member, which then in turn activates
\family typewriter
mars-$res-trigger.service
\family default
, which finally executes
\family typewriter
ExecStart=/usr/bin/marsadm systemd-trigger-extern $res
\family default
everywhere in the cluster.
\end_layout
\begin_layout Itemize
In turn,
\family typewriter
marsadm systemd-trigger-extern $res
\family default
will start or stop the units as configured via
\family typewriter
marsadm set-systemd-unit $res $start_unit_name $stop_unit_name
\family default
, as described later.
\end_layout
\begin_layout Standard
This architecture looks somewhat complicated, but it was found to be necessary
to assure lockless parallel starting and stopping of multiple resources
without conflicts.
Apparently, systemd is not a fully asynchronous system, while a Distributed
System (like the MARS replication) is always a fully asynchronous system
by its very nature.
The above triggers are used to translate from the fully asynchronous Distribute
d System to the less asynchronous systemd execution model.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Fortunately, you don't need to deal too much with these details if you take
the example templates from
\family typewriter
systemd-icpu/
\family default
and adapt them to your application (see section
\begin_inset CommandInset ref
LatexCommand nameref
reference "subsec:Example-systemd-Templates"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Subsection
Working Principle of the Template Generator for
\family typewriter
systemd
\family default
\begin_inset CommandInset label
LatexCommand label
name "subsec:Working-Principle-of"
\end_inset
\end_layout
\begin_layout Standard
systemd already has some basic templating capabilities.
It is possible to create unit names containing the
\family typewriter
@
\family default
symbol, which can then be expanded under certain circumstances, e.g.
to tty names etc.
However, automatic expansion is only done when somebody knows the instance
name already
\emph on
in advance
\emph default
.
The author has not found any way for creating instance names out of
\begin_inset Quotes eld
\end_inset
thin air
\begin_inset Quotes erd
\end_inset
, such as from dynamically created MARS resource names.
Essentially, an
\emph on
inference machine
\emph default
for systemd template names does not yet exist.
\end_layout
\begin_layout Standard
This lacking functionality is completed with the following macro processing
capabilities of
\family typewriter
marsadm
\family default
(see section
\begin_inset CommandInset ref
LatexCommand vref
reference "sec:The-macro-processor"
plural "false"
caps "false"
noprefix "false"
\end_inset
):
\end_layout
\begin_layout Standard
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
sloppy
\end_layout
\end_inset
Some ordinary or templated
\family typewriter
systemd
\family default
unit files (see
\family typewriter
man systemd.unit
\family default
) can be installed into one of the following directories:
\family typewriter
./systemd-templates
\family default
,
\family typewriter
$HOME/.marsadm/systemd-templates/
\family default
,
\family typewriter
/etc/marsadm/systemd-templates/
\family default
,
\family typewriter
/usr/lib/marsadm/systemd-templates/
\family default
,
\family typewriter
/usr/local/lib/marsadm/systemd-templates/
\family default
.
Futher places can be defined by overriding the $
\family typewriter
MARS_PATH
\family default
environment variable.
\end_layout
\begin_layout Standard
From these directories, ordinary systemd unit files will be just copied
into
\family typewriter
/run/systemd/system/
\family default
(configurable via
\family typewriter
$SYSTEMD_TARGET_DIR
\family default
) and then picked up by
\family typewriter
systemd
\family default
as ordinary unit files.
\end_layout
\begin_layout Standard
Template unit files are nothing but unit files, optionally containing
\family typewriter
@{
\emph on
varname
\emph default
}
\family default
or
\family typewriter
@escvar{
\emph on
varname
\emph default
}
\family default
parts or other macro definitions in their filename, and possibly also in
their bodies, at arbitrary places.
These
\family typewriter
@{...}
\family default
parts are substituted by the
\family typewriter
marsadm
\family default
macro processing engine.
\end_layout
\begin_layout Standard
The following macro capabilities are currently defined:
\end_layout
\begin_layout Description
\family typewriter
@{
\emph on
varname
\emph default
}
\family default
Expands to the value of the variable.
This can be used both in template filenames and and in content of template
files.
Predefined are the following variables:
\end_layout
\begin_deeper
\begin_layout Description
\family typewriter
@{res}
\family default
The MARS resource name.
\end_layout
\begin_layout Description
\family typewriter
@{resdir}
\family default
The MARS resource directory
\family typewriter
/mars/resource-$res/
\family default
.
\end_layout
\begin_layout Description
\family typewriter
@{host}
\family default
The local host name as determined by
\family typewriter
marsadm
\family default
, or as overridden by the
\family typewriter
--host=
\family default
parameter.
\end_layout
\begin_layout Description
\family typewriter
@{cmd}
\family default
The
\family typewriter
marsadm
\family default
command as given on the command line (only reasonable for debugging or
for error messages).
\end_layout
\begin_layout Description
\family typewriter
@{
\emph on
varname
\emph default
}
\family default
Further variables as defined by the macro processor, see section
\begin_inset CommandInset ref
LatexCommand vref
reference "par:Predefined-Variables"
\end_inset
, and as definable by
\family typewriter
%let{
\emph on
varname
\emph default
}{...}
\family default
statements, see also section
\begin_inset CommandInset ref
LatexCommand vref
reference "subsec:Predefined-Trivial-Macros"
\end_inset
.
\end_layout
\end_deeper
\begin_layout Description
\family typewriter
@eval{
\emph on
text
\emph default
}
\family default
Calls the MARS macro processor as explained in section
\begin_inset CommandInset ref
LatexCommand vref
reference "sec:The-macro-processor"
plural "false"
caps "false"
noprefix "false"
\end_inset
, and substitutes its output.
Notice that systemd template variables occurring in the macro processor
\family typewriter
\emph on
text
\family default
\emph default
must be accessed via the macro processor syntax
\family typewriter
%{varname}
\family default
, because the macro processor uses
\family typewriter
%
\family default
as an escape symbol, while the systemd template engine uses
\family typewriter
@
\family default
instead.
This is necessary for distinction of both layers.
Notice that variables defined via the macro processor syntax
\family typewriter
%let{varname}{value}
\family default
can be afterwards accessed by the template engine via
\family typewriter
@{varname}
\family default
syntax, once the macro engine has finished working on
\family typewriter
\emph on
text
\family default
\emph default
.
\end_layout
\begin_layout Description
\family typewriter
^
\emph on
{varname
\emph default
}
\family default
This is a matching operator, binding a string to a variable.
It can be used in template filenames
\emph on
only
\emph default
.
First, any
\family typewriter
@{
\emph on
othername
\emph default
}
\family default
are substituted.
Finally, any
\family typewriter
^
\emph on
{varname
\emph default
}
\family default
are matched against the actual filename like a shell wildcard
\family typewriter
*
\family default
.
The matching part of the filename is assigned to
\family typewriter
\emph on
varname
\family default
\emph default
, and can be later used at
\family typewriter
@{
\emph on
varname
\emph default
}
\family default
substitutions occurring in the
\emph on
content
\emph default
of the file.
\end_layout
\begin_layout Description
\family typewriter
@esc{
\emph on
text
\emph default
}
\family default
Calls the
\family typewriter
systemd-escape
\family default
tool for conversion of pathnames following the
\family typewriter
systemd
\family default
naming conventions (see
\family typewriter
man systemd-escape
\family default
).
For example, a dash is converted to
\family typewriter
\backslash
x2d
\family default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Omission of
\family typewriter
systemd-escape
\family default
can lead to problems when your resource names are containing special characters
like dashes or other special symbols (in the sense of
\family typewriter
systemd
\family default
).
Bugs of this kind are hard to find and to debug.
Either forbid special characters in your installation, or don't forget
to test everything with some crude resource names!
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Example snippet from a
\family typewriter
.path
\family default
unit.
Please notice where escaping is needed and where it must not be used (also
notice that a dash is sometimes a legal part of the
\family typewriter
.mount
\family default
unit name, but except from the resource name part):
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
[Path]
\end_layout
\begin_layout Plain Layout
PathExists=/dev/mars/@{res}
\end_layout
\begin_layout Plain Layout
Unit=vol-@escvar{res}.mount
\end_layout
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Another source of crude bugs is the backslash character in the
\family typewriter
systemd-escape
\family default
substitution, such as from
\family typewriter
\backslash
x2d
\family default
.
When passed to a shell, such as in certain
\family typewriter
ExecStart=
\family default
statements like
\family typewriter
/bin/bash -c
\series bold
$args
\family default
\series default
, the backslash will be removed.
Therefore, don't forget to either replace any single backslash with two
backslashes, or to put the whole pathname in single quotes, or similar.
Always check the result of your substitutions! It depends on the
\emph on
target
\emph default
(such as
\family typewriter
bash
\family default
, as opposed to
\family typewriter
systemd
\family default
) whether further escaping of the escapes is needed, or whether it
\emph on
must not
\emph default
be applied.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Become a master of the escaping hell by inserting debug code into your scripts
(reporting to
\family typewriter
/dev/stderr
\family default
or to log files) and do thorough testing like a devil.
\end_layout
\begin_layout Description
\family typewriter
@escvar{
\emph on
varname
\emph default
}
\family default
Equivalent to
\family typewriter
@esc{@{
\emph on
varname
\emph default
}}
\family default
.
This is often used in template filenames to ensure that MARS resource names
containing special symbols like dashes, are properly converted to systemd
naming conventions where a dash has a different pre-defined meaning.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When creating a new resource via
\family typewriter
marsadm create-resource
\family default
, or when adding a new replica via
\family typewriter
marsadm join-resource
\family default
or similar, the template system will automatically create new instances
for the new resource or its replicas.
Conversely,
\family typewriter
marsadm leave-resource
\family default
and its friends like
\family typewriter
delete-resource
\family default
etc will automatically remove the corresponding template instances from
\family typewriter
/run/systemd/system/
\family default
.
\end_layout
\begin_layout Subsection
Template Markers
\begin_inset CommandInset label
LatexCommand label
name "subsec:Template-Markers"
\end_inset
\end_layout
\begin_layout Standard
Starting with
\family typewriter
mars0.1astable119
\family default
, you may use some special markers in comments of systemd templates.
These comments are ignored by systemd, but interpreted by the marsadm template
engine.
The marker syntax is somewhat stricter than in usual comments:
\end_layout
\begin_layout Quote
Exactly one hash symbol exactly at the start of the line, optionally followed
by whitespace, followed by the marker in CAPITAL letters.
\end_layout
\begin_layout Standard
The requirement of exactly one hash symbol allows you to comment out markers
by using two hash symbols or more.
Here is a table of markers and their meaning:
\end_layout
\begin_layout Standard
\begin_inset Tabular
\begin_inset Text
\begin_layout Plain Layout
Marker
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
Meaning
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
# ALWAYS_DISABLED
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
The unit instance will be generated, but neither enabled nor started by
marsadm (except when exclicitly using it as an argument to
\family typewriter
set-systemd-unit
\family default
).
Useful for generation of units you want to control by some other tools.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
# ALWAYS_START
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
This is the opposite of ALWAYS_DISABLED: this unit will always be enabled
and started, regardless what
\family typewriter
marsadm get-systemd-want
\family default
is telling you.
If it is no longer in use after leave-resource, only then it will be stopped.
Useful for permanent tasks such as
\family typewriter
.path
\family default
path watcher units, etc.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
# KEEP_RUNNING
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
This unit will always be enabled and started.
If the unit is no longer in use after leave-resource, it will be only be
disabled (protection against accidental restart), but otherwise stay untouched
by marsadm.
In particular, it will
\emph on
not
\emph default
be stopped if it is currently running.
Useful for important HA-like services which need to be controlled by another
means.
Also useful for
\emph on
global
\emph default
units which are independent from any resources.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
# ${NAME}_START
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
This can be used for simplification of the
\family typewriter
set-systemd-unit
\family default
command.
In place of providing a full template name with all of its escape characters
and all of its risky typos, simply say
\family typewriter
marsadm set-systemd-unit mydata DEFAULT
\family default
.
This will search for templates marked with DEFAULT_START and DEFAULT_STOP,
and use the corresponding
\family typewriter
@escvar{res}
\family default
substitutions for starting and stopping.
\end_layout
\begin_layout Plain Layout
HINT: by inventing other marker ${NAME}s, you may ease discrimination of
multiple operation modes.
\end_layout
\begin_layout Plain Layout
Notice:
\family typewriter
^{...}
\family default
pattern matching is currently NYI, only
\family typewriter
@{res}
\family default
and variants like
\family typewriter
@escvar{res}
\family default
are currently implemented.
\end_layout
\end_inset
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
# ${NAME}_STOP
\end_layout
\end_inset
|
\begin_inset Text
\begin_layout Plain Layout
\begin_inset Box Frameless
position "t"
hor_pos "c"
has_inner_box 1
inner_pos "t"
use_parbox 0
use_makebox 0
width "60col%"
special "none"
height "1in"
height_special "totalheight"
thickness "0.4pt"
separation "3pt"
shadowsize "4pt"
framecolor "black"
backgroundcolor "none"
status open
\begin_layout Plain Layout
See description of # ${NAME}_START.
\end_layout
\end_inset
\end_layout
\end_inset
|
\end_inset
\end_layout
\begin_layout Subsection
Special
\family typewriter
.script
\family default
Pseudo Units
\begin_inset CommandInset label
LatexCommand label
name "subsec:Special-.script-Pseudo"
\end_inset
\end_layout
\begin_layout Paragraph
Howto use .script
\end_layout
\begin_layout Standard
When a template name ends in
\family typewriter
.script
\family default
and has execute permissions, the marsadm template generator will write
the instantiated script (with all
\family typewriter
@{...}
\family default
variables substituted) into the directory
\family typewriter
/etc/marsadm/systemd-generated/
\family default
directory in place of
\family typewriter
/run/systemd/systemd/
\family default
.
\end_layout
\begin_layout Standard
In place of
\family typewriter
systemctl start $unit
\family default
, the script
\family typewriter
/etc/marsadm/systemd-generated/$unit.script start
\family default
is called with single parameter
\family typewriter
start
\family default
, and similarly for
\family typewriter
stop
\family default
.
\end_layout
\begin_layout Standard
This way, the author found it easy to program idempotent scripts, like adaptors
to third-party software.
\end_layout
\begin_layout Paragraph
Motivation for .script
\end_layout
\begin_layout Standard
The author has spent a lot of time (several months) for getting standard
systemd units to work in a fully asynchronous Distributed System consisting
of hundreds of machines, where
\emph on
any
\emph default
type of event may appear at
\emph on
any
\emph default
time.
\end_layout
\begin_layout Standard
Although this big effort resulted in a somewhat working system, the result
is was not fully HA.
\end_layout
\begin_layout Standard
Notice that HA is defined by a single number like 99.99% (see mars-architecture-g
uide.pdf).
In practice, true HA
\emph on
typically
\emph default
means that the
\emph on
total system
\emph default
, including its controlling components, must be
\series bold
more reliable
\series default
than (some or any) of its worker sub-components.
Notice that systemd is one one of these components.
\end_layout
\begin_layout Standard
The problem with systemd was that it created failures on its own.
Compensation of these failures became very hairy with the current version,
as used for the experiments (Debian Buster).
\end_layout
\begin_layout Standard
Apparently, systemd does not tolerate certain types of parallelism.
For example, while
\family typewriter
systemd daemon-reload
\family default
is currently executing, a parallel
\family typewriter
systemctl start $other_unit
\family default
may fail, although it normally works without problems.
\end_layout
\begin_layout Standard
Even more unfortunate, sometimes systemd did no longer know the
\emph on
actual state
\emph default
of a unit, as the following example output snippet from
\family typewriter
systemctl status mnt-test-lv
\backslash
x2d0.mount
\family default
is demonstrating:
\end_layout
\begin_layout Standard
\family typewriter
\size scriptsize
Dec 24 17:00:48 c1 systemd[1]: Mounting MARS TESTING local mount on /mnt/test/lv
-0...
\end_layout
\begin_layout Standard
\family typewriter
\size scriptsize
Dec 24 17:00:58 c1 systemd[1]: mnt-test-lv
\backslash
x2d0.mount: Mount process finished, but there is no mount.
\end_layout
\begin_layout Standard
\family typewriter
\size scriptsize
Dec 24 17:00:58 c1 systemd[1]: mnt-test-lv
\backslash
x2d0.mount: Failed with result 'protocol'.
\end_layout
\begin_layout Standard
\family typewriter
\size scriptsize
Dec 24 17:00:58 c1 systemd[1]: Failed to mount MARS TESTING local mount
on /mnt/test/lv-0.
\end_layout
\begin_layout Standard
This failure report was wrong, because the mount had actually succeeded
in reality, but systemd wrongly assumed the opposite.
Neither
\family typewriter
start
\family default
nor
\family typewriter
stop
\family default
was possible afterwards, even after
\family typewriter
systemctl reset-failed
\family default
.
\end_layout
\begin_layout Standard
Possibly this may be a bug, which could be fixed.
However, HA systems are expected to even work in the presence of bugs,
as best as possible.
\end_layout
\begin_layout Standard
If you ever encounter a similar problem, you may get stuck in a dead end,
at least for a while.
Apparently, systemd is repairing the state of failed mount units after
some timeout, but in the meantime true HA with many nines is endangered.
Other unit types appear to show similar failure behaviour.
\end_layout
\begin_layout Standard
What is the reason for this behaviour?
\end_layout
\begin_layout Standard
The author is no systemd expert
\begin_inset Foot
status open
\begin_layout Plain Layout
The author might have overlooked further possibilities for solutions.
This rises the question how the
\series bold
usability
\series default
of systemd could be improved.
\end_layout
\end_inset
, but here is an
\emph on
attempt
\emph default
to analyze the problems at
\emph on
concept level
\emph default
, and to suggest some solutions.
\end_layout
\begin_layout Standard
The following may be of interest for systemd developers, and for very advanced
users of systemd.
All others may skip the rest of this paragraph, and just use the
\family typewriter
.script
\family default
workaround as explained before.
\end_layout
\begin_layout Standard
From observation, and from
\family typewriter
man systemctl
\family default
it appears to me that a
\family typewriter
systemctl
\family default
command invocation (aka job) is not fully equivalent to an
\family typewriter
ExecStart=
\family default
directive.
According to the docs,
\family typewriter
Exec=
\family default
and some sister directives are obeying dependencies to any queued or already
running jobs.
However, I found no obvious way for obeying dependencies when starting
jobs via
\family typewriter
systemctl
\family default
commands
\emph on
manually
\emph default
.
There is an option
\family typewriter
--job-mode=
\family default
which defaults to the value
\family typewriter
replace
\family default
, documenting the bad behaviour I have observed: it may
\series bold
\emph on
disturb
\series default
\emph default
a currently running or conflicting job.
\end_layout
\begin_layout Standard
In worst case, the conflicting unit may fail
\begin_inset Quotes eld
\end_inset
unexpectedly
\begin_inset Quotes erd
\end_inset
from a user's viewpoint due to the default
\family typewriter
--job-mode=replace
\family default
, and I have observed cases where it was neither startable nor stoppable
immediately afterwards (maybe this could depend on further properties of
called
\family typewriter
Exec=
\family default
scripts, which may stem from a third party, and are not constructed for
being called by systemd: eventually I got desperate after investing a lot
of time).
\end_layout
\begin_layout Standard
Conclusions: there appear multiple non-trivial HA problems with the current
version of systemd.
While some of them may be bugs which could be fixed, others appear to reside
at
\emph on
concept level
\emph default
:
\end_layout
\begin_layout Enumerate
Jobs seem to be
\emph on
uniquely identified
\emph default
by unit names.
Thus it is not possible to
\emph on
address
\emph default
multiple different jobs belonging to the
\emph on
same
\emph default
unit.
\begin_inset Newline newline
\end_inset
An example:
\family typewriter
systemctl start unitA
\family default
is currently running, taking a long time to execute.
During this, another command
\family typewriter
systemctl stop unitA
\family default
is started
\emph on
in parallel
\emph default
(e.g.
from another commandline shell).
According to the documented default behaviour
\family typewriter
--job-mode=replace
\family default
, the old job may be
\emph on
interrupted
\emph default
in favour of the new one.
However, interruption of a job may be interpreted as a job failure, possibly
leading to state
\family typewriter
failed
\family default
.
However, a failed unit can no longer be stopped, it seems to be treated
like if it were
\emph on
already stopped
\emph default
.
It is possible to reset a failed unit via
\family typewriter
systemctl reset-failed unitA
\family default
, but then I found that it is also treated as if it were already stopped,
such that
\family typewriter
systemctl stop unitA
\family default
just reports
\begin_inset Quotes eld
\end_inset
success
\begin_inset Quotes erd
\end_inset
without doing anything.
This may lead to
\emph on
serious
\emph default
problems in a HA world.
\begin_inset Newline newline
\end_inset
An example: unitA was executing a script
\family typewriter
scriptA.sh
\family default
in oneshot mode.
Unit failure typically meant that the script was killed by a signal.
Even if
\family typewriter
scriptA.sh
\family default
had a signal handler doing proper application cleanup, and even if there
were no final SIGKILL which eventually killed the running signal handler,
the
\emph on
application
\emph default
may get
\emph on
stuck
\emph default
in some
\series bold
undefined application state
\series default
.
But afterwards, one is unable to queue a stop job for cleanup
\begin_inset Foot
status open
\begin_layout Plain Layout
Possibly, a new directive
\family typewriter
ExecCleanup=
\family default
could help.
However, this could mean that a new command variant
\family typewriter
systemctl cleanup unitA
\family default
would need to be introduced.
This would complicate the user interface.
Instead, the author would prefer Idempotence, because Idempotences allows
to use
\family typewriter
systemctl stop unitA
\family default
for cleanup.
This results in a much simpler end-user interface.
\end_layout
\end_inset
, as explained before.
Notice that queuing a start job in place of a cleanup job is no option
in general, at least in a HA world.
\begin_inset Newline newline
\end_inset
According to the docs, there exists no
\family typewriter
--job-mode=append
\family default
or similar option, which would just queue / delay
\emph on
any
\emph default
new job for
\emph on
any
\emph default
unit, until all conflicting previous jobs are gone.
Notice that this would be always mathematically possible (e.g.
resulting in a strictly sequential job order).
An implementation should be technically possible, but currently it seems
not implemented in systemd according to the docs.
This lack of full dependency awareness for entering new jobs causes numerous
other problems, not only the previously described ones.
\begin_inset Newline newline
\end_inset
Possibly (the author has checked
\begin_inset Foot
status open
\begin_layout Plain Layout
The documentation
\family typewriter
man systemd
\family default
explains a subtle difference.
The conflicts causing
\family typewriter
--job-mode=fail
\family default
to fail seem to be different from general conflicts in unit dependencies.
Although not precisely documented, the observed behaviour luckily appears
to make HA more likely.
There remains some uncertainity caused by the documented failure possibility.
A new option called
\family typewriter
--job-mode=append
\family default
or
\family typewriter
--job-mode=wait
\family default
could resolve this, for example by resulting in strict sequential operations
in place of
\begin_inset Quotes eld
\end_inset
unnecessary
\begin_inset Quotes erd
\end_inset
failures.
\end_layout
\end_inset
, which resulted in some behavioural improvements) the
\family typewriter
--job-mode=fail
\family default
option can be used for a self-programmed busy-wait submission loop, in
order to
\emph on
approach
\emph default
(but not to
\emph on
guarantee
\emph default
in HA sense) disturbance-free addition of new systemctl jobs obeying all
specified dependencies, and without causing side effects on already queued
/ running jobs.
However, this trick did not always help in the presence of the above mount
unit failure example, triggered by
\emph on
transitive
\emph default
dependencies.
Another remaining problem is the exit code: there is no documented difference
showing the
\emph on
reason
\emph default
of the failure.
Was it a conflict with another queued job caused by
\family typewriter
--job-mode=fail
\family default
, or did the unit
\emph on
itself
\emph default
fail?
\end_layout
\begin_layout Enumerate
Not only in the presence of multiple jobs for the same unit (possibly submitted
in parallel to each other), query operations like
\family typewriter
systemctl is-active unitA
\family default
(or
\family typewriter
is-failed
\family default
etc) are prone to races.
A potential future solution could be externally visible job IDs for identifying
jobs.
Similar concepts are for example used in printer job spoolers for decades.
Of course, information about terminated jobs have to be kept for some time,
or until some maximum job entries are exhausted.
In addition, true asynchronous invocation via
\family typewriter
--no-block
\family default
and later polling the job ID would also become possible.
\end_layout
\begin_layout Enumerate
Systemd lacks an important property called Idempotence.
Idempotence is a very common feature in big industry plants, where hundreds
of human workers may act on controlling hundrets of facilities.
Each alarm call may cause a different person to try to
\begin_inset Quotes eld
\end_inset
fix
\begin_inset Quotes erd
\end_inset
a problem.
Idempotence is a
\emph on
must
\emph default
in such an industry environment.
Idempotence means that
\begin_inset Quotes eld
\end_inset
start
\begin_inset Quotes erd
\end_inset
and
\begin_inset Quotes eld
\end_inset
stop
\begin_inset Quotes erd
\end_inset
are always working when possible at all,
\series bold
regardless of the previous state
\series default
of the
\emph on
machinery
\emph default
(
\emph on
not
\emph default
of some
\emph on
software
\emph default
state).
For operations stuff, there is no need to obey any previous state.
When pressing a
\begin_inset Quotes eld
\end_inset
start
\begin_inset Quotes erd
\end_inset
button, it means
\begin_inset Quotes eld
\end_inset
ensure that the machine including all of of its sub-components will be running
\begin_inset Quotes erd
\end_inset
, regardless whether it was running before, or not, or only half-running,
or only an arbitrary subset of sub-components was running before.
So the button press does not declare an operation, it declares a
\series bold
target state
\series default
.
\begin_inset Newline newline
\end_inset
It is the task of the Idempotence controller software to ensure that the
target state is being reached
\emph on
somehow
\emph default
.
This does not specify a particular way for reaching the target state.
In general, there might be multiple ways.
Very sophisticated controller software may even try multiple ways, until
one of them succeeds in reaching the specified target state.
\end_layout
\begin_layout Standard
A future Idempotence feature of systemd could be implemented as follows:
\end_layout
\begin_layout Enumerate
In the unit file, an option for declaration of the Idempotence property
could be added.
Backwards compatibility: the semantics of conventional non-idempotent units
should not be changed unless idempotence is declared explicitly.
\end_layout
\begin_layout Enumerate
When Idempotence is declared,
\family typewriter
systemctl start
\family default
or
\family typewriter
systemctl stop
\family default
will
\emph on
always
\emph default
execute a start/stop job somewhen later, obeying all dependencies.
Optionally, this could also mean that in
\emph on
worst case
\emph default
all conflicting previous jobs might need to terminate first.
More sophisticated variants might provide mechanisms for
\series bold
controlled abortion
\series default
of startup operations, provided that they usually do not lead to failure
at all.
Care must be taken that failures caused by aborts will not occur too frequently
for HA.
When failures caused by aborts are occuring too frequently, the concept
of abort should be disabled.
\end_layout
\begin_layout Enumerate
When
\family typewriter
ExecStart=
\family default
or
\family typewriter
ExecStop=
\family default
is declared in an Idempotent unit, the script will be
\emph on
always
\emph default
executed, regardess of the previous internal systemd state of the unit.
It is up to the script writer to ensure idempotence at his/her script code.
This means, the
\emph on
script
\emph default
has to approach the application's target state independently from the previous
application state, and has to report in its exit code whether the
\emph on
target state
\emph default
has been actually reached.
\end_layout
\begin_layout Enumerate
A very helpful addition to
\emph on
any
\emph default
systemd unit (not only to Idempotent ones) would be a new directive
\family typewriter
ExecCheck=
\family default
.
In place of keeping a copy of the application state inside of systemd,
it would allow to directly
\series bold
poll
\series default
the actual
\emph on
application
\emph default
state via callback, whenever it becomes necessary.
The user could provide a state-checking script which has no side effects,
other than querying the actual state of the application.
This feature would be extremely helpful for turning
\emph on
any
\emph default
conventional unit into an idempotent one, likely without need for changing
anything else (e.g.
in third-party software, even when it lacks idempotence).
Only when actual state checking is available and when it does not fail,
Idempotent units may be allowed to skip the execution of other
\family typewriter
ExecStartOrStop=
\family default
actions.
\end_layout
\begin_layout Standard
In ideal case,
\family typewriter
ExecCheck=
\family default
or another measure for achieving true HA idempotence might make the above
\family typewriter
*.script
\family default
workaround superfluous.
\end_layout
\begin_layout Subsection
Example
\family typewriter
systemd
\family default
Templates
\begin_inset CommandInset label
LatexCommand label
name "subsec:Example-systemd-Templates"
\end_inset
\end_layout
\begin_layout Standard
These can be found in the MARS repo in the
\family typewriter
systemd-testing/
\family default
and the
\family typewriter
systemd-icpu/
\family default
subdirectories.
Until systemd is supporting idempotence natively, any newbee is advised
to take one of the examples
\family typewriter
systemd-testing/mnt-test-@escvar{res}-testload.script
\family default
and
\family typewriter
systemd-icpu/nodeagent-@escvar{res}.script
\family default
as a basis for own modifications.
\end_layout
\begin_layout Standard
At the moment, the following templates are available (subject to further
extension and improvements without notice):
\end_layout
\begin_layout Description
\family typewriter
daemon-reload.service
\family default
A helper unit which ensures that
\family typewriter
systemctl daemon-reload
\family default
is not triggered in parallel to itself.
It also reduces the risk for parallel execution with some other units,
but unfortunately cannot provide full mutual exclusion with everything
else.
Hopefully a future version of systemd will allow specification of full
mutual exclusion.
\end_layout
\begin_layout Description
\family typewriter
mars.path
\family default
This ensures that the mountpoint
\family typewriter
/mars/
\family default
is already mounted before
\family typewriter
mars.service
\family default
is started.
\end_layout
\begin_layout Description
\family typewriter
mars.service
\family default
This starts and stops the MARS kernel module, provided that
\family typewriter
/mars
\family default
is (somehow) mounted.
The latter can be ensured by classical
\family typewriter
/etc/fstab
\family default
methods, or by
\family typewriter
.mount
\family default
units like your own hand-crafted
\family typewriter
mars.mount
\family default
unit.
\end_layout
\begin_layout Description
\family typewriter
mars-trigger.path
\family default
This is used for remote triggering of the marsadm template engine from
another MARS cluster member, e.g.
when executing
\family typewriter
marsadm join-resource
\family default
or
\family typewriter
leave-resource
\family default
or
\family typewriter
set-systemd-unit
\family default
.
Local triggering is also possible via
\family typewriter
touch /mars/userspace/systemd-trigger
\family default
.
When triggered, the command
\family typewriter
marsadm systemd-trigger-extern
\family default
(without
\family typewriter
--force
\family default
) will be executed.
In turn, this will re-compute all
\family typewriter
systemd
\family default
templates when necessary.
\end_layout
\begin_layout Description
\family typewriter
mars-trigger.service
\family default
An intermediate helper unit, sitting inbetween
\family typewriter
mars-trigger.path
\family default
and
\family typewriter
marsadm systemd-trigger-extern
\family default
.
It also ensures that the marsadm command is never called in parallel to
itself.
\end_layout
\begin_layout Description
\family typewriter
mnt-test-@escvar{res}.path
\family default
This path unit is used for generic triggering of any
\family typewriter
resource-specific systemd
\family default
unit as set by
\family typewriter
marsadm set-systemd-unit $res $unit
\family default
(see below in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Handover-using-systemd"
\end_inset
).
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Pitfall: systemd's path unit watchers are based on the
\family typewriter
inotify
\family default
infrastructure of the kernel.
By default, many kernels are configured to a rather low number of inotify
watches.
When using more than 20 MARS resources, or when userspace also consumes
inotify watches, some of the path watches may not start up (typical
\family typewriter
systemctl status
\family default
messages are hinting at
\begin_inset Quotes eld
\end_inset
resource
\begin_inset Quotes erd
\end_inset
or similar).
You may need some kernel tweaks, such as
\family typewriter
echo 4096 > /proc/sys/fs/inotify/max_user_instances
\family default
and/or relatives.
\end_layout
\begin_layout Description
\family typewriter
mnt-test-@escvar{res}.service
\family default
Similarly to
\family typewriter
mars-trigger.service
\family default
, this sits inbetween the per-resource trigger and the executed command
\family typewriter
marsadm systemd-trigger-extern @{res}
\family default
, which in turn either calls
\family typewriter
systemctl
\family default
for actually starting / stopping the per-resource units, or in turn it
directly calls any
\family typewriter
.script
\family default
workaround.
See the overview picture in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "subsec:Execution-Model-systemd"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Description
\family typewriter
\series bold
mnt-test-@escvar{res}-testload.script
\family default
\series default
This is an academic example for testing and for inspection, not intended
for production.
It shows the currently recommended script workaround for achieving idempotence.
Fully automatic activation / deactivation of this target during handover
via
\family typewriter
marsadm primary $res
\family default
can be configured via one of the following commands:
\family typewriter
marsadm set-systemd-unit mydata DEFAULT
\family default
or by the long form
\family typewriter
marsadm set-systemd-unit mydata mnt-test-mydata.script.
\begin_inset Newline newline
\end_inset
\family default
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Note that the
\emph on
previous
\emph default
\family typewriter
*trigger*{path,service}
\family default
native units remain necessary for getting
\family typewriter
*.script
\family default
to work.
Any potential races in
\emph on
their
\emph default
activation are automatically healed by idempotent re-triggering of this
.script workaround.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
The following native templates might be used in place of this workaround,
but I have to warn that the following native systemd units are not fully
passing various stress tests, while the corresponding .script workaround
has passed them.
\end_layout
\begin_layout Description
\family typewriter
mnt-test-@escvar{res}.mount
\family default
\begin_inset space ~
\end_inset
or
\begin_inset space ~
\end_inset
\family typewriter
^{mntname}-@escvar{res}.mount
\family default
This is one of the possible native systemd execution targets configurable
by
\family typewriter
marsadm set-systemd-unit
\family default
.
For fully automatic activation / deactivation of this alternative target
during handover via
\family typewriter
marsadm primary $res
\family default
, you can configure a very basic test with something like
\family typewriter
marsadm set-systemd-unit mydata vol-mydata.mount
\family default
or similar.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Notice: the template notation
\family typewriter
^{mntname}
\family default
can be used for mounting to an
\emph on
arbitrary
\emph default
mountpoint, such as
\family typewriter
/another/mountdir/mydata
\family default
, by using the corresponding systemd template syntax in
\family typewriter
marsadm set-systemd-unit mydata another-mountdir-mydata.mount
\family default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Look into the template file
\family typewriter
^{mntname}-@escvar{res}.mount
\family default
.
In the first line, there is the following macro call:
\begin_inset Newline newline
\end_inset
\family typewriter
@eval{%let{mntpath}{%subst{%{mntname}}{-}{/}}}
\family default
\begin_inset Newline newline
\end_inset
This is a trick for conversion of any systemd template name
\family typewriter
mntname
\family default
into into an ordinary filesystem pathname
\family typewriter
mntpath
\family default
.
While subdirectories in a path are separated by slashes, the systemd unit
naming conventions (as required by systemd) are using dashes in place of
slashes.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Do not confuse
\family typewriter
@{mntname}
\family default
with
\family typewriter
@{mntpath}
\family default
.
Depending on the
\emph on
type
\emph default
of argument to be substituted, you may need either systemd unit naming
conventions, or classical Unix pathname conventions.
\end_layout
\begin_layout Description
\family typewriter
mnt-test-@escvar{res}-testload.service
\family default
This is an academic example for testing and for inspection, not intended
for production.
Here you can see in comments how a
\series bold
transitive dependency chain
\series default
could be configured.
In its body, this template contains a
\family typewriter
BindsTo=
\family default
plus
\family typewriter
After=
\family default
reference to another template
\family typewriter
^{mntname}-@escvar{res}-delay.service
\family default
, which in turn contains a
\family typewriter
BindsTo=
\family default
plus
\family typewriter
After=
\family default
reference to
\family typewriter
mnt-test-@escvar{res}.mount
\family default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Do not confuse
\family typewriter
Requires=
\family default
with
\family typewriter
BindsTo=
\family default
(see
\family typewriter
man systemd.unit
\family default
).
If you want to automatically stop your
\emph on
entire
\emph default
unit stack via a
\emph on
single
\emph default
command
\family typewriter
systemctl stop vol-mydata.mount
\family default
, then you most likely need the stronger
\family typewriter
BindsTo=
\family default
directive plus
\family typewriter
After=
\family default
in place of weaker ones like
\family typewriter
Requires=
\family default
or similar.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
In most cases (but not always), you also need an
\family typewriter
After=
\family default
directive.
Otherwise you will unintentionally program a hard to debug
\series bold
race condition
\series default
, which can extinct your last hair.
Be sure to understand the corresponding details in the systemd documentation.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In general, it is good practice to have a
\emph on
consistent
\emph default
name scheme.
Always use the
\emph on
logically same name
\emph default
(modulo some escaping conventions for special characters), e.g.
for the underlying LV (called disk in MARS terminology), equal to the MARS
resource name, equal to the last part of the mountpoint, equal to the IQN
of an iSCSI export, equal to the NFS share name, equal to the LXC container
name, equal to the KVM/qemu virtual machine name, and so on.
Messing around with non-systematic naming conventions can easily result
in a hell.
\end_layout
\begin_layout Subsection
Fully Automatic Handover using
\family typewriter
systemd
\begin_inset CommandInset label
LatexCommand label
name "subsec:Handover-using-systemd"
\end_inset
\end_layout
\begin_layout Standard
First, you need to install your systemd templates into one of the template
directories mentioned in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Working-Principle-of"
\end_inset
.
In case you have never used the template engine before, you can create
the first instantiation via
\family typewriter
marsadm systemd-trigger
\family default
.
Afterwards, inspect
\family typewriter
/run/systemd/system/
\family default
for newly created template instances (and
\family typewriter
/etc/marsadm/systemd-generated/
\family default
for any .script workarounds) and check them.
\end_layout
\begin_layout Standard
For each resource
\family typewriter
$res
\family default
, you should set systemd targets in one of the following variants:
\end_layout
\begin_layout Itemize
short form:
\family typewriter
marsadm set-systemd-unit $res DEFAULT
\end_layout
\begin_layout Itemize
long form, using the .script workaround:
\family typewriter
marsadm set-systemd-unit $res mnt-test-$res-testload.script
\family default
\end_layout
\begin_layout Itemize
most general form:
\family typewriter
marsadm set-systemd-unit $res
\begin_inset Quotes eld
\end_inset
$start_unit
\begin_inset Quotes erd
\end_inset
\begin_inset Quotes eld
\end_inset
$stop_unit
\family default
\begin_inset Quotes erd
\end_inset
.
\end_layout
\begin_layout Standard
Except for .script workarounds,
\family typewriter
$start_unit
\family default
and
\family typewriter
$stop_unit
\family default
will typically denote
\emph on
different
\emph default
targets for start and stop (with few exceptions) for the following reason:
\end_layout
\begin_layout Description
Example: assume your native systemd-controlled stack consists of
\family typewriter
vol-@escvar{res}.mount
\family default
and
\family typewriter
nfs-export-@escvar{res}.service
\family default
.
Before the filesystem can be exported via
\family typewriter
nfs
\family default
, it
\emph on
first
\emph default
needs to be mounted.
At startup,
\family typewriter
systemd
\family default
can do this automatically for you: just add a
\family typewriter
Requires=
\family default
or
\family typewriter
BindsTo=
\family default
dependency between both targets, or similar.
Then, simply use
\family typewriter
nfs-export-mydata.service
\family default
as your start unit.
Whenever it (thinks that it) needs to be started, systemd will automatically
analyze its dependencies and automatically start
\family typewriter
vol-mydata.mount
\family default
.
However, stopping is different.
Theoretically,
\family typewriter
systemctl stop nfs-export-mydata.service
\family default
\emph on
could
\emph default
work in some cases, but in general it doesn't work this way.
Reason: there might be other
\emph on
sister
\emph default
units which
\emph on
also
\emph default
depend on the mount.
In some cases, you may not necessarily notice any sisters, because systemd
can add further (internal) targets
\emph on
automatically
\emph default
.
The problem is easily solvable by using
\family typewriter
BindsTo=
\family default
and/or
\family typewriter
PartOf=
\family default
dependencies, peferably augmented with
\family typewriter
After=
\family default
, and then
\family typewriter
systemctl stop vol-mydata.mount
\family default
will automatically tear down
\emph on
all
\emph default
dependencies in reverse order.
Therefore, use the
\emph on
bottom
\emph default
of the stack (usually a mount unit) as your stop unit.
\end_layout
\begin_layout Standard
For maximum safety,
\family typewriter
$start_unit
\family default
should always point at the
\emph on
tip
\emph default
of your stack, while
\family typewriter
$stop_unit
\family default
should always point at the
\emph on
bottom
\emph default
(but one level higher than
\family typewriter
/dev/mars/$res
\family default
).
\end_layout
\begin_layout Standard
Removing any systemd targets is also possible via
\family typewriter
marsadm set-systemd-unit $res
\begin_inset Quotes eld
\end_inset
\begin_inset Quotes erd
\end_inset
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Tip: groups of units can be controlled via .target units, see
\family typewriter
man systemd.target
\family default
.
\end_layout
\begin_layout Standard
\noindent
When everything is set up properly, the following should work:
\end_layout
\begin_layout Enumerate
Issue
\family typewriter
marsadm primary $res
\family default
on another node which is currently in secondary role.
\end_layout
\begin_layout Enumerate
As a consequence,
\family typewriter
systemctl stop
\begin_inset Quotes eld
\end_inset
$stop_unit
\begin_inset Quotes erd
\end_inset
\family default
should be automatically executed at the old primary side.
\end_layout
\begin_layout Enumerate
After a while, the MARS kernel module will notice that
\family typewriter
/dev/mars/$res
\family default
is no longer opened.
You can check this manually via
\family typewriter
marsadm view-device-opened $res
\family default
which will tell you a boolean result.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
In case the device is not closed for any reason, ordinary handover
\emph on
cannot
\emph default
proceed, because somebody could (at least potentially) write some data
into it, even after the handover, which would lead to a split brain.
Therefore MARS
\emph on
must
\emph default
insist that the device is closed before
\emph on
ordinary
\emph default
handover can proceed.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In order to not leave you with a failed service, umount failures will be
detected after a timeout.
Handover by marsadm will then
\emph on
automatically
\emph default
restart the old start unit at the old primary side where the the device
was not released.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In case an ordinary handover is not possible due to hanging device openings,
you have the following options:
\end_layout
\begin_deeper
\begin_layout Enumerate
Check your
\family typewriter
systemd
\family default
configuration or other sources of error why the device is not closed.
Possible reasons could be hanging processes or hanging sessions which might
need a
\family typewriter
kill
\family default
or a
\family typewriter
kill -9
\family default
or similar.
Notice that
\family typewriter
lsof
\family default
does not catch
\emph on
all
\emph default
possible sources like (recursive or bind-) mounts occupied by foreign kernel
namespaces.
\end_layout
\begin_layout Enumerate
Do a failover via
\family typewriter
primary --force
\family default
, which will likely provoke a split brain.
\end_layout
\end_deeper
\begin_layout Enumerate
Once
\family typewriter
/dev/mars/$res
\family default
has disappeared, the ordinary MARS handover from the old primary to the
new site should proceed as usual.
\end_layout
\begin_layout Enumerate
After
\family typewriter
/dev/mars/$res
\family default
has appeared at the new site,
\family typewriter
systemctl start
\begin_inset Quotes eld
\end_inset
$start_unit
\begin_inset Quotes erd
\end_inset
\family default
should be executed automaticy.
In turn, this should bring up your configured services.
\end_layout
\begin_layout Standard
Details depend on your
\family typewriter
systemd
\family default
configuration / templates.
For example, you can configure systemd targets for activation of VMs, or
for
\family typewriter
LXC
\family default
containers, or for
\family typewriter
iSCSI
\family default
exports, or for
\family typewriter
nfs
\family default
exports, or for
\family typewriter
glusterfs
\family default
exports, or for whatever you need.
For true geo-redundancy, you will likely have to include some
\family typewriter
quagga
\family default
or
\family typewriter
bird
\family default
or other BGP configurations into your systemd unit stack.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In general, marsadm tries to keep your services running whenever a handover
failure occurs, or when you re-attach after a detach, or when your machine
reloads
\family typewriter
mars.ko
\family default
after a crash reboot, etc.
This is regarded as a
\emph on
feature
\emph default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
However, this feature could become boring if you
\emph on
intentionally(!)
\emph default
want to stop your services, for example when you need to run an
\family typewriter
fsck
\family default
.
Do not use
\family typewriter
marsadm secondary
\family default
, because this would make
\family typewriter
/dev/mars/mydata
\family default
to disappear.
Although
\family typewriter
marsadm set-systemd-unit mydata
\begin_inset Quotes eld
\end_inset
\begin_inset Quotes erd
\end_inset
\family default
would solve the problem, this could make you forget the old start and stop
unit names (if you don't use markers like DEFAULT etc).
You could workaround by some wrapper script remembering the old names via
\family typewriter
marsadm get-systemd-unit
\family default
, but this is not necessary:
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
There is a simple solution:
\family typewriter
marsadm set-systemd-want
\begin_inset Quotes eld
\end_inset
(none)
\begin_inset Quotes erd
\end_inset
\family default
will
\emph on
temporarily
\emph default
stop the whole systemd unit stack, while keeping
\family typewriter
/dev/mars/mydata
\family default
accessible.
After your
\family typewriter
fsck /dev/mars/mydata
\family default
has finished, simply use an idempotent
\family typewriter
marsadm primary mydata
\family default
for restart of your services.
\end_layout
\begin_layout Section
The macro processor
\begin_inset CommandInset label
LatexCommand label
name "sec:The-macro-processor"
\end_inset
\end_layout
\begin_layout Standard
The macro processor is a very flexible and versatile tool for
\series bold
customizing
\series default
.
Conceptually, two levels of macros are discriminated:
\end_layout
\begin_layout Enumerate
primitive macros: these are firmly built into
\family typewriter
marsadm
\family default
.
\end_layout
\begin_layout Enumerate
complex macros: these can be defined via the
\series bold
macro language
\series default
of
\family typewriter
marsadm
\family default
.
\end_layout
\begin_layout Standard
Some complex macros are already pre-defined, for example the standard
\family typewriter
marsadm view all
\family default
(see section
\begin_inset CommandInset ref
LatexCommand vref
reference "subsec:Standard-marsadm-view"
plural "false"
caps "false"
noprefix "false"
\end_inset
).
\end_layout
\begin_layout Standard
From the commandline, any macro can be called via
\family typewriter
marsadm view-
\emph on
$macroname
\emph default
mydata
\family default
.
The short form
\family typewriter
marsadm view mydata
\family default
is equivalent to
\family typewriter
marsadm view-default mydata
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In general, the command
\family typewriter
marsadm view-
\emph on
$macroname
\emph default
all
\family default
will first call the macro
\family typewriter
\emph on
$macroname
\family default
\emph default
in a loop for
\emph on
all
\emph default
resources we are a
\emph on
member locally
\emph default
.
Finally, a trailing macro
\family typewriter
\emph on
$macroname
\emph default
-global
\family default
will be called with an empty
\family typewriter
%{res}
\family default
argument, provided that such a macro is defined.
This way, you can produce per-resource output followed by global output
which does not depend on a particular resource.
\end_layout
\begin_layout Subsection
Predefined Primitive Macros
\begin_inset CommandInset label
LatexCommand label
name "subsec:Predefined-Trivial-Macros"
\end_inset
\end_layout
\begin_layout Subsubsection
Intended for Humans
\end_layout
\begin_layout Standard
In the following, shell glob notation
\family typewriter
{a,b}
\family default
is used to document similar variants of similar macros in a single place.
When you actually call the macro, you must choose one of the possible variants
(excluding the braces).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
the-err-msg
\family default
Show reported errors for a resource.
When the resource argument is missing or empty, show global error information.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
all-err-msg
\family default
Like before, but show all information including those which are
\family typewriter
OK
\family default
.
This way, you get a list
\begin_inset Foot
status open
\begin_layout Plain Layout
The list may be extended in future versions of MARS.
\end_layout
\end_inset
of
\emph on
all
\emph default
potential error information present in the system.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-wrn-msg
\family default
Show all / reported warnings in the system.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-inf-msg
\family default
Show all / reported informational messages in the system.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-msg
\family default
Show all / reported messages regardless of its classification.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-global-msg
\family default
Show global messages not associated with any resource (the resource argument
of the
\family typewriter
marsadm
\family default
command is ignored in this case).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-global-{inf,wrn,err}-msg
\family default
Dito, but more specific.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-pretty-{global-,}{inf-,wrn-,err-,}msg
\family default
Dito, but show numerical timestamps in a human readable form.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{all,the}-{global-,}{inf-,wrn-,err-,}count
\family default
Instead of showing the messages, show their count (number of lines).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
errno-text
\family default
This macro takes 1 argument, which must represent a Linux
\family typewriter
errno
\family default
number, and converts it to human readable form (similar to the C
\family typewriter
strerror()
\family default
function).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
todo-{attach,sync,fetch,replay,primary,secondary}
\family default
Shows a boolean value (0 or 1) indicating the current state of the correspondin
g todo switch (whether on or off).
The meaning of todo switches is illustrated in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-State-of"
\end_inset
.
Exceptions:
\family typewriter
todo-primary
\family default
is not reporting the boolean value of a switch, but means that the designated
primary string as reported by
\family typewriter
get-primary
\family default
is equal to the current host.
Similary,
\family typewriter
todo-secondary
\family default
means that no designated primary exists throughout the cluster, indicating
that
\family typewriter
get-primary
\family default
equals to the special string value
\family typewriter
(none)
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
get-resource-{fat,err,wrn}
\family default
Access to the internal error status files.
This is not an official interface and may thus change at any time without
notice.
Use this only for human inspection, not for scripting!
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
These macros, as well as the error status files, are likely to disappear
in future versions of MARS.
They should be used for debugging only.
At least when merging into the upstream Linux kernel, only the
\family typewriter
*-msg
\family default
macros will likely survive.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
get-resource-{fat,err,wrn}-count
\family default
Dito, but get the number of lines instead of the text.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
replay-code
\family default
Indicate the current state of logfile replay / recovery:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
(empty) Unknown.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
0 No replay is currently running.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
1 Replay is currently running.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
2 Replay has successfully stopped.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
<
\begin_inset space ~
\end_inset
0 See Linux
\family typewriter
errno
\family default
code.
Typically this indicates a damaged logfile, or another filesystem error
at
\family typewriter
/mars
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
<=
\begin_inset space ~
\end_inset
-10000 See the Perl hash from the
\family typewriter
marsadm
\family default
script, describing some MARS-specific error codes.
\end_layout
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-{attach,sync,fetch,replay,primary,secondary,module-loaded}
\family default
Shows a boolean value (0 or 1) indicating the
\emph on
actual
\emph default
state, whether the corresponding action has been actually carried out,
or not (yet).
Notice that the values indicated by
\family typewriter
is-*
\family default
may differ from the
\family typewriter
todo-*
\family default
values when something is not (yet) working.
Notice:
\family typewriter
is-primary
\family default
(or its negation
\family typewriter
is-secondary
\family default
) means that the transaction logger has (resp.
not) reached a working state, but the corresponding
\family typewriter
/dev/mars/mydata
\family default
prosumer device need not (yet) have appeared (somewhere else).
More explanations can be found in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-State-of"
\end_inset
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-split-brain
\family default
Shows whether split brain (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Split-Brain-Resolution"
\end_inset
) has been detected, or not.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-consistent
\family default
Shows whether the
\emph on
underlying disk
\emph default
is in a locally consistent state, i.e.
whether it
\emph on
could
\emph default
be (potentially) detached and then used for read-only test-mounting
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice that the
\emph on
writeback
\emph default
at the primary side is out-of-order by default, for performance reasons.
Therefore, the underlying disk is only guaranteed to be consistent when
there is no data left to be written back.
Notice that this condition is racy by construction.
When your primary node crashes during writeback and then comes up again,
you must do a
\family typewriter
modprobe mars
\family default
first in order to automatically replay the transaction logfiles, which
will automatically heal such temporary inconsistencies.
\end_layout
\end_inset
.
Don't confuse this with the consistency of
\family typewriter
/dev/mars/mydata
\family default
, which is by construction
\emph on
always
\emph default
locally consistent once it has appeared
\begin_inset Foot
status open
\begin_layout Plain Layout
Exceptions are possible when using
\family typewriter
marsadm fake-sync
\family default
.
Even in split brain situations,
\family typewriter
marsadm primary --force
\family default
tries to prevent any further potential exception as best as it can, by
not letting
\family typewriter
/dev/mars/mydata
\family default
to appear and by insisting on split brain resolution first.
In future implementations, this might change if more pressure is put on
the developer to sacrifice consistency in preference to not waiting for
a full logfile replay.
\end_layout
\end_inset
.
By construction of MARS, the disk of secondaries will
\emph on
always
\emph default
remain in a locally consistent state once the initial sync has finished
as well as the initial logfile replay.
Notice that local consistency does not necessarily imply actuality.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-emergency
\family default
Shows whether emergency mode (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Emergency-Mode"
\end_inset
) has been entered for the named resource, or not.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
nr-{attach,sync,fetch,replay,primary,secondary}
\family default
Show the
\emph on
total number
\emph default
of resource members which are in corresponding state
\family typewriter
%is-
\emph on
$something
\emph default
{}
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
rest-space
\family default
(global, no resource argument necessary) Shows the
\emph on
logically
\emph default
available space in
\family typewriter
/mars/
\family default
measured and rounded down in GiB, which may deviate from the physically
available space as indicated by the
\family typewriter
df
\family default
command.
The difference to
\family typewriter
df
\family default
is intended for safeguarding.
Computational details may change in future MARS releases.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
total-space
\family default
(available since mars0.1astable140, global, no resource argument necessary)
Shows the
\emph on
logically present
\emph default
space in
\family typewriter
/mars/
\family default
, which may deviate from the physically available space as indicated by
the
\family typewriter
df
\family default
command.
Similarly to
\family typewriter
rest-space
\family default
but independently from it, this is also safeguarded and rounded down in
units of GiB.
Computational details may change in future MARS releases.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
get-{disk,device}
\family default
Show the name of the underlying disk, or of the
\family typewriter
/dev/mars/mydata
\family default
device (if it is available).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{disk,device}-present
\family default
Show (as a boolean value) whether the underlying disk, or the
\family typewriter
/dev/mars/mydata
\family default
device, is available.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-opened
\family default
Show (as a number) how often
\family typewriter
/dev/mars/mydata
\family default
has been actually openend, e.g.
by
\family typewriter
mount
\family default
or by some processes like
\family typewriter
dd
\family default
, or by iSCSI, etc.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-{ops,amount}-rate
\family default
Show the number of current IOPS, esp.
the current throughput in KiB/s.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-nrflying
\family default
Show the number of currently flying IO requests.
This is an indicator of queueing at the low-level device.
When it is permenantly very high, it may point at IO problems, such as
RAID degradation.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
disk-error
\family default
Show a negative Linux errno code, or a mars-specific code when lower than
-10000.
In addition to some explanation text, it shows the first
\emph on
known
\emph default
IO error, as reported upwards to applications, and before it was resetted
for whatever reason.
For example, it may be the last open() error on the underlying disk, or
something else may have occured during operations, and sometimes it may
have corrected itself.
Normally, this should be always zero.
When < 0 according to return-code conventions as explained at
\family typewriter
%replay-code{}
\family default
, this typically indicates a hardware or LVM problem, etc.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-error
\family default
Show a negative Linux errno code, or a mars-specific code when lower than
-10000.
In addition to some explanation text, it shows the first
\emph on
known
\emph default
IO error, as reported upwards to applications, and before it was resetted
for whatever reason.
Normally, this should be always zero.
When < 0 according to return-code conventions as explained at
\family typewriter
%replay-code{}
\family default
, this typically indicates a hardware (or network) problem.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
{potential,implemented,usable}-features Show a list of flag names, indicating
the compression / digest features (see description in section
\begin_inset CommandInset ref
LatexCommand formatted
reference "sec:Data-Compression-Checksumming"
plural "false"
caps "false"
noprefix "false"
\end_inset
) as either as known to the current version of marsadm, or as implemented
in the currently running kernel module, or as the minimum feature set currently
available in the whole cluster.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
{implemented,usable}-{digests,compressions} Same as before, but more specificall
y related to either compressions or digests.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
enabled-{log|net}-compressions Show which compression features have been
set by
\family typewriter
marsadm set-global-enabled-*-compressions
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
disabled-{log|net}-digests Show which digest features have been disabled
by
\family typewriter
marsadm set-global-disabled-*-digests
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
used-{log,net}-{digest,compression} Show which digest or compression features
are currently actually used by $host, either for logfile or for network
purposes.
\end_layout
\begin_layout Subsubsection
Intended for Scripting
\end_layout
\begin_layout Standard
While complex macros may output a whole bunch of information, the following
primitive macros are outputting exactly one value.
They are intended for script usage (cf.
section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Scripting-HOWTO"
\end_inset
).
Of course, curious humans may also use them :)
\end_layout
\begin_layout Standard
In the following, shell glob notation
\family typewriter
{a,b}
\family default
is used to document similar variants of similar macros in a single place.
When you actually call the macro, you must choose one of the possible variants
(excluding the braces).
\end_layout
\begin_layout Paragraph
Memberships, Name Querying and their Counts
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-member
\family default
Boolean, indicating whether
\family typewriter
%{host}
\family default
is a storage member of the resource
\family typewriter
%{res}.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-guest
\family default
Boolean, indicating whether
\family typewriter
%{host}
\family default
is currently a
\emph on
dynamic guest
\emph default
of resource
\family typewriter
%{res}.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
cluster-peers
\family default
Show a newline-separated list of all host names appearing in
\family typewriter
/mars/ips/ip-$peername
\family default
.
Please prefer this macro in place of direct access to filesystem data:
future MARS features might need some changes in the low-level naming convention
s, and/or in the hierarchical filesystem layout, or even the replacement
of the
\family typewriter
/mars/
\family default
filesystem by different data container formats, etc.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
resource-peers
\family default
Show a newline-separated list of all host names participating in the particular
resource
\family typewriter
%{res}
\family default
.
Notice that this is typically a subset of
\family typewriter
%cluster-peers{}
\family default
.
\begin_inset Newline newline
\end_inset
Note: stray data, e.g.
as produced by forgotten / interrupted
\family typewriter
leave-resource
\family default
& co may lead to some mismatches.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
guest-peers
\family default
Show a newline-separated list of all host names which are currently dynamically
added as
\emph on
guests
\emph default
to resource
\family typewriter
%{res}
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
count-{cluster,resource,guest}-peers
\family default
Show the corresponding
\emph on
number
\emph default
of hosts, accordingly.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{my,all}-resources
\family default
Show a newline-separated list of either all resource names
\emph on
existing
\emph default
in the cluster, or only those where the current host
\family typewriter
%{host}
\family default
is a storage member.
Optionally, you may specify the hostname as a parameter, e.g.
\family typewriter
%my-resources{
\emph on
otherhost
\emph default
}
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{my,all}-members
\family default
Show a newline-separated list of storage members existing in the cluster.
There is a very subtle difference to
\family typewriter
*-resources
\family default
: there may exist resources which have no storage members.
This may for example occur when all storage members have left via leave-resourc
e, but delete-resource has not yet been executed.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{my,all}-guests
\family default
Show a newline-separated list of currently dynamically added guests.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
count-{my,all}-{resources,members,guests}
\family default
Show the corresponding
\emph on
number
\emph default
of resources or storage members or guests, accordingly.
\end_layout
\begin_layout Paragraph
Amounts of Data Inquiry
\end_layout
\begin_layout Standard
\begin_inset Float figure
placement h
wide false
sideways false
status open
\begin_layout Plain Layout
\noindent
\align center
\begin_inset Graphics
filename images/fetch-replay-total.fig
width 80col%
\end_inset
\end_layout
\begin_layout Plain Layout
\begin_inset Caption Standard
\begin_layout Plain Layout
overview on amounts / cursors
\begin_inset CommandInset label
LatexCommand label
name "fig:overview-on-amounts"
\end_inset
\end_layout
\end_inset
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
The following macros are meaningful for both primary and secondary nodes:
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
deletable-size
\family default
Show the total amount of
\emph on
locally present
\emph default
logfile data which
\emph on
could
\emph default
be deleted by
\family typewriter
marsadm cron
\family default
.
This differs almost always from both
\family typewriter
replay-pos
\family default
and
\family typewriter
occupied-size
\family default
due to granularity reasons (only whole logfiles can be deleted).
Units are
\emph on
bytes
\emph default
, not kilobytes.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
occupied-size
\family default
Show the total amount of
\emph on
locally present
\emph default
logfile data (sum of all file sizes).
This is often roughly approximate to
\family typewriter
fetch-pos
\family default
, but it may differ vastly (in both directions) when logfiles are not completely
transferred, when some are damaged, during split brain, after a
\family typewriter
join-resource
\family default
/
\family typewriter
invalidate
\family default
, or when the resource is in emergency mode (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Emergency-Mode"
\end_inset
).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
disk-size
\family default
Show the size of the underlying local disk in bytes.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
resource-size
\family default
Show the logical size of the resource in bytes.
When this value is lower than
\family typewriter
disk-size
\family default
, you are wasting space.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-size
\family default
At a primary node, this may differ from
\family typewriter
resource-size
\family default
only for a very short time during the
\family typewriter
resize
\family default
operation.
At secondaries, there will be no difference.
\end_layout
\begin_layout Standard
\noindent
The following macros are only meaningful for resources in primary mode:
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
writeback-rest
\family default
Show the amount of data which is already in the transaction logfile, but
has not yet been written back to the underlying disk.
This may be used for estimation of recovery time after a potential primary
crash.
The writeback buffer is explained by the graphics at
\begin_inset CommandInset ref
LatexCommand vref
reference "sec:The-Transaction-Logger"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
\noindent
The following macros are only meaningful for resources in secondary mode.
By information theoretic limits, they can only tell what is
\emph on
locally known
\emph default
.
They
\series bold
cannot
\series default
reflect the
\begin_inset Quotes eld
\end_inset
true (global) state
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice that according to Einstein's law, and according to observations by
Lamport, the concept of
\begin_inset Quotes eld
\end_inset
true state
\begin_inset Quotes erd
\end_inset
does not exist at all in a distributed system.
Anything you can know in a distributed system is always local knowlege,
which races with other (remote) knowlege, and may be outdated at
\emph on
any
\emph default
time.
\end_layout
\end_inset
\begin_inset Quotes erd
\end_inset
of a cluster, in particular during network partitions.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-size
\family default
Show the total amount of data which is / was to be processed by either
sync, fetch, or replay.
\family typewriter
work-size
\family default
is equivalent to
\family typewriter
fetch-size
\family default
.
\family typewriter
replay-size
\family default
is equivalent to
\family typewriter
fetch-pos
\family default
(see below).
Units are
\emph on
bytes
\emph default
, not kilobytes.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-pos
\family default
Show the total amount of data which is already processed (current
\begin_inset Quotes eld
\end_inset
cursor
\begin_inset Quotes erd
\end_inset
position).
\family typewriter
work-pos
\family default
is equivalent to
\family typewriter
replay-pos
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
The 0% point is the
\emph on
locally contiguous
\emph default
amount of data since the last
\family typewriter
create-resource
\family default
,
\family typewriter
join-resource
\family default
, or
\family typewriter
invalidate
\family default
, or since the last emergency mode, but possibly shortened by
\family typewriter
cron
\family default
.
Notice that the 0% point may be different on different cluster nodes, because
their resource history may be different or non-contiguous during split
brain, or after a
\family typewriter
join-resource
\family default
, or after
\family typewriter
invalidate
\family default
, or during / after emergency mode.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-rest
\family default
Shows the difference between
\family typewriter
*-size
\family default
and
\family typewriter
*-pos
\family default
(amount of work to do).
\family typewriter
work-rest
\family default
is therefore the difference between
\family typewriter
fetch-size
\family default
and
\family typewriter
replay-pos
\family default
, which is the
\emph on
total
\emph default
amount of work to do (regardless whether to be fetched and/or to be replayed).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-reached
\family default
Boolean value indicating whether
\family typewriter
*-rest
\family default
dropped down to zero
\begin_inset Foot
status open
\begin_layout Plain Layout
MARS can only guarantee local consistency, but cannot guarantee actuality
in all imaginable situations.
Notice that a general notion of
\begin_inset Quotes eld
\end_inset
actuality
\begin_inset Quotes erd
\end_inset
is
\emph on
undefinable
\emph default
in a widely distributed system at all, according to Einstein's laws.
\end_layout
\begin_layout Plain Layout
Let's look at an example.
In case of a node crash, and after the node is up again, a
\family typewriter
modprobe mars
\family default
has to occur, in order to replay the transaction logs of MARS again.
However, at the recovery phase before, the journalling
\family typewriter
ext4
\family default
filesystem
\family typewriter
/mars/
\family default
\emph on
may
\emph default
have rolled back some internal symlink updates which have occurred immediately
before the crash.
MARS is relying on the fact that journalling filesystems like
\family typewriter
ext4
\family default
should do their recovery in a consistent way, possibly by sacrifycing actuality
a little bit.
Therefore, the above macros cannot guarantee to deliver true information
about what is persisted at the moment.
\end_layout
\begin_layout Plain Layout
Notice that there are further potential caveats.
\end_layout
\begin_layout Plain Layout
In case of
\family typewriter
{sync,fetch}-reached
\family default
, MARS uses
\family typewriter
bio
\family default
callbacks resp.
\family typewriter
fdatasync()
\family default
by default, thus the underlying storage layer has
\emph on
told
\emph default
us that it
\emph on
believes
\emph default
it has commited the data in a reboot-safe way.
Whether this is
\emph on
really
\emph default
true does not depend on MARS, but on the lower layers of the storage hierarchy.
There exists hardware where this claim is known to be wrong under certain
circumstances, such as certain hard disk drives in certain modes of operation.
Please check the hardware for any violations of storage semantics under
certain circumstances such as power loss, and check information sources
like magazines about the problem area.
Please notice that such a problem, if it exists at all, is independent
from MARS.
It would also exist if you wouldn't use MARS on the same system.
\end_layout
\end_inset
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{fetch,replay,work}-threshold-reached
\family default
Boolean value indicating whether
\family typewriter
*-rest
\family default
dropped down to
\family typewriter
%{threshold}
\family default
, which is pre-settable by the
\family typewriter
--threshold=
\emph on
size
\family default
\emph default
command line option (default is 10 MiB).
In asynchronous use cases of MARS, this should be preferred over
\family typewriter
*-reached
\family default
for
\emph on
human display
\emph default
, because it produces less flickering by the inevitable replication delay.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{fetch,replay,work}-almost-reached
\family default
Boolean value indicating whether
\family typewriter
*-rest
\family default
\emph on
almost
\emph default
/
\emph on
approximately
\emph default
dropped down to zero.
The default is that at lease 990 permille are reached.
In asynchronous use cases of MARS, this can be preferred over
\family typewriter
*-reached
\family default
for
\emph on
human display
\emph default
only, because it produces less flickering by the inevitable replication
delay.
However, don't base any decisions on this!
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-percent
\family default
The cursor position
\family typewriter
*-pos
\family default
as a percentage of
\family typewriter
*-size
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-permille
\family default
The cursor position
\family typewriter
*-pos
\family default
as permille of
\family typewriter
*-size
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-rate
\family default
Show the current throughput in bytes
\begin_inset Foot
status open
\begin_layout Plain Layout
Notice that the internal granularity reported by the kernel may be coarser,
such as KiB.
This interfaces abstracts away from kernel internals and thus presents
everything in byte units.
\end_layout
\end_inset
per second.
\family typewriter
work-rate
\family default
is the
\emph on
maximum
\emph default
of
\family typewriter
fetch-rate
\family default
and
\family typewriter
replay-rate
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay,work}-remain
\family default
Show the
\emph on
estimated
\emph default
remaining time for completion of the respective operation.
This is just a very raw guess.
Units are seconds.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{sync,fetch,replay}-{ops,amount}-rate
\family default
Show the current IOPS of sync / fetch / replay, or its corresponding throughput
in KiB/s.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
summary-vector
\family default
Show the colon-separated CSV value
\family typewriter
%replay-pos{}:%fetch-pos{}:%fetch-size{}
\family default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
replay-basenr
\family default
Get currently first reachable logfile number (see figure
\begin_inset CommandInset ref
LatexCommand vref
reference "fig:overview-on-amounts"
\end_inset
).
Only for curious humans or for debugging / monitoring - don't base any
decisions on this.
Use the
\family typewriter
*-{pos,size}
\family default
macros instead.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{replay,fetch,work}-lognr
\family default
Get current logfile number of replay or fetch position, or of the currently
known last reachable number (see figure
\begin_inset CommandInset ref
LatexCommand vref
reference "fig:overview-on-amounts"
\end_inset
).
Only for curious humans or for debugging / monitoring - don't base any
decisions on this.
Use the
\family typewriter
*-{pos,size}
\family default
macros instead.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{replay,fetch,work}-logcount
\family default
Get current number of logfiles which are already replayed, or are already
fetched, or are to be applied in total (see figure
\begin_inset CommandInset ref
LatexCommand vref
reference "fig:overview-on-amounts"
\end_inset
).
Only for curious humans or for debugging / monitoring - don't base any
decisions on this.
Use the
\family typewriter
*-{rest}
\family default
macros instead.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
alive-timestamp
\family default
Tell the Lamport Unix timestamp (seconds since 1970) of the last metadata
communication to the designated primary (or to any other host given by
the first argument).
Returns
\begin_inset Formula $-1$
\end_inset
if no such host exists.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{fetch,replay,work}-timestamp
\family default
Tell the Lamport Unix timestamp (seconds since 1970) when the last progress
has been made.
When no such action exists,
\begin_inset Formula $-1$
\end_inset
is returned.
\family typewriter
%work-timestamp{
\emph on
hostname
\emph default
}
\family default
is the maximum of
\family typewriter
%fetch-timestamp{
\emph on
hostname
\emph default
}
\family default
and
\family typewriter
%replay-timestamp{
\emph on
hostname
\emph default
}
\family default
.
When the parameter
\family typewriter
\emph on
hostname
\family default
\emph default
is empty, the local host will be reported (default).
Example usage:
\family typewriter
marsadm view all --macro=
\begin_inset Quotes erd
\end_inset
%replay-timestamp{%todo-primary{}}
\begin_inset Quotes erd
\end_inset
\family default
shows the timestamp of the last reported
\begin_inset Foot
status open
\begin_layout Plain Layout
Updates of this information are occurring with lower frequency than actual
writebacks, for performance reasons.
The metadata network update protocol will add further delays.
Therefore, the accuracy is only in the range of minutes.
\end_layout
\end_inset
writeback action at the designated primary.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{alive,fetch,replay,work}-age
\family default
Tell the number of seconds since the last respective action, or
\begin_inset Formula $-1$
\end_inset
if none exists.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
{alive,fetch,replay,work}-lag
\family default
Report the time difference (in seconds) between the last
\emph on
known
\emph default
action at the local host and at the designated primary (or between any
other hosts when 2 parameters are given).
Returns
\begin_inset Formula $-1$
\end_inset
if no such action exists at any of the two hosts.
Attention! This need not reflect the
\emph on
actual
\emph default
state in case of networking problems.
Don't draw wrong conclusions from a high
\family typewriter
{fetch,replay}-lag
\family default
value: it could also mean that simply no write operation at all has occurred
at the primary side for a long time.
Conversely, a low lag value does not imply that the replication is recent:
it may refer to
\emph on
different
\emph default
write operations at each of the hosts; therefore it only tells that
\emph on
some
\emph default
progress has been made, but says nothing about the amount of the progress.
\end_layout
\begin_layout Paragraph
Device Information
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
get-device
\family default
Tell the device name, which is
\family typewriter
/dev/mars/%{res}
\family default
in the current MARS implementation.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-present
\family default
Boolean, telling whether
\family typewriter
/dev/mars/%{res}
\family default
is currently appearing at
\family typewriter
%{host}
\family default
or not.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-opened
\family default
Tell the number of times
\family typewriter
/dev/mars/%{res}
\family default
is currently opened (e.g.
mounted) at
\family typewriter
%{host}
\family default
.
Upon non-exclusive access by multiple readers / writers in parallel (which
is potentially very dangerous), the number may grow greater than 1.
You may exploit this for monitoring / supervision.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-ops-rate
\family default
Tell the current request throughput, aka IOPS.
This is actually changing much more frequently than can be reported by
the kernel, but anyway may be useful for getting some impression on what
is going on.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-error
\family default
Tell the Unix error code when any IO error has occurred in the past, or
0 when no error is known.
Useful for debugging and fault analysis.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-nrflying
\family default
Tell the number of currently flying IO requests (i.e.
submitted, but not yet completed).
This is changing in much higher frequency that can be ever reported by
the kernel, but may be useful for bottleneck analysis, and when the system
is stuck (e.g.
defective RAID).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-completion-stamp
\family default
Tell the realtime timestamp of the last completed IO request.
Useful for detection of a hanging system (e.g.
defective disks, etc).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
device-completion-age
\family default
Similar to before, but report the
\emph on
relative
\emph default
age (compared to the current time) in seconds.
\end_layout
\begin_layout Paragraph
Misc Informational Status
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
get-primary
\family default
Return the name of the current designated primary node as locally known.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
actual-primary
\family default
(deprecated) try to determine the name of the node which
\emph on
appears
\emph default
to be the actual primary.
This only a
\series bold
\emph on
guess
\series default
\emph default
, because it is not generally unique in split brain situations! Don't use
this macro.
Instead, use
\family typewriter
is-primary
\family default
on those nodes you are interested in.
The explanations from section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-State-of"
\end_inset
also apply to
\family typewriter
get-primary
\family default
versus
\family typewriter
actual-primary
\family default
analogously.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
is-alive
\family default
Boolean value indicating whether all other nodes participating in
\family typewriter
mydata
\family default
are reachable / healthy.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
uuid
\family default
(global) Show the unique identifier created by
\family typewriter
create-cluster
\family default
or by
\family typewriter
create-uuid
\family default
.
Hint: this is immutable, and it is firmly bound to the
\family typewriter
/mars/
\family default
filesystem.
It can only be destroyed by deleting the whole filesystem (see section
\begin_inset CommandInset ref
LatexCommand ref
reference "leave-cluster"
\end_inset
).
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
tree
\family default
(global) Indicate symlink tree version (see
\family typewriter
mars-for-kernel-developers.pdf
\family default
).
\end_layout
\begin_layout Paragraph
Experts Only
\end_layout
\begin_layout Standard
The following is for hackers who know what they are doing.
The following is not officially supported.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
\family typewriter
wait-{is,todo}-{attach,sync,fetch,replay,primary,secondary}-{on,off}
\family default
This may be used to program some useful waiting conditions in advanced
macro scripts.
It works via busy wait, and does not support disjoint waiting conditions.
Use at your own risk! Hint: for disjoint and/or more complex waiting conditions
, and/or for programming your own finite state transition machines etc,
please prefer the non-blocking
\family typewriter
{is,todo}-*
\family default
and sisters, and program any busy wait yourself (or try to avoid busy-wait
at all).
\end_layout
\begin_layout Section
Creating your own Macros
\begin_inset CommandInset label
LatexCommand label
name "subsec:Creating-your-own"
\end_inset
\end_layout
\begin_layout Standard
In order to create your own macros, you could start writing them from scratch
with your favorite ASCII text editor.
However, it is much easier to take an existing macro and to customize it
to your needs.
In addition, you can learn something about macro programming by looking
at the existing macro code.
\end_layout
\begin_layout Standard
Go to a new empty directory and say
\end_layout
\begin_layout Itemize
\family typewriter
marsadm dump-macros
\end_layout
\begin_layout Standard
in order to get the most interesting complex macros, or say
\end_layout
\begin_layout Itemize
\family typewriter
marsadm dump-all-macros
\end_layout
\begin_layout Standard
in order to additionally get some primitive macros which could be customized
if needed.
This will write lots of files
\family typewriter
*.tpl
\family default
into your current working directory.
\end_layout
\begin_layout Standard
Any modfied or new macro file should be placed either into the current working
directory
\family typewriter
./
\family default
, or into
\family typewriter
$HOME/.marsadm/
\family default
, or into
\family typewriter
/etc/marsadm/
\family default
.
They will be searched in this order, and the first match will win.
When no macro file is found, the built-in version will be used if it exists.
This way, you may override builtin macros.
\end_layout
\begin_layout Standard
Example: if you have a file
\family typewriter
./mymacro.tpl
\family default
you just need to say
\family typewriter
marsadm view-mymacro mydata
\family default
in order to invoke it in the resource context
\family typewriter
mydata
\family default
.
\end_layout
\begin_layout Subsection
General Macro Syntax
\end_layout
\begin_layout Standard
Macros are simple ASCII text, enriched with calls to other macros.
\end_layout
\begin_layout Standard
ASCII text outside of comments are copied to the output verbatim.
Comments are skipped.
Comments may have one of the following well-known forms:
\end_layout
\begin_layout Itemize
\family typewriter
# skipped text until / including next newline character
\end_layout
\begin_layout Itemize
\family typewriter
// skipped text until / including next newline character
\end_layout
\begin_layout Itemize
\family typewriter
/* skipped text including any newline characters */
\end_layout
\begin_layout Itemize
denoted as Perl regex:
\family typewriter
\backslash
\backslash
\backslash
n
\backslash
s*
\family default
(single backslash directly followed by a newline character, and eating up
any whitespace characters at the beginning of the next line) Hint: this
may be fruitfully used to structure macros in a more readable form / indentatio
n.
\end_layout
\begin_layout Standard
Special characters are always initiated by a backslash.
The following pre-defined special character sequences are recognized:
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
n
\family default
newline
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
r
\family default
return (useful for DOS compatibility)
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
t
\family default
tab
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
f
\family default
formfeed
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
b
\family default
backspace
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
a
\family default
alarm (bell)
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
e
\family default
escape (e.g.
for generating ANSI escape sequences)
\end_layout
\begin_layout Itemize
\family typewriter
\backslash
\family default
followed by anything else: assure that the next character is taken verbatim.
Although possible, please don't use this for escaping letters, because
further escape sequences might be pre-defined in future.
Best practice is to use this only for escaping the backslash itself, or
for escaping the percent sign when you don't want to call a macro (protect
against evaluation), or to escape a brace directly after a macro call (verbatim
brace not to be interpreted as a macro parameter).
\end_layout
\begin_layout Itemize
All other characters stand for their own.
If you like, you should be able to produce XML, HTML, JSON and other ASCII-base
d output formats this way.
\end_layout
\begin_layout Standard
Macro calls have the following syntax:
\end_layout
\begin_layout Itemize
\family typewriter
%
\emph on
macroname
\emph default
{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}{
\emph on
argn
\emph default
}
\end_layout
\begin_layout Itemize
Of course, arguments may be empty, denoted as
\family typewriter
{}
\end_layout
\begin_layout Itemize
It is possible to supply more arguments than required.
These are simply ignored.
\end_layout
\begin_layout Itemize
There must be always at least 1 argument, even for parameterless macros.
In such a case, it is good style to leave it empty (even if it is actually
ignored).
Just write
\family typewriter
%parameterlessmacro{}
\family default
in such a case.
\end_layout
\begin_layout Itemize
\family typewriter
%{
\emph on
varname
\emph default
}
\family default
syntax: As a special case, the macro name may be empty, but then the first
argument must denote a previously defined variable (such as assigned via
\family typewriter
%let{varname}{myvalue}
\family default
, or a pre-defined standard variable like
\family typewriter
%{res}
\family default
for the current resource name, see later paragraph
\begin_inset CommandInset ref
LatexCommand ref
reference "par:Predefined-Variables"
\end_inset
).
\end_layout
\begin_layout Itemize
Of course, parameter calls may be (almost) arbitrarily nested.
\end_layout
\begin_layout Itemize
Of course, the
\emph on
correctness
\emph default
of nesting of braces must be generally obeyed, as usual in any other macro
processor language.
General rule: for each opening brace, there must be exactly one closing
brace somewhere afterwards.
\end_layout
\begin_layout Standard
These rules are hopefully simple and intuitive.
There are currently no exceptions.
In particular, there is no special infix operator syntax for arithmetic
expressions, and therefore no operator precedence rules are necessary.
You have to write nested arithmetic expressions always in the above prefix
syntax, like
\family typewriter
%*{7}{%+{2}{3}}
\family default
(similar to non-inverse polish notation).
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When deeply nesting macros and their braces, you may easily find yourself
in a feeling like in the good old days of Lisp.
Use the above backslash-newline syntax to indent your macros in a readable
and structured way.
Fortunately, modern text editors like (x)emacs or vim have modes for dealing
with the correctness of nested braces.
\end_layout
\begin_layout Subsection
Calling Builtin / Primitive Macros
\end_layout
\begin_layout Standard
Primitive macros can be called in two alternate forms:
\end_layout
\begin_layout Itemize
\family typewriter
%primitive-
\emph on
macroname
\emph default
{
\emph on
something
\emph default
}
\end_layout
\begin_layout Itemize
\family typewriter
%
\emph on
macroname
\emph default
{
\emph on
something
\emph default
}
\end_layout
\begin_layout Standard
When using the
\family typewriter
%primitive-*{}
\family default
form, you
\emph on
explicitly disallow
\emph default
interception of the call by a
\family typewriter
*.tpl
\family default
file.
Otherwise, you may override the standard definition even of primitive macros
by your own template files.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Notice that
\family typewriter
%call{}
\family default
conventions are used in such a case.
The parameters are passed via
\family typewriter
%{0}
\family default
\begin_inset Formula $\ldots$
\end_inset
\family typewriter
%{n}
\family default
variables (see description below).
\end_layout
\begin_layout Paragraph
Standard MARS State Inspection Macros
\end_layout
\begin_layout Standard
These are already described in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Predefined-Trivial-Macros"
\end_inset
.
When calling one of them, the call will simply expand to the corresponding
value.
\end_layout
\begin_layout Standard
Example:
\family typewriter
%get-primary{}
\family default
will expand to the hostname of the current designated primary node.
\end_layout
\begin_layout Paragraph
Further MARS State Inspection Macros
\end_layout
\begin_layout Paragraph
Variable Access Macros
\end_layout
\begin_layout Itemize
\family typewriter
%let{
\emph on
varname
\emph default
}{
\emph on
expression
\emph default
}
\family default
Evaluates both
\family typewriter
\emph on
varname
\family default
\emph default
and the
\family typewriter
\emph on
expression
\family default
\emph default
.
The
\family typewriter
\emph on
expression
\family default
\emph default
is then assigned to
\family typewriter
varname
\family default
.
\end_layout
\begin_layout Itemize
\family typewriter
%let{
\emph on
varname
\emph default
}{
\emph on
expression
\emph default
}
\family default
Evaluates both
\family typewriter
\emph on
varname
\family default
\emph default
and the
\family typewriter
\emph on
expression
\family default
\emph default
.
The
\family typewriter
\emph on
expression
\family default
\emph default
is then appended to
\family typewriter
varname
\family default
(concatenation).
\end_layout
\begin_layout Itemize
\family typewriter
%{
\emph on
varname
\emph default
}
\family default
Evaluates
\family typewriter
\emph on
varname
\family default
\emph default
, and outputs the value of the corresponding variable.
When the variable does not exist, the empty string is returned.
\end_layout
\begin_layout Itemize
\family typewriter
%{++}{
\emph on
varname
\emph default
}
\family default
or
\family typewriter
%{
\emph on
varname
\emph default
}{++}
\family default
Has the obvious well-known side effect e.g.
from C or Java.
You may also use
\family typewriter
--
\family default
instead of
\family typewriter
++
\family default
.
This is handy for programming loops (see below).
\end_layout
\begin_layout Itemize
\family typewriter
%dump-vars{}
\family default
Writes all currently defined variables (from the currently active scope)
to
\family typewriter
stderr
\family default
.
This is handy for debugging.
\end_layout
\begin_layout Paragraph
CSV Array Macros
\end_layout
\begin_layout Itemize
\family typewriter
%{
\emph on
varname
\emph default
}{
\emph on
delimiter
\emph default
}{
\emph on
index
\emph default
}
\family default
Evaluates all arguments.
The contents of
\family typewriter
\emph on
varname
\family default
\emph default
is interpreted as a comma-separated list, delimited by
\family typewriter
\emph on
delimiter
\family default
\emph default
.
The
\family typewriter
\emph on
index
\family default
\emph default
'th list element is returned.
\end_layout
\begin_layout Itemize
\family typewriter
%set{
\emph on
varname
\emph default
}{
\emph on
delimiter
\emph default
}{
\emph on
index
\emph default
}{
\emph on
expression
\emph default
}
\family default
Evaluates all arguments.
The contents of the old
\family typewriter
\emph on
varname
\family default
\emph default
is interpreted as a comma-separated list, delimited by
\family typewriter
\emph on
delimiter
\family default
\emph default
.
The
\family typewriter
\emph on
index
\family default
\emph default
'th list element is the assigend to, or substituted by,
\family typewriter
\emph on
expression
\family default
\emph default
.
\end_layout
\begin_layout Paragraph
Arithmetic Expression Macros
\end_layout
\begin_layout Standard
The following macros can also take more than two arguments, carrying out
the corresponding arithmetic operation in sequence (it depends on the operator
whether this accords to the associative law).
\end_layout
\begin_layout Itemize
\family typewriter
%+{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Evaluates the arguments, inteprets them as numbers, and adds them together.
\end_layout
\begin_layout Itemize
\family typewriter
%-{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Subtraction.
\end_layout
\begin_layout Itemize
\family typewriter
%*{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Multiplication.
\end_layout
\begin_layout Itemize
\family typewriter
%/{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Division.
\end_layout
\begin_layout Itemize
\family typewriter
%%{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Modulus.
\end_layout
\begin_layout Itemize
\family typewriter
%&{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Bitwise Binary And.
\end_layout
\begin_layout Itemize
\family typewriter
%|{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Bitwise Binary Or.
\end_layout
\begin_layout Itemize
\family typewriter
%^{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Bitwise Binary Exclusive Or.
\end_layout
\begin_layout Itemize
\family typewriter
%<<{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Binary Shift Left.
\end_layout
\begin_layout Itemize
\family typewriter
%>>{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Binary Shift Right.
\end_layout
\begin_layout Itemize
\family typewriter
%min{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Compute the arithmetic minimum of the arguments.
\end_layout
\begin_layout Itemize
\family typewriter
%max{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Compute the arithmetic maximum of the arguments.
\end_layout
\begin_layout Paragraph
Boolean Condition Macros
\end_layout
\begin_layout Itemize
\family typewriter
%=={
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Numeral Equality.
\end_layout
\begin_layout Itemize
\family typewriter
%!={
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Numeral Inequality.
\end_layout
\begin_layout Itemize
\family typewriter
%<{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Numeral Less Then.
\end_layout
\begin_layout Itemize
\family typewriter
%<={
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Numeral Less or Equal.
\end_layout
\begin_layout Itemize
\family typewriter
%>{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Numeral Greater Then.
\end_layout
\begin_layout Itemize
\family typewriter
%>={
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Numeral Greater or Equal.
\end_layout
\begin_layout Itemize
\family typewriter
%eq{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
\begin_inset space ~
\end_inset
String Equality.
\end_layout
\begin_layout Itemize
\family typewriter
%ne{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
String Inequality.
\end_layout
\begin_layout Itemize
\family typewriter
%lt{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
String Less Then.
\end_layout
\begin_layout Itemize
\family typewriter
%le{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
String Less or Equal.
\end_layout
\begin_layout Itemize
\family typewriter
%gt{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
String Greater Then.
\end_layout
\begin_layout Itemize
\family typewriter
%ge{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
String Greater or Equal.
\end_layout
\begin_layout Itemize
\family typewriter
%=~{
\emph on
string
\emph default
}{
\emph on
regex
\emph default
}{
\emph on
opts
\emph default
}
\family default
or
\family typewriter
%match{
\emph on
string
\emph default
}{
\emph on
regex
\emph default
}{
\emph on
opts
\emph default
}
\family default
Checks whether
\family typewriter
\emph on
string
\family default
\emph default
matches the Perl regular expression
\family typewriter
\emph on
regex
\family default
\emph default
.
Modifiers can be given via
\family typewriter
\emph on
opts
\family default
\emph default
.
\end_layout
\begin_layout Paragraph
Shortcut Evaluation Operators
\end_layout
\begin_layout Standard
The following operators evaluate their arguments only when needed (like
in C).
\end_layout
\begin_layout Itemize
\family typewriter
%&&{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Logical And.
\end_layout
\begin_layout Itemize
\family typewriter
%and{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Alias for
\family typewriter
%&&{}
\family default
.
\end_layout
\begin_layout Itemize
\family typewriter
%||{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Logical Or.
\end_layout
\begin_layout Itemize
\family typewriter
%or{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}
\family default
Alias for
\family typewriter
%||{}
\family default
.
\end_layout
\begin_layout Paragraph
Unary Operators
\end_layout
\begin_layout Itemize
\family typewriter
%!{
\emph on
arg
\emph default
}
\family default
Logical Not.
\end_layout
\begin_layout Itemize
\family typewriter
%not{
\emph on
arg
\emph default
}
\family default
Alias for
\family typewriter
%!{}
\family default
.
\end_layout
\begin_layout Itemize
\family typewriter
%~{
\emph on
arg
\emph default
}
\family default
Bitwise Ńegation.
\end_layout
\begin_layout Paragraph
String Functions
\end_layout
\begin_layout Itemize
\family typewriter
%length{
\emph on
string
\emph default
}
\family default
Return the number of ASCII characters present in
\family typewriter
\emph on
string
\family default
\emph default
.
\end_layout
\begin_layout Itemize
\family typewriter
%toupper{
\emph on
string
\emph default
}
\family default
Return all ASCII characters converted to uppercase.
\end_layout
\begin_layout Itemize
\family typewriter
%tolower{
\emph on
string
\emph default
}
\family default
Return all ASCII characters converted to lowercase.
\end_layout
\begin_layout Itemize
\family typewriter
%append{
\emph on
varname
\emph default
}{
\emph on
string
\emph default
}
\family default
Equivalent to
\family typewriter
%let{
\emph on
varname
\emph default
}{%{
\emph on
varname
\emph default
}
\emph on
string
\emph default
}
\family default
.
\end_layout
\begin_layout Itemize
\family typewriter
%subst{
\emph on
string
\emph default
}{
\emph on
regex
\emph default
}{
\emph on
subst
\emph default
}{
\emph on
opts
\emph default
}
\family default
Perl regex substitution.
\end_layout
\begin_layout Itemize
\family typewriter
%sprintf{
\emph on
fmt
\emph default
}{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}{
\emph on
argn
\emph default
}
\family default
Perl
\family typewriter
sprintf()
\family default
operator.
Details see Perl manual.
\end_layout
\begin_layout Itemize
\family typewriter
%human-number{
\emph on
unit
\emph default
}{
\emph on
delim
\emph default
}{
\emph on
unit-sep
\emph default
}{
\emph on
number
\emph default
1}{
\emph on
number
\emph default
2}
\begin_inset Formula $\ldots$
\end_inset
\family default
Convert a number or a list of numbers into human-readable
\family typewriter
B
\family default
,
\family typewriter
KiB
\family default
,
\family typewriter
MiB
\family default
,
\family typewriter
GiB
\family default
,
\family typewriter
TiB
\family default
, as given by
\family typewriter
\emph on
unit
\family default
\emph default
.
When
\family typewriter
\emph on
unit
\family default
\emph default
is empty, a reasonable unit will be guessed automatically from the maximum
of all given numbers.
A single result string is produced, where multiple numbers are separated
by
\family typewriter
\emph on
delim
\family default
\emph default
when necessary.
When
\family typewriter
\emph on
delim
\family default
\emph default
is empty, the slash symbol
\family typewriter
/
\family default
is used by default (the most obvious use case is result strings like
\family typewriter
\begin_inset Quotes eld
\end_inset
17/32 KiB
\begin_inset Quotes erd
\end_inset
\family default
).
The final unit text is separated from the previous number(s) by
\family typewriter
\emph on
unit-sep
\family default
\emph default
.
When
\family typewriter
\emph on
unit-sep
\family default
\emph default
is empty, a single blank is used by default.
\end_layout
\begin_layout Itemize
\family typewriter
%human-seconds{
\emph on
number
\emph default
}
\family default
Convert the given number of seconds into
\family typewriter
hh:mm:ss
\family default
format.
\end_layout
\begin_layout Paragraph
Complex Helper Macros
\end_layout
\begin_layout Itemize
\family typewriter
%progress{20}
\family default
Return a string containing a progress bar showing the values from
\family typewriter
%summary-vector{}
\family default
.
The default width is 20 characters plus two braces.
\end_layout
\begin_layout Itemize
\family typewriter
%progress{20}{
\emph on
minvalue
\emph default
}{
\emph on
midvalue
\emph default
}{
\emph on
maxvalue
\emph default
}
\family default
Instead of taking the values from
\family typewriter
%summary-vector{}
\family default
, use the supplied values.
\family typewriter
minvalue
\family default
and
\family typewriter
midvalue
\family default
indicate two different intermediate points, while
\family typewriter
maxvalue
\family default
will determine the 100% point.
\end_layout
\begin_layout Paragraph
Control Flow Macros
\end_layout
\begin_layout Itemize
\family typewriter
%if{
\emph on
expression
\emph default
}{
\emph on
then-part
\emph default
}
\family default
or
\family typewriter
%if{
\emph on
expression
\emph default
}{
\emph on
then-part
\emph default
}{
\emph on
else-part
\emph default
}
\family default
Like in any other macro or programming language, this evaluates the
\family typewriter
expression
\family default
once, not copying its outcome to the output.
If the result is non-empty and is not a string denoting the number
\family typewriter
0
\family default
, the
\family typewriter
\emph on
then-part
\family default
\emph default
is evaluated and copied to the output.
Otherwise, the
\family typewriter
else-part
\family default
is evaluated and copied, provided that one exists.
\end_layout
\begin_layout Itemize
\family typewriter
%unless{
\emph on
expression
\emph default
}{
\emph on
then-part
\emph default
}
\family default
or
\family typewriter
%unless{
\emph on
expression
\emph default
}{
\emph on
then-part
\emph default
}{
\emph on
else-part
\emph default
}
\family default
Like
\family typewriter
%if{}
\family default
, but the expression is logically negated.
Essentially, this is a shorthand for
\family typewriter
%if{%not{expression}}{...}
\family default
or similar.
\end_layout
\begin_layout Itemize
\family typewriter
%elsif{
\emph on
expr1
\emph default
}{
\emph on
then1
\emph default
}{
\emph on
expr2
\emph default
}{
\emph on
then2
\emph default
}
\family default
\begin_inset Formula $\ldots$
\end_inset
or
\family typewriter
%elsif{
\emph on
expr1
\emph default
}{
\emph on
then1
\emph default
}{
\emph on
expr2
\emph default
}{
\emph on
then2
\emph default
}
\family default
\begin_inset Formula $\ldots$
\end_inset
\family typewriter
{
\emph on
odd-else-part
\emph default
}
\family default
This is for simplification of boring if-else-if chains.
The classical if-syntax (as shown above) has the drawback that inner if-parts
need to be nested into outer else-parts, so rather deep nestings may occur
when you are programming longer chains.
This is an alternate syntax for avoidance of deep nesting.
When giving an odd number of arguments, the last argument is taken as final
else-part.
\end_layout
\begin_layout Itemize
\family typewriter
%elsunless
\family default
\begin_inset Formula $\ldots$
\end_inset
Like
\family typewriter
%elsif
\family default
, but
\emph on
all
\emph default
conditions are negated.
\end_layout
\begin_layout Itemize
\family typewriter
%while{
\emph on
expression
\emph default
}{
\emph on
body
\emph default
}
\family default
Evaluates the
\family typewriter
\emph on
expression
\family default
\emph default
in a while loop, like in any other macro or programming language.
The
\family typewriter
\emph on
body
\family default
\emph default
is evaluated exactly as many times as the
\family typewriter
\emph on
expression
\family default
\emph default
holds.
Notice that endless loops can be only avoided by a calling a non-pure macro
inspecting external state information, or by creating (and checking) another
side effect somewhere, like assigning to a variable somewhere.
\end_layout
\begin_layout Itemize
\family typewriter
%until{
\emph on
expression
\emph default
}{
\emph on
body
\emph default
}
\family default
Like
\family typewriter
%while{
\emph on
expression
\emph default
}{
\emph on
body
\emph default
}
\family default
, but negate the expression.
\end_layout
\begin_layout Itemize
\family typewriter
%for{
\emph on
exp
\emph default
r1}{
\emph on
exp
\emph default
r2}{
\emph on
exp
\emph default
r3}{
\emph on
body
\emph default
}
\family default
As you will expect from the corresponding C, Perl, Java, or (add your favorite
language) construct.
Only the syntactic sugar is a little bit different.
\end_layout
\begin_layout Itemize
\family typewriter
%foreach{
\emph on
varname
\emph default
}{
\emph on
CSV-delimited-string
\emph default
}{
\emph on
delimiter
\emph default
}{
\emph on
body
\emph default
}
\family default
As you can expect from similar
\family typewriter
foreach
\family default
constructs in other languages like Perl.
Currently, the macro processor has no arrays, but can use comma-separated
strings as a substitute.
\end_layout
\begin_layout Itemize
\family typewriter
%eval{
\emph on
count
\emph default
}{
\emph on
body
\emph default
}
\family default
Evaluates the
\family typewriter
\emph on
body
\family default
\emph default
exactly as many times as indicated by the numeric argument
\family typewriter
\emph on
count
\family default
\emph default
.
This may be used to re-evaluate the output of other macros once again.
\end_layout
\begin_layout Itemize
\family typewriter
%protect{
\emph on
body
\emph default
}
\family default
Equivalent to
\family typewriter
%eval{0}{
\emph on
body
\emph default
}
\family default
, which means that the body is not evaluated at all, but copied to the output
verbatim
\begin_inset Foot
status open
\begin_layout Plain Layout
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
TeX
\end_layout
\end_inset
\begin_inset space ~
\end_inset
or
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
LaTeX
\end_layout
\end_inset
\begin_inset space ~
\end_inset
fans usually know what this is good for ;)
\end_layout
\end_inset
.
\end_layout
\begin_layout Itemize
\family typewriter
%eval-down{
\emph on
body
\emph default
}
\family default
Evaluates the
\family typewriter
\emph on
body
\family default
\emph default
in a loop until the result does not change any more
\begin_inset Foot
status open
\begin_layout Plain Layout
Mathematicians knowing Banach's fixedpoint theorem will know what this is
good for ;)
\end_layout
\end_inset
.
\end_layout
\begin_layout Itemize
\family typewriter
%tmp{
\emph on
body
\emph default
}
\family default
Evaluates the
\family typewriter
\emph on
body
\family default
\emph default
once in a temporary scope which is thrown away afterwards.
\end_layout
\begin_layout Itemize
\family typewriter
%call{
\emph on
macroname
\emph default
}{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}{
\emph on
argn
\emph default
}
\family default
Like in many other macro languages, this evaluates the named macro in the
a new scope.
This means that any side effects produced by the called macro, such as
variable assignments, will be reverted after the call, and therefore not
influence the old scope.
However notice that the arguments
\family typewriter
\emph on
arg1
\family default
\emph default
to
\family typewriter
\emph on
argn
\family default
\emph default
are evaluted in the
\emph on
old
\emph default
scope before the call actually happens (possibly producing side effects
if they contain some), and their result is respectively assigned to
\family typewriter
%{1}
\family default
until
\family typewriter
%{
\emph on
n
\emph default
}
\family default
in the new scope, analogously to the Shell or to Perl.
In addition, the new
\family typewriter
%{0}
\family default
gets the
\family typewriter
\emph on
macroname
\family default
\emph default
.
Notice that the argument evaluation happens non-lazily in the old scope
and therefore differs from other macro processors like
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
TeX
\end_layout
\end_inset
.
\end_layout
\begin_layout Itemize
\family typewriter
%include{
\emph on
macroname
\emph default
}{
\emph on
arg1
\emph default
}{
\emph on
arg2
\emph default
}{
\emph on
argn
\emph default
}
\family default
Like
\family typewriter
%call{}
\family default
, but evaluates the named macro in the
\emph on
current
\emph default
scope (similar to the
\family typewriter
source
\family default
command of the bourne shell).
This means that any side effects produced by the called macro, such as
variable assignments, will
\emph on
not
\emph default
be reverted after the call.
Even the
\family typewriter
%{0}
\family default
until
\family typewriter
%{
\emph on
n
\emph default
}
\family default
variables will continue to exist (and may lead to confusion if you aren't
aware of that).
\end_layout
\begin_layout Itemize
\family typewriter
%callstack{}
\family default
Useful for debugging: show the current chain of macro invocations.
\end_layout
\begin_layout Paragraph
Time Handling Macros
\end_layout
\begin_layout Itemize
\family typewriter
%time{}
\family default
Return the current Lamport timestamp (see
\family typewriter
mars-for-kernel-developers.pdf
\family default
), in units of seconds since the Unix epoch.
\end_layout
\begin_layout Itemize
\family typewriter
%real-time{}
\family default
Return the current system clock timestamp, in units of seconds since the
Unix epoch.
\end_layout
\begin_layout Itemize
\family typewriter
%sleep{
\emph on
seconds
\emph default
}
\family default
Pause the given number of seconds.
\end_layout
\begin_layout Itemize
\family typewriter
%timeout{
\emph on
seconds
\emph default
}
\family default
Like
\family typewriter
%sleep{
\emph on
seconds
\emph default
}
\family default
, but abort the
\family typewriter
marsadm
\family default
command after the total waiting time has exceeded the timeout given by
the
\family typewriter
--timeout=
\family default
parameter.
\end_layout
\begin_layout Paragraph
Misc Macros
\end_layout
\begin_layout Itemize
\family typewriter
%warn{
\emph on
text
\emph default
}
\family default
Show a WARNING:
\end_layout
\begin_layout Itemize
\family typewriter
%die{
\emph on
text
\emph default
}
\family default
Abort execution with an error message.
\end_layout
\begin_layout Paragraph
Experts Only - Risky
\end_layout
\begin_layout Standard
The following macros are unstable and may change at any time without notice.
\end_layout
\begin_layout Itemize
\family typewriter
%get-msg{
\emph on
name
\emph default
}
\family default
Low-level access to system messages.
You should not use this, since this is not extensible (you must know the
name in advance).
\end_layout
\begin_layout Itemize
\family typewriter
%readlink{
\emph on
path
\emph default
}
\family default
Low-level access to symlinks.
Don't misuse this for circumvention of the abstraction macros from the
symlink tree!
\end_layout
\begin_layout Itemize
\family typewriter
%setlink{
\emph on
value
\emph default
}{
\emph on
path
\emph default
}
\family default
Low-level creation of symlinks.
Don't misuse this for circumvention of the abstraction macros for the symlink
tree!
\end_layout
\begin_layout Itemize
\family typewriter
%fetch-info{}
\family default
etc.
Low-level access to internal symlink formats.
Don't use this in scripts! Only for curious humans.
\end_layout
\begin_layout Itemize
\family typewriter
%is-almost-consistent{}
\family default
Whatever you guess what this could mean, don't use it, at least never in
place of
\family typewriter
%is-consistent{}
\family default
- it is risky to base decisions on this.
Mostly for historical reasons.
\end_layout
\begin_layout Itemize
\family typewriter
%does{
\emph on
name
\emph default
}
\family default
Equivalent to
\family typewriter
%is-
\emph on
name
\emph default
{}
\family default
(just more handy for computing the macro name).
Use with care!
\end_layout
\begin_layout Subsection
Predefined Variables
\begin_inset CommandInset label
LatexCommand label
name "par:Predefined-Variables"
\end_inset
\end_layout
\begin_layout Itemize
\family typewriter
%{cmd}
\family default
The command argument of the invoked
\family typewriter
marsadm
\family default
command.
\end_layout
\begin_layout Itemize
\family typewriter
%{res}
\family default
The resource name given to the
\family typewriter
marsadm
\family default
command as a command line parameter (or, possibly expanded from
\family typewriter
all
\family default
).
\end_layout
\begin_layout Itemize
\family typewriter
%{resdir}
\family default
The corresponding resource directory.
The current version of MARS uses
\family typewriter
/mars/resource-%{res}/
\family default
, but this may change in future.
Normally, you should not need this, since anything should be already abstracted
for you.
In case you
\emph on
really
\emph default
need low-level access to something, please prefer this variable over
\family typewriter
%{mars}/resource-%{res}
\family default
because it is a bit more abstracted.
\end_layout
\begin_layout Itemize
\family typewriter
%{mars}
\family default
Currently the fixed string
\family typewriter
/mars
\family default
.
This may change in future, probably with the advent of MARS Full.
\end_layout
\begin_layout Itemize
\family typewriter
%{host}
\family default
The hostname of the local node.
\end_layout
\begin_layout Itemize
\family typewriter
%{ip}
\family default
The IP address of the local node.
\end_layout
\begin_layout Itemize
\family typewriter
%{timeout}
\family default
The value given by the
\family typewriter
--timeout=
\family default
option, or the corresonding default value.
\end_layout
\begin_layout Itemize
\family typewriter
%{threshold}
\family default
The value given by the
\family typewriter
--threshold=
\family default
option, or the corresonding default value.
\end_layout
\begin_layout Itemize
\family typewriter
%{window}
\family default
The value given by the
\family typewriter
--window=
\family default
option, or the corresonding default value (60s).
\end_layout
\begin_layout Itemize
\family typewriter
%{force}
\family default
The number of times the
\family typewriter
--force
\family default
option has been given.
\end_layout
\begin_layout Itemize
\family typewriter
%{dry-run}
\family default
The number of times the
\family typewriter
--dry-run
\family default
option has been given.
\end_layout
\begin_layout Itemize
\family typewriter
%{verbose}
\family default
The number of times the
\family typewriter
--verbose
\family default
option has been given.
\end_layout
\begin_layout Itemize
\family typewriter
%{callstack}
\family default
Same as the
\family typewriter
%callstack{}
\family default
macro.
The latter gives you an opportunity for overriding, while the former is
firmly built in.
\end_layout
\begin_layout Section
Scripting Advice
\begin_inset CommandInset label
LatexCommand label
name "sec:Scripting-HOWTO"
\end_inset
\end_layout
\begin_layout Standard
Both the
\series bold
asynchronous communication model
\series default
of MARS including the Lamport clock, and the
\series bold
state model
\series default
(cf section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:The-State-of"
\end_inset
) is something you
\emph on
definitely
\emph default
should have in mind when you want to do some scripting.
Here is some advice:
\end_layout
\begin_layout Itemize
Don't access anything on
\family typewriter
/mars/
\family default
directly, except for debugging purposes.
Use
\family typewriter
marsadm
\family default
.
\end_layout
\begin_layout Itemize
Avoid running scripts in parallel, other than for inspection / monitoring
purposes.
When you give two
\family typewriter
marsadm
\family default
commands in parallel (whether on the same host, or on different hosts belonging
to the same cluster), it is possible to produce a mess.
\family typewriter
marsadm
\family default
has no internal locking.
There is no cluster-wide locking at all, because if would cause trouble
during long-distance network outages.
Unfortunately, some systems like Pacemaker are violating this in many cases
(depending on their configuration).
Best is if you have a dedicated / more or less centralized
\series bold
control machine
\series default
which controls masses of your georedundant working servers.
This reduces the risk of running interfering actions in parallel.
Of course, you need backup machines for your control machines, and in different
locations.
Not obeying this advice can easily lead to problems such as complex races
which are very difficult to solve in long-distance distributed systems,
even in general (not limited to MARS).
\end_layout
\begin_layout Itemize
\family typewriter
marsadm wait-cluster
\family default
is your friend.
Whenever your (near-)central script has to switch between different hosts
\family typewriter
A
\family default
and
\family typewriter
B
\family default
(of the same cluster), use it in the following way:
\begin_inset Newline newline
\end_inset
\family typewriter
ssh A
\begin_inset Quotes eld
\end_inset
marsadm action1
\begin_inset Quotes erd
\end_inset
; ssh B
\begin_inset Quotes eld
\end_inset
marsadm wait-cluster; marsadm action2
\begin_inset Quotes erd
\end_inset
\begin_inset Newline newline
\end_inset
\family default
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Don't ignore this advice! Interference is almost
\emph on
sure
\emph default
! As a rule of thumb, precede almost any action command with some appropriate
waiting command!
\end_layout
\begin_layout Itemize
Further friends are any
\family typewriter
marsadm wait-*
\family default
commands, such as
\family typewriter
wait-umount
\family default
.
\end_layout
\begin_layout Itemize
In some places, busy-wait loops might be needed, e.g.
for waiting until a specific resource is
\family typewriter
UpToDate
\family default
or matches some other condition.
Examples of waiting conditions can be found under
\family typewriter
github.com/schoebel/test-suite
\family default
in subdirectory
\family typewriter
mars/modules/
\family default
, specifically
\family typewriter
02_predicates.sh
\family default
or similar.
\end_layout
\begin_layout Itemize
In case of network problems, some command may hang (forever), if you don't
set the
\family typewriter
--timeout=
\family default
option.
Don't forget the check the return state of any failed / timeouted commands,
and to take appropriate measures!
\end_layout
\begin_layout Itemize
Test your scripts in failure scenarios!
\end_layout
\begin_layout Chapter
\start_of_appendix
FAQ
\begin_inset CommandInset label
LatexCommand label
name "chap:FAQ"
\end_inset
\end_layout
\begin_layout Standard
Following answers are from Thomas Schöbel-Theuer, the inventor of the MARS
components and the responsible maintainer of the out-of-tree OpenSource
project under GPL.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
Q: Why are the units of
\family typewriter
marsdm view-rest-space
\family default
or
\family typewriter
marsdm view-total-space
\family default
in GiB?
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
A: This is for your protection.
Contemporary servers have RAM up to TiB, not only GiB.
In worst case, e.g.
certain types of userspace bugs / attacks / intrusions, large parts of
this RAM can be filled via the
\emph on
page cache of the kernel
\emph default
by (masses of) wild-running user processes
\emph on
like hell
\emph default
, e.g.
\begin_inset space ~
\end_inset
GiB/ms.
Exceptional RAM usage / rates can trigger the
\series bold
OOM killer
\series default
, which in turn may
\series bold
\emph on
randomly
\emph default
kill
\series default
almost anything,
\series bold
including daemons
\series default
\begin_inset Foot
status open
\begin_layout Plain Layout
Exceptional fill rates are dangerous by itself.
Neither the kernel nor MARS can
\emph on
reliably
\emph default
prevent such
\begin_inset Quotes eld
\end_inset
use cases
\begin_inset Quotes erd
\end_inset
.
We altogether can only
\emph on
try
\emph default
to
\emph on
deal with it
\emph default
and to protect us
\emph on
as best as possible
\emph default
under certain conditions.
Detailed high-frequency monitoring would be difficult in practice.
Via units of GiB, I try to
\emph on
hint
\emph default
you on this large problem field.
\end_layout
\end_inset
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
Q: Why isn't
\family typewriter
marsadm
\family default
a daemon, but follows the process paradigm from UNIX?
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
A: Same story: reasonable protection against whoever kills processes for
whatever reasons.
Daemons can
\series bold
loose their runtime state
\series default
, and this may happen even in
\emph on
critical sections
\emph default
.
Thus your
\series bold
(distributed) system(s) may get (widely) stuck
\series default
.
More explanations are in section
\begin_inset CommandInset ref
LatexCommand nameref
reference "subsec:Why-systemd?"
plural "false"
caps "false"
noprefix "false"
\end_inset
\begin_inset CommandInset ref
LatexCommand vpageref
reference "subsec:Why-systemd?"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
This can become
\emph on
evil
\emph default
when it happens just during an operational incident, requiring a (mass)
failover, and just when you
\emph on
desperately
\emph default
want to
\emph on
rely
\emph default
on MARS (see also the CAP theorem).
In contrast,
\family typewriter
marsadm
\family default
(as a component) is
\series bold
stateless
\begin_inset Foot
status open
\begin_layout Plain Layout
\family typewriter
marsadm
\family default
does not
\emph on
functionally
\emph default
depend on network traffic, at least for non-network operations.
The
\emph on
kernel(!) and its GPLed code
\emph default
will
\emph on
automatically
\emph default
cleanup most remains upon process kill.
\series bold
Repeatability
\series default
: afterwards, the next
\family typewriter
marsadm
\family default
invocation should not depend on former (OOM-like) problems.
\end_layout
\end_inset
\series default
\emph on
between
\emph default
invocations.
Thus your system(s) can
\series bold
recover more easily
\series default
.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
Q: Can I create a fork of MARS?
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
A: Yes, given that you
\series bold
conform to the license
\series default
.
Please read the GPL, and follow it.
This is not only about kernel code.
\family typewriter
marsadm
\family default
will remain under GPL.
I have
\emph on
created
\emph default
it under European personal rights, and even during my precious spare time.
Personally, I will
\emph on
not
\emph default
publish anything which is
\emph on
not
\emph default
under an OSI and/or OIN-compliant license.
\begin_inset Newline newline
\end_inset
In addition, it is
\emph on
wise
\emph default
to obey the customs of the OpenSource
\series bold
community
\series default
.
I
\series bold
firmly recommend
\series default
to take the time to read
\family sans
\series bold
Homesteading the Noosphere
\family default
\series default
(a ground-breaking essay from Eric Raymond, see original web document at
\begin_inset Flex URL
status open
\begin_layout Plain Layout
http://catb.org/~esr/writings/homesteading/homesteading/
\end_layout
\end_inset
), and to think about its consequences.
Just stating the obvious, do not break important basics from there.
Finally, keep in mind that it is mandatory to follow the written and unwritten
rules from the Linux kernel community.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
Q: Will MARS become part of the official Linux kernel as published at
\begin_inset Flex URL
status open
\begin_layout Plain Layout
www.kernel.org
\end_layout
\end_inset
?
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
A: Hopefully.
The decision is up to Linus Torvalds and the kernel community.
If possible, I will try to do my best, in order to get it there
\begin_inset Foot
status open
\begin_layout Plain Layout
Hopefully, the
\emph on
out-of-tree
\emph default
kernel part of MARS will no longer be needed by anyone in the long term.
Any (professional) support for the MARS kernel module, and also for
\family typewriter
marsadm
\family default
, should hopefully migrate to the official Linux kernel and/or to the OpenSource
community of all interested Linux distros, in a reasonable timeframe.
\end_layout
\end_inset
.
After acceptance, I am willing to support it further as a member of the
community, up to my death, under my personal constraints after my retirement.
I am also planning to continuously support the community, and to consent
to passing over the baton to somebody
\emph on
from the Linux kernel community
\emph default
.
My current problem is lack of time.
I estimate that I will need more than 70% of my precious working hours
for getting it into the kernel.
Please help me.
Please talk
\emph on
directly
\emph default
with me about perspectives.
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
Q: What is the
\series bold
business value
\series default
of any
\family typewriter
OpenSource
\family default
for my company?
\end_layout
\begin_layout Labeling
\labelwidthstring 00.00.0000
A: Short story for managers / controllers / consultants: talk with
\series bold
\size large
experts from the Linux Foundation
\series default
\size default
.
\begin_inset Newline newline
\end_inset
Some recommended details top-down via checklist:
\end_layout
\begin_deeper
\begin_layout Enumerate
Consider
\begin_inset Flex URL
status open
\begin_layout Plain Layout
http://catb.org/~esr/writings/homesteading/homesteading/
\end_layout
\end_inset
a
\emph on
successful
\emph default
management strategy for
\emph on
creation
\emph default
of
\emph on
globally shared commons
\emph default
value
\series bold
\begin_inset Foot
status open
\begin_layout Plain Layout
Recommendation: do not follow a common misbelief that something would not
deliver any value because it is
\emph on
for free
\emph default
.
Also, do not mix up English meanings of
\begin_inset Quotes eld
\end_inset
free
\begin_inset Quotes erd
\end_inset
.
When unsure, please consult the well-known publications from Richard Stallman,
who explained the fundamentals.
\end_layout
\end_inset
\series default
.
\end_layout
\begin_layout Enumerate
Understand the fundamental differences between commons
\emph on
cultures
\emph default
and company
\emph on
cultures
\emph default
, and their relationships to management
\emph on
cultures
\emph default
.
\end_layout
\begin_layout Enumerate
Map typical
\emph on
usage patterns
\emph default
of
\family typewriter
OpenSource
\family default
down to your company, like follows.
Cross-compare your
\series bold
savings
\series default
(if you would need to
\emph on
develop
\emph default
and to
\emph on
maintain
\emph default
the software
\emph on
fully yourself
\emph default
, and/or to
\emph on
buy
\emph default
and
\emph on
integrate
\emph default
and operate comparable products on non-
\family typewriter
OpenSource
\family default
markets), and compute the corresponding
\series bold
earnings
\begin_inset Foot
status open
\begin_layout Plain Layout
Optionally, further effects like
\series bold
scaling effects
\series default
may be also relevant.
\end_layout
\end_inset
\series default
via best-practice management methods.
\end_layout
\begin_layout Enumerate
Finally, take the
\series bold
future
\series default
of business value alternatives, spread over the
\series bold
actual lifetime
\series default
, into account.
\end_layout
\begin_layout Enumerate
Ultimately, take the long-term
\series bold
ecosystem effects
\series default
of
\emph on
all
\emph default
your downloaded and/or contributed
\family typewriter
OpenSource
\family default
into account, without overlooking so-called
\emph on
hidden champions
\emph default
.
\end_layout
\end_deeper
\begin_layout Labeling
\labelwidthstring 00.00.0000
\begin_inset space ~
\end_inset
Obviously, delegate OpenSource (strategy) only to persons who have
\emph on
proven
\begin_inset Foot
status open
\begin_layout Plain Layout
Recommendations: do not forget to take the
\emph on
actual
\emph default
OpenSource
\series bold
affinity
\series default
of people into account, in which
\series bold
culture
\series default
they have
\series bold
grown up
\series default
.
Just believing some personal claims is not enough.
Check for any people who
\emph on
grew up during their youth
\emph default
in a non-affine culture, and do not trust a counter-culture where fighting
\emph on
against
\emph default
OpenSource is or was a fashion.
Beware of (hidden)
\series bold
\emph on
clash of cultures
\series default
\emph default
.
Check for contradictions.
Guard your company against hidden agendas and against
\emph on
fakes
\emph default
.
Valuable OpenSource is
\emph on
not
\emph default
created by management affinity, but
\emph on
only
\emph default
by
\emph on
certain hand-selected
\emph default
\series bold
individuals
\series default
.
Carefully select the
\emph on
right
\emph default
individual(s) for your company.
Do not forget to ask for
\series bold
personal references
\series default
, best on
\emph on
actual individual creations
\emph default
, and
\emph on
check
\emph default
them.
\end_layout
\end_inset
\emph default
that they
\emph on
actually master
\emph default
the OpenSource playgrounds according to its intrinsic rules.
Do not put the fox in charge of the henhouse
\begin_inset Foot
status open
\begin_layout Plain Layout
Similar saying: do not trust the cat to keep the cream.
\end_layout
\end_inset
.
\end_layout
\begin_layout Standard
This FAQ will be continued / updated only when necessary, and according
to my time constraints.
\end_layout
\begin_layout Chapter
Technical Data MARS
\begin_inset CommandInset label
LatexCommand label
name "chap:Technical-Data-MARS"
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Do not use MARS inside of VMs.
Only use at bare metal!
\end_layout
\begin_layout Standard
MARS has some built-in limitations which should be overcome
\begin_inset Foot
status open
\begin_layout Plain Layout
Some internal algorithms are quadratic.
The reason is that MARS evolved from a lab prototype which wasn't originally
intended for enterprise grade usage, but should have been succeeded by
the fully instance-oriented MARS Full much earlier.
\end_layout
\end_inset
by future MARS versions.
Please don't exceed the following limits:
\end_layout
\begin_layout Itemize
maximum 10 nodes per cluster
\end_layout
\begin_layout Itemize
maximum 30 resources per cluster
\end_layout
\begin_layout Itemize
maximum 100 logfiles per resource
\end_layout
\begin_layout Chapter
HISTORIC Guide for Midnight Problem Solving
\begin_inset CommandInset label
LatexCommand label
name "chap:Handout-for-Midnight"
\end_inset
\end_layout
\begin_layout Standard
Here is a
\emph on
generic
\emph default
\emph on
guide
\emph default
(
\series bold
not to be treated as instructions
\series default
) for the
\emph on
generic
\emph default
\family typewriter
marsadm
\family default
and command\SpecialChar softhyphen
line level.
Do not forget the terms and conditions from the GPL.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
This is
\series bold
\emph on
not
\emph default
an operational documentation
\series default
.
There are too many other application-dependent components in a real production
system.
Any other levels / layers (e.g.
different types of cluster managers, PaceMaker, control scripts /
\family typewriter
rc
\family default
scripts /
\family typewriter
upstart
\family default
or
\family typewriter
systemd
\family default
scripts, etc)
\emph on
need
\emph default
to be described elsewhere.
Midnight problem solving means to engage sysadmins familiar with (1)
\emph on
all
\emph default
of these components, and (2) with any
\emph on
potential interferences
\emph default
between them.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Aristoteles taught us that a system is more than the sum of its components.
You need your own
\emph on
maintained
\emph default
handout for problem solving at
\emph on
full-system
\emph default
level.
\end_layout
\begin_layout Section
Inspecting the State of MARS
\end_layout
\begin_layout Standard
For manual inspection, please prefer the new
\family typewriter
marsadm view all
\family default
over the old
\family typewriter
marsadm view-1and1 all
\family default
.
It shows more appropriate / detailed information.
\end_layout
\begin_layout Quotation
\family typewriter
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
# watch marsadm view all
\end_layout
\end_inset
\end_layout
\begin_layout Standard
Checking the low-level network connections at runtime:
\end_layout
\begin_layout Quotation
\family typewriter
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
# watch "netstat --tcp | grep 777"
\end_layout
\end_inset
\end_layout
\begin_layout Standard
Meaning of the port numbers (current
\emph on
default
\emph default
as configured into the kernel module, may change in future):
\end_layout
\begin_layout Itemize
7776 = prosumer device traffic (realtime requirements, only at new MARS
versions)
\end_layout
\begin_layout Itemize
7777 = metadata / symlink propagation (low traffic)
\end_layout
\begin_layout Itemize
7778 = transfer of transaction logfiles (load dependent)
\end_layout
\begin_layout Itemize
7779 = transfer of fast-fullsync traffic (only when fast-fullsync is running)
\end_layout
\begin_layout Standard
7777 must be always active on a healthy cluster.
All others will appear only on demand, when resources are configured accordingl
y and/or when some data is transferred.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Hint: when one of the columns Send-Q or Recv-Q are constantly at high values,
you might have a network bottleneck.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When unsure or desperate: check that at least the
\emph on
server-part
\emph default
sockets 7777 to 7779 are
\emph on
always
\emph default
present after modprobe mars and in state LISTEN, e.g.
via
\family typewriter
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
# netstat -lp --tcp | grep 777
\end_layout
\end_inset
\end_layout
\begin_layout Standard
Hint: I have seen strange incidents where somebody else had
\emph on
occupied
\emph default
some of these server sockets via some bugs in some userspace scripts.
There might be other network-level problems, e.g.
network hardware has firmware bugs, or when network devices are misconfigured,
or when some strange firewalling rules are kicking in, etc.
Or even
\emph on
trivial
\emph default
problems, like electrical problems, faulty cables or contacts, bad temperatures
, humidity, etc.
\end_layout
\begin_layout Section
Replication is unexpectedly Stuck
\end_layout
\begin_layout Standard
Indications for a stuck:
\end_layout
\begin_layout Itemize
\family typewriter
marsadm view all
\family default
displays some human-readable
\emph on
warnings
\emph default
containing the keywords
\family typewriter
age
\family default
or
\family typewriter
hint
\family default
and some hours:minutes:seconds numbers.
\end_layout
\begin_layout Itemize
Other warnings containing the keyword error and some errno code / text (see
\family typewriter
man errno
\family default
but notice that the Linux kernel uses negative numbers in place of positives).
You need to read and understand the meaning of these
\family typewriter
errno
\family default
numbers in the context of you Linux version and
\family typewriter
mars.ko
\family default
.
\end_layout
\begin_layout Itemize
One of the flags shown by
\family typewriter
marsadm view all
\family default
or
\family typewriter
marsadm view-flags all
\family default
contain a symbol
\family typewriter
"-"
\family default
(dash).
This means that some switch is currently switched off (deliberately).
Please check whether there is a valid reason why somebody else switched
it off.
If the switch-off is just by accident, use the following command to fix
the stuck:
\family typewriter
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
# marsadm up all
\end_layout
\end_inset
\family default
(or replace
\family typewriter
all
\family default
by a particular resource name if you want to start only a specific one).
\begin_inset Newline newline
\end_inset
Note:
\family typewriter
up
\family default
is equivalent to the sequence
\family typewriter
attach; resume-fetch; resume-replay; resume-sync
\family default
.
Instead of switching each individual knob, use
\family typewriter
up
\family default
as a shortcut for switching on anything which is currently off.
\end_layout
\begin_layout Itemize
\family typewriter
netstat --tcp | grep 777
\family default
does not show anything.
Please check the following:
\begin_inset Separator latexpar
\end_inset
\end_layout
\begin_deeper
\begin_layout Itemize
Is the kernel module loaded? Check
\family typewriter
lsmod | grep mars
\family default
.
When necessary, run
\family typewriter
modprobe mars
\family default
.
\end_layout
\begin_layout Itemize
Is the network interface down? Check
\family typewriter
ifconfig
\family default
, and/or
\family typewriter
ethtool
\family default
and friends, and fix it when necessary.
Use
\family typewriter
journalctl -k
\family default
to detect any potential kernel messages, such as network driver problems.
\end_layout
\begin_layout Itemize
Is a
\family typewriter
ping
\family default
possible? If not, fix the network / routing / firewall / etc.
When fixed, the MARS connections should automatically appear after about
1 minute.
\end_layout
\begin_layout Itemize
When
\family typewriter
ping
\family default
is possible, but a MARS connection to port 7777 does not appear after a
few minutes, try to connect to remote port 7777 by hand via
\family typewriter
telnet
\family default
.
But don't type anything, just abort the connection immediately when it
works! Typing anything will almost certainly throw a harsh error message
at the other server, which could unnecessarily alert other people.
\end_layout
\end_deeper
\begin_layout Itemize
Check whether
\family typewriter
marsadm view all
\family default
shows some progress bars somewhere.
Example:
\family typewriter
\size scriptsize
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
istore-test-bap1:~# marsadm view all
\end_layout
\begin_layout Plain Layout
--------- resource lv-0
\end_layout
\begin_layout Plain Layout
lv-0 OutDated[F] PausedReplay dCAS-R Secondary istore-test-bs1
\end_layout
\begin_layout Plain Layout
replaying: [>...................] 1.21% (12/1020)MiB logs: [2..3]
\end_layout
\begin_layout Plain Layout
> fetch: 1008.198 MiB rate: 0 B/sec remaining: --:--:-- hrs
\end_layout
\begin_layout Plain Layout
> replay: 0 B rate: 0 B/sec remaining: 00:00:00 hrs
\end_layout
\end_inset
\family default
\size default
At least one of the
\family typewriter
rate:
\family default
values should be greater than 0.
When none of the
\family typewriter
rate:
\family default
values indicate any progress for a longer time, try
\family typewriter
marsadm up all
\family default
again.
If it doesn't help, check and repair the network.
If even this does not help, check the hardware for any IO hangups, or kernel
hangups via
\family typewriter
journalctl
\family default
and sisters.
Check the RAID controllers.
Often (but not certainly), a stuck kernel can be recognized when many processes
are
\emph on
permanently
\emph default
in state "D", for a long time:
\family typewriter
ps ax | grep " D" | grep -v grep
\family default
or similar.
Please check whether there is just an overload, or
\emph on
really
\emph default
a true kernel problem.
Discrimination is not easy, and requires experience (as with any other
system; not limited to MARS).
A truly stuck kernel can only be resurrected by rebooting.
The same holds for many hardware problems.
\end_layout
\begin_layout Itemize
Check whether
\family typewriter
marsadm view all
\family default
reports any lines like
\family typewriter
WARNING: SPLIT BRAIN at '' detected
\family default
.
In such a case, check that there is
\emph on
really
\emph default
a split brain, before obeying the instructions in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Resolution-of-Split"
\end_inset
.
Notice that network outages or missing
\family typewriter
marsadm cron
\family default
may continue to report an old split brain which has gone in the meantime.
\end_layout
\begin_layout Itemize
Check whether
\family typewriter
/mars/
\family default
is too full.
For a rough impression,
\family typewriter
df /mars/
\family default
may be used.
For getting authoritative values as internally used by the MARS emergency-mode
computations, use
\family typewriter
marsadm view-rest-space
\family default
(the unit is GiB).
In practice, the differences are only marginal, at least on bigger
\family typewriter
/mars/
\family default
partitions.
When there is only few rest space (or none at all), please obey the instruction
s in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Resolution-of-Emergency"
\end_inset
.
\end_layout
\begin_layout Itemize
Check
\family typewriter
journalctl -k
\family default
specifically for any kernel-level problems.
\end_layout
\begin_layout Section
Standard Resolution of Emergency Mode and Split Brain
\begin_inset CommandInset label
LatexCommand label
name "sec:Resolution-of-Emergency"
\end_inset
\end_layout
\begin_layout Standard
Emergency mode occurs when
\family typewriter
/mars/
\family default
runs out of space, such that no new logfile data can be written anymore.
\end_layout
\begin_layout Standard
In emergency mode, the primary will write any write requests
\emph on
directly
\emph default
to the underlying disk, as if MARS were not present at all.
Thus, your application will continue to run.
Only the
\emph on
replication
\emph default
as such is stopped.
\end_layout
\begin_layout Standard
\begin_inset Note Greyedout
status open
\begin_layout Plain Layout
Notice: emergency mode means that your secondary nodes are usually in a
\emph on
consistent
\emph default
, but
\emph on
outdated
\emph default
state (exception: when a sync was running in parallel to the emergency
mode, then the sync will be automatically started over again).
You can check consistency via
\family typewriter
marsadm view-flags all
\family default
.
Only when a local disk shows a lower-case letter
\family typewriter
"d"
\family default
instead of an uppercase
\family typewriter
"D"
\family default
, it is known to be inconsistent (e.g.
during a sync).
When there is a dash instead, it usually means that the disk is detatched
or misconfigured or the kernel module is not started.
Please fix these problems first before believing that your local disk is
unusable.
Even if it is really inconsistent (which is very unlikely, typically occurring
only as a consequence of hardware failures, or of the above-mentioned exception
), you have a big chance to recover most of the data via
\family typewriter
fsck
\family default
and friends.
\end_layout
\end_inset
\end_layout
\begin_layout Standard
A currently existing emergency mode can be detected by
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
primary:~# marsadm view-is-emergency all
\end_layout
\begin_layout Plain Layout
secondary:~# marsadm view-is-emergency all
\end_layout
\end_inset
Notice: this delivers the current state, telling nothing about the past.
\end_layout
\begin_layout Standard
Emergency mode
\emph on
may
\emph default
also show something like
\family typewriter
WARNING: SPLIT BRAIN at '' detected
\family default
because both problems may sometimes appear in combination.
Anyway, the standard resolution process is equal.
\end_layout
\begin_layout Standard
Preconditions:
\end_layout
\begin_layout Itemize
The network
\series bold
must
\series default
be working.
Check that the following gives an entry for each secondary:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
primary:~# netstat --tcp | grep 7777
\end_layout
\end_inset
When necessary, fix the network first (see instructions above).
\end_layout
\begin_layout Itemize
The hardware must be healthy, and any RAID subsystems
\emph on
should not
\emph default
be in any degraded state
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
It is your
\emph on
operational decision
\emph default
whether to prefer relatively fast RAID rebuild after handover of any primary
to some secondary and/or pausing some secondary-side IO for some time,
or whether you drastically increase the TTR = Time To Repair by loading
your RAID
\emph on
unnecessarily
\emph default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
MARS is constructed for working
\begin_inset Quotes eld
\end_inset
almost as best as possible
\begin_inset Quotes erd
\end_inset
even on slow IO systems and over slow networks, but
\emph on
do not expect miracles
\emph default
.
The laws of physics are stronger than any human expectations!
\end_layout
\begin_layout Standard
Emergency mode should now be resolved, e.g.
by checking
\family typewriter
marsadm view all
\family default
, and/or via commands like
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
primary:~# marsadm view-is-emergency all
\end_layout
\begin_layout Plain Layout
primary:~# du -s /mars/resource-* | sort -n
\end_layout
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Remember the affected resource names and their
\emph on
logfile storage s
\emph default
ize.
Do
\emph on
not
\emph default
invalidate on
\emph on
any
\emph default
non-SPLIT_BRAIN or non-Emergency resources.
Do
\emph on
not
\emph default
invalidate at the target where you
\series bold
might need to failover
\series default
somewhen in the next time! It is your
\emph on
responsible operational decision
\emph default
which resource on which secondary host you want to repair via
\family typewriter
invalidate
\family default
at a certain point in time!
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Be aware of the
\emph on
officially documented fact
\emph default
that
\family typewriter
marsadm invalidate
\family default
(similarly to
\family typewriter
drbdadm invalidate
\family default
) will make your secondary replica
\family typewriter
Inconsistent
\family default
until the following fast-fullsync has successfully finished!
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Depending on operational strategies for certain use cases and/or hardware
defects and/or load situations etc, it
\emph on
might
\emph default
be better to wait some (relatively short) time to start
\family typewriter
marsadm invalidate
\family default
\emph on
later
\emph default
.
\end_layout
\begin_layout Standard
Once you have decided to use
\family typewriter
invalidate
\family default
on certain resources, best practice is to start with the
\emph on
biggest
\emph default
resource as shown by
\family typewriter
du -s /mars/resource-* | sort -n
\family default
in reverse order:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
secondary1:~# marsadm invalidate
\end_layout
\begin_layout Plain Layout
secondary1:~# marsadm view
\end_layout
\begin_layout Plain Layout
primary:~# marsadm cron
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Typical non-overloaded servers allow you to invalidate about 3 to 5 (or
\emph on
sometimes(!)
\emph default
even tens of) resources in parallel, but highly overloaded machines may
require
\family typewriter
marsadm pause-sync $some_resource
\family default
for load reduction.
When more resources are affected by SPLIT BRAIN, regularly check whether
\family typewriter
df /mars/
\family default
shows enough space to wait some time until you need to invalidate more
resources according to
\family typewriter
du -s /mars/resource-* | sort -n
\family default
.
\end_layout
\begin_layout Standard
Hint: during the resolution process, some other resources might have gone
into emergency mode concurrently.
In addition, it is possible that some secondaries are stuck at particular
resources while the corresponding primary has
\emph on
not yet
\emph default
entered emergency mode.
Please repeat the steps in such a case, and look for any emergency modes
at secondaries additionally.
When necessary, extend your list of
\emph on
affected
\emph default
resources and/or secondary hosts.
\end_layout
\begin_layout Standard
Hint: be patient.
Deleting large bulks of logfile data may take a long time, at least on
highly loaded systems.
You should give the cleanup processes at least 5 minutes before concluding
that
\family typewriter
marsadm invalidate
\family default
followed by primary-side
\family typewriter
marsadm cron
\family default
had no effect! When unsure, use
\family typewriter
marsadm cron
\family default
at
\emph on
all
\emph default
cluster nodes, even when seemingly unaffected.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Notice: neither a secondary-side
\family typewriter
marsadm invalidate
\family default
can be noticed by the current primary side, nor
\family typewriter
marsadm cron
\family default
can work
\emph on
fully
\emph default
when the metadata update over port 7777 is extremely slow, or when it does
not work for whatever reason.
Check your replication speed!
\end_layout
\begin_layout Standard
In very complex scenarios, when the primary roles of different resources
are spread over diffent hosts (aka mixed operation), you may need to repeat
the whole cycle iteratively for a few cycles until the complex jam is fully
resolved in the full Distributed System.
\end_layout
\begin_layout Standard
If it does not disappear fully, you have another chance by the following
split-brain and emergency-mode resolution process:
\end_layout
\begin_layout Section
Alternative Resolution of Split Brain / Emergency Mode / Defective Hardware
\begin_inset CommandInset label
LatexCommand label
name "sec:Resolution-of-Split"
\end_inset
\end_layout
\begin_layout Standard
Hint: in most cases, the resolution of emergency mode and/or split brain
via
\family typewriter
marsadm invalidate
\family default
(plus some additional
\family typewriter
marsadm cron
\family default
) should resolve practically almost everything, at least when done in the
right order and on the right hosts / their resources.
However, it cannot always work miracles on certain types of
\series bold
defective hardware
\series default
.
\end_layout
\begin_layout Standard
Here is a more capable but more complex alternative, typically useful in
\series bold
complex failure scenarios
\series default
, e.g.
after
\series bold
cascading disasters
\series default
& co and after the hardware + software + network had been
\series bold
repaired
\series default
successfully.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
The following can only work when the
\emph on
original content
\emph default
of
\family typewriter
/mars/
\family default
has survived your incident.
Otherwise, you may need a
\emph on
variant
\emph default
of this method as explained later, and probably you should not do this
at midnight.
Read this
\emph on
completely
\emph default
and understand it, before starting any action!
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
Never run MARS inside of VMs, see
\family typewriter
architecture-guide-geo-redundancy.pdf
\family default
.
If you do so anyway, or if you place MARS
\emph on
on top of
\emph default
some LV snapshot(s) or similar, you are running a
\series bold
high risk
\series default
: any restore of an
\emph on
old snapshot
\emph default
affecting the content of
\family typewriter
/mars/
\family default
and/or of some underly resource disk /
\emph on
underlying
\emph default
LV and/or its content can
\series bold
provoke a disaster!
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
That said, the following method often works when the underlying resource
data had been somewhat damaged or even lost at
\emph on
some(!)
\emph default
of the replicas (due to the incident), but
\family typewriter
/mars/
\family default
has survived and the storage is operational again.
For exampley, any defective RAID disks have been already replaced and the
underlaying RAID is now
\emph on
rebuilt
\emph default
and
\emph on
no longer
\emph default
is in
\series bold
degraded RAID
\series default
mode – check your RAID first!
\end_layout
\begin_layout Standard
Precondition: the hardware + software + network must be working, and any
RAID is no longer degraded.
Check that the following gives an entry for each secondary:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
primary:~# netstat --tcp | grep 7777
\end_layout
\end_inset
When necessary, fix the network first (see instructions above).
Be sure the hardware and any RAID is fully operational.
\end_layout
\begin_layout Standard
Inspect the split brain situation:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
primary:~# marsadm view all
\end_layout
\begin_layout Plain Layout
primary:~# du -s /mars/resource-* | sort -n
\end_layout
\end_inset
Remember those resources where a message like
\family typewriter
WARNING: SPLIT BRAIN at '' detected
\family default
appears.
Do the following only for
\emph on
affected
\emph default
resources, starting with the biggest one (before proceeding to the next
one).
\end_layout
\begin_layout Standard
Do the following with only
\emph on
one
\emph default
resource at a time (before proceeding to the next one), and repeat the
actions on that resource at every secondary (if there are multiple secondaries)
:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
secondary1:~# marsadm leave-resource $res1
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
ONLY WHEN some secondaries are FINALLY LOST FOREVER and WILL NEVER RE-APPEAR
like a
\begin_inset Quotes eld
\end_inset
zombie
\begin_inset Quotes erd
\end_inset
, try the following instead:
\end_layout
\begin_layout Standard
\family typewriter
\size small
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
alternative-secondory-or-primary:~# marsadm leave-resource $res1
\backslash
\end_layout
\begin_layout Plain Layout
--force --host=$defective_secondary1
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
Check whether the split brain has vanished everywhere, and the replication
is actually working on any non-stucked secondary.
Startover with other resources at their secondaries when necessary.
\end_layout
\begin_layout Standard
Finally, when no split brain is reported at any (former) secondary, do the
following on the primary:
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
primary:~# marsadm cron
\end_layout
\begin_layout Plain Layout
primary:~# sleep 30
\end_layout
\begin_layout Plain Layout
primary:~# marsadm view all
\end_layout
\end_inset
Now, any split brain and/or emergency mode should be gone even at the primary.
If not, repeat this step (and some of the previous ones).
\end_layout
\begin_layout Standard
In case even this should fail on some
\family typewriter
$res
\family default
(which is very unlikely), read the PDF manual before using
\family typewriter
marsadm log-purge-all $res
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
ONLY WHEN some secondary had been FINALLY LOST FOREVER: before running
\family typewriter
marsadm join-cluster
\family default
on any new replacement hardware where
\family typewriter
/mars/
\family default
is initially empty, you should first remove the old hardware from the cluster:
\end_layout
\begin_layout Standard
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
alternative-secondary-or-primary:~# marsadm leave-cluster
\backslash
\end_layout
\begin_layout Plain Layout
--force --host=$defective_secondary1
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
ONLY WHEN a former primary had been LOST FOREVER: before you can forcibly
remove a defective primary as described above, you must first
\series bold
decide
\series default
which surving secondary will be the surviving new primary, and you
\emph on
need
\emph default
a
\series bold
successful failover
\series default
as described in section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Failover-Emergency-Switch"
plural "false"
caps "false"
noprefix "false"
\end_inset
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:Failover-Emergency-Switch"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Do not forget to
\emph on
ensure
\emph default
that suchalike zombies cannot
\begin_inset Quotes eld
\end_inset
resurrect
\begin_inset Quotes erd
\end_inset
by itself! Read
\emph on
all
\emph default
relevant parts of this manual!
\end_layout
\begin_layout Standard
Finally, when the split brain + emergency mode is gone everywhere, rebuild
the redundancy at every (newly deployed
\emph on
fully
\emph default
, including
\family typewriter
marsadm join-cluster
\family default
) secondary host via
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
secondary1:~# marsadm join-resource $res1 /dev//$res1
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Here is the LAST RESORT if you are
\emph on
completely desperate
\emph default
, and if even the previous methods did not help after
\emph on
multiple attempts
\emph default
, and when you are
\emph on
sure
\emph default
that a hardware / software / kernel / etc upgrade / downgrade cannot help:
setup the whole cluster afresh by
\family typewriter
rmmod mars
\family default
everywhere, and creating a fresh
\family typewriter
/mars/
\family default
filesystem everywhere, followed by the same procedure as installing MARS
for the first time (which is outside the scope of this guide).
\end_layout
\begin_layout Section
Handover of Primary Role
\end_layout
\begin_layout Standard
When there exists a
\emph on
reliable
\emph default
method for primary handover in higher layers such as cluster managers,
please prefer that method (e.g.
\family typewriter
cm3
\family default
or other tools).
\end_layout
\begin_layout Standard
If suchalike doesn't work, or if you need to handover some resource
\family typewriter
$res1
\family default
by hand, do the following:
\end_layout
\begin_layout Itemize
Stop the any
\emph on
customer
\emph default
network traffic first.
This is important for overload prevention, and for security reasons, and
for minimization of any potential split brain data in case of any failures
(see also the famous CAP theorem).
\end_layout
\begin_layout Itemize
Stop the load / application processes corresponding to
\family typewriter
$res1
\family default
on the old primary side.
\end_layout
\begin_layout Itemize
\family typewriter
umount /dev/mars/$res1
\family default
, or otherwise close any openers such as iSCSI.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Do not skip this step: otherwise a
\emph on
handover
\emph default
(not to be confused with
\emph on
failover
\emph default
) is
\emph on
not possible
\emph default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When
\family typewriter
umount
\family default
& co does not work for whatever reason: then it is your
\emph on
responsible operational decision
\emph default
whether you want to (a) restart the full application stack again at the
old primary side (via whatever method, including reboot), or (b) accept
a
\emph on
potential
\emph default
split brain and its potential redundancy loss, and proceed with section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Failover-Emergency-Switch"
plural "false"
caps "false"
noprefix "false"
\end_inset
\begin_inset CommandInset ref
LatexCommand nameref
reference "sec:Failover-Emergency-Switch"
plural "false"
caps "false"
noprefix "false"
\end_inset
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Informed operational decisions can be supported by familiarity with the
famous CAP theorem.
\end_layout
\begin_layout Itemize
At the new primary:
\family typewriter
marsadm primary $res1
\end_layout
\begin_layout Itemize
Restart the application at the new site (in reverse order to above).
In case you want to switch
\emph on
all
\emph default
resources which are not yet at the new side, you
\emph on
cautiously may
\emph default
use
\family typewriter
marsadm primary all
\family default
.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
When overload of the new primary side is possible, e.g.
when the
\series bold
kernel caches are cold
\series default
, it is
\emph on
your operational decision
\emph default
whether to (a) handover all resources
\emph on
in parallel
\emph default
(which is a tested functionality of MARS), or (b) to avoid overload caused
by applications, initiate a
\emph on
sequential
\emph default
handover resource-by-resource, obeying that the new primary side often
needs to have
\series bold
warmed its kernel caches
\series default
sufficiently in order to meet your SLAs.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Important: by definition,
\emph on
handover
\emph default
is
\emph on
not
\emph default
an emergency operation like
\emph on
failover
\emph default
is.
It is
\emph on
your operational decision
\emph default
how many resources you want to handover from any location X to any other
location Y in whatever parallelism degree.
Do not blame MARS if doesn't run faster than a local reboot and its inevitable
cache warming phases.
\end_layout
\begin_layout Itemize
Finally, check that the network is up again (e.g.
BGP) and that everything is running fine at the new location (from a customer's
perspective).
\end_layout
\begin_layout Section
Failover = Emergency Switch of Primary Role
\begin_inset CommandInset label
LatexCommand label
name "sec:Failover-Emergency-Switch"
\end_inset
\end_layout
\begin_layout Standard
Failover = emergency switching is necessary when your primary is no longer
reachable over the network for a
\emph on
longer
\emph default
time, or when the hardware is defective.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Do not blame MARS for anything which is outside its scope residing at kernel
level.
Wheter and when a failover is needed for whatever reason, and in which
parallelism degree, is clearly outside the scope of a
\emph on
component
\emph default
like MARS is.
The same would be true for DRBD in place of MARS.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Failover = emergency switching will often lead to a split brain, see the
famous CAP theorem.
It
\emph on
may
\emph default
require manual actions to resolve (see above), depending on your type of
automation and its automation degree, and depending on the
\series bold
management-level risks
\series default
caused by improper automation and/or bugs / misinformation / influences
from the famous CAP theorem in whatever higher-level component.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Therefore, try to avoid failover = emergency switching when possible!
\end_layout
\begin_layout Standard
\noindent
Hint: MARS can automatically recover after a primary crash / reboot, as
well as after secondary crashes, just by executing
\family typewriter
modprobe mars
\family default
after
\family typewriter
/mars/
\family default
had been mounted.
Please
\emph on
consider
\emph default
to wait until your system comes up again, instead of risking a split brain.
\end_layout
\begin_layout Standard
The decision between failover = emergency switching and continuing operation
at the same primary side is an operational one.
MARS can support your decision by the following information at the potentially
new primary side (which was in secondary mode before):
\family typewriter
\size scriptsize
\begin_inset listings
inline false
status open
\begin_layout Plain Layout
istore-test-bap1:~# marsadm view all
\end_layout
\begin_layout Plain Layout
--------- resource lv-0
\end_layout
\begin_layout Plain Layout
lv-0 InConsistent Syncing dcAsFr Secondary istore-test-bs1
\end_layout
\begin_layout Plain Layout
syncing: [====>..............] 27.84% (567/2048)MiB rate: 72583.00 KiB/sec remaining: 00:00:20
hrs
\end_layout
\begin_layout Plain Layout
> sync: 567.293/2048 MiB rate: 72583 KiB/sec remaining: 00:00:20 hrs
\end_layout
\begin_layout Plain Layout
replaying: [>:::::::::::::::::::] 0.00% (0/12902)KiB logs: [1..1]
\end_layout
\begin_layout Plain Layout
> fetch: 0 B rate: 38 KiB/s remaining: 00:00:00
\end_layout
\begin_layout Plain Layout
> replay: 12902.047 KiB rate: 0 B/s remaining: --:--:--
\end_layout
\end_inset
\family default
\size default
When your target is syncing (like in this example), you cannot switch to
it (same as with DRBD).
When you had an emergency mode before, you should first resolve that (whenever
possible).
When a split brain is reported, try to resolve it first (same as with DRBD).
Only in case you
\emph on
know
\emph default
that the primary is
\emph on
really
\emph default
damaged, or it is
\emph on
really
\emph default
impossible to the run the application there for some reason, failover =
emergency switching is desirable for typical use cases like webhosting
or cloud computing (see
\family typewriter
architecture-guide-geo-redundancy.pdf
\family default
).
\end_layout
\begin_layout Standard
Hint: in case the secondary is inconsistent for some reason, e.g.
because of an incremental fast full-sync, you have a last chance to recover
most data after forceful switching by using a filesystem check or suchalike.
This might be even faster than restoring data from the backup.
But use suchalike only if you are
\emph on
really
\emph default
desperate and
\emph on
have no other chance
\emph default
!
\end_layout
\begin_layout Standard
The amount of data which is
\emph on
known
\emph default
to be missing at your secondary is displayed by
\family typewriter
marsadm view all
\family default
after the
\family typewriter
> fetch:
\family default
in human-readable form.
However, in cases of networking problems this information may be
\emph on
outdated
\emph default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
You
\emph on
always
\emph default
need to consider further facts which cannot be known by MARS.
\end_layout
\begin_layout Standard
When there exists a method for failover = emergency switching of the primary
in higher layers such as cluster managers, please prefer that method in
front of the following one.
\end_layout
\begin_layout Standard
If suchalike doesn't work, or when a handover attempt has failed several
times, or if you
\emph on
really need
\emph default
forceful switching of some resource
\family typewriter
$res1
\family default
by hand, you can do the following:
\end_layout
\begin_layout Itemize
When possible, stop the
\emph on
customer
\emph default
network traffic + application corresponding to
\family typewriter
$res1
\family default
on the old primary side.
\end_layout
\begin_layout Itemize
When possible,
\family typewriter
umount /dev/mars/$res1
\family default
, or otherwise close any openers such as iSCSI.
\end_layout
\begin_layout Itemize
When possible (if you have some time), wait until as much data has been
propagated to the new primary as possible (watch the
\family typewriter
fetch:
\family default
indicator).
\end_layout
\begin_layout Itemize
At the new primary:
\family typewriter
marsadm pause-fetch $res1; marsadm primary --force $res1
\end_layout
\begin_layout Itemize
Restart the application at the new site (in reverse order to above).
\end_layout
\begin_layout Itemize
Check that everything is up again (e.g.
BGP and customer traffic etc) and that everything is running fine at the
new location (from a customer's perspective).
\end_layout
\begin_layout Itemize
After the application is known to run reliably, check for split brains at
MARS level and cleanup them when necessary.
\end_layout
\begin_layout Chapter
HISTORICAL Methods for Split Brain Resolution
\begin_inset CommandInset label
LatexCommand label
name "chap:Alternative-Methods-for"
\end_inset
\end_layout
\begin_layout Standard
HISTORICAL / DO NOT USE ANYMORE: Instead of
\family typewriter
marsadm invalidate
\family default
, the following steps may be used.
In preference, start with the old
\begin_inset Quotes eld
\end_inset
wrong
\begin_inset Quotes erd
\end_inset
primaries first:
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm leave-resource mydata
\end_layout
\begin_layout Enumerate
After having done this on one cluster node, check whether the split brain
is already gone (e.g.
by saying
\family typewriter
marsadm view mydata
\family default
).
There are chances that you don't need this on all of your nodes.
Only in very rare
\begin_inset Foot
status open
\begin_layout Plain Layout
When your network had partitioned in a very awkward way for a long time,
and when your partitioned primaries did several
\family typewriter
cron
\family default
operations indendently from each other, there is a small chance that
\family typewriter
leave-resource
\family default
does not clean up
\emph on
all
\emph default
remains of such an awkward situation.
Only in such a case, try
\family typewriter
log-purge-all
\family default
.
\end_layout
\end_inset
cases, it might happen that the preceding l
\family typewriter
eave-resource
\family default
operations were not able to clean up all logfiles produced in parallel
by the split brain situation.
\end_layout
\begin_layout Enumerate
Read the documentation about
\family typewriter
log-purge-all
\family default
(see page
\begin_inset CommandInset ref
LatexCommand pageref
reference "log-purge-all$res"
\end_inset
) and use it.
\end_layout
\begin_layout Enumerate
If you want to restore redundancy, you can follow-up a
\family typewriter
join-resource
\family default
phase to the old resource name (using the correct device name, double-check
it!) This will restore your redundancy by overwriting your bad split brain
version with the correct one.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
It is important to resolve the split brain
\emph on
before
\emph default
you can start the
\family typewriter
join-resource
\family default
reconstruction phase! In order to keep as many
\begin_inset Quotes eld
\end_inset
good
\begin_inset Quotes erd
\end_inset
versions as possible (e.g.
for emergency cases), don't re-join them all in parallel, but rather start
with the oldest / most outdated / worst / inconsistent version first.
It is recommended to start the next one only when the previous one has
sucessfully finished.
\end_layout
\begin_layout Chapter
Alternative De- and Reconstruction of a Damaged Resource
\begin_inset CommandInset label
LatexCommand label
name "chap:Alternative-De--and"
\end_inset
\end_layout
\begin_layout Standard
In case
\family typewriter
leave-resource --host=
\family default
does not work, you may use the following fallback.
On the surviving new designated primary, give the following commands:
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm disconnect-all mydata
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm down mydata
\end_layout
\begin_layout Enumerate
Check by hand whether your local disk is consistent, e.g.
by test-mounting it readonly,
\family typewriter
fsck
\family default
, etc.
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm delete-resource mydata
\end_layout
\begin_layout Enumerate
Check whether the other vital cluster nodes don't report the dead resource
any more, e.g.
\family typewriter
marsadm view all
\family default
at
\emph on
each
\emph default
of them.
In case the resource has not disappeared anywhere (which may happen during
network problems), do the
\family typewriter
down ; delete-resource
\family default
steps also there (optionally again with
\family typewriter
--force
\family default
).
\end_layout
\begin_layout Enumerate
Be sure that the resource has disappeared
\emph on
everywhere
\emph default
.
When necessary, repeat the
\family typewriter
delete-resource
\family default
with
\family typewriter
--force
\family default
.
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm create-resource newmydata ...
\family default
at the
\emph on
correct
\emph default
node using the
\emph on
correct
\emph default
disk device containing the
\emph on
correct
\emph default
version, and further steps to setup your resource from scratch, preferably
under a different name to minimize any risk.
\end_layout
\begin_layout Standard
\noindent
In any case,
\series bold
manually check
\series default
whether a split brain is reported for any resource on any of your
\emph on
surviving
\emph default
cluster nodes.
If you find one there (and only then), please (re-)execute the split brain
resolution steps on the affected node(s).
\end_layout
\begin_layout Chapter
Cleanup in case of Complicated Cascading Failures
\begin_inset CommandInset label
LatexCommand label
name "subsec:Cleanup-in-case"
\end_inset
\end_layout
\begin_layout Standard
MARS does its best to recover even from multiple failures (e.g.
\series bold
rolling disasters
\series default
).
Chances are high that the instructions from sections
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Split-Brain-Resolution"
\end_inset
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Final-Destroy-of"
\end_inset
or appendix
\begin_inset CommandInset ref
LatexCommand ref
reference "chap:Alternative-Methods-for"
\end_inset
\begin_inset CommandInset ref
LatexCommand ref
reference "chap:Alternative-De--and"
\end_inset
will work even in case of multiple failures, such as a network failure
plus local node failure at only 1 node (even if that node is the former
primary node).
\end_layout
\begin_layout Standard
However, in general (e.g.
when more than 1 node is damaged and/or when the filesystem
\family typewriter
/mars/
\family default
is badly damaged) there is no general guarantee that recovery will
\emph on
always
\emph default
succeed under
\emph on
any
\emph default
(weird) circumstances.
That said, your chances for recovery are
\emph on
very
\emph default
high when some disk remains usable at least at one of your surviving secondarie
s.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
It should be very hard to finally trash a secondary, because the transaction
logfiles are containing
\family typewriter
md5
\family default
checksums for all data records.
Any attempt to replay currupted logfiles is refused by MARS.
In addition, the sequence numbers of rotated logfiles (e.g.
via
\family typewriter
cron
\family default
) are checked for contiguity.
Finally, the
\emph on
sequence path
\emph default
of logfile applications (consisting of logfile names plus their respective
length) is additionally secured by a
\family typewriter
git
\family default
-like incremental checksum over the whole path history (so-called
\begin_inset Quotes eld
\end_inset
version links
\begin_inset Quotes erd
\end_inset
).
This should detect split brains even if logfiles are appended / modified
\emph on
after
\emph default
a (forceful) switchover has already taken place.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresToxiques.png
lyxscale 50
scale 17
\end_inset
That said, your risk of final data loss is very high if you remove the
\series bold
BBU
\series default
from your hardware RAID controller before all hot data has been flushed
to the physical disks.
Therefore, never try to
\begin_inset Quotes eld
\end_inset
repair
\begin_inset Quotes erd
\end_inset
a seemingly dead node before your replication is up again somewhere else!
Only unplug the network cables when advised, but never try to repair the
hardware instantly!
\end_layout
\begin_layout Standard
In case of desperate situations where none of the previous instructions
have succeeded, your last chance is rebuilding all your resources from
intact disks as follows:
\end_layout
\begin_layout Enumerate
Do
\family typewriter
rmmod mars
\family default
on all your cluster nodes and/or reboot them.
Note: if you are less desperate, chances are high that the following will
also work when the kernel module remains active and everywhere a
\family typewriter
marsadm down
\family default
is given instead, but for an
\emph on
ultimate
\emph default
instruction you should eliminate
\emph on
potential
\emph default
kernel problems by
\family typewriter
rmmod
\family default
/
\family typewriter
reboot
\family default
, at least if you can afford the downtime on concurrently operating resources.
\end_layout
\begin_layout Enumerate
For safety, physically remove the storage network cables on
\emph on
all
\emph default
your cluster nodes.
Note: the same disclaimer holds.
MARS really does its best, even when
\family typewriter
delete-resource
\family default
is given while the network is fully active and multiple split-brain primaries
are actively using their local device in parallel (approved by some testcases
from the automatic test suite, but note that it is impossible to catch
all possible failure scenarios).
Don't challenge your fate if you are desperate! Don't
\emph on
rely
\emph default
on this! Nothing is absolutely fail-safe!
\end_layout
\begin_layout Enumerate
\series bold
Manually
\series default
check which surviving disk is usable, and which is the
\begin_inset Quotes eld
\end_inset
best
\begin_inset Quotes erd
\end_inset
one for your purpose.
\end_layout
\begin_layout Enumerate
Do
\family typewriter
modprobe mars
\family default
\emph on
only
\emph default
on that node.
If that fails,
\family typewriter
rmmod
\family default
and/or reboot again, and start over with a completely fresh
\family typewriter
/mars/
\family default
partition (
\family typewriter
mkfs.ext4 /mars/
\family default
or similar)
\emph on
everywhere
\emph default
on
\emph on
all
\emph default
cluster nodes, and continue with step 7.
\end_layout
\begin_layout Enumerate
If your old
\family typewriter
/mars/
\family default
works, and you did not already (forcefully) switch your designated primary
to the final destination, do it now (see description in section
\begin_inset CommandInset ref
LatexCommand ref
reference "subsec:Forced-Switching"
\end_inset
).
Wait until any old logfile data has been replayed.
\end_layout
\begin_layout Enumerate
Say
\family typewriter
marsadm delete-resource mydata --force
\family default
.
This will cleanup all internal symlink tree information for the resource,
but will leave your disk data intact.
\end_layout
\begin_layout Enumerate
Locally build up the new resource(s) as usual, out of the underlying disks.
\end_layout
\begin_layout Enumerate
Check whether the new resource(s) work in standalone mode.
\end_layout
\begin_layout Enumerate
When necessary, repeat these steps with other resources.
\end_layout
\begin_layout Standard
Now you can choose how the rebuild your cluster.
If you rebuilt
\family typewriter
/mars/
\family default
anywhere, you
\emph on
must
\emph default
rebuild it on
\emph on
all
\emph default
new cluster nodes and start over with a fresh
\family typewriter
join-cluster
\family default
on each of them, from scratch.
It is not possible to mix the old cluster with the new one.
\end_layout
\begin_layout Standard
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
begin{enumerate}
\backslash
setcounter{enumi}{9}
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
item
\end_layout
\end_inset
Finally, do all the necessary
\family typewriter
join-resource
\family default
s on the respective cluster nodes, according to your new redundancy scenario
after the failures (e.g.
after activating spare nodes, etc).
If you have
\begin_inset Formula $k>2$
\end_inset
replicas, start
\family typewriter
join-resource
\family default
on the worst / most damaged version first, and start the next preferably
only after the previous sync has completed successfully.
This way, you will be permanently retaining some (old and outdated, but
hopefully potentially usable) replicas while a sync is running.
Don't start too many syncs in parallel.
\end_layout
\begin_layout Standard
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
end{enumerate}
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Never use
\family typewriter
delete-resource
\family default
twice on the same resource name, after you have already a working standalone
primary
\begin_inset Foot
status open
\begin_layout Plain Layout
Of course, when you don't have created the
\emph on
same
\emph default
resource anew, you may repeat
\family typewriter
delete-resource
\family default
on other cluster nodes in order to get rid of local files / symlinks which
had not been propagated to other nodes before.
\end_layout
\end_inset
.
You might accidentally destroy your again-working copy! You
\emph on
can
\emph default
issue
\family typewriter
delete-resource
\family default
multiple times on different nodes, e.g.
when the network has problems, but doing so
\emph on
after
\emph default
re-establishment of the initial primary bears some risk.
Therefore, the safest way is first deleting the resources everywhere, and
then starting over afresh.
\end_layout
\begin_layout Standard
Before re-connecting any network cable on any non-primary (new secondaries),
ensure that all
\family typewriter
/dev/mars/mydata
\family default
devices are no longer in use (e.g.
from an old primary role before the incident happened), and that each local
disk is detached.
Only after that, you should be able to safely re-connect the network.
The
\family typewriter
delete-resource
\family default
given at the new primary should propagate now to each of your secondaries,
and your local disk should be usable for a re-
\family typewriter
join-resource
\family default
.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
When you did not rebuild your cluster from scratch with fresh
\family typewriter
/mars/
\family default
filesystems, and one of the old cluster nodes is supposed to be removed
permanently, use
\family typewriter
leave-resource
\family default
(optionally with
\family typewriter
--host=
\family default
and/or
\family typewriter
--force
\family default
) and finally
\family typewriter
leave-cluster
\family default
.
After
\family typewriter
leave-cluster
\family default
, you
\emph on
must
\emph default
re-create the
\family typewriter
/mars
\family default
filesystem.
\end_layout
\begin_layout Chapter
Experts only: Special Trick Switching and Rebuild
\begin_inset CommandInset label
LatexCommand label
name "chap:Experts-only:-Special"
\end_inset
\end_layout
\begin_layout Standard
The following is a further alternative for
\series bold
experts
\series default
who really know what they are doing.
The method is very simple and therefore well-suited for coping with mass
failures, e.g.
\series bold
power blackout of whole datacenters
\series default
.
\end_layout
\begin_layout Standard
In case a primary datacenter fails as a whole for whatever reason and you
have a backup datacenter, do the following steps in the backup datacenter:
\end_layout
\begin_layout Enumerate
Fencing step: by means of firewalling,
\series bold
ensure
\series default
that the (virtually) damaged datacenter nodes
\series bold
cannot
\series default
be reached over the network.
For example, you may place REJECT rules into all of your local iptables
firewalls at the backup datacenter.
Alternatively / additionally, you may block the routes at the appropriate
central router(s) in your network.
\end_layout
\begin_layout Enumerate
Run the sequence
\family typewriter
marsadm disconnect all; marsadm primary --force all
\family default
on all nodes in the backup datacenter.
\end_layout
\begin_layout Enumerate
Restart your services in the backup datacenter (as far as necessary).
Depending on your network setup, further steps like switching BGP routes
etc may be necessary.
\end_layout
\begin_layout Enumerate
Check that
\emph on
all
\emph default
your services are
\emph on
really
\emph default
up and running, before you try to repair anything! Failing to do so may
result in data loss when you execute the following restore method for
\emph on
experts
\emph default
.
\end_layout
\begin_layout Standard
Now your backup datacenter should continue servicing your clients.
The final reconstruction of the originally primary datacenter works as
follows:
\end_layout
\begin_layout Enumerate
At the damaged primary datacenter, ensure that nowhere the MARS kernel module
is running.
In case of a power blackout, you shouldn't have executed an automatic
\family typewriter
modprobe mars
\family default
anywhere during reboot, so you should be already done when all your nodes
are up again.
In case some nodes had no reboot, execute
\family typewriter
rmmod mars
\family default
everywhere.
If
\family typewriter
rmmod
\family default
refuses to run, you may need to umount the
\family typewriter
/dev/mars/mydata
\family default
device first.
When nothing else helps, you may just mass reboot your hanging nodes.
\end_layout
\begin_layout Enumerate
At the failed side, do
\family typewriter
rm -rf /mars/resource-$mydata/
\family default
for all those resources which had been primary before the blackout.
Do this
\emph on
only
\emph default
for those cases, otherwise you will need unnecessary
\family typewriter
leave-resource
\family default
s or
\family typewriter
invalidate
\family default
s later (e.g.
when half of your nodes were already running at the surving side).
In order to avoid unnecessary traffic, please do this only as far as really
necessary.
Don't remove any other directories.
In particular,
\family typewriter
/mars/ips/
\family default
\emph on
must
\emph default
remain intact.
In case you accidentally deleted them, or you had to re-create
\family typewriter
/mars/
\family default
from scratch, try
\family typewriter
rsync
\family default
with the correct options.
\begin_inset Newline newline
\end_inset
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Caution! before doing this, check that the corresponding directory exists
at the backup datacenter, and that it is
\emph on
really
\emph default
healthy!
\end_layout
\begin_layout Enumerate
Un-Fencing: restore your network firewall / routes and check that they work
(
\family typewriter
ping
\family default
etc).
\end_layout
\begin_layout Enumerate
Do
\family typewriter
modprobe mars
\family default
everywhere.
All missing directories and their missing symlinks should be automatically
fetched from the backup datacenter.
\end_layout
\begin_layout Enumerate
Run
\family typewriter
marsadm join-resource $res
\family default
, but only at those places where the directory was removed previously, while
using the same disk devices as before.
This will minimize actual traffic thanks to the fast full sync algorithm.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
It is
\series bold
crucial
\series default
that the fencing step
\series bold
must
\series default
be executed
\emph on
before
\emph default
any
\family typewriter
primary --force
\family default
! This way, no split brain will be
\emph on
visible
\emph default
at the backup datacenter side, because there is simply no chance for transferri
ng different versions over the network.
It is also crucial to remove any (potentially diverging) resource directories
\emph on
before
\emph default
the
\family typewriter
modprobe
\family default
! This way, the backup datacenter never runs into split brain.
This saves you a lot of detail work for split brain resolution when you
have to restore bulks of nodes in a short time.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
In case the repair of a full datacenter should take so extremely long that
some
\family typewriter
/mars/
\family default
partitions are about to run out of space at the surviving side, you may
use the
\family typewriter
leave-resource --host=failed-node
\family default
trick described earlier, followed by
\family typewriter
cron
\family default
.
Best if you have prepared a fully automatic script long before the incident,
which executes suchalike only as far as necessary in each individual case.
\end_layout
\begin_layout Standard
\noindent
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Even better: train such scenarios in advance, and prepare scripts for mass
automation.
Look into section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Scripting-HOWTO"
\end_inset
.
\end_layout
\begin_layout Chapter
Creating Backups via Pseudo Snapshots
\begin_inset CommandInset label
LatexCommand label
name "chap:Creating-Backups-via"
\end_inset
\end_layout
\begin_layout Standard
When all your secondaries are all homogenously located in a standby datacenter,
they will be almost idle all the time.
This is a waste of computing resources.
\end_layout
\begin_layout Standard
Since MARS is no substitute for a full-fledged backup system, and since
backups may put high system load onto your active side, you may want to
utilize your passive hardware resources in a better way.
\end_layout
\begin_layout Standard
MARS supports this thanks to its ability to switch the
\family typewriter
pause-replay
\family default
\emph on
independently
\emph default
from
\family typewriter
pause-fetch
\family default
.
\end_layout
\begin_layout Standard
The basic idea is simple: just use
\family typewriter
pause-replay
\family default
at your secondary site, but leave the replication of transaction logfiles
intact by deliberately
\emph on
not
\emph default
saying
\family typewriter
pause-fetch
\family default
.
This way, your secondary replica (block device) will stay frozen for a
limited time, without loosing your redundancy: since the transaction logs
will continue to replicate in the meantime, you can start
\family typewriter
resume-replay
\family default
at any time, in particular when a primary-side incident should happen unexpecte
dly.
The former secondary will just catch up by replaying the outstanding parts
of the transaction logs in order to become recent.
\end_layout
\begin_layout Standard
However, some
\emph on
details
\emph default
have to be obeyed.
In particular, the current version of MARS needs an additional
\family typewriter
detach
\family default
operation, in order to release exclusive access to the underlying disk
\family typewriter
/dev/lv/$res
\family default
.
Future versions of MARS are planned to support this more directly, without
need for an intermediate
\family typewriter
detach
\family default
operation.
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/MatieresCorrosives.png
lyxscale 50
scale 17
\end_inset
Beware:
\family typewriter
mount -o ro /dev/vg/$res
\family default
can lead to
\series bold
unnoticed write operations
\series default
if you are not careful! Some journalling filesystems like
\family typewriter
xfs
\family default
or
\family typewriter
ext4
\family default
may replay their journals onto the disk, leading to
\emph on
binary
\emph default
differences and thus
\series bold
destroying your consistency
\series default
later when you re-enable
\family typewriter
resume-replay
\family default
!
\end_layout
\begin_layout Standard
\begin_inset Graphics
filename images/lightbulb_brightlit_benj_.png
lyxscale 9
scale 5
\end_inset
Therefore, you may use small LVM snapshots (only in such cases).
Typically,
\family typewriter
xfs
\family default
journal replay will require only a few megabytes.
Therefore you typically don't need much temporary space for this.
Here is a more detailed description of steps:
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm pause-replay $res
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm detach $res
\end_layout
\begin_layout Enumerate
\family typewriter
lvcreate --size 100m --snapshot --name ro-$res /dev/vg/$res
\end_layout
\begin_layout Enumerate
\family typewriter
mount -o ro /dev/vg/ro-$res /mnt/tmp
\end_layout
\begin_layout Enumerate
Now draw your backup from
\family typewriter
/mnt/tmp/
\end_layout
\begin_layout Enumerate
\family typewriter
umount /mnt/tmp
\end_layout
\begin_layout Enumerate
\family typewriter
lvremove -f /dev/vg/ro-$res
\end_layout
\begin_layout Enumerate
\family typewriter
marsadm up $res
\end_layout
\begin_layout Standard
Hint: during the backup, the transaction logs will accumulate on
\family typewriter
/mars/
\family default
.
In order to avoid overflow of
\family typewriter
/mars/
\family default
(c.f.
section
\begin_inset CommandInset ref
LatexCommand ref
reference "sec:Defending-Overflow"
\end_inset
), don't unnecessarily prolong the backup duration.
\end_layout
\begin_layout Chapter
Command Documentation for Userspace Tools
\begin_inset CommandInset label
LatexCommand label
name "chap:Command-Documentation-for"
\end_inset
\end_layout
\begin_layout Section
\family typewriter
marsadm --help
\begin_inset CommandInset label
LatexCommand label
name "sec:marsadm-–help"
\end_inset
\end_layout
\begin_layout Standard
\begin_inset ERT
status open
\begin_layout Plain Layout
\backslash
input{marsadm.help}
\end_layout
\end_inset
\end_layout
\begin_layout Standard
\begin_inset CommandInset include
LatexCommand input
preview true
filename "common-back-matter.lyx"
\end_inset
\end_layout
\end_body
\end_document