2016-03-10 14:18:13 +00:00
|
|
|
#!/bin/sh
|
2016-03-14 14:47:04 +00:00
|
|
|
#
|
|
|
|
# rbd_mirror.sh - test rbd-mirror daemon
|
|
|
|
#
|
|
|
|
# The scripts starts two ("local" and "remote") clusters using mstart.sh script,
|
|
|
|
# creates a temporary directory, used for cluster configs, daemon logs, admin
|
|
|
|
# socket, temporary files, and launches rbd-mirror daemon.
|
|
|
|
#
|
|
|
|
# There are several env variables useful when troubleshooting a test failure:
|
|
|
|
#
|
|
|
|
# RBD_MIRROR_NOCLEANUP - if not empty, don't run the cleanup (stop processes,
|
|
|
|
# destroy the clusters and remove the temp directory)
|
|
|
|
# on exit, so it is possible to check the test state
|
|
|
|
# after failure.
|
|
|
|
# RBD_MIRROR_TEMDIR - use this path when creating the temporary directory
|
|
|
|
# (should not exist) instead of running mktemp(1).
|
|
|
|
#
|
|
|
|
# The cleanup can be done as a separate step, running the script with
|
|
|
|
# `cleanup ${RBD_MIRROR_TEMDIR}' arguments.
|
|
|
|
#
|
|
|
|
# Note, as other workunits tests, rbd_mirror.sh expects to find ceph binaries
|
|
|
|
# in PATH.
|
|
|
|
#
|
|
|
|
# Thus a typical troubleshooting session:
|
|
|
|
#
|
|
|
|
# From Ceph src dir (CEPH_SRC_PATH), start the test in NOCLEANUP mode and with
|
|
|
|
# TEMPDIR pointing to a known location:
|
|
|
|
#
|
|
|
|
# cd $CEPH_SRC_PATH
|
|
|
|
# PATH=$CEPH_SRC_PATH:$PATH
|
|
|
|
# RBD_MIRROR_NOCLEANUP=1 RBD_MIRROR_TEMDIR=/tmp/tmp.rbd_mirror \
|
|
|
|
# ../qa/workunits/rbd/rbd_mirror.sh
|
|
|
|
#
|
|
|
|
# After the test failure cd to TEMPDIR and check the current state:
|
|
|
|
#
|
|
|
|
# cd /tmp/tmp.rbd_mirror
|
|
|
|
# ls
|
2016-04-07 23:57:14 +00:00
|
|
|
# less rbd-mirror.cluster1_daemon.$pid.log
|
2016-03-31 10:57:17 +00:00
|
|
|
# ceph --cluster cluster1 -s
|
|
|
|
# ceph --cluster cluster1 -s
|
|
|
|
# rbd --cluster cluster2 -p mirror ls
|
|
|
|
# rbd --cluster cluster2 -p mirror journal status --image test
|
2016-04-07 23:57:14 +00:00
|
|
|
# ceph --admin-daemon rbd-mirror.cluster1_daemon.cluster1.$pid.asok help
|
2016-03-31 08:42:13 +00:00
|
|
|
# ...
|
|
|
|
#
|
|
|
|
# Also you can execute commands (functions) from the script:
|
|
|
|
#
|
|
|
|
# cd $CEPH_SRC_PATH
|
|
|
|
# export RBD_MIRROR_TEMDIR=/tmp/tmp.rbd_mirror
|
|
|
|
# ../qa/workunits/rbd/rbd_mirror.sh status
|
2016-04-07 23:57:14 +00:00
|
|
|
# ../qa/workunits/rbd/rbd_mirror.sh stop_mirror cluster1
|
|
|
|
# ../qa/workunits/rbd/rbd_mirror.sh start_mirror cluster2
|
|
|
|
# ../qa/workunits/rbd/rbd_mirror.sh flush cluster2
|
2016-03-14 14:47:04 +00:00
|
|
|
# ...
|
|
|
|
#
|
|
|
|
# Eventually, run the cleanup:
|
|
|
|
#
|
|
|
|
# cd $CEPH_SRC_PATH
|
2016-03-31 08:42:13 +00:00
|
|
|
# RBD_MIRROR_TEMDIR=/tmp/tmp.rbd_mirror \
|
|
|
|
# ../qa/workunits/rbd/rbd_mirror.sh cleanup
|
2016-03-14 14:47:04 +00:00
|
|
|
#
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
CLUSTER1=cluster1
|
|
|
|
CLUSTER2=cluster2
|
2016-03-10 14:18:13 +00:00
|
|
|
POOL=mirror
|
|
|
|
SRC_DIR=$(readlink -f $(dirname $0)/../../../src)
|
|
|
|
TEMPDIR=
|
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
# These vars facilitate running this script in an environment with
|
|
|
|
# ceph installed from packages, like teuthology. These are not defined
|
|
|
|
# by default.
|
|
|
|
#
|
|
|
|
# RBD_MIRROR_USE_EXISTING_CLUSTER - if set, do not start and stop ceph clusters
|
|
|
|
# RBD_MIRROR_USE_EXISTING_DAEMON - if set, use an existing instance of rbd-mirror
|
|
|
|
# running as ceph client $CEPH_ID. If empty,
|
|
|
|
# this script will start and stop rbd-mirror
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
#
|
|
|
|
# Functions
|
|
|
|
#
|
|
|
|
|
2016-03-28 19:57:58 +00:00
|
|
|
daemon_asok_file()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local local_cluster=$1
|
2016-03-28 19:57:58 +00:00
|
|
|
local cluster=$2
|
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
if [ -n "${RBD_MIRROR_USE_RBD_MIRROR}" ]; then
|
|
|
|
echo $(ceph-conf --cluster $local_cluster --name "client.${CEPH_ID}" 'admin socket')
|
|
|
|
else
|
|
|
|
echo "${TEMPDIR}/rbd-mirror.${local_cluster}_daemon.${cluster}.asok"
|
|
|
|
fi
|
2016-03-28 19:57:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
daemon_pid_file()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-28 19:57:58 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
if [ -n "${RBD_MIRROR_USE_RBD_MIRROR}" ]; then
|
|
|
|
echo $(ceph-conf --cluster $cluster --name "client.${CEPH_ID}" 'pid file')
|
|
|
|
else
|
|
|
|
echo "${TEMPDIR}/rbd-mirror.${cluster}_daemon.pid"
|
|
|
|
fi
|
2016-03-28 19:57:58 +00:00
|
|
|
}
|
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
testlog()
|
|
|
|
{
|
|
|
|
echo $(date '+%F %T') $@ | tee -a "${TEMPDIR}/rbd-mirror.test.log"
|
|
|
|
}
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
setup()
|
|
|
|
{
|
|
|
|
local c
|
|
|
|
trap cleanup INT TERM EXIT
|
|
|
|
|
2016-03-14 14:47:04 +00:00
|
|
|
if [ -n "${RBD_MIRROR_TEMDIR}" ]; then
|
|
|
|
mkdir "${RBD_MIRROR_TEMDIR}"
|
|
|
|
TEMPDIR="${RBD_MIRROR_TEMDIR}"
|
|
|
|
else
|
|
|
|
TEMPDIR=`mktemp -d`
|
|
|
|
fi
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
if [ -z "${RBD_MIRROR_USE_EXISTING_CLUSTER}" ]; then
|
|
|
|
cd ${SRC_DIR}
|
|
|
|
./mstart.sh ${CLUSTER1} -n
|
|
|
|
./mstart.sh ${CLUSTER2} -n
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
ln -s $(readlink -f run/${CLUSTER1}/ceph.conf) \
|
|
|
|
${TEMPDIR}/${CLUSTER1}.conf
|
|
|
|
ln -s $(readlink -f run/${CLUSTER2}/ceph.conf) \
|
|
|
|
${TEMPDIR}/${CLUSTER2}.conf
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
cd ${TEMPDIR}
|
|
|
|
fi
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
ceph --cluster ${CLUSTER1} osd pool create ${POOL} 64 64
|
|
|
|
ceph --cluster ${CLUSTER2} osd pool create ${POOL} 64 64
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
rbd --cluster ${CLUSTER1} mirror pool enable ${POOL} pool
|
|
|
|
rbd --cluster ${CLUSTER2} mirror pool enable ${POOL} pool
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
rbd --cluster ${CLUSTER1} mirror pool peer add ${POOL} ${CLUSTER2}
|
|
|
|
rbd --cluster ${CLUSTER2} mirror pool peer add ${POOL} ${CLUSTER1}
|
2016-03-10 14:18:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
cleanup()
|
|
|
|
{
|
|
|
|
test -n "${RBD_MIRROR_NOCLEANUP}" && return
|
|
|
|
|
|
|
|
set +e
|
|
|
|
|
2016-04-07 23:57:14 +00:00
|
|
|
stop_mirror "${CLUSTER1}"
|
|
|
|
stop_mirror "${CLUSTER2}"
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
if [ -z "${RBD_MIRROR_USE_EXISTING_CLUSTER}" ]; then
|
|
|
|
cd ${SRC_DIR}
|
|
|
|
./mstop.sh ${CLUSTER1}
|
|
|
|
./mstop.sh ${CLUSTER2}
|
|
|
|
else
|
|
|
|
ceph --cluster ${CLUSTER1} osd pool rm ${POOL} ${POOL} --yes-i-really-really-mean-it
|
|
|
|
ceph --cluster ${CLUSTER2} osd pool rm ${POOL} ${POOL} --yes-i-really-really-mean-it
|
|
|
|
fi
|
2016-03-10 14:18:13 +00:00
|
|
|
rm -Rf ${TEMPDIR}
|
|
|
|
}
|
|
|
|
|
|
|
|
start_mirror()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
test -n "${RBD_MIRROR_USE_RBD_MIRROR}" && return
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
rbd-mirror \
|
2016-03-28 19:57:58 +00:00
|
|
|
--cluster ${cluster} \
|
2016-04-07 23:57:14 +00:00
|
|
|
--pid-file=$(daemon_pid_file "${cluster}") \
|
2016-05-01 19:04:46 +00:00
|
|
|
--log-file=${TEMPDIR}/rbd-mirror.${cluster}_daemon.\$cluster.\$pid.log \
|
2016-04-07 23:57:14 +00:00
|
|
|
--admin-socket=${TEMPDIR}/rbd-mirror.${cluster}_daemon.\$cluster.asok \
|
2016-03-10 14:18:13 +00:00
|
|
|
--debug-rbd=30 --debug-journaler=30 \
|
|
|
|
--debug-rbd_mirror=30 \
|
|
|
|
--daemonize=true
|
|
|
|
}
|
|
|
|
|
|
|
|
stop_mirror()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-02 01:15:33 +00:00
|
|
|
test -n "${RBD_MIRROR_USE_RBD_MIRROR}" && return
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
local pid
|
2016-04-07 23:57:14 +00:00
|
|
|
pid=$(cat $(daemon_pid_file "${cluster}") 2>/dev/null) || :
|
2016-03-10 14:18:13 +00:00
|
|
|
if [ -n "${pid}" ]
|
|
|
|
then
|
|
|
|
kill ${pid}
|
|
|
|
for s in 1 2 4 8 16 32; do
|
|
|
|
sleep $s
|
|
|
|
ps auxww | awk -v pid=${pid} '$2 == pid {print; exit 1}' && break
|
|
|
|
done
|
|
|
|
ps auxww | awk -v pid=${pid} '$2 == pid {print; exit 1}'
|
|
|
|
fi
|
2016-04-07 23:57:14 +00:00
|
|
|
rm -f $(daemon_asok_file "${cluster}" "${CLUSTER1}")
|
|
|
|
rm -f $(daemon_asok_file "${cluster}" "${CLUSTER2}")
|
|
|
|
rm -f $(daemon_pid_file "${cluster}")
|
2016-03-31 10:34:30 +00:00
|
|
|
}
|
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
admin_daemon()
|
|
|
|
{
|
|
|
|
local cluster=$1 ; shift
|
|
|
|
|
|
|
|
local asok_file=$(daemon_asok_file "${cluster}" "${cluster}")
|
|
|
|
test -S "${asok_file}"
|
|
|
|
|
|
|
|
ceph --admin-daemon ${asok_file} $@
|
|
|
|
}
|
|
|
|
|
2016-03-31 08:42:13 +00:00
|
|
|
status()
|
|
|
|
{
|
2016-03-31 10:34:30 +00:00
|
|
|
local cluster daemon image
|
2016-03-31 08:42:13 +00:00
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
for cluster in ${CLUSTER1} ${CLUSTER2}
|
2016-03-31 08:42:13 +00:00
|
|
|
do
|
|
|
|
echo "${cluster} status"
|
|
|
|
ceph --cluster ${cluster} -s
|
|
|
|
echo
|
|
|
|
|
|
|
|
echo "${cluster} ${POOL} images"
|
|
|
|
rbd --cluster ${cluster} -p ${POOL} ls
|
|
|
|
echo
|
|
|
|
|
2016-04-24 16:39:40 +00:00
|
|
|
echo "${cluster} ${POOL} mirror pool status"
|
|
|
|
rbd --cluster ${cluster} -p ${POOL} mirror pool status --verbose
|
|
|
|
echo
|
|
|
|
|
2016-03-31 08:42:13 +00:00
|
|
|
for image in `rbd --cluster ${cluster} -p ${POOL} ls 2>/dev/null`
|
|
|
|
do
|
2016-04-24 16:39:40 +00:00
|
|
|
echo "image ${image} info"
|
|
|
|
rbd --cluster ${cluster} -p ${POOL} info ${image}
|
|
|
|
echo
|
2016-03-31 08:42:13 +00:00
|
|
|
echo "image ${image} journal status"
|
|
|
|
rbd --cluster ${cluster} -p ${POOL} journal status --image ${image}
|
|
|
|
echo
|
|
|
|
done
|
|
|
|
done
|
|
|
|
|
|
|
|
local ret
|
|
|
|
|
2016-04-07 23:57:14 +00:00
|
|
|
for cluster in "${CLUSTER1}" "${CLUSTER2}"
|
2016-03-31 08:42:13 +00:00
|
|
|
do
|
2016-04-07 23:57:14 +00:00
|
|
|
local pid_file=$(daemon_pid_file ${cluster} )
|
2016-03-31 08:42:13 +00:00
|
|
|
if [ ! -e ${pid_file} ]
|
|
|
|
then
|
2016-04-07 23:57:14 +00:00
|
|
|
echo "${cluster} rbd-mirror not running or unknown" \
|
2016-03-31 08:42:13 +00:00
|
|
|
"(${pid_file} not exist)"
|
|
|
|
continue
|
|
|
|
fi
|
|
|
|
|
|
|
|
local pid
|
|
|
|
pid=$(cat ${pid_file} 2>/dev/null) || :
|
|
|
|
if [ -z "${pid}" ]
|
|
|
|
then
|
2016-04-07 23:57:14 +00:00
|
|
|
echo "${cluster} rbd-mirror not running or unknown" \
|
2016-03-31 08:42:13 +00:00
|
|
|
"(can't find pid using ${pid_file})"
|
|
|
|
ret=1
|
|
|
|
continue
|
|
|
|
fi
|
|
|
|
|
|
|
|
echo "${daemon} rbd-mirror process in ps output:"
|
|
|
|
if ps auxww |
|
|
|
|
awk -v pid=${pid} 'NR == 1 {print} $2 == pid {print; exit 1}'
|
|
|
|
then
|
|
|
|
echo
|
2016-04-07 23:57:14 +00:00
|
|
|
echo "${cluster} rbd-mirror not running" \
|
2016-03-31 08:42:13 +00:00
|
|
|
"(can't find pid $pid in ps output)"
|
|
|
|
ret=1
|
|
|
|
continue
|
|
|
|
fi
|
|
|
|
echo
|
|
|
|
|
2016-04-07 23:57:14 +00:00
|
|
|
local asok_file=$(daemon_asok_file ${cluster} ${cluster})
|
2016-03-31 08:42:13 +00:00
|
|
|
if [ ! -S "${asok_file}" ]
|
|
|
|
then
|
2016-04-07 23:57:14 +00:00
|
|
|
echo "${cluster} rbd-mirror asok is unknown (${asok_file} not exits)"
|
2016-03-31 08:42:13 +00:00
|
|
|
ret=1
|
|
|
|
continue
|
|
|
|
fi
|
|
|
|
|
2016-04-07 23:57:14 +00:00
|
|
|
echo "${cluster} rbd-mirror status"
|
2016-03-31 08:42:13 +00:00
|
|
|
ceph --admin-daemon ${asok_file} rbd mirror status
|
|
|
|
echo
|
|
|
|
done
|
|
|
|
|
|
|
|
return ${ret}
|
|
|
|
}
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
flush()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-28 19:57:58 +00:00
|
|
|
local image=$2
|
2016-03-31 08:42:13 +00:00
|
|
|
local cmd="rbd mirror flush"
|
|
|
|
|
|
|
|
if [ -n "${image}" ]
|
|
|
|
then
|
|
|
|
cmd="${cmd} ${POOL}/${image}"
|
|
|
|
fi
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
admin_daemon "${cluster}" ${cmd}
|
2016-03-10 14:18:13 +00:00
|
|
|
}
|
|
|
|
|
2016-03-14 14:47:04 +00:00
|
|
|
test_image_replay_state()
|
2016-03-10 14:18:13 +00:00
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-31 10:34:30 +00:00
|
|
|
local image=$2
|
|
|
|
local test_state=$3
|
2016-03-14 14:47:04 +00:00
|
|
|
local current_state=stopped
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
admin_daemon "${cluster}" help |
|
2016-04-28 06:23:35 +00:00
|
|
|
fgrep "\"rbd mirror status ${POOL}/${image}\"" &&
|
2016-04-28 06:32:33 +00:00
|
|
|
admin_daemon "${cluster}" rbd mirror status ${POOL}/${image} |
|
2016-04-28 06:23:35 +00:00
|
|
|
grep -i 'state.*Replaying' &&
|
|
|
|
current_state=started
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-14 14:47:04 +00:00
|
|
|
test "${test_state}" = "${current_state}"
|
|
|
|
}
|
|
|
|
|
|
|
|
wait_for_image_replay_state()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-31 10:34:30 +00:00
|
|
|
local image=$2
|
|
|
|
local state=$3
|
2016-03-16 14:29:56 +00:00
|
|
|
local s
|
2016-03-10 14:18:13 +00:00
|
|
|
|
|
|
|
# TODO: add a way to force rbd-mirror to update replayers
|
2016-03-28 19:57:58 +00:00
|
|
|
for s in 1 2 4 8 8 8 8 8 8 8 8 16 16; do
|
2016-03-10 14:18:13 +00:00
|
|
|
sleep ${s}
|
2016-04-07 23:57:14 +00:00
|
|
|
test_image_replay_state "${cluster}" "${image}" "${state}" && return 0
|
2016-03-10 14:18:13 +00:00
|
|
|
done
|
|
|
|
return 1
|
|
|
|
}
|
|
|
|
|
2016-03-14 14:47:04 +00:00
|
|
|
wait_for_image_replay_started()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-31 10:34:30 +00:00
|
|
|
local image=$2
|
2016-03-14 14:47:04 +00:00
|
|
|
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_state "${cluster}" "${image}" started
|
2016-03-14 14:47:04 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
wait_for_image_replay_stopped()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local cluster=$1
|
2016-03-31 10:34:30 +00:00
|
|
|
local image=$2
|
2016-03-14 14:47:04 +00:00
|
|
|
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_state "${cluster}" "${image}" stopped
|
2016-03-14 14:47:04 +00:00
|
|
|
}
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
get_position()
|
|
|
|
{
|
2016-03-28 19:57:58 +00:00
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
|
|
|
local id_regexp=$3
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-16 21:07:07 +00:00
|
|
|
# Parse line like below, looking for the first position
|
2016-03-10 14:18:13 +00:00
|
|
|
# [id=, commit_position=[positions=[[object_number=1, tag_tid=3, entry_tid=9], [object_number=0, tag_tid=3, entry_tid=8], [object_number=3, tag_tid=3, entry_tid=7], [object_number=2, tag_tid=3, entry_tid=6]]]]
|
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
local status_log=${TEMPDIR}/${CLUSTER2}-${POOL}-${image}.status
|
2016-03-28 19:57:58 +00:00
|
|
|
rbd --cluster ${cluster} -p ${POOL} journal status --image ${image} |
|
2016-03-10 14:18:13 +00:00
|
|
|
tee ${status_log} >&2
|
2016-03-16 21:07:07 +00:00
|
|
|
sed -nEe 's/^.*\[id='"${id_regexp}"',.*positions=\[\[([^]]*)\],.*$/\1/p' \
|
|
|
|
${status_log}
|
2016-03-10 14:18:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
get_master_position()
|
|
|
|
{
|
2016-03-28 19:57:58 +00:00
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-28 19:57:58 +00:00
|
|
|
get_position "${cluster}" "${image}" ''
|
2016-03-10 14:18:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
get_mirror_position()
|
|
|
|
{
|
2016-03-28 19:57:58 +00:00
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-28 19:57:58 +00:00
|
|
|
get_position "${cluster}" "${image}" '..*'
|
2016-03-10 14:18:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
wait_for_replay_complete()
|
|
|
|
{
|
2016-04-07 23:57:14 +00:00
|
|
|
local local_cluster=$1
|
2016-03-28 19:57:58 +00:00
|
|
|
local cluster=$2
|
|
|
|
local image=$3
|
2016-03-10 14:18:13 +00:00
|
|
|
local s master_pos mirror_pos
|
|
|
|
|
2016-03-14 14:47:04 +00:00
|
|
|
for s in 0.2 0.4 0.8 1.6 2 2 4 4 8 8 16 16; do
|
2016-03-10 14:18:13 +00:00
|
|
|
sleep ${s}
|
2016-04-07 23:57:14 +00:00
|
|
|
flush "${local_cluster}" "${image}"
|
2016-03-28 19:57:58 +00:00
|
|
|
master_pos=$(get_master_position "${cluster}" "${image}")
|
|
|
|
mirror_pos=$(get_mirror_position "${cluster}" "${image}")
|
2016-03-10 14:18:13 +00:00
|
|
|
test -n "${master_pos}" -a "${master_pos}" = "${mirror_pos}" && return 0
|
|
|
|
done
|
|
|
|
return 1
|
|
|
|
}
|
|
|
|
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir()
|
|
|
|
{
|
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
|
|
|
local state_pattern=$3
|
|
|
|
local description_pattern=$4
|
|
|
|
|
|
|
|
local status_log=${TEMPDIR}/${cluster}-${image}.mirror_status
|
|
|
|
rbd --cluster ${cluster} -p ${POOL} mirror image status ${image} |
|
|
|
|
tee ${status_log}
|
|
|
|
grep "state: .*${state_pattern}" ${status_log}
|
|
|
|
grep "description: .*${description_pattern}" ${status_log}
|
|
|
|
}
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
create_image()
|
|
|
|
{
|
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
|
|
|
|
|
|
|
rbd --cluster ${cluster} -p ${POOL} create --size 128 \
|
|
|
|
--image-feature exclusive-lock --image-feature journaling ${image}
|
|
|
|
}
|
|
|
|
|
|
|
|
write_image()
|
|
|
|
{
|
2016-03-28 19:57:58 +00:00
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
|
|
|
local count=$3
|
2016-03-10 14:18:13 +00:00
|
|
|
|
2016-03-28 19:57:58 +00:00
|
|
|
rbd --cluster ${cluster} -p ${POOL} bench-write ${image} \
|
2016-03-10 14:18:13 +00:00
|
|
|
--io-size 4096 --io-threads 1 --io-total $((4096 * count)) \
|
|
|
|
--io-pattern rand
|
|
|
|
}
|
|
|
|
|
|
|
|
compare_images()
|
|
|
|
{
|
|
|
|
local image=$1
|
|
|
|
|
2016-03-31 10:57:17 +00:00
|
|
|
local rmt_export=${TEMPDIR}/${CLUSTER2}-${POOL}-${image}.export
|
|
|
|
local loc_export=${TEMPDIR}/${CLUSTER1}-${POOL}-${image}.export
|
2016-03-10 14:18:13 +00:00
|
|
|
|
|
|
|
rm -f ${rmt_export} ${loc_export}
|
2016-03-31 10:57:17 +00:00
|
|
|
rbd --cluster ${CLUSTER2} -p ${POOL} export ${image} ${rmt_export}
|
|
|
|
rbd --cluster ${CLUSTER1} -p ${POOL} export ${image} ${loc_export}
|
2016-03-10 14:18:13 +00:00
|
|
|
cmp ${rmt_export} ${loc_export}
|
|
|
|
}
|
|
|
|
|
2016-03-28 19:57:58 +00:00
|
|
|
demote_image()
|
|
|
|
{
|
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
|
|
|
|
|
|
|
rbd --cluster=${cluster} mirror image demote ${POOL}/${image}
|
|
|
|
}
|
|
|
|
|
|
|
|
promote_image()
|
|
|
|
{
|
|
|
|
local cluster=$1
|
|
|
|
local image=$2
|
|
|
|
|
|
|
|
rbd --cluster=${cluster} mirror image promote ${POOL}/${image}
|
|
|
|
}
|
|
|
|
|
2016-03-10 14:18:13 +00:00
|
|
|
#
|
|
|
|
# Main
|
|
|
|
#
|
|
|
|
|
2016-03-31 08:42:13 +00:00
|
|
|
if [ "$#" -gt 0 ]
|
|
|
|
then
|
|
|
|
if [ -z "${RBD_MIRROR_TEMDIR}" ]
|
|
|
|
then
|
|
|
|
echo "RBD_MIRROR_TEMDIR is not set" >&2
|
|
|
|
exit 1
|
2016-03-14 14:47:04 +00:00
|
|
|
fi
|
|
|
|
|
2016-03-31 08:42:13 +00:00
|
|
|
TEMPDIR="${RBD_MIRROR_TEMDIR}"
|
|
|
|
cd ${TEMPDIR}
|
|
|
|
$@
|
|
|
|
exit $?
|
2016-03-10 14:18:13 +00:00
|
|
|
fi
|
|
|
|
|
|
|
|
set -xe
|
|
|
|
|
|
|
|
setup
|
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
testlog "TEST: add image and test replay"
|
2016-04-07 23:57:14 +00:00
|
|
|
start_mirror ${CLUSTER1}
|
2016-03-10 14:18:13 +00:00
|
|
|
image=test
|
2016-03-31 10:57:17 +00:00
|
|
|
create_image ${CLUSTER2} ${image}
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
2016-03-31 10:57:17 +00:00
|
|
|
write_image ${CLUSTER2} ${image} 100
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_replay_complete ${CLUSTER1} ${CLUSTER2} ${image}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER1} ${image} 'up+replaying' 'master_position'
|
|
|
|
test_status_in_pool_dir ${CLUSTER2} ${image} 'down+unknown'
|
2016-03-10 14:18:13 +00:00
|
|
|
compare_images ${image}
|
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
testlog "TEST: stop mirror, add image, start mirror and test replay"
|
2016-04-07 23:57:14 +00:00
|
|
|
stop_mirror ${CLUSTER1}
|
2016-03-10 14:18:13 +00:00
|
|
|
image1=test1
|
2016-03-31 10:57:17 +00:00
|
|
|
create_image ${CLUSTER2} ${image1}
|
|
|
|
write_image ${CLUSTER2} ${image1} 100
|
2016-04-07 23:57:14 +00:00
|
|
|
start_mirror ${CLUSTER1}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image1}
|
|
|
|
wait_for_replay_complete ${CLUSTER1} ${CLUSTER2} ${image1}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER1} ${image1} 'up+replaying' 'master_position'
|
|
|
|
test_status_in_pool_dir ${CLUSTER2} ${image1} 'down+unknown'
|
2016-03-10 14:18:13 +00:00
|
|
|
compare_images ${image1}
|
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
testlog "TEST: test the first image is replaying after restart"
|
2016-03-31 10:57:17 +00:00
|
|
|
write_image ${CLUSTER2} ${image} 100
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_replay_complete ${CLUSTER1} ${CLUSTER2} ${image}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER1} ${image} 'up+replaying' 'master_position'
|
2016-03-28 19:57:58 +00:00
|
|
|
compare_images ${image}
|
|
|
|
|
2016-04-28 06:32:33 +00:00
|
|
|
testlog "TEST: stop/start/restart mirror via admin socket"
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror stop
|
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror start
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror restart
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror stop
|
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror restart
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror stop ${CLUSTER2}
|
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror start ${POOL}/${image}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror start
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror start ${CLUSTER2}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror restart ${POOL}/${image}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror restart ${CLUSTER2}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image1}
|
|
|
|
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror flush
|
|
|
|
admin_daemon ${CLUSTER1} rbd mirror status
|
|
|
|
|
|
|
|
testlog "TEST: failover and failback"
|
2016-04-07 23:57:14 +00:00
|
|
|
start_mirror ${CLUSTER2}
|
2016-03-28 19:57:58 +00:00
|
|
|
|
|
|
|
# failover
|
2016-03-31 10:57:17 +00:00
|
|
|
demote_image ${CLUSTER2} ${image}
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_stopped ${CLUSTER1} ${image}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER1} ${image} 'up+stopped'
|
|
|
|
test_status_in_pool_dir ${CLUSTER2} ${image} 'up+stopped'
|
2016-03-31 10:57:17 +00:00
|
|
|
promote_image ${CLUSTER1} ${image}
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_started ${CLUSTER2} ${image}
|
2016-03-31 10:57:17 +00:00
|
|
|
write_image ${CLUSTER1} ${image} 100
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_replay_complete ${CLUSTER2} ${CLUSTER1} ${image}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER1} ${image} 'up+stopped'
|
|
|
|
test_status_in_pool_dir ${CLUSTER2} ${image} 'up+replaying' 'master_position'
|
2016-03-28 19:57:58 +00:00
|
|
|
compare_images ${image}
|
|
|
|
|
|
|
|
# failback
|
2016-03-31 10:57:17 +00:00
|
|
|
demote_image ${CLUSTER1} ${image}
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_stopped ${CLUSTER2} ${image}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER2} ${image} 'up+stopped'
|
2016-03-31 10:57:17 +00:00
|
|
|
promote_image ${CLUSTER2} ${image}
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_image_replay_started ${CLUSTER1} ${image}
|
2016-03-31 10:57:17 +00:00
|
|
|
write_image ${CLUSTER2} ${image} 100
|
2016-04-07 23:57:14 +00:00
|
|
|
wait_for_replay_complete ${CLUSTER1} ${CLUSTER2} ${image}
|
2016-04-24 16:39:40 +00:00
|
|
|
test_status_in_pool_dir ${CLUSTER1} ${image} 'up+replaying' 'master_position'
|
|
|
|
test_status_in_pool_dir ${CLUSTER2} ${image} 'up+stopped'
|
2016-03-10 14:18:13 +00:00
|
|
|
compare_images ${image}
|
|
|
|
|
|
|
|
echo OK
|