2020-11-18 10:28:39 +00:00
|
|
|
import errno
|
2018-01-02 09:14:14 +00:00
|
|
|
import logging
|
2019-02-25 19:10:01 +00:00
|
|
|
import signal
|
2018-01-02 09:14:14 +00:00
|
|
|
from textwrap import dedent
|
|
|
|
from tasks.cephfs.fuse_mount import FuseMount
|
|
|
|
from tasks.cephfs.cephfs_test_case import CephFSTestCase
|
2021-06-15 12:55:22 +00:00
|
|
|
from teuthology.orchestra.run import Raw
|
|
|
|
from teuthology.exceptions import CommandFailedError
|
2018-01-02 09:14:14 +00:00
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
2018-01-06 02:54:48 +00:00
|
|
|
MDS_RESTART_GRACE = 60
|
|
|
|
|
2018-01-02 09:14:14 +00:00
|
|
|
class TestSnapshots(CephFSTestCase):
|
2018-02-01 05:47:48 +00:00
|
|
|
MDSS_REQUIRED = 3
|
2019-10-17 06:15:00 +00:00
|
|
|
LOAD_SETTINGS = ["mds_max_snaps_per_dir"]
|
2018-01-02 09:14:14 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _check_subtree(self, rank, path, status=None):
|
|
|
|
got_subtrees = self.fs.rank_asok(["get", "subtrees"], rank=rank, status=status)
|
2018-01-02 09:14:14 +00:00
|
|
|
for s in got_subtrees:
|
|
|
|
if s['dir']['path'] == path and s['auth_first'] == rank:
|
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _get_snapclient_dump(self, rank=0, status=None):
|
|
|
|
return self.fs.rank_asok(["dump", "snaps"], rank=rank, status=status)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _get_snapserver_dump(self, rank=0, status=None):
|
|
|
|
return self.fs.rank_asok(["dump", "snaps", "--server"], rank=rank, status=status)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _get_last_created_snap(self, rank=0, status=None):
|
|
|
|
return int(self._get_snapserver_dump(rank,status=status)["last_created"])
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _get_last_destroyed_snap(self, rank=0, status=None):
|
|
|
|
return int(self._get_snapserver_dump(rank,status=status)["last_destroyed"])
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _get_pending_snap_update(self, rank=0, status=None):
|
|
|
|
return self._get_snapserver_dump(rank,status=status)["pending_update"]
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _get_pending_snap_destroy(self, rank=0, status=None):
|
|
|
|
return self._get_snapserver_dump(rank,status=status)["pending_destroy"]
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2020-11-18 10:28:39 +00:00
|
|
|
def test_allow_new_snaps_config(self):
|
|
|
|
"""
|
|
|
|
Check whether 'allow_new_snaps' setting works
|
|
|
|
"""
|
|
|
|
self.mount_a.run_shell(["mkdir", "test-allow-snaps"])
|
|
|
|
|
|
|
|
self.fs.set_allow_new_snaps(False);
|
|
|
|
try:
|
|
|
|
self.mount_a.run_shell(["mkdir", "test-allow-snaps/.snap/snap00"])
|
|
|
|
except CommandFailedError as ce:
|
|
|
|
self.assertEqual(ce.exitstatus, errno.EPERM, "expected EPERM")
|
|
|
|
else:
|
|
|
|
self.fail("expected snap creatiion to fail")
|
|
|
|
|
|
|
|
self.fs.set_allow_new_snaps(True);
|
|
|
|
self.mount_a.run_shell(["mkdir", "test-allow-snaps/.snap/snap00"])
|
|
|
|
self.mount_a.run_shell(["rmdir", "test-allow-snaps/.snap/snap00"])
|
|
|
|
self.mount_a.run_shell(["rmdir", "test-allow-snaps"])
|
|
|
|
|
2018-01-06 02:54:48 +00:00
|
|
|
def test_kill_mdstable(self):
|
|
|
|
"""
|
|
|
|
check snaptable transcation
|
|
|
|
"""
|
2018-03-16 10:03:23 +00:00
|
|
|
if not isinstance(self.mount_a, FuseMount):
|
2019-04-24 16:35:46 +00:00
|
|
|
self.skipTest("Require FUSE client to forcibly kill mount")
|
2018-03-16 10:03:23 +00:00
|
|
|
|
2018-01-06 02:54:48 +00:00
|
|
|
self.fs.set_allow_new_snaps(True);
|
|
|
|
self.fs.set_max_mds(2)
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.wait_for_daemons()
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
# setup subtrees
|
|
|
|
self.mount_a.run_shell(["mkdir", "-p", "d1/dir"])
|
|
|
|
self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
|
2020-06-19 20:52:22 +00:00
|
|
|
self._wait_subtrees([("/d1", 1)], rank=1, path="/d1")
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
last_created = self._get_last_created_snap(rank=0,status=status)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
# mds_kill_mdstable_at:
|
|
|
|
# 1: MDSTableServer::handle_prepare
|
|
|
|
# 2: MDSTableServer::_prepare_logged
|
|
|
|
# 5: MDSTableServer::handle_commit
|
|
|
|
# 6: MDSTableServer::_commit_logged
|
|
|
|
for i in [1,2,5,6]:
|
|
|
|
log.info("testing snapserver mds_kill_mdstable_at={0}".format(i))
|
2019-02-25 19:10:01 +00:00
|
|
|
|
|
|
|
status = self.fs.status()
|
|
|
|
rank0 = self.fs.get_rank(rank=0, status=status)
|
|
|
|
self.fs.rank_freeze(True, rank=0)
|
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "{0}".format(i)], rank=0, status=status)
|
2018-01-06 02:54:48 +00:00
|
|
|
proc = self.mount_a.run_shell(["mkdir", "d1/dir/.snap/s1{0}".format(i)], wait=False)
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=0), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank0['name']);
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=0)
|
|
|
|
self.fs.mds_restart(rank0['name'])
|
|
|
|
self.wait_for_daemon_start([rank0['name']])
|
|
|
|
status = self.fs.wait_for_daemons()
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
proc.wait()
|
|
|
|
last_created += 1
|
2019-02-25 19:10:01 +00:00
|
|
|
self.wait_until_true(lambda: self._get_last_created_snap(rank=0) == last_created, timeout=30)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.set_conf("mds", "mds_reconnect_timeout", "5")
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", Raw("d1/dir/.snap/*")])
|
|
|
|
|
|
|
|
# set mds_kill_mdstable_at, also kill snapclient
|
|
|
|
for i in [2,5,6]:
|
|
|
|
log.info("testing snapserver mds_kill_mdstable_at={0}, also kill snapclient".format(i))
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.status()
|
|
|
|
last_created = self._get_last_created_snap(rank=0, status=status)
|
|
|
|
|
|
|
|
rank0 = self.fs.get_rank(rank=0, status=status)
|
|
|
|
rank1 = self.fs.get_rank(rank=1, status=status)
|
|
|
|
self.fs.rank_freeze(True, rank=0) # prevent failover...
|
|
|
|
self.fs.rank_freeze(True, rank=1) # prevent failover...
|
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "{0}".format(i)], rank=0, status=status)
|
2018-01-06 02:54:48 +00:00
|
|
|
proc = self.mount_a.run_shell(["mkdir", "d1/dir/.snap/s2{0}".format(i)], wait=False)
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=0), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank0['name']);
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_signal(signal.SIGKILL, rank=1)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.mount_a.kill()
|
|
|
|
self.mount_a.kill_cleanup()
|
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=0)
|
|
|
|
self.fs.mds_restart(rank0['name'])
|
|
|
|
self.wait_for_daemon_start([rank0['name']])
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.fs.wait_for_state('up:resolve', rank=0, timeout=MDS_RESTART_GRACE)
|
|
|
|
if i in [2,5]:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(len(self._get_pending_snap_update(rank=0)), 1)
|
2018-01-06 02:54:48 +00:00
|
|
|
elif i == 6:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(len(self._get_pending_snap_update(rank=0)), 0)
|
|
|
|
self.assertGreater(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=1)
|
|
|
|
self.fs.mds_restart(rank1['name'])
|
|
|
|
self.wait_for_daemon_start([rank1['name']])
|
2018-01-06 02:54:48 +00:00
|
|
|
self.fs.wait_for_state('up:active', rank=0, timeout=MDS_RESTART_GRACE)
|
|
|
|
|
|
|
|
if i in [2,5]:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.wait_until_true(lambda: len(self._get_pending_snap_update(rank=0)) == 0, timeout=30)
|
2018-01-06 02:54:48 +00:00
|
|
|
if i == 2:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
else:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertGreater(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2020-04-03 09:26:22 +00:00
|
|
|
self.mount_a.mount_wait()
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", Raw("d1/dir/.snap/*")])
|
|
|
|
|
|
|
|
# mds_kill_mdstable_at:
|
|
|
|
# 3: MDSTableClient::handle_request (got agree)
|
|
|
|
# 4: MDSTableClient::commit
|
|
|
|
# 7: MDSTableClient::handle_request (got ack)
|
|
|
|
for i in [3,4,7]:
|
|
|
|
log.info("testing snapclient mds_kill_mdstable_at={0}".format(i))
|
2019-02-25 19:10:01 +00:00
|
|
|
last_created = self._get_last_created_snap(rank=0)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.status()
|
|
|
|
rank1 = self.fs.get_rank(rank=1, status=status)
|
|
|
|
self.fs.rank_freeze(True, rank=1) # prevent failover...
|
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "{0}".format(i)], rank=1, status=status)
|
2018-01-06 02:54:48 +00:00
|
|
|
proc = self.mount_a.run_shell(["mkdir", "d1/dir/.snap/s3{0}".format(i)], wait=False)
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=1), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank1['name']);
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.mount_a.kill()
|
|
|
|
self.mount_a.kill_cleanup()
|
|
|
|
|
|
|
|
if i in [3,4]:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(len(self._get_pending_snap_update(rank=0)), 1)
|
2018-01-06 02:54:48 +00:00
|
|
|
elif i == 7:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(len(self._get_pending_snap_update(rank=0)), 0)
|
|
|
|
self.assertGreater(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=1)
|
|
|
|
self.fs.mds_restart(rank1['name'])
|
|
|
|
self.wait_for_daemon_start([rank1['name']])
|
|
|
|
status = self.fs.wait_for_daemons(timeout=MDS_RESTART_GRACE)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
if i in [3,4]:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.wait_until_true(lambda: len(self._get_pending_snap_update(rank=0)) == 0, timeout=30)
|
2018-01-06 02:54:48 +00:00
|
|
|
if i == 3:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
else:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertGreater(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2020-04-03 09:26:22 +00:00
|
|
|
self.mount_a.mount_wait()
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", Raw("d1/dir/.snap/*")])
|
|
|
|
|
|
|
|
# mds_kill_mdstable_at:
|
|
|
|
# 3: MDSTableClient::handle_request (got agree)
|
|
|
|
# 8: MDSTableServer::handle_rollback
|
|
|
|
log.info("testing snapclient mds_kill_mdstable_at=3, snapserver mds_kill_mdstable_at=8")
|
2019-02-25 19:10:01 +00:00
|
|
|
last_created = self._get_last_created_snap(rank=0)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.status()
|
|
|
|
rank0 = self.fs.get_rank(rank=0, status=status)
|
|
|
|
rank1 = self.fs.get_rank(rank=1, status=status)
|
|
|
|
self.fs.rank_freeze(True, rank=0)
|
|
|
|
self.fs.rank_freeze(True, rank=1)
|
2020-01-09 07:27:37 +00:00
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "8"], rank=0, status=status)
|
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "3"], rank=1, status=status)
|
|
|
|
proc = self.mount_a.run_shell(["mkdir", "d1/dir/.snap/s4"], wait=False)
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=1), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank1['name']);
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
self.mount_a.kill()
|
|
|
|
self.mount_a.kill_cleanup()
|
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(len(self._get_pending_snap_update(rank=0)), 1)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=1)
|
|
|
|
self.fs.mds_restart(rank1['name'])
|
|
|
|
self.wait_for_daemon_start([rank1['name']])
|
2018-01-06 02:54:48 +00:00
|
|
|
|
|
|
|
# rollback triggers assertion
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=0), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank0['name']);
|
|
|
|
self.fs.rank_fail(rank=0)
|
|
|
|
self.fs.mds_restart(rank0['name'])
|
|
|
|
self.wait_for_daemon_start([rank0['name']])
|
2018-01-06 02:54:48 +00:00
|
|
|
self.fs.wait_for_state('up:active', rank=0, timeout=MDS_RESTART_GRACE)
|
2019-02-25 19:10:01 +00:00
|
|
|
|
|
|
|
# mds.1 should re-send rollback message
|
|
|
|
self.wait_until_true(lambda: len(self._get_pending_snap_update(rank=0)) == 0, timeout=30)
|
|
|
|
self.assertEqual(self._get_last_created_snap(rank=0), last_created)
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2020-04-03 09:26:22 +00:00
|
|
|
self.mount_a.mount_wait()
|
2018-01-06 02:54:48 +00:00
|
|
|
|
2018-02-01 05:47:48 +00:00
|
|
|
def test_snapclient_cache(self):
|
|
|
|
"""
|
|
|
|
check if snapclient cache gets synced properly
|
|
|
|
"""
|
|
|
|
self.fs.set_allow_new_snaps(True);
|
|
|
|
self.fs.set_max_mds(3)
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.wait_for_daemons()
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
self.mount_a.run_shell(["mkdir", "-p", "d0/d1/dir"])
|
|
|
|
self.mount_a.run_shell(["mkdir", "-p", "d0/d2/dir"])
|
|
|
|
self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
|
|
|
|
self.mount_a.setfattr("d0/d1", "ceph.dir.pin", "1")
|
|
|
|
self.mount_a.setfattr("d0/d2", "ceph.dir.pin", "2")
|
2020-06-19 20:52:22 +00:00
|
|
|
self._wait_subtrees([("/d0", 0), ("/d0/d1", 1), ("/d0/d2", 2)], rank="all", status=status, path="/d0")
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
def _check_snapclient_cache(snaps_dump, cache_dump=None, rank=0):
|
2018-02-01 05:47:48 +00:00
|
|
|
if cache_dump is None:
|
2019-02-25 19:10:01 +00:00
|
|
|
cache_dump = self._get_snapclient_dump(rank=rank)
|
2019-10-09 12:36:58 +00:00
|
|
|
for key, value in cache_dump.items():
|
2018-02-01 05:47:48 +00:00
|
|
|
if value != snaps_dump[key]:
|
|
|
|
return False
|
|
|
|
return True;
|
|
|
|
|
|
|
|
# sync after mksnap
|
2019-02-25 19:10:01 +00:00
|
|
|
last_created = self._get_last_created_snap(rank=0)
|
|
|
|
self.mount_a.run_shell(["mkdir", "d0/d1/dir/.snap/s1", "d0/d1/dir/.snap/s2"])
|
|
|
|
self.wait_until_true(lambda: len(self._get_pending_snap_update(rank=0)) == 0, timeout=30)
|
|
|
|
self.assertGreater(self._get_last_created_snap(rank=0), last_created)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
snaps_dump = self._get_snapserver_dump(rank=0)
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=0));
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=1));
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=2));
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
# sync after rmsnap
|
2019-02-25 19:10:01 +00:00
|
|
|
last_destroyed = self._get_last_destroyed_snap(rank=0)
|
2018-02-01 05:47:48 +00:00
|
|
|
self.mount_a.run_shell(["rmdir", "d0/d1/dir/.snap/s1"])
|
2019-02-25 19:10:01 +00:00
|
|
|
self.wait_until_true(lambda: len(self._get_pending_snap_destroy(rank=0)) == 0, timeout=30)
|
|
|
|
self.assertGreater(self._get_last_destroyed_snap(rank=0), last_destroyed)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
snaps_dump = self._get_snapserver_dump(rank=0)
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=0));
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=1));
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=2));
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
# sync during mds recovers
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=2)
|
|
|
|
status = self.fs.wait_for_daemons(timeout=MDS_RESTART_GRACE)
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=2));
|
|
|
|
|
|
|
|
self.fs.rank_fail(rank=0)
|
|
|
|
self.fs.rank_fail(rank=1)
|
|
|
|
status = self.fs.wait_for_daemons()
|
2018-02-01 05:47:48 +00:00
|
|
|
self.fs.wait_for_state('up:active', rank=0, timeout=MDS_RESTART_GRACE)
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=0));
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=1));
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, rank=2));
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
# kill at MDSTableClient::handle_notify_prep
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.status()
|
|
|
|
rank2 = self.fs.get_rank(rank=2, status=status)
|
|
|
|
self.fs.rank_freeze(True, rank=2)
|
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "9"], rank=2, status=status)
|
2018-02-01 05:47:48 +00:00
|
|
|
proc = self.mount_a.run_shell(["mkdir", "d0/d1/dir/.snap/s3"], wait=False)
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=2), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank2['name']);
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
# mksnap should wait for notify ack from mds.2
|
|
|
|
self.assertFalse(proc.finished);
|
|
|
|
|
|
|
|
# mksnap should proceed after mds.2 fails
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=2)
|
2018-02-01 05:47:48 +00:00
|
|
|
self.wait_until_true(lambda: proc.finished, timeout=30);
|
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.mds_restart(rank2['name'])
|
|
|
|
self.wait_for_daemon_start([rank2['name']])
|
|
|
|
status = self.fs.wait_for_daemons(timeout=MDS_RESTART_GRACE)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", Raw("d0/d1/dir/.snap/*")])
|
|
|
|
|
|
|
|
# kill at MDSTableClient::commit
|
|
|
|
# the recovering mds should sync all mds' cache when it enters resolve stage
|
|
|
|
self.set_conf("mds", "mds_reconnect_timeout", "5")
|
|
|
|
for i in range(1, 4):
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.status()
|
|
|
|
rank2 = self.fs.get_rank(rank=2, status=status)
|
|
|
|
self.fs.rank_freeze(True, rank=2)
|
|
|
|
self.fs.rank_asok(['config', 'set', "mds_kill_mdstable_at", "4"], rank=2, status=status)
|
|
|
|
last_created = self._get_last_created_snap(rank=0)
|
2018-02-01 05:47:48 +00:00
|
|
|
proc = self.mount_a.run_shell(["mkdir", "d0/d2/dir/.snap/s{0}".format(i)], wait=False)
|
2021-10-21 01:43:54 +00:00
|
|
|
self.wait_until_true(lambda: "laggy_since" in self.fs.get_rank(rank=2), timeout=self.fs.beacon_timeout);
|
2019-02-25 19:10:01 +00:00
|
|
|
self.delete_mds_coredump(rank2['name']);
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
self.mount_a.kill()
|
|
|
|
self.mount_a.kill_cleanup()
|
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.assertEqual(len(self._get_pending_snap_update(rank=0)), 1)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
if i in [2,4]:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=0)
|
2018-02-01 05:47:48 +00:00
|
|
|
if i in [3,4]:
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=1)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.fs.rank_fail(rank=2)
|
|
|
|
self.fs.mds_restart(rank2['name'])
|
|
|
|
self.wait_for_daemon_start([rank2['name']])
|
|
|
|
status = self.fs.wait_for_daemons(timeout=MDS_RESTART_GRACE)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
rank0_cache = self._get_snapclient_dump(rank=0)
|
|
|
|
rank1_cache = self._get_snapclient_dump(rank=1)
|
|
|
|
rank2_cache = self._get_snapclient_dump(rank=2)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
self.assertGreater(int(rank0_cache["last_created"]), last_created)
|
|
|
|
self.assertEqual(rank0_cache, rank1_cache);
|
|
|
|
self.assertEqual(rank0_cache, rank2_cache);
|
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
self.wait_until_true(lambda: len(self._get_pending_snap_update(rank=0)) == 0, timeout=30)
|
2018-02-01 05:47:48 +00:00
|
|
|
|
2019-02-25 19:10:01 +00:00
|
|
|
snaps_dump = self._get_snapserver_dump(rank=0)
|
2018-02-01 05:47:48 +00:00
|
|
|
self.assertEqual(snaps_dump["last_created"], rank0_cache["last_created"])
|
|
|
|
self.assertTrue(_check_snapclient_cache(snaps_dump, cache_dump=rank0_cache));
|
|
|
|
|
2020-04-03 09:26:22 +00:00
|
|
|
self.mount_a.mount_wait()
|
2018-02-01 05:47:48 +00:00
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", Raw("d0/d2/dir/.snap/*")])
|
|
|
|
|
2018-01-02 09:14:14 +00:00
|
|
|
def test_multimds_mksnap(self):
|
|
|
|
"""
|
|
|
|
check if snapshot takes effect across authority subtrees
|
|
|
|
"""
|
|
|
|
self.fs.set_allow_new_snaps(True);
|
|
|
|
self.fs.set_max_mds(2)
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.wait_for_daemons()
|
2018-01-02 09:14:14 +00:00
|
|
|
|
2020-06-19 20:52:22 +00:00
|
|
|
self.mount_a.run_shell(["mkdir", "-p", "d0/d1/empty"])
|
2018-01-02 09:14:14 +00:00
|
|
|
self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
|
|
|
|
self.mount_a.setfattr("d0/d1", "ceph.dir.pin", "1")
|
2020-06-19 20:52:22 +00:00
|
|
|
self._wait_subtrees([("/d0", 0), ("/d0/d1", 1)], rank="all", status=status, path="/d0")
|
2018-01-02 09:14:14 +00:00
|
|
|
|
|
|
|
self.mount_a.write_test_pattern("d0/d1/file_a", 8 * 1024 * 1024)
|
|
|
|
self.mount_a.run_shell(["mkdir", "d0/.snap/s1"])
|
|
|
|
self.mount_a.run_shell(["rm", "-f", "d0/d1/file_a"])
|
|
|
|
self.mount_a.validate_test_pattern("d0/.snap/s1/d1/file_a", 8 * 1024 * 1024)
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", "d0/.snap/s1"])
|
|
|
|
self.mount_a.run_shell(["rm", "-rf", "d0"])
|
|
|
|
|
|
|
|
def test_multimds_past_parents(self):
|
|
|
|
"""
|
|
|
|
check if past parents are properly recorded during across authority rename
|
|
|
|
"""
|
|
|
|
self.fs.set_allow_new_snaps(True);
|
|
|
|
self.fs.set_max_mds(2)
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.wait_for_daemons()
|
2018-01-02 09:14:14 +00:00
|
|
|
|
2020-06-19 20:52:22 +00:00
|
|
|
self.mount_a.run_shell_payload("mkdir -p {d0,d1}/empty")
|
2018-01-02 09:14:14 +00:00
|
|
|
self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
|
|
|
|
self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
|
2020-06-19 20:52:22 +00:00
|
|
|
self._wait_subtrees([("/d0", 0), ("/d1", 1)], rank=0, status=status)
|
2018-01-02 09:14:14 +00:00
|
|
|
|
|
|
|
self.mount_a.run_shell(["mkdir", "d0/d3"])
|
|
|
|
self.mount_a.run_shell(["mkdir", "d0/.snap/s1"])
|
|
|
|
snap_name = self.mount_a.run_shell(["ls", "d0/d3/.snap"]).stdout.getvalue()
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["mv", "d0/d3", "d1/d3"])
|
|
|
|
snap_name1 = self.mount_a.run_shell(["ls", "d1/d3/.snap"]).stdout.getvalue()
|
|
|
|
self.assertEqual(snap_name1, snap_name);
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", "d0/.snap/s1"])
|
|
|
|
snap_name1 = self.mount_a.run_shell(["ls", "d1/d3/.snap"]).stdout.getvalue()
|
|
|
|
self.assertEqual(snap_name1, "");
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rm", "-rf", "d0", "d1"])
|
|
|
|
|
|
|
|
def test_multimds_hardlink(self):
|
|
|
|
"""
|
|
|
|
check if hardlink snapshot works in multimds setup
|
|
|
|
"""
|
|
|
|
self.fs.set_allow_new_snaps(True);
|
|
|
|
self.fs.set_max_mds(2)
|
2019-02-25 19:10:01 +00:00
|
|
|
status = self.fs.wait_for_daemons()
|
2018-01-02 09:14:14 +00:00
|
|
|
|
2020-06-19 20:52:22 +00:00
|
|
|
self.mount_a.run_shell_payload("mkdir -p {d0,d1}/empty")
|
2018-01-02 09:14:14 +00:00
|
|
|
|
|
|
|
self.mount_a.setfattr("d0", "ceph.dir.pin", "0")
|
|
|
|
self.mount_a.setfattr("d1", "ceph.dir.pin", "1")
|
2020-06-19 20:52:22 +00:00
|
|
|
self._wait_subtrees([("/d0", 0), ("/d1", 1)], rank=0, status=status)
|
2018-01-02 09:14:14 +00:00
|
|
|
|
|
|
|
self.mount_a.run_python(dedent("""
|
|
|
|
import os
|
|
|
|
open(os.path.join("{path}", "d0/file1"), 'w').write("asdf")
|
|
|
|
open(os.path.join("{path}", "d0/file2"), 'w').write("asdf")
|
|
|
|
""".format(path=self.mount_a.mountpoint)
|
|
|
|
))
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["ln", "d0/file1", "d1/file1"])
|
|
|
|
self.mount_a.run_shell(["ln", "d0/file2", "d1/file2"])
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["mkdir", "d1/.snap/s1"])
|
|
|
|
|
|
|
|
self.mount_a.run_python(dedent("""
|
|
|
|
import os
|
|
|
|
open(os.path.join("{path}", "d0/file1"), 'w').write("qwer")
|
|
|
|
""".format(path=self.mount_a.mountpoint)
|
|
|
|
))
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["grep", "asdf", "d1/.snap/s1/file1"])
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rm", "-f", "d0/file2"])
|
|
|
|
self.mount_a.run_shell(["grep", "asdf", "d1/.snap/s1/file2"])
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rm", "-f", "d1/file2"])
|
|
|
|
self.mount_a.run_shell(["grep", "asdf", "d1/.snap/s1/file2"])
|
|
|
|
|
|
|
|
self.mount_a.run_shell(["rmdir", "d1/.snap/s1"])
|
|
|
|
self.mount_a.run_shell(["rm", "-rf", "d0", "d1"])
|
2019-10-17 06:15:00 +00:00
|
|
|
|
|
|
|
class SnapLimitViolationException(Exception):
|
|
|
|
failed_snapshot_number = -1
|
|
|
|
|
|
|
|
def __init__(self, num):
|
|
|
|
self.failed_snapshot_number = num
|
|
|
|
|
|
|
|
def get_snap_name(self, dir_name, sno):
|
|
|
|
sname = "{dir_name}/.snap/s_{sno}".format(dir_name=dir_name, sno=sno)
|
|
|
|
return sname
|
|
|
|
|
|
|
|
def create_snap_dir(self, sname):
|
|
|
|
self.mount_a.run_shell(["mkdir", sname])
|
|
|
|
|
|
|
|
def delete_dir_and_snaps(self, dir_name, snaps):
|
|
|
|
for sno in range(1, snaps+1, 1):
|
|
|
|
sname = self.get_snap_name(dir_name, sno)
|
|
|
|
self.mount_a.run_shell(["rmdir", sname])
|
|
|
|
self.mount_a.run_shell(["rmdir", dir_name])
|
|
|
|
|
|
|
|
def create_dir_and_snaps(self, dir_name, snaps):
|
|
|
|
self.mount_a.run_shell(["mkdir", dir_name])
|
2020-03-10 10:41:07 +00:00
|
|
|
|
2019-10-17 06:15:00 +00:00
|
|
|
for sno in range(1, snaps+1, 1):
|
|
|
|
sname = self.get_snap_name(dir_name, sno)
|
|
|
|
try:
|
|
|
|
self.create_snap_dir(sname)
|
|
|
|
except CommandFailedError as e:
|
|
|
|
# failing at the last mkdir beyond the limit is expected
|
|
|
|
if sno == snaps:
|
|
|
|
log.info("failed while creating snap #{}: {}".format(sno, repr(e)))
|
|
|
|
raise TestSnapshots.SnapLimitViolationException(sno)
|
|
|
|
|
|
|
|
def test_mds_max_snaps_per_dir_default_limit(self):
|
|
|
|
"""
|
|
|
|
Test the newly introudced option named mds_max_snaps_per_dir
|
|
|
|
Default snaps limit is 100
|
|
|
|
Test if the default number of snapshot directories can be created
|
|
|
|
"""
|
|
|
|
self.create_dir_and_snaps("accounts", int(self.mds_max_snaps_per_dir))
|
|
|
|
self.delete_dir_and_snaps("accounts", int(self.mds_max_snaps_per_dir))
|
|
|
|
|
|
|
|
def test_mds_max_snaps_per_dir_with_increased_limit(self):
|
|
|
|
"""
|
|
|
|
Test the newly introudced option named mds_max_snaps_per_dir
|
2020-03-10 10:41:07 +00:00
|
|
|
First create 101 directories and ensure that the 101st directory
|
2019-10-17 06:15:00 +00:00
|
|
|
creation fails. Then increase the default by one and see if the
|
|
|
|
additional directory creation succeeds
|
|
|
|
"""
|
|
|
|
# first test the default limit
|
|
|
|
new_limit = int(self.mds_max_snaps_per_dir)
|
|
|
|
self.fs.rank_asok(['config', 'set', 'mds_max_snaps_per_dir', repr(new_limit)])
|
|
|
|
try:
|
|
|
|
self.create_dir_and_snaps("accounts", new_limit + 1)
|
|
|
|
except TestSnapshots.SnapLimitViolationException as e:
|
|
|
|
if e.failed_snapshot_number == (new_limit + 1):
|
|
|
|
pass
|
|
|
|
# then increase the limit by one and test
|
|
|
|
new_limit = new_limit + 1
|
|
|
|
self.fs.rank_asok(['config', 'set', 'mds_max_snaps_per_dir', repr(new_limit)])
|
|
|
|
sname = self.get_snap_name("accounts", new_limit)
|
|
|
|
self.create_snap_dir(sname)
|
|
|
|
self.delete_dir_and_snaps("accounts", new_limit)
|
|
|
|
|
|
|
|
def test_mds_max_snaps_per_dir_with_reduced_limit(self):
|
|
|
|
"""
|
|
|
|
Test the newly introudced option named mds_max_snaps_per_dir
|
|
|
|
First create 99 directories. Then reduce the limit to 98. Then try
|
|
|
|
creating another directory and ensure that additional directory
|
|
|
|
creation fails.
|
|
|
|
"""
|
|
|
|
# first test the new limit
|
|
|
|
new_limit = int(self.mds_max_snaps_per_dir) - 1
|
|
|
|
self.create_dir_and_snaps("accounts", new_limit)
|
|
|
|
sname = self.get_snap_name("accounts", new_limit + 1)
|
|
|
|
# then reduce the limit by one and test
|
|
|
|
new_limit = new_limit - 1
|
|
|
|
self.fs.rank_asok(['config', 'set', 'mds_max_snaps_per_dir', repr(new_limit)])
|
|
|
|
try:
|
|
|
|
self.create_snap_dir(sname)
|
2019-12-09 15:17:23 +00:00
|
|
|
except CommandFailedError:
|
2019-10-17 06:15:00 +00:00
|
|
|
# after reducing limit we expect the new snapshot creation to fail
|
|
|
|
pass
|
|
|
|
self.delete_dir_and_snaps("accounts", new_limit + 1)
|