2020-07-01 02:20:38 +00:00
|
|
|
import logging
|
|
|
|
import errno
|
|
|
|
from tasks.cephfs.cephfs_test_case import CephFSTestCase
|
2020-08-25 13:33:47 +00:00
|
|
|
from teuthology.contextutil import safe_while
|
2021-06-15 12:55:22 +00:00
|
|
|
from teuthology.exceptions import CommandFailedError
|
2020-07-01 02:20:38 +00:00
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
class TestScrub2(CephFSTestCase):
|
|
|
|
MDSS_REQUIRED = 3
|
|
|
|
CLIENTS_REQUIRED = 1
|
|
|
|
|
2020-12-31 02:25:20 +00:00
|
|
|
def _check_scrub_status(self, result=None, reverse=False):
|
|
|
|
self.assertEqual(self.fs.wait_until_scrub_complete(result=result, rank=1,
|
|
|
|
sleep=5, timeout=30,
|
|
|
|
reverse=reverse), True)
|
|
|
|
self.assertEqual(self.fs.wait_until_scrub_complete(result=result, rank=2,
|
|
|
|
sleep=5, timeout=30,
|
|
|
|
reverse=reverse), True)
|
|
|
|
self.assertEqual(self.fs.wait_until_scrub_complete(result=result, rank=0,
|
|
|
|
sleep=5, timeout=30,
|
|
|
|
reverse=reverse), True)
|
|
|
|
|
2020-08-25 13:33:47 +00:00
|
|
|
def _check_task_status_na(self, timo=120):
|
|
|
|
""" check absence of scrub status in ceph status """
|
|
|
|
with safe_while(sleep=1, tries=120, action='wait for task status') as proceed:
|
|
|
|
while proceed():
|
|
|
|
active = self.fs.get_active_names()
|
|
|
|
log.debug("current active={0}".format(active))
|
|
|
|
task_status = self.fs.get_task_status("scrub status")
|
|
|
|
if not active[0] in task_status:
|
|
|
|
return True
|
|
|
|
|
|
|
|
def _check_task_status(self, expected_status, timo=120):
|
|
|
|
""" check scrub status for current active mds in ceph status """
|
|
|
|
with safe_while(sleep=1, tries=120, action='wait for task status') as proceed:
|
|
|
|
while proceed():
|
|
|
|
active = self.fs.get_active_names()
|
|
|
|
log.debug("current active={0}".format(active))
|
|
|
|
task_status = self.fs.get_task_status("scrub status")
|
|
|
|
try:
|
|
|
|
if task_status[active[0]].startswith(expected_status):
|
|
|
|
return True
|
|
|
|
except KeyError:
|
|
|
|
pass
|
|
|
|
|
2020-07-01 02:20:38 +00:00
|
|
|
def _find_path_inos(self, root_path):
|
|
|
|
inos = []
|
|
|
|
p = self.mount_a.run_shell(["find", root_path])
|
|
|
|
paths = p.stdout.getvalue().strip().split()
|
|
|
|
for path in paths:
|
|
|
|
inos.append(self.mount_a.path_to_ino(path))
|
|
|
|
return inos
|
|
|
|
|
|
|
|
def _setup_subtrees(self):
|
|
|
|
self.fs.set_max_mds(3)
|
|
|
|
self.fs.wait_for_daemons()
|
|
|
|
status = self.fs.status()
|
|
|
|
|
|
|
|
path = 'd1/d2/d3/d4/d5/d6/d7/d8'
|
|
|
|
self.mount_a.run_shell(['mkdir', '-p', path])
|
|
|
|
self.mount_a.run_shell(['sync', path])
|
|
|
|
|
2020-08-25 13:33:47 +00:00
|
|
|
self.mount_a.setfattr("d1/d2", "ceph.dir.pin", "0")
|
|
|
|
self.mount_a.setfattr("d1/d2/d3/d4", "ceph.dir.pin", "1")
|
|
|
|
self.mount_a.setfattr("d1/d2/d3/d4/d5/d6", "ceph.dir.pin", "2")
|
|
|
|
|
|
|
|
self._wait_subtrees([('/d1/d2', 0), ('/d1/d2/d3/d4', 1)], status, 0)
|
|
|
|
self._wait_subtrees([('/d1/d2/d3/d4', 1), ('/d1/d2/d3/d4/d5/d6', 2)], status, 1)
|
|
|
|
self._wait_subtrees([('/d1/d2/d3/d4', 1), ('/d1/d2/d3/d4/d5/d6', 2)], status, 2)
|
2020-07-01 02:20:38 +00:00
|
|
|
|
|
|
|
for rank in range(3):
|
|
|
|
self.fs.rank_tell(["flush", "journal"], rank)
|
|
|
|
|
|
|
|
def test_apply_tag(self):
|
|
|
|
self._setup_subtrees()
|
|
|
|
inos = self._find_path_inos('d1/d2/d3/')
|
|
|
|
|
|
|
|
tag = "tag123"
|
2020-12-23 01:54:52 +00:00
|
|
|
out_json = self.fs.rank_tell(["tag", "path", "/d1/d2/d3", tag], 0)
|
|
|
|
self.assertNotEqual(out_json, None)
|
|
|
|
self.assertEqual(out_json["return_code"], 0)
|
|
|
|
self.assertEqual(self.fs.wait_until_scrub_complete(tag=out_json["scrub_tag"]), True)
|
2020-07-01 02:20:38 +00:00
|
|
|
|
|
|
|
def assertTagged(ino):
|
|
|
|
file_obj_name = "{0:x}.00000000".format(ino)
|
2021-03-10 22:46:27 +00:00
|
|
|
self.fs.radosm(["getxattr", file_obj_name, "scrub_tag"])
|
2020-07-01 02:20:38 +00:00
|
|
|
|
|
|
|
for ino in inos:
|
|
|
|
assertTagged(ino)
|
|
|
|
|
|
|
|
def test_scrub_backtrace(self):
|
|
|
|
self._setup_subtrees()
|
|
|
|
inos = self._find_path_inos('d1/d2/d3/')
|
|
|
|
|
|
|
|
for ino in inos:
|
|
|
|
file_obj_name = "{0:x}.00000000".format(ino)
|
2021-03-10 22:46:27 +00:00
|
|
|
self.fs.radosm(["rmxattr", file_obj_name, "parent"])
|
2020-07-01 02:20:38 +00:00
|
|
|
|
2021-06-09 02:37:16 +00:00
|
|
|
out_json = self.fs.run_scrub(["start", "/d1/d2/d3", "recursive,force"], 0)
|
2020-12-23 01:54:52 +00:00
|
|
|
self.assertNotEqual(out_json, None)
|
|
|
|
self.assertEqual(out_json["return_code"], 0)
|
|
|
|
self.assertEqual(self.fs.wait_until_scrub_complete(tag=out_json["scrub_tag"]), True)
|
2020-07-01 02:20:38 +00:00
|
|
|
|
|
|
|
def _check_damage(mds_rank, inos):
|
|
|
|
all_damage = self.fs.rank_tell(["damage", "ls"], mds_rank)
|
|
|
|
damage = [d for d in all_damage if d['ino'] in inos and d['damage_type'] == "backtrace"]
|
|
|
|
return len(damage) >= len(inos)
|
|
|
|
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertTrue(_check_damage(0, inos[0:2]))
|
|
|
|
self.assertTrue(_check_damage(1, inos[2:4]))
|
|
|
|
self.assertTrue(_check_damage(2, inos[4:6]))
|
2020-07-01 02:20:38 +00:00
|
|
|
|
|
|
|
def test_scrub_non_mds0(self):
|
|
|
|
self._setup_subtrees()
|
|
|
|
|
|
|
|
def expect_exdev(cmd, mds):
|
|
|
|
try:
|
|
|
|
self.fs.mon_manager.raw_cluster_cmd('tell', 'mds.{0}'.format(mds), *cmd)
|
|
|
|
except CommandFailedError as e:
|
|
|
|
if e.exitstatus == errno.EXDEV:
|
|
|
|
pass
|
|
|
|
else:
|
|
|
|
raise
|
|
|
|
else:
|
|
|
|
raise RuntimeError("expected failure")
|
|
|
|
|
|
|
|
rank1 = self.fs.get_rank(rank=1)
|
|
|
|
expect_exdev(["scrub", "start", "/d1/d2/d3"], rank1["name"])
|
|
|
|
expect_exdev(["scrub", "abort"], rank1["name"])
|
|
|
|
expect_exdev(["scrub", "pause"], rank1["name"])
|
|
|
|
expect_exdev(["scrub", "resume"], rank1["name"])
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
def test_scrub_abort_mds0(self):
|
|
|
|
self._setup_subtrees()
|
|
|
|
|
|
|
|
inos = self._find_path_inos('d1/d2/d3/')
|
|
|
|
|
|
|
|
for ino in inos:
|
|
|
|
file_obj_name = "{0:x}.00000000".format(ino)
|
2021-03-10 22:46:27 +00:00
|
|
|
self.fs.radosm(["rmxattr", file_obj_name, "parent"])
|
2020-08-25 13:33:47 +00:00
|
|
|
|
2021-06-09 02:37:16 +00:00
|
|
|
out_json = self.fs.run_scrub(["start", "/d1/d2/d3", "recursive,force"], 0)
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertNotEqual(out_json, None)
|
|
|
|
|
2020-12-23 03:31:09 +00:00
|
|
|
res = self.fs.run_scrub(["abort"])
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertEqual(res['return_code'], 0)
|
|
|
|
|
|
|
|
# Abort and verify in both mdss. We also check the status in rank 0 mds because
|
|
|
|
# it is supposed to gather the scrub status from other mdss.
|
2020-12-31 02:25:20 +00:00
|
|
|
self._check_scrub_status()
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
# sleep enough to fetch updated task status
|
|
|
|
checked = self._check_task_status_na()
|
|
|
|
self.assertTrue(checked)
|
|
|
|
|
|
|
|
def test_scrub_pause_and_resume_mds0(self):
|
|
|
|
self._setup_subtrees()
|
|
|
|
|
|
|
|
inos = self._find_path_inos('d1/d2/d3/')
|
|
|
|
|
|
|
|
for ino in inos:
|
|
|
|
file_obj_name = "{0:x}.00000000".format(ino)
|
2021-03-10 22:46:27 +00:00
|
|
|
self.fs.radosm(["rmxattr", file_obj_name, "parent"])
|
2020-08-25 13:33:47 +00:00
|
|
|
|
2021-06-09 02:37:16 +00:00
|
|
|
out_json = self.fs.run_scrub(["start", "/d1/d2/d3", "recursive,force"], 0)
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertNotEqual(out_json, None)
|
|
|
|
|
2020-12-23 03:31:09 +00:00
|
|
|
res = self.fs.run_scrub(["pause"])
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertEqual(res['return_code'], 0)
|
|
|
|
|
2020-12-31 02:25:20 +00:00
|
|
|
self._check_scrub_status(result="PAUSED")
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
checked = self._check_task_status("paused")
|
|
|
|
self.assertTrue(checked)
|
|
|
|
|
|
|
|
# resume and verify
|
2020-12-23 03:31:09 +00:00
|
|
|
res = self.fs.run_scrub(["resume"])
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertEqual(res['return_code'], 0)
|
|
|
|
|
2020-12-31 02:25:20 +00:00
|
|
|
self._check_scrub_status(result="PAUSED", reverse=True)
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
checked = self._check_task_status_na()
|
|
|
|
self.assertTrue(checked)
|
|
|
|
|
|
|
|
def test_scrub_pause_and_resume_with_abort_mds0(self):
|
|
|
|
self._setup_subtrees()
|
|
|
|
|
|
|
|
inos = self._find_path_inos('d1/d2/d3/')
|
|
|
|
|
|
|
|
for ino in inos:
|
|
|
|
file_obj_name = "{0:x}.00000000".format(ino)
|
2021-03-10 22:46:27 +00:00
|
|
|
self.fs.radosm(["rmxattr", file_obj_name, "parent"])
|
2020-08-25 13:33:47 +00:00
|
|
|
|
2021-06-09 02:37:16 +00:00
|
|
|
out_json = self.fs.run_scrub(["start", "/d1/d2/d3", "recursive,force"], 0)
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertNotEqual(out_json, None)
|
|
|
|
|
2020-12-23 03:31:09 +00:00
|
|
|
res = self.fs.run_scrub(["pause"])
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertEqual(res['return_code'], 0)
|
|
|
|
|
2020-12-31 02:25:20 +00:00
|
|
|
self._check_scrub_status(result="PAUSED")
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
checked = self._check_task_status("paused")
|
|
|
|
self.assertTrue(checked)
|
|
|
|
|
2020-12-23 03:31:09 +00:00
|
|
|
res = self.fs.run_scrub(["abort"])
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertEqual(res['return_code'], 0)
|
|
|
|
|
2020-12-31 02:25:20 +00:00
|
|
|
self._check_scrub_status(result="PAUSED")
|
|
|
|
self._check_scrub_status(result="0 inodes")
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
# scrub status should still be paused...
|
|
|
|
checked = self._check_task_status("paused")
|
|
|
|
self.assertTrue(checked)
|
|
|
|
|
|
|
|
# resume and verify
|
2020-12-23 03:31:09 +00:00
|
|
|
res = self.fs.run_scrub(["resume"])
|
2020-08-25 13:33:47 +00:00
|
|
|
self.assertEqual(res['return_code'], 0)
|
|
|
|
|
2020-12-31 02:25:20 +00:00
|
|
|
self._check_scrub_status(result="PAUSED", reverse=True)
|
2020-08-25 13:33:47 +00:00
|
|
|
|
|
|
|
checked = self._check_task_status_na()
|
|
|
|
self.assertTrue(checked)
|