ceph/qa/tasks/cephfs/test_sessionmap.py

from StringIO import StringIO
import json
import logging
from unittest import SkipTest

from tasks.cephfs.fuse_mount import FuseMount
from teuthology.exceptions import CommandFailedError
from tasks.cephfs.cephfs_test_case import CephFSTestCase

log = logging.getLogger(__name__)


class TestSessionMap(CephFSTestCase):
    CLIENTS_REQUIRED = 2
    MDSS_REQUIRED = 2

    def test_tell_session_drop(self):
        """
        That when a `tell` command is sent using the python CLI,
        its MDS session is gone after it terminates
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        mds_id = self.fs.get_lone_mds_id()
        self.fs.mon_manager.raw_cluster_cmd("tell", "mds.{0}".format(mds_id), "session", "ls")

        ls_data = self.fs.mds_asok(['session', 'ls'])
        self.assertEqual(len(ls_data), 0)

    def _get_thread_count(self, mds_id):
        remote = self.fs.mds_daemons[mds_id].remote

        ps_txt = remote.run(
            args=["ps", "-ww", "axo", "nlwp,cmd"],
            stdout=StringIO()
        ).stdout.getvalue().strip()
        lines = ps_txt.split("\n")[1:]

        for line in lines:
            if "ceph-mds" in line and not "daemon-helper" in line:
                if line.find("-i {0}".format(mds_id)) != -1:
                    log.info("Found ps line for daemon: {0}".format(line))
                    return int(line.split()[0])

        raise RuntimeError("No process found in ps output for MDS {0}: {1}".format(
            mds_id, ps_txt
        ))

    def test_tell_conn_close(self):
        """
        That when a `tell` command is sent using the python CLI,
        the thread count goes back to where it started (i.e. we aren't
        leaving connections open)
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        mds_id = self.fs.get_lone_mds_id()

        initial_thread_count = self._get_thread_count(mds_id)
        self.fs.mon_manager.raw_cluster_cmd("tell", "mds.{0}".format(mds_id), "session", "ls")
        final_thread_count = self._get_thread_count(mds_id)

        self.assertEqual(initial_thread_count, final_thread_count)

    def test_mount_conn_close(self):
        """
        That when a client unmounts, the thread count on the MDS goes back
        to what it was before the client mounted
        """
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        mds_id = self.fs.get_lone_mds_id()

        initial_thread_count = self._get_thread_count(mds_id)
        self.mount_a.mount()
        self.mount_a.wait_until_mounted()
        self.assertGreater(self._get_thread_count(mds_id), initial_thread_count)
        self.mount_a.umount_wait()
        final_thread_count = self._get_thread_count(mds_id)

        self.assertEqual(initial_thread_count, final_thread_count)

    def test_version_splitting(self):
        """
        That when many sessions are updated, they are correctly
        split into multiple versions to obey mds_sessionmap_keys_per_op
        """

        # Start umounted
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        # Configure MDS to write one OMAP key at once
        self.set_conf('mds', 'mds_sessionmap_keys_per_op', 1)
        self.fs.mds_fail_restart()
        self.fs.wait_for_daemons()

        # I would like two MDSs, so that I can do an export dir later
        self.fs.set_max_mds(2)
        self.fs.wait_for_daemons()

        active_mds_names = self.fs.get_active_names()
        rank_0_id = active_mds_names[0]
        rank_1_id = active_mds_names[1]
        log.info("Ranks 0 and 1 are {0} and {1}".format(
            rank_0_id, rank_1_id))

        # Bring the clients back
        self.mount_a.mount()
        self.mount_b.mount()
        self.mount_a.create_files()  # Kick the client into opening sessions
        self.mount_b.create_files()

        # See that they've got sessions
        self.assert_session_count(2, mds_id=rank_0_id)

        # See that we persist their sessions
        self.fs.mds_asok(["flush", "journal"], rank_0_id)
        table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
        log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
        self.assertEqual(table_json['0']['result'], 0)
        self.assertEqual(len(table_json['0']['data']['Sessions']), 2)

        # Now, induce a "force_open_sessions" event by exporting a dir
        self.mount_a.run_shell(["mkdir", "bravo"])
        self.mount_a.run_shell(["touch", "bravo/file"])
        self.mount_b.run_shell(["ls", "-l", "bravo/file"])

        def get_omap_wrs():
            return self.fs.mds_asok(['perf', 'dump', 'objecter'], rank_1_id)['objecter']['omap_wr']

        # Flush so that there are no dirty sessions on rank 1
        self.fs.mds_asok(["flush", "journal"], rank_1_id)

        # Export so that we get a force_open to rank 1 for the two sessions from rank 0
        initial_omap_wrs = get_omap_wrs()
        self.fs.mds_asok(['export', 'dir', '/bravo', '1'], rank_0_id)

        # This is the critical (if rather subtle) check: that in the process of doing an export dir,
        # we hit force_open_sessions, and as a result we end up writing out the sessionmap.  There
        # will be two sessions dirtied here, and because we have set keys_per_op to 1, we should see
        # a single session get written out (the first of the two, triggered by the second getting marked
        # dirty)
        # The number of writes is two per session, because the header (sessionmap version) update and
        # KV write both count. Also, multiply by 2 for each openfile table update.
        self.wait_until_true(
            lambda: get_omap_wrs() - initial_omap_wrs == 2*2,
            timeout=30  # Long enough for an export to get acked
        )

        # Now end our sessions and check the backing sessionmap is updated correctly
        self.mount_a.umount_wait()
        self.mount_b.umount_wait()

        # In-memory sessionmap check
        self.assert_session_count(0, mds_id=rank_0_id)

        # On-disk sessionmap check
        self.fs.mds_asok(["flush", "journal"], rank_0_id)
        table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))
        log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))
        self.assertEqual(table_json['0']['result'], 0)
        self.assertEqual(len(table_json['0']['data']['Sessions']), 0)

    def _sudo_write_file(self, remote, path, data):
        """
        Write data to a remote file as super user

        :param remote: Remote site.
        :param path: Path on the remote being written to.
        :param data: Data to be written.

        Both perms and owner are passed directly to chmod.
        """
        remote.run(
            args=[
                'sudo',
                'python',
                '-c',
                'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',
                path,
            ],
            stdin=data,
        )

    def _configure_auth(self, mount, id_name, mds_caps, osd_caps=None, mon_caps=None):
        """
        Set up auth credentials for a client mount, and write out the keyring
        for the client to use.
        """

        if osd_caps is None:
            osd_caps = "allow rw"

        if mon_caps is None:
            mon_caps = "allow r"

        out = self.fs.mon_manager.raw_cluster_cmd(
            "auth", "get-or-create", "client.{name}".format(name=id_name),
            "mds", mds_caps,
            "osd", osd_caps,
            "mon", mon_caps
        )
        mount.client_id = id_name
        self._sudo_write_file(mount.client_remote, mount.get_keyring_path(), out)
        self.set_conf("client.{name}".format(name=id_name), "keyring", mount.get_keyring_path())

    def test_session_reject(self):
        if not isinstance(self.mount_a, FuseMount):
            raise SkipTest("Requires FUSE client to inject client metadata")

        self.mount_a.run_shell(["mkdir", "foo"])
        self.mount_a.run_shell(["mkdir", "foo/bar"])
        self.mount_a.umount_wait()

        # Mount B will be my rejected client
        self.mount_b.umount_wait()

        # Configure a client that is limited to /foo/bar
        self._configure_auth(self.mount_b, "badguy", "allow rw path=/foo/bar")
        # Check he can mount that dir and do IO
        self.mount_b.mount(mount_path="/foo/bar")
        self.mount_b.wait_until_mounted()
        self.mount_b.create_destroy()
        self.mount_b.umount_wait()

        # Configure the client to claim that its mount point metadata is /baz
        self.set_conf("client.badguy", "client_metadata", "root=/baz")
        # Try to mount the client, see that it fails
        with self.assert_cluster_log("client session with non-allowable root '/baz' denied"):
            with self.assertRaises(CommandFailedError):
                self.mount_b.mount(mount_path="/foo/bar")
tasks: add TestSessionMap.test_[mount\|tell]_conn_close To check that teardown is happening correctly when sending commands to an MDS. Fixes: #14048 Signed-off-by: John Spray <john.spray@redhat.com> 2015-12-14 22:16:46 +00:00			`from StringIO import StringIO`
tasks/cephfs: add test_sessionmap Tests for the persistence behaviour of SessionMap. Signed-off-by: John Spray <john.spray@redhat.com> 2015-03-26 17:50:23 +00:00			`import json`
			`import logging`
tasks/cephfs: skip test_session_reject cleanly Instead of asserting in configure_auth (which in fact works fine with KernelMount.write_secret_file), raise a SkipTest in test_session_reject (because the kernel client cannot handle the client_metadata setting to inject bogus data) Signed-off-by: John Spray <john.spray@redhat.com> 2016-09-01 17:33:50 +00:00			`from unittest import SkipTest`

tasks/cephfs: add TestSessionMap.test_session_reject Signed-off-by: John Spray <john.spray@redhat.com> 2015-11-27 15:52:27 +00:00			`from tasks.cephfs.fuse_mount import FuseMount`
			`from teuthology.exceptions import CommandFailedError`
tasks/cephfs: add test_sessionmap Tests for the persistence behaviour of SessionMap. Signed-off-by: John Spray <john.spray@redhat.com> 2015-03-26 17:50:23 +00:00			`from tasks.cephfs.cephfs_test_case import CephFSTestCase`

			`log = logging.getLogger(__name__)`


			`class TestSessionMap(CephFSTestCase):`
			`CLIENTS_REQUIRED = 2`
			`MDSS_REQUIRED = 2`

tasks/cephfs: quick test for `tell`... ...specifically that we don't have lingering MDS sessions after running it. This is testing that Client::shutdown is doing the right thing and closing sessions. Signed-off-by: John Spray <john.spray@redhat.com> 2015-10-28 05:28:42 +00:00			`def test_tell_session_drop(self):`
			`"""`
			That when a `tell` command is sent using the python CLI,
			`its MDS session is gone after it terminates`
			`"""`
			`self.mount_a.umount_wait()`
			`self.mount_b.umount_wait()`

			`mds_id = self.fs.get_lone_mds_id()`
			`self.fs.mon_manager.raw_cluster_cmd("tell", "mds.{0}".format(mds_id), "session", "ls")`

			`ls_data = self.fs.mds_asok(['session', 'ls'])`
			`self.assertEqual(len(ls_data), 0)`

tasks: add TestSessionMap.test_[mount\|tell]_conn_close To check that teardown is happening correctly when sending commands to an MDS. Fixes: #14048 Signed-off-by: John Spray <john.spray@redhat.com> 2015-12-14 22:16:46 +00:00			`def _get_thread_count(self, mds_id):`
			`remote = self.fs.mds_daemons[mds_id].remote`

			`ps_txt = remote.run(`
tasks/cephfs: fix ps usage to not truncate cmds Now that daemon commandlines include "--cluster" they easily overflow ps's default behaviour. Fixes: http://tracker.ceph.com/issues/15857 Signed-off-by: John Spray <john.spray@redhat.com> 2016-05-12 10:16:56 +00:00			`args=["ps", "-ww", "axo", "nlwp,cmd"],`
tasks: add TestSessionMap.test_[mount\|tell]_conn_close To check that teardown is happening correctly when sending commands to an MDS. Fixes: #14048 Signed-off-by: John Spray <john.spray@redhat.com> 2015-12-14 22:16:46 +00:00			`stdout=StringIO()`
			`).stdout.getvalue().strip()`
			`lines = ps_txt.split("\n")[1:]`

			`for line in lines:`
tasks/cephfs: find processes correctly Don't mistake the daemon-helper line for the actual daemon process. Fixes: http://tracker.ceph.com/issues/15900 Signed-off-by: John Spray <john.spray@redhat.com> 2016-05-23 18:52:21 +00:00			`if "ceph-mds" in line and not "daemon-helper" in line:`
tasks: add TestSessionMap.test_[mount\|tell]_conn_close To check that teardown is happening correctly when sending commands to an MDS. Fixes: #14048 Signed-off-by: John Spray <john.spray@redhat.com> 2015-12-14 22:16:46 +00:00			`if line.find("-i {0}".format(mds_id)) != -1:`
			`log.info("Found ps line for daemon: {0}".format(line))`
tasks/cephfs: fix ps usage to not truncate cmds Now that daemon commandlines include "--cluster" they easily overflow ps's default behaviour. Fixes: http://tracker.ceph.com/issues/15857 Signed-off-by: John Spray <john.spray@redhat.com> 2016-05-12 10:16:56 +00:00			`return int(line.split()[0])`
tasks: add TestSessionMap.test_[mount\|tell]_conn_close To check that teardown is happening correctly when sending commands to an MDS. Fixes: #14048 Signed-off-by: John Spray <john.spray@redhat.com> 2015-12-14 22:16:46 +00:00
			`raise RuntimeError("No process found in ps output for MDS {0}: {1}".format(`
			`mds_id, ps_txt`
			`))`

			`def test_tell_conn_close(self):`
			`"""`
			That when a `tell` command is sent using the python CLI,
			`the thread count goes back to where it started (i.e. we aren't`
			`leaving connections open)`
			`"""`
			`self.mount_a.umount_wait()`
			`self.mount_b.umount_wait()`

			`mds_id = self.fs.get_lone_mds_id()`

			`initial_thread_count = self._get_thread_count(mds_id)`
			`self.fs.mon_manager.raw_cluster_cmd("tell", "mds.{0}".format(mds_id), "session", "ls")`
			`final_thread_count = self._get_thread_count(mds_id)`

			`self.assertEqual(initial_thread_count, final_thread_count)`

			`def test_mount_conn_close(self):`
			`"""`
			`That when a client unmounts, the thread count on the MDS goes back`
			`to what it was before the client mounted`
			`"""`
			`self.mount_a.umount_wait()`
			`self.mount_b.umount_wait()`

			`mds_id = self.fs.get_lone_mds_id()`

			`initial_thread_count = self._get_thread_count(mds_id)`
			`self.mount_a.mount()`
tasks/cephfs: fix mount wait in test_mount_conn_close Fixes: http://tracker.ceph.com/issues/15900 Signed-off-by: John Spray <john.spray@redhat.com> 2016-05-23 15:00:37 +00:00			`self.mount_a.wait_until_mounted()`
tasks: add TestSessionMap.test_[mount\|tell]_conn_close To check that teardown is happening correctly when sending commands to an MDS. Fixes: #14048 Signed-off-by: John Spray <john.spray@redhat.com> 2015-12-14 22:16:46 +00:00			`self.assertGreater(self._get_thread_count(mds_id), initial_thread_count)`
			`self.mount_a.umount_wait()`
			`final_thread_count = self._get_thread_count(mds_id)`

			`self.assertEqual(initial_thread_count, final_thread_count)`

tasks/cephfs: add test_sessionmap Tests for the persistence behaviour of SessionMap. Signed-off-by: John Spray <john.spray@redhat.com> 2015-03-26 17:50:23 +00:00			`def test_version_splitting(self):`
			`"""`
			`That when many sessions are updated, they are correctly`
			`split into multiple versions to obey mds_sessionmap_keys_per_op`
			`"""`

			`# Start umounted`
			`self.mount_a.umount_wait()`
			`self.mount_b.umount_wait()`

			`# Configure MDS to write one OMAP key at once`
			`self.set_conf('mds', 'mds_sessionmap_keys_per_op', 1)`
			`self.fs.mds_fail_restart()`
			`self.fs.wait_for_daemons()`

			`# I would like two MDSs, so that I can do an export dir later`
qa: use fs methods for setting configs Signed-off-by: Patrick Donnelly <pdonnell@redhat.com> 2017-02-01 21:42:16 +00:00			`self.fs.set_max_mds(2)`
tasks/cephfs: add test_sessionmap Tests for the persistence behaviour of SessionMap. Signed-off-by: John Spray <john.spray@redhat.com> 2015-03-26 17:50:23 +00:00			`self.fs.wait_for_daemons()`

			`active_mds_names = self.fs.get_active_names()`
			`rank_0_id = active_mds_names[0]`
			`rank_1_id = active_mds_names[1]`
			`log.info("Ranks 0 and 1 are {0} and {1}".format(`
			`rank_0_id, rank_1_id))`

			`# Bring the clients back`
			`self.mount_a.mount()`
			`self.mount_b.mount()`
			`self.mount_a.create_files() # Kick the client into opening sessions`
			`self.mount_b.create_files()`

			`# See that they've got sessions`
			`self.assert_session_count(2, mds_id=rank_0_id)`

			`# See that we persist their sessions`
			`self.fs.mds_asok(["flush", "journal"], rank_0_id)`
			`table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))`
			`log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))`
			`self.assertEqual(table_json['0']['result'], 0)`
			`self.assertEqual(len(table_json['0']['data']['Sessions']), 2)`

			`# Now, induce a "force_open_sessions" event by exporting a dir`
			`self.mount_a.run_shell(["mkdir", "bravo"])`
			`self.mount_a.run_shell(["touch", "bravo/file"])`
			`self.mount_b.run_shell(["ls", "-l", "bravo/file"])`

			`def get_omap_wrs():`
			`return self.fs.mds_asok(['perf', 'dump', 'objecter'], rank_1_id)['objecter']['omap_wr']`

			`# Flush so that there are no dirty sessions on rank 1`
			`self.fs.mds_asok(["flush", "journal"], rank_1_id)`

			`# Export so that we get a force_open to rank 1 for the two sessions from rank 0`
			`initial_omap_wrs = get_omap_wrs()`
			`self.fs.mds_asok(['export', 'dir', '/bravo', '1'], rank_0_id)`

			`# This is the critical (if rather subtle) check: that in the process of doing an export dir,`
			`# we hit force_open_sessions, and as a result we end up writing out the sessionmap. There`
			`# will be two sessions dirtied here, and because we have set keys_per_op to 1, we should see`
			`# a single session get written out (the first of the two, triggered by the second getting marked`
			`# dirty)`
			`# The number of writes is two per session, because the header (sessionmap version) update and`
qa: extend timeout for SessionMap flush Fixes: https://tracker.ceph.com/issues/24129 Signed-off-by: Patrick Donnelly <pdonnell@redhat.com> 2018-05-14 22:19:51 +00:00			`# KV write both count. Also, multiply by 2 for each openfile table update.`
tasks/cephfs: fix race in test_sessionmap Fixes: #13698 Signed-off-by: John Spray <john.spray@redhat.com> 2015-11-05 01:15:57 +00:00			`self.wait_until_true(`
qa: extend timeout for SessionMap flush Fixes: https://tracker.ceph.com/issues/24129 Signed-off-by: Patrick Donnelly <pdonnell@redhat.com> 2018-05-14 22:19:51 +00:00			`lambda: get_omap_wrs() - initial_omap_wrs == 2*2,`
			`timeout=30 # Long enough for an export to get acked`
tasks/cephfs: fix race in test_sessionmap Fixes: #13698 Signed-off-by: John Spray <john.spray@redhat.com> 2015-11-05 01:15:57 +00:00			`)`
tasks/cephfs: add test_sessionmap Tests for the persistence behaviour of SessionMap. Signed-off-by: John Spray <john.spray@redhat.com> 2015-03-26 17:50:23 +00:00
			`# Now end our sessions and check the backing sessionmap is updated correctly`
			`self.mount_a.umount_wait()`
			`self.mount_b.umount_wait()`

			`# In-memory sessionmap check`
			`self.assert_session_count(0, mds_id=rank_0_id)`

			`# On-disk sessionmap check`
			`self.fs.mds_asok(["flush", "journal"], rank_0_id)`
			`table_json = json.loads(self.fs.table_tool(["0", "show", "session"]))`
			`log.info("SessionMap: {0}".format(json.dumps(table_json, indent=2)))`
			`self.assertEqual(table_json['0']['result'], 0)`
			`self.assertEqual(len(table_json['0']['data']['Sessions']), 0)`
tasks/cephfs: add TestSessionMap.test_session_reject Signed-off-by: John Spray <john.spray@redhat.com> 2015-11-27 15:52:27 +00:00
			`def _sudo_write_file(self, remote, path, data):`
			`"""`
			`Write data to a remote file as super user`

			`:param remote: Remote site.`
			`:param path: Path on the remote being written to.`
			`:param data: Data to be written.`

			`Both perms and owner are passed directly to chmod.`
			`"""`
			`remote.run(`
			`args=[`
			`'sudo',`
			`'python',`
			`'-c',`
			`'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',`
			`path,`
			`],`
			`stdin=data,`
			`)`

			`def _configure_auth(self, mount, id_name, mds_caps, osd_caps=None, mon_caps=None):`
			`"""`
			`Set up auth credentials for a client mount, and write out the keyring`
			`for the client to use.`
			`"""`

			`if osd_caps is None:`
			`osd_caps = "allow rw"`

			`if mon_caps is None:`
			`mon_caps = "allow r"`

			`out = self.fs.mon_manager.raw_cluster_cmd(`
			`"auth", "get-or-create", "client.{name}".format(name=id_name),`
			`"mds", mds_caps,`
			`"osd", osd_caps,`
			`"mon", mon_caps`
			`)`
			`mount.client_id = id_name`
			`self._sudo_write_file(mount.client_remote, mount.get_keyring_path(), out)`
			`self.set_conf("client.{name}".format(name=id_name), "keyring", mount.get_keyring_path())`

			`def test_session_reject(self):`
tasks/cephfs: skip test_session_reject cleanly Instead of asserting in configure_auth (which in fact works fine with KernelMount.write_secret_file), raise a SkipTest in test_session_reject (because the kernel client cannot handle the client_metadata setting to inject bogus data) Signed-off-by: John Spray <john.spray@redhat.com> 2016-09-01 17:33:50 +00:00			`if not isinstance(self.mount_a, FuseMount):`
			`raise SkipTest("Requires FUSE client to inject client metadata")`

tasks/cephfs: add TestSessionMap.test_session_reject Signed-off-by: John Spray <john.spray@redhat.com> 2015-11-27 15:52:27 +00:00			`self.mount_a.run_shell(["mkdir", "foo"])`
			`self.mount_a.run_shell(["mkdir", "foo/bar"])`
			`self.mount_a.umount_wait()`

			`# Mount B will be my rejected client`
			`self.mount_b.umount_wait()`

			`# Configure a client that is limited to /foo/bar`
			`self._configure_auth(self.mount_b, "badguy", "allow rw path=/foo/bar")`
			`# Check he can mount that dir and do IO`
			`self.mount_b.mount(mount_path="/foo/bar")`
			`self.mount_b.wait_until_mounted()`
			`self.mount_b.create_destroy()`
			`self.mount_b.umount_wait()`

			`# Configure the client to claim that its mount point metadata is /baz`
			`self.set_conf("client.badguy", "client_metadata", "root=/baz")`
			`# Try to mount the client, see that it fails`
qa: update cluster log health warning message Signed-off-by: Patrick Donnelly <pdonnell@redhat.com> 2018-07-13 17:57:24 +00:00			`with self.assert_cluster_log("client session with non-allowable root '/baz' denied"):`
tasks/cephfs: add TestSessionMap.test_session_reject Signed-off-by: John Spray <john.spray@redhat.com> 2015-11-27 15:52:27 +00:00			`with self.assertRaises(CommandFailedError):`
			`self.mount_b.mount(mount_path="/foo/bar")`