Merge PR #28825 into master

* refs/pull/28825/head: qa: wait for kernel client death qa: use hard_reset to reboot kclient Reviewed-by: David Galloway <dgallowa@redhat.com>
2025-02-21 18:17:42 +00:00 · 2019-07-29 13:08:29 -07:00 · 2019-07-29 13:08:29 -07:00 · 2a82081f77
commit 2a82081f77
parent 65ee02da75 6b83f43ba0
2 changed files with 22 additions and 8 deletions
--- a/qa/tasks/cephfs/kernel_mount.py
+++ b/qa/tasks/cephfs/kernel_mount.py
@ -1,6 +1,7 @@
 from StringIO import StringIO
 import json
 import logging
 import time
 from textwrap import dedent
 from teuthology.orchestra.run import CommandFailedError
 from teuthology import misc
@ -176,21 +177,31 @@ class KernelMount(CephFSMount):
                                                self.ipmi_user,
                                                self.ipmi_password,
                                                self.ipmi_domain)
-        con.power_off()
+        con.hard_reset(wait_for_login=False)
        self.mounted = False
    def kill_cleanup(self):
        assert not self.mounted
-        con = orchestra_remote.getRemoteConsole(self.client_remote.hostname,
+        # We need to do a sleep here because we don't know how long it will
-                                                self.ipmi_user,
+        # take for a hard_reset to be effected.
-                                                self.ipmi_password,
+        time.sleep(30)
                                                self.ipmi_domain)
        con.power_on()
-        # Wait for node to come back up after reboot
+        try:
-        misc.reconnect(None, 300, [self.client_remote])
+            # Wait for node to come back up after reboot
            misc.reconnect(None, 300, [self.client_remote])
        except:
            # attempt to get some useful debug output:
            con = orchestra_remote.getRemoteConsole(self.client_remote.hostname,
                                                    self.ipmi_user,
                                                    self.ipmi_password,
                                                    self.ipmi_domain)
            con.check_status(timeout=60)
            raise
        # Remove mount directory
        self.client_remote.run(args=['uptime'], timeout=10)
        # Remove mount directory
        self.client_remote.run(
--- a/qa/tasks/cephfs/test_client_recovery.py
+++ b/qa/tasks/cephfs/test_client_recovery.py
@ -297,6 +297,9 @@ class TestClientRecovery(CephFSTestCase):
        # Simulate client death
        self.mount_a.kill()
        # wait for it to die so it doesn't voluntarily release buffer cap
        time.sleep(5)
        try:
            # The waiter should get stuck waiting for the capability
            # held on the MDS by the now-dead client A