2014-09-15 22:41:34 +00:00
|
|
|
from StringIO import StringIO
|
2014-10-28 17:12:02 +00:00
|
|
|
import json
|
2014-07-02 15:43:16 +00:00
|
|
|
import logging
|
2019-07-01 18:21:13 +00:00
|
|
|
import time
|
2014-10-28 17:12:02 +00:00
|
|
|
from textwrap import dedent
|
2014-09-15 22:41:34 +00:00
|
|
|
from teuthology.orchestra.run import CommandFailedError
|
|
|
|
from teuthology import misc
|
2014-07-02 15:43:16 +00:00
|
|
|
|
2014-09-15 22:41:34 +00:00
|
|
|
from teuthology.orchestra import remote as orchestra_remote
|
2014-07-02 15:43:16 +00:00
|
|
|
from teuthology.orchestra import run
|
2017-02-01 00:25:44 +00:00
|
|
|
from teuthology.contextutil import MaxWhileTries
|
2014-08-07 14:24:59 +00:00
|
|
|
from .mount import CephFSMount
|
2014-07-02 15:43:16 +00:00
|
|
|
|
|
|
|
log = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
2017-02-01 00:25:44 +00:00
|
|
|
UMOUNT_TIMEOUT = 300
|
|
|
|
|
|
|
|
|
2014-07-02 15:43:16 +00:00
|
|
|
class KernelMount(CephFSMount):
|
2018-07-12 13:25:53 +00:00
|
|
|
def __init__(self, ctx, mons, test_dir, client_id, client_remote,
|
2014-09-15 22:41:34 +00:00
|
|
|
ipmi_user, ipmi_password, ipmi_domain):
|
2018-07-12 13:25:53 +00:00
|
|
|
super(KernelMount, self).__init__(ctx, test_dir, client_id, client_remote)
|
2014-07-02 15:43:16 +00:00
|
|
|
self.mons = mons
|
|
|
|
|
2014-09-15 22:41:34 +00:00
|
|
|
self.mounted = False
|
|
|
|
self.ipmi_user = ipmi_user
|
|
|
|
self.ipmi_password = ipmi_password
|
|
|
|
self.ipmi_domain = ipmi_domain
|
|
|
|
|
2014-07-02 15:43:16 +00:00
|
|
|
def write_secret_file(self, remote, role, keyring, filename):
|
|
|
|
"""
|
|
|
|
Stash the keyring in the filename specified.
|
|
|
|
"""
|
|
|
|
remote.run(
|
|
|
|
args=[
|
|
|
|
'adjust-ulimits',
|
|
|
|
'ceph-coverage',
|
|
|
|
'{tdir}/archive/coverage'.format(tdir=self.test_dir),
|
|
|
|
'ceph-authtool',
|
|
|
|
'--name={role}'.format(role=role),
|
|
|
|
'--print-key',
|
|
|
|
keyring,
|
|
|
|
run.Raw('>'),
|
|
|
|
filename,
|
|
|
|
],
|
2018-10-10 20:33:46 +00:00
|
|
|
timeout=(5*60),
|
2014-07-02 15:43:16 +00:00
|
|
|
)
|
|
|
|
|
2016-11-06 22:01:00 +00:00
|
|
|
def mount(self, mount_path=None, mount_fs_name=None):
|
2018-07-12 13:25:53 +00:00
|
|
|
self.setupfs(name=mount_fs_name)
|
|
|
|
|
2014-07-02 15:43:16 +00:00
|
|
|
log.info('Mounting kclient client.{id} at {remote} {mnt}...'.format(
|
|
|
|
id=self.client_id, remote=self.client_remote, mnt=self.mountpoint))
|
|
|
|
|
2015-11-09 13:15:21 +00:00
|
|
|
keyring = self.get_keyring_path()
|
2016-05-11 19:08:17 +00:00
|
|
|
secret = '{tdir}/ceph.data/client.{id}.secret'.format(tdir=self.test_dir, id=self.client_id)
|
2014-07-02 15:43:16 +00:00
|
|
|
self.write_secret_file(self.client_remote, 'client.{id}'.format(id=self.client_id),
|
|
|
|
keyring, secret)
|
|
|
|
|
|
|
|
self.client_remote.run(
|
|
|
|
args=[
|
|
|
|
'mkdir',
|
|
|
|
'--',
|
|
|
|
self.mountpoint,
|
|
|
|
],
|
2018-10-10 20:33:46 +00:00
|
|
|
timeout=(5*60),
|
2014-07-02 15:43:16 +00:00
|
|
|
)
|
|
|
|
|
2015-11-09 13:15:21 +00:00
|
|
|
if mount_path is None:
|
|
|
|
mount_path = "/"
|
|
|
|
|
2016-12-13 01:05:25 +00:00
|
|
|
opts = 'name={id},secretfile={secret},norequire_active_mds'.format(id=self.client_id,
|
2016-11-06 22:01:00 +00:00
|
|
|
secret=secret)
|
|
|
|
|
|
|
|
if mount_fs_name is not None:
|
|
|
|
opts += ",mds_namespace={0}".format(mount_fs_name)
|
|
|
|
|
2014-07-02 15:43:16 +00:00
|
|
|
self.client_remote.run(
|
|
|
|
args=[
|
|
|
|
'sudo',
|
|
|
|
'adjust-ulimits',
|
|
|
|
'ceph-coverage',
|
|
|
|
'{tdir}/archive/coverage'.format(tdir=self.test_dir),
|
|
|
|
'/sbin/mount.ceph',
|
2015-11-09 13:15:21 +00:00
|
|
|
'{mons}:{mount_path}'.format(mons=','.join(self.mons), mount_path=mount_path),
|
2014-07-02 15:43:16 +00:00
|
|
|
self.mountpoint,
|
|
|
|
'-v',
|
|
|
|
'-o',
|
2016-11-06 22:01:00 +00:00
|
|
|
opts
|
2014-07-02 15:43:16 +00:00
|
|
|
],
|
2018-10-10 20:33:46 +00:00
|
|
|
timeout=(30*60),
|
2014-07-02 15:43:16 +00:00
|
|
|
)
|
|
|
|
|
2014-09-15 22:41:34 +00:00
|
|
|
self.client_remote.run(
|
2018-10-10 20:33:46 +00:00
|
|
|
args=['sudo', 'chmod', '1777', self.mountpoint], timeout=(5*60))
|
2014-09-15 22:41:34 +00:00
|
|
|
|
|
|
|
self.mounted = True
|
|
|
|
|
2017-01-09 12:47:37 +00:00
|
|
|
def umount(self, force=False):
|
2014-07-02 15:43:16 +00:00
|
|
|
log.debug('Unmounting client client.{id}...'.format(id=self.client_id))
|
2017-01-09 12:47:37 +00:00
|
|
|
|
|
|
|
cmd=['sudo', 'umount', self.mountpoint]
|
|
|
|
if force:
|
|
|
|
cmd.append('-f')
|
|
|
|
|
2017-07-19 07:32:37 +00:00
|
|
|
try:
|
2018-10-10 20:33:46 +00:00
|
|
|
self.client_remote.run(args=cmd, timeout=(15*60))
|
2017-07-19 07:32:37 +00:00
|
|
|
except Exception as e:
|
|
|
|
self.client_remote.run(args=[
|
|
|
|
'sudo',
|
|
|
|
run.Raw('PATH=/usr/sbin:$PATH'),
|
|
|
|
'lsof',
|
|
|
|
run.Raw(';'),
|
|
|
|
'ps', 'auxf',
|
2018-10-10 20:33:46 +00:00
|
|
|
], timeout=(15*60))
|
2017-07-19 07:32:37 +00:00
|
|
|
raise e
|
2017-01-09 12:47:37 +00:00
|
|
|
|
2017-02-01 00:25:44 +00:00
|
|
|
rproc = self.client_remote.run(
|
2014-07-02 15:43:16 +00:00
|
|
|
args=[
|
|
|
|
'rmdir',
|
|
|
|
'--',
|
2014-09-15 22:41:34 +00:00
|
|
|
self.mountpoint,
|
2014-07-02 15:43:16 +00:00
|
|
|
],
|
2017-02-01 00:25:44 +00:00
|
|
|
wait=False
|
2014-07-02 15:43:16 +00:00
|
|
|
)
|
2017-02-01 00:25:44 +00:00
|
|
|
run.wait([rproc], UMOUNT_TIMEOUT)
|
2014-09-15 22:41:34 +00:00
|
|
|
self.mounted = False
|
2014-07-17 20:35:22 +00:00
|
|
|
|
|
|
|
def cleanup(self):
|
|
|
|
pass
|
|
|
|
|
2018-05-11 12:26:43 +00:00
|
|
|
def umount_wait(self, force=False, require_clean=False, timeout=900):
|
2014-09-15 22:41:34 +00:00
|
|
|
"""
|
|
|
|
Unlike the fuse client, the kernel client's umount is immediate
|
|
|
|
"""
|
2016-08-30 12:02:28 +00:00
|
|
|
if not self.is_mounted():
|
|
|
|
return
|
|
|
|
|
2014-09-15 22:41:34 +00:00
|
|
|
try:
|
2017-01-09 12:47:37 +00:00
|
|
|
self.umount(force)
|
2017-02-01 00:25:44 +00:00
|
|
|
except (CommandFailedError, MaxWhileTries):
|
2014-09-15 22:41:34 +00:00
|
|
|
if not force:
|
|
|
|
raise
|
|
|
|
|
|
|
|
self.kill()
|
|
|
|
self.kill_cleanup()
|
|
|
|
|
|
|
|
self.mounted = False
|
2014-07-17 20:35:22 +00:00
|
|
|
|
|
|
|
def is_mounted(self):
|
2014-09-15 22:41:34 +00:00
|
|
|
return self.mounted
|
2014-07-17 20:35:22 +00:00
|
|
|
|
|
|
|
def wait_until_mounted(self):
|
2014-09-15 22:41:34 +00:00
|
|
|
"""
|
|
|
|
Unlike the fuse client, the kernel client is up and running as soon
|
|
|
|
as the initial mount() function returns.
|
|
|
|
"""
|
|
|
|
assert self.mounted
|
2014-07-17 20:35:22 +00:00
|
|
|
|
|
|
|
def teardown(self):
|
|
|
|
super(KernelMount, self).teardown()
|
2014-09-15 22:41:34 +00:00
|
|
|
if self.mounted:
|
|
|
|
self.umount()
|
|
|
|
|
|
|
|
def kill(self):
|
|
|
|
"""
|
|
|
|
The Ceph kernel client doesn't have a mechanism to kill itself (doing
|
|
|
|
that in side the kernel would be weird anyway), so we reboot the whole node
|
|
|
|
to get the same effect.
|
|
|
|
|
|
|
|
We use IPMI to reboot, because we don't want the client to send any
|
|
|
|
releases of capabilities.
|
|
|
|
"""
|
|
|
|
|
|
|
|
con = orchestra_remote.getRemoteConsole(self.client_remote.hostname,
|
|
|
|
self.ipmi_user,
|
|
|
|
self.ipmi_password,
|
|
|
|
self.ipmi_domain)
|
2019-07-01 18:21:13 +00:00
|
|
|
con.hard_reset(wait_for_login=False)
|
2014-09-15 22:41:34 +00:00
|
|
|
|
|
|
|
self.mounted = False
|
|
|
|
|
|
|
|
def kill_cleanup(self):
|
|
|
|
assert not self.mounted
|
|
|
|
|
2019-07-01 18:21:13 +00:00
|
|
|
# We need to do a sleep here because we don't know how long it will
|
|
|
|
# take for a hard_reset to be effected.
|
|
|
|
time.sleep(30)
|
2014-09-15 22:41:34 +00:00
|
|
|
|
2019-07-01 18:21:13 +00:00
|
|
|
try:
|
|
|
|
# Wait for node to come back up after reboot
|
|
|
|
misc.reconnect(None, 300, [self.client_remote])
|
|
|
|
except:
|
|
|
|
# attempt to get some useful debug output:
|
|
|
|
con = orchestra_remote.getRemoteConsole(self.client_remote.hostname,
|
|
|
|
self.ipmi_user,
|
|
|
|
self.ipmi_password,
|
|
|
|
self.ipmi_domain)
|
|
|
|
con.check_status(timeout=60)
|
|
|
|
raise
|
|
|
|
|
|
|
|
# Remove mount directory
|
|
|
|
self.client_remote.run(args=['uptime'], timeout=10)
|
2014-09-15 22:41:34 +00:00
|
|
|
|
|
|
|
# Remove mount directory
|
|
|
|
self.client_remote.run(
|
|
|
|
args=[
|
|
|
|
'rmdir',
|
|
|
|
'--',
|
|
|
|
self.mountpoint,
|
|
|
|
],
|
2018-10-10 20:33:46 +00:00
|
|
|
timeout=(5*60),
|
2014-09-15 22:41:34 +00:00
|
|
|
)
|
|
|
|
|
2014-10-28 17:12:02 +00:00
|
|
|
def _find_debug_dir(self):
|
2014-09-15 22:41:34 +00:00
|
|
|
"""
|
2014-10-28 17:12:02 +00:00
|
|
|
Find the debugfs folder for this mount
|
2014-09-15 22:41:34 +00:00
|
|
|
"""
|
2014-10-28 17:12:02 +00:00
|
|
|
pyscript = dedent("""
|
|
|
|
import glob
|
|
|
|
import os
|
|
|
|
import json
|
2014-09-15 22:41:34 +00:00
|
|
|
|
2014-10-28 17:12:02 +00:00
|
|
|
def get_id_to_dir():
|
|
|
|
result = {}
|
|
|
|
for dir in glob.glob("/sys/kernel/debug/ceph/*"):
|
|
|
|
mds_sessions_lines = open(os.path.join(dir, "mds_sessions")).readlines()
|
|
|
|
client_id = mds_sessions_lines[1].split()[1].strip('"')
|
|
|
|
|
|
|
|
result[client_id] = dir
|
|
|
|
return result
|
|
|
|
|
|
|
|
print json.dumps(get_id_to_dir())
|
|
|
|
""")
|
|
|
|
|
|
|
|
p = self.client_remote.run(args=[
|
|
|
|
'sudo', 'python', '-c', pyscript
|
2018-10-10 20:33:46 +00:00
|
|
|
], stdout=StringIO(), timeout=(5*60))
|
2014-10-28 17:12:02 +00:00
|
|
|
client_id_to_dir = json.loads(p.stdout.getvalue())
|
2014-09-15 22:41:34 +00:00
|
|
|
|
2014-10-28 17:12:02 +00:00
|
|
|
try:
|
|
|
|
return client_id_to_dir[self.client_id]
|
|
|
|
except KeyError:
|
|
|
|
log.error("Client id '{0}' debug dir not found (clients seen were: {1})".format(
|
|
|
|
self.client_id, ",".join(client_id_to_dir.keys())
|
|
|
|
))
|
|
|
|
raise
|
|
|
|
|
|
|
|
def _read_debug_file(self, filename):
|
|
|
|
debug_dir = self._find_debug_dir()
|
2014-09-15 22:41:34 +00:00
|
|
|
|
2014-10-28 17:12:02 +00:00
|
|
|
pyscript = dedent("""
|
|
|
|
import os
|
2014-09-15 22:41:34 +00:00
|
|
|
|
2014-10-28 17:12:02 +00:00
|
|
|
print open(os.path.join("{debug_dir}", "{filename}")).read()
|
|
|
|
""").format(debug_dir=debug_dir, filename=filename)
|
2014-09-15 22:41:34 +00:00
|
|
|
|
|
|
|
p = self.client_remote.run(args=[
|
|
|
|
'sudo', 'python', '-c', pyscript
|
2018-10-10 20:33:46 +00:00
|
|
|
], stdout=StringIO(), timeout=(5*60))
|
2014-10-28 17:12:02 +00:00
|
|
|
return p.stdout.getvalue()
|
|
|
|
|
|
|
|
def get_global_id(self):
|
|
|
|
"""
|
|
|
|
Look up the CephFS client ID for this mount, using debugfs.
|
|
|
|
"""
|
|
|
|
|
|
|
|
assert self.mounted
|
|
|
|
|
|
|
|
mds_sessions = self._read_debug_file("mds_sessions")
|
|
|
|
lines = mds_sessions.split("\n")
|
|
|
|
return int(lines[0].split()[1])
|
|
|
|
|
|
|
|
def get_osd_epoch(self):
|
|
|
|
"""
|
|
|
|
Return 2-tuple of osd_epoch, osd_epoch_barrier
|
|
|
|
"""
|
|
|
|
osd_map = self._read_debug_file("osdmap")
|
|
|
|
lines = osd_map.split("\n")
|
2017-04-09 17:13:29 +00:00
|
|
|
first_line_tokens = lines[0].split()
|
|
|
|
epoch, barrier = int(first_line_tokens[1]), int(first_line_tokens[3])
|
2014-10-28 17:12:02 +00:00
|
|
|
|
2017-04-09 17:13:29 +00:00
|
|
|
return epoch, barrier
|