ceph/teuthology/misc.py

from cStringIO import StringIO

import os
import logging
import configobj
import getpass
import socket
import time
import urllib2
import urlparse
import yaml

from .orchestra import run

log = logging.getLogger(__name__)

def get_ceph_binary_url(branch=None, tag=None, sha1=None, flavor=None):
    if flavor is None:
        flavor = ''
    else:
        # TODO hardcoding amd64 here for simplicity; clients will try
        # to fetch the tarball matching their arch, non-x86_64 just
        # won't find anything and the test will fail. trying to
        # support cross-arch clusters is messy because nothing
        # guarantees the same sha1 of "master" has been built for all
        # of them. hoping for yagni.
        flavor = '-{flavor}-amd64'.format(flavor=flavor)
    BASE = 'http://ceph.newdream.net/gitbuilder{flavor}/output/'.format(flavor=flavor)

    if sha1 is not None:
        assert branch is None, "cannot set both sha1 and branch"
        assert tag is None, "cannot set both sha1 and tag"
    else:
        # gitbuilder uses remote-style ref names for branches, mangled to
        # have underscores instead of slashes; e.g. origin_master
        if tag is not None:
            ref = tag
            assert branch is None, "cannot set both branch and tag"
        else:
            if branch is None:
                branch = 'master'
            ref = branch

        sha1_url = urlparse.urljoin(BASE, 'ref/{ref}/sha1'.format(ref=ref))
        log.debug('Translating ref to sha1 using url %s', sha1_url)
        sha1_fp = urllib2.urlopen(sha1_url)
        sha1 = sha1_fp.read().rstrip('\n')
        sha1_fp.close()

    log.debug('Using ceph sha1 %s', sha1)
    bindir_url = urlparse.urljoin(BASE, 'sha1/{sha1}/'.format(sha1=sha1))
    return (sha1, bindir_url)

def feed_many_stdins(fp, processes):
    while True:
        data = fp.read(8192)
        if not data:
            break
        for proc in processes:
            proc.stdin.write(data)

def feed_many_stdins_and_close(fp, processes):
    feed_many_stdins(fp, processes)
    for proc in processes:
        proc.stdin.close()

def get_mons(roles, ips):
    mons = {}
    mon_id = 0
    for idx, roles in enumerate(roles):
        for role in roles:
            if not role.startswith('mon.'):
                continue
            addr = '{ip}:{port}'.format(
                ip=ips[idx],
                port=6789+mon_id,
                )
            mon_id += 1
            mons[role] = addr
    assert mons
    return mons

def generate_caps(type_):
    defaults = dict(
        osd=dict(
            mon='allow *',
            osd='allow *',
            ),
        mds=dict(
            mon='allow *',
            osd='allow *',
            mds='allow',
            ),
        client=dict(
            mon='allow rw',
            osd='allow rwx pool=data,rbd',
            mds='allow',
            ),
        )
    for subsystem, capability in defaults[type_].items():
        yield '--cap'
        yield subsystem
        yield capability

def skeleton_config(roles, ips):
    """
    Returns a ConfigObj that's prefilled with a skeleton config.

    Use conf[section][key]=value or conf.merge to change it.

    Use conf.write to write it out, override .filename first if you want.
    """
    path = os.path.join(os.path.dirname(__file__), 'ceph.conf')
    conf = configobj.ConfigObj(path, file_error=True)
    mons = get_mons(roles=roles, ips=ips)
    for role, addr in mons.iteritems():
        conf.setdefault(role, {})
        conf[role]['mon addr'] = addr
    # set up standby mds's
    for roles in roles:
        for role in roles:
            if role.startswith('mds.') and role.endswith('-s'):
                conf.setdefault(role, {})
                conf[role]['mds standby for name'] = role[:-2]
    return conf

def roles_of_type(roles_for_host, type_):
    prefix = '{type}.'.format(type=type_)
    for name in roles_for_host:
        if not name.startswith(prefix):
            continue
        id_ = name[len(prefix):]
        yield id_

def all_roles_of_type(cluster, type_):
    prefix = '{type}.'.format(type=type_)
    for _, roles_for_host in cluster.remotes.iteritems():
        for name in roles_for_host:
            if not name.startswith(prefix):
                continue
            id_ = name[len(prefix):]
            yield id_

def is_type(type_):
    """
    Returns a matcher function for whether role is of type given.
    """
    prefix = '{type}.'.format(type=type_)
    def _is_type(role):
        return role.startswith(prefix)
    return _is_type

def num_instances_of_type(cluster, type_):
    remotes_and_roles = cluster.remotes.items()
    roles = [roles for (remote, roles) in remotes_and_roles]
    prefix = '{type}.'.format(type=type_)
    num = sum(sum(1 for role in hostroles if role.startswith(prefix)) for hostroles in roles)
    return num

def create_simple_monmap(remote, conf):
    """
    Writes a simple monmap based on current ceph.conf into <tmpdir>/monmap.

    Assumes ceph_conf is up to date.

    Assumes mon sections are named "mon.*", with the dot.
    """
    def gen_addresses():
        for section, data in conf.iteritems():
            PREFIX = 'mon.'
            if not section.startswith(PREFIX):
                continue
            name = section[len(PREFIX):]
            addr = data['mon addr']
            yield (name, addr)

    addresses = list(gen_addresses())
    assert addresses, "There are no monitors in config!"
    log.debug('Ceph mon addresses: %s', addresses)

    args = [
        '/tmp/cephtest/enable-coredump',
        '/tmp/cephtest/binary/usr/local/bin/ceph-coverage',
        '/tmp/cephtest/archive/coverage',
        '/tmp/cephtest/binary/usr/local/bin/monmaptool',
        '--create',
        '--clobber',
        ]
    for (name, addr) in addresses:
        args.extend(('--add', name, addr))
    args.extend([
            '--print',
            '/tmp/cephtest/monmap',
            ])
    remote.run(
        args=args,
        )

def write_file(remote, path, data):
    remote.run(
        args=[
            'python',
            '-c',
            'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',
            path,
            ],
        stdin=data,
        )

def sudo_write_file(remote, path, data):
    remote.run(
        args=[
            'sudo',
            'python',
            '-c',
            'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',
            path,
            ],
        stdin=data,
        )

def get_file(remote, path):
    """
    Read a file from remote host into memory.
    """
    proc = remote.run(
        args=[
            'cat',
            '--',
            path,
            ],
        stdout=StringIO(),
        )
    data = proc.stdout.getvalue()
    return data

def get_scratch_devices(remote):
    """
    Read the scratch disk list from remote host
    """
    devs = []
    try:
        file_data = get_file(remote, "/scratch_devs")
        devs = file_data.split()
    except:
        devs = ['/dev/sdb']

    retval = []
    for dev in devs:
        try:
            remote.run(
                args=[
                    'stat',
                    dev
                    ]
                )
            retval.append(dev)
        except:
            pass
    return retval

def wait_until_healthy(remote):
    """Wait until a Ceph cluster is healthy."""
    while True:
        r = remote.run(
            args=[
                '/tmp/cephtest/enable-coredump',
                '/tmp/cephtest/binary/usr/local/bin/ceph-coverage',
                '/tmp/cephtest/archive/coverage',
                '/tmp/cephtest/binary/usr/local/bin/ceph',
                '-c', '/tmp/cephtest/ceph.conf',
                'health',
                '--concise',
                ],
            stdout=StringIO(),
            logger=log.getChild('health'),
            )
        out = r.stdout.getvalue()
        log.debug('Ceph health: %s', out.rstrip('\n'))
        if out.split(None, 1)[0] == 'HEALTH_OK':
            break
        time.sleep(1)

def wait_until_fuse_mounted(remote, fuse, mountpoint):
    while True:
        proc = remote.run(
            args=[
                'stat',
                '--file-system',
                '--printf=%T\n',
                '--',
                mountpoint,
                ],
            stdout=StringIO(),
            )
        fstype = proc.stdout.getvalue().rstrip('\n')
        if fstype == 'fuseblk':
            break
        log.debug('cfuse not yet mounted, got fs type {fstype!r}'.format(fstype=fstype))

        # it shouldn't have exited yet; exposes some trivial problems
        assert not fuse.exitstatus.ready()

        time.sleep(5)
    log.info('cfuse is mounted on %s', mountpoint)

def reconnect(ctx, timeout):
    """
    Connect to all the machines in ctx.cluster.

    Presumably, some of them won't be up. Handle this
    by waiting for them, unless the wait time exceeds
    the specified timeout.

    ctx needs to contain the cluster of machines you
    wish it to try and connect to, as well as a config
    holding the ssh keys for each of them. As long as it
    contains this data, you can construct a context
    that is a subset of your full cluster.
    """
    import errno
    log.info('Re-opening connections...')
    starttime = time.time()
    need_reconnect = ctx.cluster.remotes.keys()
    while True:
        for remote in list(need_reconnect):
            try:
                from .orchestra import connection
                remote.ssh = connection.connect(
                    user_at_host=remote.name,
                    host_key=ctx.config['targets'][remote.name],
                    )
            except socket.timeout:
                pass
            except socket.error as e:
                if hasattr(e, '__getitem__'):
                    if e[0] not in [errno.ECONNREFUSED, errno.ETIMEDOUT,
                                errno.EHOSTUNREACH, errno.EHOSTDOWN]:
                        log.exception('unknown socket error: %s', repr(e))
                        raise
                    else:
                        if time.time() - starttime > timeout:
                            log.exception('timed out waiting for %s', remote.name)
                            raise
                else:
                    log.exception('weird socket error without error code')
                    raise
            else:
                need_reconnect.remove(remote)

        if not need_reconnect:
            break
        log.debug('waited {elapsed}'.format(elapsed=str(time.time() - starttime)))
        time.sleep(1)

def write_secret_file(remote, role, filename):
    remote.run(
        args=[
            '/tmp/cephtest/enable-coredump',
            '/tmp/cephtest/binary/usr/local/bin/ceph-coverage',
            '/tmp/cephtest/archive/coverage',
            '/tmp/cephtest/binary/usr/local/bin/ceph-authtool',
            '--name={role}'.format(role=role),
            '--print-key',
            '/tmp/cephtest/data/{role}.keyring'.format(role=role),
            run.Raw('>'),
            filename,
            ],
        )

def get_clients(ctx, roles):
    for role in roles:
        assert isinstance(role, basestring)
        PREFIX = 'client.'
        assert role.startswith(PREFIX)
        id_ = role[len(PREFIX):]
        (remote,) = ctx.cluster.only(role).remotes.iterkeys()
        yield (id_, remote)

def get_user():
    return getpass.getuser() + '@' + socket.gethostname()

def read_config(ctx):
    filename = os.path.join(os.environ['HOME'], '.teuthology.yaml')
    ctx.teuthology_config = {}
    with file(filename) as f:
        g = yaml.safe_load_all(f)
        for new in g:
            ctx.teuthology_config.update(new)

# return the "first" mon (alphanumerically, for lack of anything better)
def get_first_mon(ctx, config):
    mons = []
    for remote, roles in ctx.cluster.remotes.items():
        for role in roles:
            if not role.startswith('mon.'):
                continue
            mons.append(role)
            break
    firstmon = sorted(mons)[0]
    assert firstmon
    return firstmon

def replace_all_with_clients(cluster, config):
    """
    Converts a dict containing a key all to one
    mapping all clients to the value of config['all']
    """
    assert isinstance(config, dict), 'config must be a dict'
    if 'all' not in config:
        return config
    norm_config = {}
    assert len(config) == 1, \
        "config cannot have 'all' and specific clients listed"
    for client in all_roles_of_type(cluster, 'client'):
        norm_config['client.{id}'.format(id=client)] = config['all']
    return norm_config
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`from cStringIO import StringIO`

			`import os`
			`import logging`
			`import configobj`
Move username to a utility method. 2011-07-02 01:15:52 +00:00			`import getpass`
			`import socket`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`import time`
Fetch ceph binary tarball independently on every node. Avoids shuffling the bytes through the controlling node. Use sha1 file to make sure everyone gets the same version. 2011-06-02 16:09:08 +00:00			`import urllib2`
			`import urlparse`
Read lock server from ~/teuthology.yaml. 2011-07-07 18:43:35 +00:00			`import yaml`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00
Move orchestra to teuthology.orchestra so there's just one top-level package. 2011-09-13 21:53:02 +00:00			`from .orchestra import run`
Add function to output a secret key to a file. 2011-06-16 01:06:57 +00:00
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`log = logging.getLogger(__name__)`

Can now run specific ceph version based on sha1. 2011-06-10 00:05:55 +00:00			`def get_ceph_binary_url(branch=None, tag=None, sha1=None, flavor=None):`
Initialize BASE before using it. 2011-06-10 18:12:34 +00:00			`if flavor is None:`
			`flavor = ''`
			`else:`
			`# TODO hardcoding amd64 here for simplicity; clients will try`
			`# to fetch the tarball matching their arch, non-x86_64 just`
			`# won't find anything and the test will fail. trying to`
			`# support cross-arch clusters is messy because nothing`
			`# guarantees the same sha1 of "master" has been built for all`
			`# of them. hoping for yagni.`
			`flavor = '-{flavor}-amd64'.format(flavor=flavor)`
			`BASE = 'http://ceph.newdream.net/gitbuilder{flavor}/output/'.format(flavor=flavor)`

Can now run specific ceph version based on sha1. 2011-06-10 00:05:55 +00:00			`if sha1 is not None:`
			`assert branch is None, "cannot set both sha1 and branch"`
			`assert tag is None, "cannot set both sha1 and tag"`
Let ceph task config specify branch or tag to run. 2011-06-09 21:08:45 +00:00			`else:`
Can now run specific ceph version based on sha1. 2011-06-10 00:05:55 +00:00			`# gitbuilder uses remote-style ref names for branches, mangled to`
			`# have underscores instead of slashes; e.g. origin_master`
			`if tag is not None:`
			`ref = tag`
			`assert branch is None, "cannot set both branch and tag"`
			`else:`
			`if branch is None:`
			`branch = 'master'`
new gitbuilder ref/branch naming no origin_ prefix 2011-08-05 21:35:22 +00:00			`ref = branch`
Can now run specific ceph version based on sha1. 2011-06-10 00:05:55 +00:00
			`sha1_url = urlparse.urljoin(BASE, 'ref/{ref}/sha1'.format(ref=ref))`
			`log.debug('Translating ref to sha1 using url %s', sha1_url)`
			`sha1_fp = urllib2.urlopen(sha1_url)`
			`sha1 = sha1_fp.read().rstrip('\n')`
			`sha1_fp.close()`
Support ceph tarball "favors", that is different gitbuilders. Use that for picking the gcov gitbuilder, when told to record code coverage. Actual coverage support comes in the next commit. Assuming all the world is a VA.. I mean amd64, for now. 2011-06-09 22:43:43 +00:00
			`log.debug('Using ceph sha1 %s', sha1)`
Fetch ceph binary tarball independently on every node. Avoids shuffling the bytes through the controlling node. Use sha1 file to make sure everyone gets the same version. 2011-06-02 16:09:08 +00:00			`bindir_url = urlparse.urljoin(BASE, 'sha1/{sha1}/'.format(sha1=sha1))`
Save ceph sha1 in coverage dir. This is needed to postprocess the coverage data. 2011-06-09 21:02:44 +00:00			`return (sha1, bindir_url)`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00
			`def feed_many_stdins(fp, processes):`
			`while True:`
			`data = fp.read(8192)`
			`if not data:`
			`break`
			`for proc in processes:`
			`proc.stdin.write(data)`

			`def feed_many_stdins_and_close(fp, processes):`
			`feed_many_stdins(fp, processes)`
			`for proc in processes:`
			`proc.stdin.close()`

			`def get_mons(roles, ips):`
			`mons = {}`
tolerate named (not numbered) mons 2011-07-27 04:46:47 +00:00			`mon_id = 0`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`for idx, roles in enumerate(roles):`
			`for role in roles:`
			`if not role.startswith('mon.'):`
			`continue`
			`addr = '{ip}:{port}'.format(`
			`ip=ips[idx],`
			`port=6789+mon_id,`
			`)`
no ++ in python 2011-07-27 18:45:20 +00:00			`mon_id += 1`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`mons[role] = addr`
			`assert mons`
			`return mons`

			`def generate_caps(type_):`
			`defaults = dict(`
			`osd=dict(`
			`mon='allow *',`
			`osd='allow *',`
			`),`
			`mds=dict(`
			`mon='allow *',`
			`osd='allow *',`
			`mds='allow',`
			`),`
			`client=dict(`
			`mon='allow rw',`
			`osd='allow rwx pool=data,rbd',`
			`mds='allow',`
			`),`
			`)`
			`for subsystem, capability in defaults[type_].items():`
			`yield '--cap'`
			`yield subsystem`
			`yield capability`

			`def skeleton_config(roles, ips):`
			`"""`
			`Returns a ConfigObj that's prefilled with a skeleton config.`

			`Use conf[section][key]=value or conf.merge to change it.`

			`Use conf.write to write it out, override .filename first if you want.`
			`"""`
			`path = os.path.join(os.path.dirname(__file__), 'ceph.conf')`
			`conf = configobj.ConfigObj(path, file_error=True)`
			`mons = get_mons(roles=roles, ips=ips)`
			`for role, addr in mons.iteritems():`
			`conf.setdefault(role, {})`
			`conf[role]['mon addr'] = addr`
configure mds's with -s suffix as standby 2011-07-27 17:04:37 +00:00			`# set up standby mds's`
			`for roles in roles:`
			`for role in roles:`
			`if role.startswith('mds.') and role.endswith('-s'):`
			`conf.setdefault(role, {})`
			`conf[role]['mds standby for name'] = role[:-2]`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`return conf`

			`def roles_of_type(roles_for_host, type_):`
			`prefix = '{type}.'.format(type=type_)`
			`for name in roles_for_host:`
			`if not name.startswith(prefix):`
			`continue`
			`id_ = name[len(prefix):]`
			`yield id_`

Make cfuse and kclient default to all clients. 2011-06-16 23:07:59 +00:00			`def all_roles_of_type(cluster, type_):`
			`prefix = '{type}.'.format(type=type_)`
			`for _, roles_for_host in cluster.remotes.iteritems():`
			`for name in roles_for_host:`
			`if not name.startswith(prefix):`
			`continue`
			`id_ = name[len(prefix):]`
			`yield id_`

Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`def is_type(type_):`
			`"""`
			`Returns a matcher function for whether role is of type given.`
			`"""`
			`prefix = '{type}.'.format(type=type_)`
			`def _is_type(role):`
			`return role.startswith(prefix)`
			`return _is_type`

Refactor for modularity. New style: run "./virtualenv/bin/teuthology -v interactive.yaml". 2011-06-03 21:47:44 +00:00			`def num_instances_of_type(cluster, type_):`
			`remotes_and_roles = cluster.remotes.items()`
			`roles = [roles for (remote, roles) in remotes_and_roles]`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`prefix = '{type}.'.format(type=type_)`
			`num = sum(sum(1 for role in hostroles if role.startswith(prefix)) for hostroles in roles)`
			`return num`

Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`def create_simple_monmap(remote, conf):`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`"""`
			`Writes a simple monmap based on current ceph.conf into <tmpdir>/monmap.`

			`Assumes ceph_conf is up to date.`

			`Assumes mon sections are named "mon.*", with the dot.`
			`"""`
			`def gen_addresses():`
			`for section, data in conf.iteritems():`
			`PREFIX = 'mon.'`
			`if not section.startswith(PREFIX):`
			`continue`
			`name = section[len(PREFIX):]`
			`addr = data['mon addr']`
			`yield (name, addr)`

			`addresses = list(gen_addresses())`
			`assert addresses, "There are no monitors in config!"`
			`log.debug('Ceph mon addresses: %s', addresses)`

			`args = [`
Archive cores dumped during test, record test as failed if any seen. 2011-06-17 23:00:39 +00:00			`'/tmp/cephtest/enable-coredump',`
Add coverage support. 2011-06-07 18:45:29 +00:00			`'/tmp/cephtest/binary/usr/local/bin/ceph-coverage',`
Put all coverage data in the archive dir. 2011-06-10 18:17:11 +00:00			`'/tmp/cephtest/archive/coverage',`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`'/tmp/cephtest/binary/usr/local/bin/monmaptool',`
			`'--create',`
			`'--clobber',`
			`]`
			`for (name, addr) in addresses:`
			`args.extend(('--add', name, addr))`
			`args.extend([`
			`'--print',`
			`'/tmp/cephtest/monmap',`
			`])`
Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`remote.run(`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`args=args,`
			`)`

Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`def write_file(remote, path, data):`
			`remote.run(`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`args=[`
			`'python',`
			`'-c',`
			`'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',`
			`path,`
			`],`
			`stdin=data,`
			`)`

Archive syslog messages while the test was in progress. 2011-06-20 20:19:08 +00:00			`def sudo_write_file(remote, path, data):`
			`remote.run(`
			`args=[`
			`'sudo',`
			`'python',`
			`'-c',`
			`'import shutil, sys; shutil.copyfileobj(sys.stdin, file(sys.argv[1], "wb"))',`
			`path,`
			`],`
			`stdin=data,`
			`)`

Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`def get_file(remote, path):`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`"""`
			`Read a file from remote host into memory.`
			`"""`
Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`proc = remote.run(`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`args=[`
			`'cat',`
			`'--',`
			`path,`
			`],`
			`stdout=StringIO(),`
			`)`
			`data = proc.stdout.getvalue()`
			`return data`

ceph.py: add btrfs option Signed-off-by: Samuel Just <samuel.just@dreamhost.com> 2011-10-03 21:03:36 +00:00			`def get_scratch_devices(remote):`
			`"""`
			`Read the scratch disk list from remote host`
			`"""`
			`devs = []`
			`try:`
			`file_data = get_file(remote, "/scratch_devs")`
			`devs = file_data.split()`
			`except:`
			`devs = ['/dev/sdb']`

			`retval = []`
			`for dev in devs:`
			`try:`
			`remote.run(`
			`args=[`
			`'stat',`
			`dev`
			`]`
			`)`
			`retval.append(dev)`
			`except:`
			`pass`
			`return retval`

Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`def wait_until_healthy(remote):`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`"""Wait until a Ceph cluster is healthy."""`
			`while True:`
Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`r = remote.run(`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`args=[`
Archive cores dumped during test, record test as failed if any seen. 2011-06-17 23:00:39 +00:00			`'/tmp/cephtest/enable-coredump',`
Add coverage support. 2011-06-07 18:45:29 +00:00			`'/tmp/cephtest/binary/usr/local/bin/ceph-coverage',`
Put all coverage data in the archive dir. 2011-06-10 18:17:11 +00:00			`'/tmp/cephtest/archive/coverage',`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`'/tmp/cephtest/binary/usr/local/bin/ceph',`
			`'-c', '/tmp/cephtest/ceph.conf',`
			`'health',`
			`'--concise',`
			`],`
			`stdout=StringIO(),`
			`logger=log.getChild('health'),`
			`)`
			`out = r.stdout.getvalue()`
			`log.debug('Ceph health: %s', out.rstrip('\n'))`
			`if out.split(None, 1)[0] == 'HEALTH_OK':`
			`break`
			`time.sleep(1)`

Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`def wait_until_fuse_mounted(remote, fuse, mountpoint):`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`while True:`
Refactor to use Cluster and Remote, to evaluate the new APIs. 2011-06-01 23:04:52 +00:00			`proc = remote.run(`
Initial import. Currently hardcoded to run dbench, not modular, and the remote execution API is clumsy. 2011-05-31 20:51:48 +00:00			`args=[`
			`'stat',`
			`'--file-system',`
			`'--printf=%T\n',`
			`'--',`
			`mountpoint,`
			`],`
			`stdout=StringIO(),`
			`)`
			`fstype = proc.stdout.getvalue().rstrip('\n')`
			`if fstype == 'fuseblk':`
			`break`
			`log.debug('cfuse not yet mounted, got fs type {fstype!r}'.format(fstype=fstype))`

			`# it shouldn't have exited yet; exposes some trivial problems`
			`assert not fuse.exitstatus.ready()`

			`time.sleep(5)`
			`log.info('cfuse is mounted on %s', mountpoint)`
Add function to output a secret key to a file. 2011-06-16 01:06:57 +00:00
Move reconnect function from kernel task to misc.py Signed-off-by: Greg Farnum <gregory.farnum@dreamhost.com> 2011-08-10 17:37:04 +00:00			`def reconnect(ctx, timeout):`
			`"""`
			`Connect to all the machines in ctx.cluster.`

			`Presumably, some of them won't be up. Handle this`
			`by waiting for them, unless the wait time exceeds`
			`the specified timeout.`

			`ctx needs to contain the cluster of machines you`
			`wish it to try and connect to, as well as a config`
			`holding the ssh keys for each of them. As long as it`
			`contains this data, you can construct a context`
			`that is a subset of your full cluster.`
			`"""`
			`import errno`
			`log.info('Re-opening connections...')`
			`starttime = time.time()`
			`need_reconnect = ctx.cluster.remotes.keys()`
			`while True:`
			`for remote in list(need_reconnect):`
			`try:`
Move orchestra to teuthology.orchestra so there's just one top-level package. 2011-09-13 21:53:02 +00:00			`from .orchestra import connection`
Move reconnect function from kernel task to misc.py Signed-off-by: Greg Farnum <gregory.farnum@dreamhost.com> 2011-08-10 17:37:04 +00:00			`remote.ssh = connection.connect(`
			`user_at_host=remote.name,`
			`host_key=ctx.config['targets'][remote.name],`
			`)`
Merge branch 'wip-nuke' Conflicts: teuthology/task/kernel.py 2011-08-10 23:16:11 +00:00			`except socket.timeout:`
			`pass`
Move reconnect function from kernel task to misc.py Signed-off-by: Greg Farnum <gregory.farnum@dreamhost.com> 2011-08-10 17:37:04 +00:00			`except socket.error as e:`
			`if hasattr(e, '__getitem__'):`
			`if e[0] not in [errno.ECONNREFUSED, errno.ETIMEDOUT,`
			`errno.EHOSTUNREACH, errno.EHOSTDOWN]:`
			`log.exception('unknown socket error: %s', repr(e))`
			`raise`
			`else:`
			`if time.time() - starttime > timeout:`
			`log.exception('timed out waiting for %s', remote.name)`
			`raise`
			`else:`
			`log.exception('weird socket error without error code')`
			`raise`
			`else:`
			`need_reconnect.remove(remote)`

			`if not need_reconnect:`
			`break`
			`log.debug('waited {elapsed}'.format(elapsed=str(time.time() - starttime)))`
			`time.sleep(1)`

Add function to output a secret key to a file. 2011-06-16 01:06:57 +00:00			`def write_secret_file(remote, role, filename):`
			`remote.run(`
			`args=[`
Archive cores dumped during test, record test as failed if any seen. 2011-06-17 23:00:39 +00:00			`'/tmp/cephtest/enable-coredump',`
Add function to output a secret key to a file. 2011-06-16 01:06:57 +00:00			`'/tmp/cephtest/binary/usr/local/bin/ceph-coverage',`
			`'/tmp/cephtest/archive/coverage',`
rename c* -> ceph-* Leave cfuse task name unchanged for now... 2011-09-23 15:57:18 +00:00			`'/tmp/cephtest/binary/usr/local/bin/ceph-authtool',`
Add function to output a secret key to a file. 2011-06-16 01:06:57 +00:00			`'--name={role}'.format(role=role),`
			`'--print-key',`
			`'/tmp/cephtest/data/{role}.keyring'.format(role=role),`
			`run.Raw('>'),`
			`filename,`
			`],`
			`)`
Move get_clients method into misc to avoid duplication. 2011-06-20 19:12:11 +00:00
Revert "fix get_clients" This reverts commit 83b6678e79904793bf31e82bbecad7bf16c1b2b5. The bug I was hitting was actually fxied by 06e3e69c293b20c0ce5df526fa923a979c1d8cfc. 2011-08-09 20:23:58 +00:00			`def get_clients(ctx, roles):`
			`for role in roles:`
			`assert isinstance(role, basestring)`
			`PREFIX = 'client.'`
			`assert role.startswith(PREFIX)`
			`id_ = role[len(PREFIX):]`
			`(remote,) = ctx.cluster.only(role).remotes.iterkeys()`
			`yield (id_, remote)`
Move username to a utility method. 2011-07-02 01:15:52 +00:00
			`def get_user():`
			`return getpass.getuser() + '@' + socket.gethostname()`
Read lock server from ~/teuthology.yaml. 2011-07-07 18:43:35 +00:00
			`def read_config(ctx):`
			`filename = os.path.join(os.environ['HOME'], '.teuthology.yaml')`
			`ctx.teuthology_config = {}`
			`with file(filename) as f:`
			`g = yaml.safe_load_all(f)`
			`for new in g:`
			`ctx.teuthology_config.update(new)`
thrashosds: make it work when first mon isn't mon.0 2011-08-31 20:56:42 +00:00
			`# return the "first" mon (alphanumerically, for lack of anything better)`
			`def get_first_mon(ctx, config):`
			`mons = []`
			`for remote, roles in ctx.cluster.remotes.items():`
			`for role in roles:`
			`if not role.startswith('mon.'):`
			`continue`
			`mons.append(role)`
			`break`
			`firstmon = sorted(mons)[0]`
			`assert firstmon`
			`return firstmon`
autotest: allow tests to be run on all clients 2011-09-08 00:50:12 +00:00
			`def replace_all_with_clients(cluster, config):`
			`"""`
			`Converts a dict containing a key all to one`
			`mapping all clients to the value of config['all']`
			`"""`
			`assert isinstance(config, dict), 'config must be a dict'`
			`if 'all' not in config:`
			`return config`
			`norm_config = {}`
			`assert len(config) == 1, \`
			`"config cannot have 'all' and specific clients listed"`
			`for client in all_roles_of_type(cluster, 'client'):`
			`norm_config['client.{id}'.format(id=client)] = config['all']`
			`return norm_config`