ceph/qa/tasks/peering_speed_test.py

88 lines
2.2 KiB
Python

"""
Remotely run peering tests.
"""
import logging
import time
log = logging.getLogger(__name__)
from teuthology.task.args import argify
POOLNAME = "POOLNAME"
ARGS = [
('num_pgs', 'number of pgs to create', 256, int),
('max_time', 'seconds to complete peering', 0, int),
('runs', 'trials to run', 10, int),
('num_objects', 'objects to create', 256 * 1024, int),
('object_size', 'size in bytes for objects', 64, int),
('creation_time_limit', 'time limit for pool population', 60*60, int),
('create_threads', 'concurrent writes for create', 256, int)
]
def setup(ctx, config):
"""
Setup peering test on remotes.
"""
manager = ctx.managers['ceph']
manager.clear_pools()
manager.create_pool(POOLNAME, config.num_pgs)
log.info("populating pool")
manager.rados_write_objects(
POOLNAME,
config.num_objects,
config.object_size,
config.creation_time_limit,
config.create_threads)
log.info("done populating pool")
def do_run(ctx, config):
"""
Perform the test.
"""
start = time.time()
# mark in osd
manager = ctx.managers['ceph']
manager.mark_in_osd(0)
log.info("writing out objects")
manager.rados_write_objects(
POOLNAME,
config.num_pgs, # write 1 object per pg or so
1,
config.creation_time_limit,
config.num_pgs, # lots of concurrency
cleanup = True)
peering_end = time.time()
log.info("peering done, waiting on recovery")
manager.wait_for_clean()
log.info("recovery done")
recovery_end = time.time()
if config.max_time:
assert(peering_end - start < config.max_time)
manager.mark_out_osd(0)
manager.wait_for_clean()
return {
'time_to_active': peering_end - start,
'time_to_clean': recovery_end - start
}
@argify("peering_speed_test", ARGS)
def task(ctx, config):
"""
Peering speed test
"""
setup(ctx, config)
manager = ctx.managers['ceph']
manager.mark_out_osd(0)
manager.wait_for_clean()
ret = []
for i in range(config.runs):
log.info("Run {i}".format(i = i))
ret.append(do_run(ctx, config))
manager.mark_in_osd(0)
ctx.summary['recovery_times'] = {
'runs': ret
}