mirror of
https://github.com/ceph/ceph
synced 2025-01-14 06:53:11 +00:00
fb915c4805
If the source or target PG version is 0'0, we may silently take the max of the source and target and still leave the PG complete. This specifically can happen with an empty PG, as seen with bug 38655. In theory we could encounter one of the PGs with some other last_update that doesn't match what we expect. If that ever happens, make sure the result is incomplete so that backfill can clean up. Additionally check that the pool metadata for the last merge matches the PGs at all. This could mismatch if we have an osdmap gap and are forced to do some merge without merge info at all... in which case we should definitely invalidate: there should be newer copies of the PG(s), and we have no idea whether the PGs we are merging are what we want. If this is some disaster recovery situation, an operator is always free to use ceph-objectstore-tool to re-mark a PG complete (at their own peril!). Fixes: http://tracker.ceph.com/issues/38655 Signed-off-by: Sage Weil <sage@redhat.com>
205 lines
6.7 KiB
Bash
Executable File
205 lines
6.7 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
source $CEPH_ROOT/qa/standalone/ceph-helpers.sh
|
|
|
|
function run() {
|
|
local dir=$1
|
|
shift
|
|
|
|
export CEPH_MON="127.0.0.1:7147" # git grep '\<7147\>' : there must be only one
|
|
export CEPH_ARGS
|
|
CEPH_ARGS+="--fsid=$(uuidgen) --auth-supported=none "
|
|
CEPH_ARGS+="--mon-host=$CEPH_MON --mon_min_osdmap_epochs=50 --paxos_service_trim_min=10"
|
|
|
|
local funcs=${@:-$(set | sed -n -e 's/^\(TEST_[0-9a-z_]*\) .*/\1/p')}
|
|
for func in $funcs ; do
|
|
$func $dir || return 1
|
|
done
|
|
}
|
|
|
|
function TEST_a_merge_empty() {
|
|
local dir=$1
|
|
|
|
setup $dir || return 1
|
|
run_mon $dir a --osd_pool_default_size=3 || return 1
|
|
run_mgr $dir x || return 1
|
|
run_osd $dir 0 || return 1
|
|
run_osd $dir 1 || return 1
|
|
run_osd $dir 2 || return 1
|
|
|
|
ceph osd pool create foo 2 || return 1
|
|
ceph osd pool set foo pgp_num 1 || return 1
|
|
|
|
wait_for_clean || return 1
|
|
|
|
# note: we need 1.0 to have the same or more objects than 1.1
|
|
# 1.1
|
|
rados -p foo put foo1 /etc/passwd
|
|
rados -p foo put foo2 /etc/passwd
|
|
rados -p foo put foo3 /etc/passwd
|
|
rados -p foo put foo4 /etc/passwd
|
|
# 1.0
|
|
rados -p foo put foo5 /etc/passwd
|
|
rados -p foo put foo6 /etc/passwd
|
|
rados -p foo put foo8 /etc/passwd
|
|
rados -p foo put foo10 /etc/passwd
|
|
rados -p foo put foo11 /etc/passwd
|
|
rados -p foo put foo12 /etc/passwd
|
|
rados -p foo put foo16 /etc/passwd
|
|
|
|
wait_for_clean || return 1
|
|
|
|
ceph tell osd.1 config set osd_debug_no_purge_strays true
|
|
ceph osd pool set foo size 2 || return 1
|
|
wait_for_clean || return 1
|
|
|
|
kill_daemons $dir TERM osd.2 || return 1
|
|
ceph-objectstore-tool --data-path $dir/2 --op remove --pgid 1.1 --force || return 1
|
|
activate_osd $dir 2 || return 1
|
|
|
|
wait_for_clean || return 1
|
|
|
|
# osd.2: now 1.0 is there but 1.1 is not
|
|
|
|
# instantiate 1.1 on osd.2 with last_update=0'0 ('empty'), which is
|
|
# the problematic state... then let it merge with 1.0
|
|
ceph tell osd.2 config set osd_debug_no_acting_change true
|
|
ceph osd out 0 1
|
|
ceph osd pool set foo pg_num 1
|
|
sleep 5
|
|
ceph tell osd.2 config set osd_debug_no_acting_change false
|
|
|
|
# go back to osd.1 being primary, and 3x so the osd.2 copy doesn't get
|
|
# removed
|
|
ceph osd in 0 1
|
|
ceph osd pool set foo size 3
|
|
|
|
wait_for_clean || return 1
|
|
|
|
# scrub to ensure the osd.3 copy of 1.0 was incomplete (vs missing
|
|
# half of its objects).
|
|
ceph pg scrub 1.0
|
|
sleep 10
|
|
ceph log last debug
|
|
ceph pg ls
|
|
ceph pg ls | grep ' active.clean ' || return 1
|
|
}
|
|
|
|
function TEST_import_after_merge_and_gap() {
|
|
local dir=$1
|
|
|
|
setup $dir || return 1
|
|
run_mon $dir a --osd_pool_default_size=1 || return 1
|
|
run_mgr $dir x || return 1
|
|
run_osd $dir 0 || return 1
|
|
|
|
ceph osd pool create foo 2 || return 1
|
|
wait_for_clean || return 1
|
|
rados -p foo bench 3 write -b 1024 --no-cleanup || return 1
|
|
|
|
kill_daemons $dir TERM osd.0 || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op export --pgid 1.1 --file $dir/1.1 --force || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op export --pgid 1.0 --file $dir/1.0 --force || return 1
|
|
activate_osd $dir 0 || return 1
|
|
|
|
ceph osd pool set foo pg_num 1
|
|
sleep 5
|
|
while ceph daemon osd.0 perf dump | jq '.osd.numpg' | grep 2 ; do sleep 1 ; done
|
|
wait_for_clean || return 1
|
|
|
|
#
|
|
kill_daemons $dir TERM osd.0 || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op remove --pgid 1.0 --force || return 1
|
|
# this will import both halves the original pg
|
|
ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.1 --file $dir/1.1 || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.0 --file $dir/1.0 || return 1
|
|
activate_osd $dir 0 || return 1
|
|
|
|
wait_for_clean || return 1
|
|
|
|
# make a map gap
|
|
for f in `seq 1 50` ; do
|
|
ceph osd set nodown
|
|
ceph osd unset nodown
|
|
done
|
|
|
|
# poke and prod to ensure last_epech_clean is big, reported to mon, and
|
|
# the osd is able to trim old maps
|
|
rados -p foo bench 1 write -b 1024 --no-cleanup || return 1
|
|
wait_for_clean || return 1
|
|
ceph tell osd.0 send_beacon
|
|
sleep 5
|
|
ceph osd set nodown
|
|
ceph osd unset nodown
|
|
sleep 5
|
|
|
|
kill_daemons $dir TERM osd.0 || return 1
|
|
|
|
# this should fail.. 1.1 still doesn't exist
|
|
! ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.1 --file $dir/1.1 || return 1
|
|
|
|
ceph-objectstore-tool --data-path $dir/0 --op export-remove --pgid 1.0 --force --file $dir/1.0.later || return 1
|
|
|
|
# this should fail too because of the gap
|
|
! ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.1 --file $dir/1.1 || return 1
|
|
! ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.0 --file $dir/1.0 || return 1
|
|
|
|
# we can force it...
|
|
ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.1 --file $dir/1.1 --force || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.0 --file $dir/1.0 --force || return 1
|
|
|
|
# ...but the osd won't start, so remove it again.
|
|
ceph-objectstore-tool --data-path $dir/0 --op remove --pgid 1.0 --force || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op remove --pgid 1.1 --force || return 1
|
|
|
|
ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.0 --file $dir/1.0.later --force || return 1
|
|
|
|
|
|
activate_osd $dir 0 || return 1
|
|
|
|
wait_for_clean || return 1
|
|
}
|
|
|
|
function TEST_import_after_split() {
|
|
local dir=$1
|
|
|
|
setup $dir || return 1
|
|
run_mon $dir a --osd_pool_default_size=1 || return 1
|
|
run_mgr $dir x || return 1
|
|
run_osd $dir 0 || return 1
|
|
|
|
ceph osd pool create foo 1 || return 1
|
|
wait_for_clean || return 1
|
|
rados -p foo bench 3 write -b 1024 --no-cleanup || return 1
|
|
|
|
kill_daemons $dir TERM osd.0 || return 1
|
|
ceph-objectstore-tool --data-path $dir/0 --op export --pgid 1.0 --file $dir/1.0 --force || return 1
|
|
activate_osd $dir 0 || return 1
|
|
|
|
ceph osd pool set foo pg_num 2
|
|
sleep 5
|
|
while ceph daemon osd.0 perf dump | jq '.osd.numpg' | grep 1 ; do sleep 1 ; done
|
|
wait_for_clean || return 1
|
|
|
|
kill_daemons $dir TERM osd.0 || return 1
|
|
|
|
ceph-objectstore-tool --data-path $dir/0 --op remove --pgid 1.0 --force || return 1
|
|
|
|
# this should fail because 1.1 (split child) is there
|
|
! ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.0 --file $dir/1.0 || return 1
|
|
|
|
ceph-objectstore-tool --data-path $dir/0 --op remove --pgid 1.1 --force || return 1
|
|
# now it will work (1.1. is gone)
|
|
ceph-objectstore-tool --data-path $dir/0 --op import --pgid 1.0 --file $dir/1.0 || return 1
|
|
|
|
activate_osd $dir 0 || return 1
|
|
|
|
wait_for_clean || return 1
|
|
}
|
|
|
|
|
|
main pg-split-merge "$@"
|
|
|
|
# Local Variables:
|
|
# compile-command: "cd ../.. ; make -j4 && test/osd/pg-split-merge.sh"
|
|
# End:
|