futriix/tests/unit/cluster/diskless-load-swapdb.tcl
Binbin 9827eef4d0
Avoid timing issue in diskless-load-swapdb test (#1077)
Since we paused the primary node earlier, the replica may enter
cluster down due to primary node pfail. Here set allow read to
prevent subsequent read errors.

Signed-off-by: Binbin <binloveplay1314@qq.com>
2024-10-01 13:14:30 -07:00

94 lines
2.8 KiB
Tcl

# Check that replica keys and keys to slots map are right after failing to diskless load using SWAPDB.
start_cluster 1 1 {tags {external:skip cluster}} {
test "Cluster should start ok" {
wait_for_cluster_state ok
}
test "Cluster is writable" {
cluster_write_test [srv 0 port]
}
test "Main db not affected when fail to diskless load" {
set master [srv 0 "client"]
set replica [srv -1 "client"]
set master_id 0
set replica_id -1
$replica READONLY
$replica config set repl-diskless-load swapdb
$replica config set appendonly no
$replica config set save ""
$replica config rewrite
$master config set repl-backlog-size 1024
$master config set repl-diskless-sync yes
$master config set repl-diskless-sync-delay 0
$master config set rdb-key-save-delay 10000
$master config set rdbcompression no
$master config set appendonly no
$master config set save ""
# Write a key that belongs to slot 0
set slot0_key "06S"
$master set $slot0_key 1
wait_for_ofs_sync $master $replica
assert_equal {1} [$replica get $slot0_key]
assert_equal $slot0_key [$replica CLUSTER GETKEYSINSLOT 0 1]
# Save an RDB and kill the replica
$replica save
pause_process [srv $replica_id pid]
# Delete the key from master
$master del $slot0_key
# Replica must full sync with master when start because replication
# backlog size is very small, and dumping rdb will cost several seconds.
set num 10000
set value [string repeat A 1024]
set rd [valkey_deferring_client valkey $master_id]
for {set j 0} {$j < $num} {incr j} {
$rd set $j $value
}
for {set j 0} {$j < $num} {incr j} {
$rd read
}
# Start the replica again
resume_process [srv $replica_id pid]
restart_server $replica_id true false
set replica [srv -1 "client"]
$replica READONLY
# Start full sync, wait till after db started loading in background
wait_for_condition 500 10 {
[s $replica_id async_loading] eq 1
} else {
fail "Fail to full sync"
}
# Kill master, abort full sync
pause_process [srv $master_id pid]
# Start full sync, wait till the replica detects the disconnection
wait_for_condition 500 10 {
[s $replica_id async_loading] eq 0
} else {
fail "Fail to stop the full sync"
}
# Since we paused the primary node earlier, the replica may enter
# cluster down due to primary node pfail. Here set allow read to
# prevent subsequent read errors.
$replica config set cluster-allow-reads-when-down yes
# Replica keys and keys to slots map still both are right
assert_equal {1} [$replica get $slot0_key]
assert_equal $slot0_key [$replica CLUSTER GETKEYSINSLOT 0 1]
resume_process [srv $master_id pid]
}
} ;# start_cluster