libdb/test/tcl/repmgr010.tcl

167 lines
5.6 KiB
Tcl

# See the file LICENSE for redistribution information.
#
# Copyright (c) 2007, 2011 Oracle and/or its affiliates. All rights reserved.
#
# $Id$
#
# TEST repmgr010
# TEST Acknowledgement policy and timeout test.
# TEST
# TEST Verify that "quorum" acknowledgement policy succeeds with fewer than
# TEST nsites running. Verify that "all" acknowledgement policy results in
# TEST ack failures with fewer than nsites running.
# TEST
# TEST Run for btree only because access method shouldn't matter.
# TEST
proc repmgr010 { { niter 100 } { tnum "010" } args } {
source ./include.tcl
if { $is_freebsd_test == 1 } {
puts "Skipping replication manager test on FreeBSD platform."
return
}
set method "btree"
set args [convert_args $method $args]
puts "Repmgr$tnum ($method): repmgr ack policy and timeout test."
repmgr010_sub $method $niter $tnum $args
}
proc repmgr010_sub { method niter tnum largs } {
global testdir
global rep_verbose
global verbose_type
set nsites 3
set small_iter [expr $niter / 10]
set verbargs ""
if { $rep_verbose == 1 } {
set verbargs " -verbose {$verbose_type on} "
}
env_cleanup $testdir
set ports [available_ports $nsites]
set masterdir $testdir/MASTERDIR
set clientdir $testdir/CLIENTDIR
set clientdir2 $testdir/CLIENTDIR2
file mkdir $masterdir
file mkdir $clientdir
file mkdir $clientdir2
# Use different connection retry timeout values to handle any
# collisions from starting sites at the same time by retrying
# at different times.
puts "\tRepmgr$tnum.a: Start master, two clients, ack policy quorum."
# Open a master.
set ma_envcmd "berkdb_env_noerr -create $verbargs \
-errpfx MASTER -home $masterdir -txn -rep -thread"
set masterenv [eval $ma_envcmd]
$masterenv repmgr -ack quorum \
-timeout {connection_retry 20000000} \
-timeout {ack 5000000} \
-local [list localhost [lindex $ports 0]] \
-start master
# Open first client
set cl_envcmd "berkdb_env_noerr -create $verbargs \
-errpfx CLIENT -home $clientdir -txn -rep -thread"
set clientenv [eval $cl_envcmd]
$clientenv repmgr -ack quorum \
-timeout {connection_retry 10000000} \
-local [list localhost [lindex $ports 1]] \
-remote [list localhost [lindex $ports 0]] \
-remote [list localhost [lindex $ports 2]] \
-start client
await_startup_done $clientenv
# Open second client
set cl2_envcmd "berkdb_env_noerr -create $verbargs \
-errpfx CLIENT2 -home $clientdir2 -txn -rep -thread"
set clientenv2 [eval $cl2_envcmd]
$clientenv2 repmgr -ack quorum \
-timeout {connection_retry 5000000} \
-local [list localhost [lindex $ports 2]] \
-remote [list localhost [lindex $ports 0]] \
-remote [list localhost [lindex $ports 1]] \
-start client
await_startup_done $clientenv2
puts "\tRepmgr$tnum.b: Run first set of transactions at master."
set start 0
eval rep_test $method $masterenv NULL $niter $start 0 0 $largs
incr start $niter
#
# Special verification needed for quorum ack policy. Wait
# longer than ack timeout (default 1 second) then check for
# ack failures (perm_failed events). Quorum only guarantees
# that transactions replicated to one site or the other, so
# test for this condition instead of both sites.
#
puts "\tRepmgr$tnum.c: Verify both client databases, no ack failures."
error_check_good quorum_perm_failed1 \
[stat_field $masterenv repmgr_stat "Acknowledgement failures"] 0
catch {rep_verify\
$masterdir $masterenv $clientdir $clientenv 1 1 1} ver1
catch {rep_verify\
$masterdir $masterenv $clientdir2 $clientenv2 1 1 1} ver2
error_check_good onesite [expr [string length $ver1] == 0 || \
[string length $ver2] == 0] 1
puts "\tRepmgr$tnum.d: Shut down first client."
error_check_good client_close [$clientenv close] 0
puts "\tRepmgr$tnum.e: Run second set of transactions at master."
eval rep_test $method $masterenv NULL $small_iter $start 0 0 $largs
incr start $niter
puts "\tRepmgr$tnum.f: Verify client database, no ack failures."
error_check_good quorum_perm_failed2 \
[stat_field $masterenv repmgr_stat "Acknowledgement failures"] 0
rep_verify $masterdir $masterenv $clientdir2 $clientenv2 1 1 1
puts "\tRepmgr$tnum.g: Adjust all sites to ack policy all."
# Reopen first client with ack policy all
set cl_envcmd "berkdb_env_noerr -create $verbargs \
-errpfx CLIENT -home $clientdir -txn -rep -thread"
# Open -recover to clear env region, including startup_done value.
set clientenv [eval $cl_envcmd -recover]
$clientenv repmgr -ack all \
-timeout {connection_retry 10000000} \
-local [list localhost [lindex $ports 1]] \
-remote [list localhost [lindex $ports 0]] \
-remote [list localhost [lindex $ports 2]] \
-start client
await_startup_done $clientenv
# Adjust other sites to ack policy all
$masterenv repmgr -ack all
$clientenv2 repmgr -ack all
puts "\tRepmgr$tnum.h: Shut down first client."
error_check_good client_close [$clientenv close] 0
set init_perm_failed \
[stat_field $masterenv repmgr_stat "Acknowledgement failures"]
#
# Use of -ack all guarantees replication complete before repmgr send
# function returns and rep_test finishes.
#
puts "\tRepmgr$tnum.i: Run third set of transactions at master."
eval rep_test $method $masterenv NULL $small_iter $start 0 0 $largs
puts "\tRepmgr$tnum.j: Verify client database, some ack failures."
rep_verify $masterdir $masterenv $clientdir2 $clientenv2 1 1 1
error_check_good all_perm_failed [expr \
[stat_field $masterenv repmgr_stat "Acknowledgement failures"] \
> $init_perm_failed] 1
error_check_good client2_close [$clientenv2 close] 0
error_check_good masterenv_close [$masterenv close] 0
}