1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204
|
# See the file LICENSE for redistribution information.
#
# Copyright (c) 2007, 2013 Oracle and/or its affiliates. All rights reserved.
#
# $Id$
#
# TEST rep074
# TEST Verify replication withstands send errors processing requests.
# TEST
# TEST Run for btree only because access method shouldn't matter.
# TEST
proc rep074 { method { niter 20 } { tnum "074" } args } {
source ./include.tcl
global databases_in_memory
global repfiles_in_memory
global env_private
# Skip for all methods except btree.
if { $checking_valid_methods } {
return btree
}
if { [is_btree $method] == 0 } {
puts "Rep$tnum: skipping for non-btree method $method."
return
}
set args [convert_args $method $args]
set logsets [create_logsets 2]
# Set up for on-disk or in-memory databases.
set msg "using on-disk databases"
if { $databases_in_memory } {
set msg "using named in-memory databases"
if { [is_queueext $method] } {
puts -nonewline "Skipping rep$tnum for method "
puts "$method with named in-memory databases."
return
}
}
set msg2 "and on-disk replication files"
if { $repfiles_in_memory } {
set msg2 "and in-memory replication files"
}
set msg3 ""
if { $env_private } {
set msg3 "with private env"
}
foreach l $logsets {
puts "Rep$tnum ($method): Test of send errors processing\
requests $msg $msg2 $msg3."
puts "Rep$tnum: Master logs are [lindex $l 0]"
puts "Rep$tnum: Client logs are [lindex $l 1]"
rep074_sub $method $niter $tnum $l $args
}
}
proc rep074_sub { method niter tnum logset largs } {
global testdir
global rep074_failure_count
global repfiles_in_memory
global env_private
global rep_verbose
global verbose_type
set rep074_failure_count -1
set verbargs ""
if { $rep_verbose == 1 } {
set verbargs " -verbose {$verbose_type on} "
}
set repmemargs ""
if { $repfiles_in_memory } {
set repmemargs "-rep_inmem_files "
}
set privargs ""
if { $env_private == 1 } {
set privargs " -private "
}
env_cleanup $testdir
replsetup $testdir/MSGQUEUEDIR
set masterdir $testdir/MASTERDIR
set clientdir $testdir/CLIENTDIR
file mkdir $masterdir
file mkdir $clientdir
set m_logtype [lindex $logset 0]
set c_logtype [lindex $logset 1]
# In-memory logs require a large log buffer, and cannot
# be used with -txn nosync. Adjust the args for master
# and client.
set m_logargs [adjust_logargs $m_logtype]
set c_logargs [adjust_logargs $c_logtype]
set m_txnargs [adjust_txnargs $m_logtype]
set c_txnargs [adjust_txnargs $c_logtype]
# Open a master.
repladd 1
set ma_envcmd "berkdb_env_noerr -create $verbargs -errpfx MASTER \
-home $masterdir $m_logargs $m_txnargs $repmemargs $privargs \
-rep_transport \[list 1 rep074_replsend\]"
set masterenv [eval $ma_envcmd -rep_master]
# Create some new records, so that the master will have something
# substantial to say when asked for LOG_REQ.
#
puts "\tRep$tnum.a: Running rep_test in replicated env."
eval rep_test $method $masterenv NULL $niter 0 0 0 $largs
# Open a client
repladd 2
set cl_envcmd "berkdb_env_noerr -create $verbargs -errpfx CLIENT \
-home $clientdir $c_logargs $c_txnargs $repmemargs $privargs \
-rep_transport \[list 2 replsend\]"
set clientenv [eval $cl_envcmd -rep_client]
set envlist "{$masterenv 1} {$clientenv 2}"
# Bring the client online by processing the startup messages. This will
# cause the client to send a request to the master.
#
# In the first cycle, the client gets NEWMASTER and sends an UPDATE_REQ.
# In the second cycle, the master answers the UPDATE_REQ with an UPDATE,
# and the client sends a PAGE_REQ. Third, once we've gotten pages, we
# send a LOG_REQ.
#
# 1. NEWCLIENT -> NEWMASTER -> UPDATE_REQ
# 2. UPDATE -> PAGE_REQ
# 3. PAGE -> LOG_REQ
#
puts "\tRep$tnum.b: NEWMASTER -> UPDATE_REQ"
proc_msgs_once $envlist
puts "\tRep$tnum.c: UPDATE -> PAGE_REQ"
proc_msgs_once $envlist
puts "\tRep$tnum.d: PAGE -> LOG_REQ"
proc_msgs_once $envlist
# Force a sending error at the master while processing the LOG_REQ.
# We should ignore it, and return success to rep_process_message
#
puts "\tRep$tnum.e: Simulate a send error."
set rep074_failure_count [expr $niter / 2]
proc_msgs_once $envlist NONE errorp
puts "\tRep$tnum.f: Check for good return from rep_process_msg."
error_check_good rep_resilient $errorp 0
# Since we interrupted the flow with the simulated error, we don't have
# the log records we need yet.
#
error_check_bad startupdone \
[stat_field $clientenv rep_stat "Startup complete"] 1
#
# Run some more new txns at the master, so that the client eventually
# decides to request the remainder of the LOG_REQ response that it's
# missing. Pause for a second to make sure we reach the lower
# threshold for re-request on fast machines. We need to force a
# checkpoint because we need to create a gap, and then pause to
# reach the rerequest threshold.
#
set rep074_failure_count -1
$masterenv txn_checkpoint -force
process_msgs $envlist
tclsleep 1
eval rep_test $method $masterenv NULL $niter 0 0 0 $largs
process_msgs $envlist
error_check_good startupdone \
[stat_field $clientenv rep_stat "Startup complete"] 1
$masterenv close
$clientenv close
replclose $testdir/MSGQUEUEDIR
}
# Failure count < 0 turns off any special failure simulation processing.
# When the count is > 0, it means we should process that many messages normally,
# before invoking a failure.
#
proc rep074_replsend { control rec fromid toid flags lsn } {
global rep074_failure_count
if { $rep074_failure_count < 0 } {
return [replsend $control $rec $fromid $toid $flags $lsn]
}
if { $rep074_failure_count > 0 } {
incr rep074_failure_count -1
return [replsend $control $rec $fromid $toid $flags $lsn]
}
# Return an arbitrary non-zero value to indicate an error.
return 1
}
|