2014-02-19 10:26:23 +01:00
|
|
|
# Check the basic monitoring and failover capabilities.
|
|
|
|
|
2014-02-20 16:57:51 +01:00
|
|
|
source "../sentinel-tests/includes/init-tests.tcl"
|
2014-02-18 11:53:54 +01:00
|
|
|
|
|
|
|
test "Sentinels are able to auto-discover other sentinels" {
|
|
|
|
set sentinels [llength $::sentinel_instances]
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
wait_for_condition 100 50 {
|
|
|
|
[dict get [S $id SENTINEL MASTER mymaster] num-other-sentinels] == ($sentinels-1)
|
|
|
|
} else {
|
|
|
|
fail "At least some sentinel can't detect some other sentinel"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2014-02-18 16:31:52 +01:00
|
|
|
|
|
|
|
test "Sentinels are able to auto-discover slaves" {
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
wait_for_condition 100 50 {
|
|
|
|
[dict get [S $id SENTINEL MASTER mymaster] num-slaves] == $redis_slaves
|
|
|
|
} else {
|
|
|
|
fail "At least some sentinel can't detect some slave"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
test "Basic failover works if the master is down" {
|
|
|
|
set old_port [RI $master_id tcp_port]
|
|
|
|
set addr [S 0 SENTINEL GET-MASTER-ADDR-BY-NAME mymaster]
|
|
|
|
assert {[lindex $addr 1] == $old_port}
|
2014-02-22 17:26:30 +01:00
|
|
|
R $master_id debug sleep 10
|
2014-02-18 16:31:52 +01:00
|
|
|
foreach_sentinel_id id {
|
|
|
|
wait_for_condition 100 50 {
|
|
|
|
[lindex [S $id SENTINEL GET-MASTER-ADDR-BY-NAME mymaster] 1] != $old_port
|
|
|
|
} else {
|
|
|
|
fail "At least one Sentinel did not received failover info"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
set addr [S 0 SENTINEL GET-MASTER-ADDR-BY-NAME mymaster]
|
|
|
|
set master_id [get_instance_id_by_port redis [lindex $addr 1]]
|
|
|
|
}
|
|
|
|
|
|
|
|
test "New master [join $addr {:}] role matches" {
|
|
|
|
assert {[RI $master_id role] eq {master}}
|
|
|
|
}
|
2014-02-18 17:03:56 +01:00
|
|
|
|
|
|
|
test "All the other slaves now point to the new master" {
|
|
|
|
foreach_redis_id id {
|
|
|
|
if {$id != $master_id && $id != 0} {
|
|
|
|
wait_for_condition 1000 50 {
|
|
|
|
[RI $id master_port] == [lindex $addr 1]
|
|
|
|
} else {
|
|
|
|
fail "Redis ID $id not configured to replicate with new master"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
test "The old master eventually gets reconfigured as a slave" {
|
|
|
|
wait_for_condition 1000 50 {
|
|
|
|
[RI 0 master_port] == [lindex $addr 1]
|
|
|
|
} else {
|
|
|
|
fail "Old master not reconfigured as slave of new master"
|
|
|
|
}
|
|
|
|
}
|
2014-02-19 09:44:38 +01:00
|
|
|
|
|
|
|
test "ODOWN is not possible without enough Sentinels reports" {
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
S $id SENTINEL SET mymaster quorum [expr $sentinels+1]
|
|
|
|
}
|
|
|
|
set old_port [RI $master_id tcp_port]
|
|
|
|
set addr [S 0 SENTINEL GET-MASTER-ADDR-BY-NAME mymaster]
|
|
|
|
assert {[lindex $addr 1] == $old_port}
|
2014-02-22 17:26:30 +01:00
|
|
|
R $master_id debug sleep 10
|
2014-02-19 09:44:38 +01:00
|
|
|
|
|
|
|
# Make sure failover did not happened.
|
|
|
|
set addr [S 0 SENTINEL GET-MASTER-ADDR-BY-NAME mymaster]
|
|
|
|
assert {[lindex $addr 1] == $old_port}
|
|
|
|
}
|
|
|
|
|
|
|
|
test "Failover is not possible without majority agreement" {
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
S $id SENTINEL SET mymaster quorum $quorum
|
|
|
|
}
|
|
|
|
|
|
|
|
# Make majority of sentinels stop monitoring the master
|
|
|
|
for {set id 0} {$id < $quorum} {incr id} {
|
|
|
|
S $id SENTINEL REMOVE mymaster
|
|
|
|
}
|
2014-02-22 17:26:30 +01:00
|
|
|
R $master_id debug sleep 10
|
2014-02-19 09:44:38 +01:00
|
|
|
|
|
|
|
# Make sure failover did not happened.
|
|
|
|
set addr [S $quorum SENTINEL GET-MASTER-ADDR-BY-NAME mymaster]
|
|
|
|
assert {[lindex $addr 1] == $old_port}
|
|
|
|
|
|
|
|
# Cleanup: reconfigure the Sentinels to monitor the master.
|
|
|
|
for {set id 0} {$id < $quorum} {incr id} {
|
|
|
|
S $id SENTINEL MONITOR mymaster \
|
|
|
|
[get_instance_attrib redis $master_id host] \
|
|
|
|
[get_instance_attrib redis $master_id port] $quorum
|
2014-02-19 10:26:23 +01:00
|
|
|
S $id SENTINEL SET mymaster down-after-milliseconds 2000
|
2014-02-19 09:44:38 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
test "Failover works if we configure for absolute agreement" {
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
S $id SENTINEL SET mymaster quorum $sentinels
|
|
|
|
}
|
|
|
|
|
|
|
|
# Wait for Sentinels to monitor the master again
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
wait_for_condition 1000 50 {
|
|
|
|
[dict get [S $id SENTINEL MASTER mymaster] info-refresh] < 100000
|
|
|
|
} else {
|
|
|
|
fail "At least one Sentinel is not monitoring the master"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-02-22 17:26:30 +01:00
|
|
|
R $master_id debug sleep 10
|
2014-02-19 09:44:38 +01:00
|
|
|
foreach_sentinel_id id {
|
2014-02-19 10:26:23 +01:00
|
|
|
wait_for_condition 1000 50 {
|
2014-02-19 09:44:38 +01:00
|
|
|
[lindex [S $id SENTINEL GET-MASTER-ADDR-BY-NAME mymaster] 1] != $old_port
|
|
|
|
} else {
|
|
|
|
fail "At least one Sentinel did not received failover info"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
set addr [S 0 SENTINEL GET-MASTER-ADDR-BY-NAME mymaster]
|
|
|
|
set master_id [get_instance_id_by_port redis [lindex $addr 1]]
|
|
|
|
|
|
|
|
# Set the min ODOWN agreement back to strict majority.
|
|
|
|
foreach_sentinel_id id {
|
|
|
|
S $id SENTINEL SET mymaster quorum $quorum
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-02-19 10:08:49 +01:00
|
|
|
test "New master [join $addr {:}] role matches" {
|
|
|
|
assert {[RI $master_id role] eq {master}}
|
|
|
|
}
|