blob: 746da1d85af6159313ebcf5f35ebd7fdae4c5f91 [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
package org.apache.zookeeper.server.quorum;
import static org.apache.zookeeper.test.ClientBase.CONNECTION_TIMEOUT;
import static org.junit.jupiter.api.Assertions.assertEquals;
import static org.junit.jupiter.api.Assertions.assertFalse;
import static org.junit.jupiter.api.Assertions.assertTrue;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.Set;
import org.apache.zookeeper.PortAssignment;
import org.apache.zookeeper.ZooKeeper;
import org.apache.zookeeper.test.ClientBase;
import org.apache.zookeeper.test.ReconfigTest;
import org.junit.jupiter.api.BeforeEach;
import org.junit.jupiter.api.Test;
public class ReconfigRecoveryTest extends QuorumPeerTestBase {
public void setup() {
* Reconfiguration recovery - test that a reconfiguration is completed if
* leader has .next file during startup and new config is not running yet
public void testNextConfigCompletion() throws Exception {
// 2 servers in current config, 3 in next config
final int SERVER_COUNT = 3;
final int[] clientPorts = new int[SERVER_COUNT];
StringBuilder sb = new StringBuilder();
String server;
ArrayList<String> allServers = new ArrayList<String>();
String currentQuorumCfgSection = null, nextQuorumCfgSection;
for (int i = 0; i < SERVER_COUNT; i++) {
clientPorts[i] = PortAssignment.unique();
server = "server." + i + "=localhost:" + PortAssignment.unique() + ":" + PortAssignment.unique()
+ ":participant;localhost:" + clientPorts[i];
sb.append(server + "\n");
if (i == 1) {
currentQuorumCfgSection = sb.toString();
nextQuorumCfgSection = sb.toString();
// Both servers 0 and 1 will have the .next config file, which means
// for them that a reconfiguration was in progress when they failed
// and the leader will complete it
MainThread[] mt = new MainThread[SERVER_COUNT];
ZooKeeper[] zk = new ZooKeeper[SERVER_COUNT];
for (int i = 0; i < SERVER_COUNT - 1; i++) {
mt[i] = new MainThread(i, clientPorts[i], currentQuorumCfgSection, true, "100000000");
// note that we should run the server, shut it down and only then
// simulate a reconfig in progress by writing the temp file, but here no
// other server is competing with them in FLE, so we can skip this step
// (server 2 is booted after FLE ends)
mt[i].writeTempDynamicConfigFile(nextQuorumCfgSection, "200000000");
zk[i] = new ZooKeeper("" + clientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
assertTrue(ClientBase.waitForServerUp("" + clientPorts[0], CONNECTION_TIMEOUT),
"waiting for server 0 being up");
assertTrue(ClientBase.waitForServerUp("" + clientPorts[1], CONNECTION_TIMEOUT),
"waiting for server 1 being up");
int leader = mt[0].main.quorumPeer.leader == null ? 1 : 0;
// the new server's config is going to include itself and the current leader
sb = new StringBuilder();
sb.append(allServers.get(leader) + "\n");
sb.append(allServers.get(2) + "\n");
// suppose that this new server never heard about the reconfig proposal
String newServerInitialConfig = sb.toString();
mt[2] = new MainThread(2, clientPorts[2], newServerInitialConfig);
zk[2] = new ZooKeeper("" + clientPorts[2], ClientBase.CONNECTION_TIMEOUT, this);
assertTrue(ClientBase.waitForServerUp("" + clientPorts[2], CONNECTION_TIMEOUT),
"waiting for server 2 being up");
ReconfigTest.testServerHasConfig(zk[0], allServers, null);
ReconfigTest.testServerHasConfig(zk[1], allServers, null);
ReconfigTest.testServerHasConfig(zk[2], allServers, null);
ReconfigTest.testNormalOperation(zk[0], zk[2]);
ReconfigTest.testNormalOperation(zk[2], zk[1]);
for (int i = 0; i < SERVER_COUNT; i++) {
* Reconfiguration recovery - current config servers discover .next file,
* but they're both observers and their ports change in next config. Suppose
* that next config wasn't activated yet. Should complete reconfiguration.
public void testCurrentServersAreObserversInNextConfig() throws Exception {
// 2 servers in current config, 5 in next config
final int SERVER_COUNT = 5;
final int[] clientPorts = new int[SERVER_COUNT];
final int[] oldClientPorts = new int[2];
StringBuilder sb = new StringBuilder();
String server;
String currentQuorumCfg, nextQuorumCfgSection;
ArrayList<String> allServersNext = new ArrayList<String>();
for (int i = 0; i < 2; i++) {
oldClientPorts[i] = PortAssignment.unique();
server = "server." + i + "=localhost:" + PortAssignment.unique() + ":" + PortAssignment.unique()
+ ":participant;localhost:" + oldClientPorts[i];
sb.append(server + "\n");
currentQuorumCfg = sb.toString();
sb = new StringBuilder();
String role;
for (int i = 0; i < SERVER_COUNT; i++) {
clientPorts[i] = PortAssignment.unique();
if (i < 2) {
role = "observer";
} else {
role = "participant";
server = "server." + i + "=localhost:" + PortAssignment.unique() + ":" + PortAssignment.unique() + ":"
+ role + ";localhost:" + clientPorts[i];
sb.append(server + "\n");
nextQuorumCfgSection = sb.toString();
MainThread[] mt = new MainThread[SERVER_COUNT];
ZooKeeper[] zk = new ZooKeeper[SERVER_COUNT];
// run servers 0 and 1 normally
for (int i = 0; i < 2; i++) {
mt[i] = new MainThread(i, oldClientPorts[i], currentQuorumCfg, true, "100000000");
zk[i] = new ZooKeeper("" + oldClientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
for (int i = 0; i < 2; i++) {
assertTrue(ClientBase.waitForServerUp("" + oldClientPorts[i], CONNECTION_TIMEOUT * 2),
"waiting for server " + i + " being up");
ReconfigTest.testNormalOperation(zk[0], zk[1]);
// shut them down and then simulate a reboot with a reconfig in progress
for (int i = 0; i < 2; i++) {
for (int i = 0; i < 2; i++) {
assertTrue(ClientBase.waitForServerDown("" + oldClientPorts[i], CONNECTION_TIMEOUT * 2),
"waiting for server " + i + " being up");
for (int i = 0; i < 2; i++) {
mt[i].writeTempDynamicConfigFile(nextQuorumCfgSection, "200000000");
zk[i] = new ZooKeeper("" + clientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
// new members are initialized with current config + the new server
for (int i = 2; i < SERVER_COUNT; i++) {
mt[i] = new MainThread(i, clientPorts[i], currentQuorumCfg + allServersNext.get(i));
zk[i] = new ZooKeeper("" + clientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
for (int i = 0; i < SERVER_COUNT; i++) {
assertTrue(ClientBase.waitForServerUp("" + clientPorts[i], CONNECTION_TIMEOUT * 2),
"waiting for server " + i + " being up");
ReconfigTest.testServerHasConfig(zk[i], allServersNext, null);
ReconfigTest.testNormalOperation(zk[0], zk[2]);
ReconfigTest.testNormalOperation(zk[4], zk[1]);
for (int i = 0; i < SERVER_COUNT; i++) {
* Reconfiguration recovery - test that if servers in old config have a
* .next file but no quorum of new config is up then no progress should be
* possible (no progress will happen to ensure safety as the new config
* might be actually up but partitioned from old config)
public void testNextConfigUnreachable() throws Exception {
// 2 servers in current config, 5 in next config
final int SERVER_COUNT = 5;
final int[] clientPorts = new int[SERVER_COUNT];
StringBuilder sb = new StringBuilder();
String server;
String currentQuorumCfgSection = null, nextQuorumCfgSection;
for (int i = 0; i < SERVER_COUNT; i++) {
clientPorts[i] = PortAssignment.unique();
server = "server." + i + "=localhost:" + PortAssignment.unique() + ":" + PortAssignment.unique()
+ ":participant;localhost:" + clientPorts[i];
sb.append(server + "\n");
if (i == 1) {
currentQuorumCfgSection = sb.toString();
nextQuorumCfgSection = sb.toString();
MainThread[] mt = new MainThread[SERVER_COUNT];
ZooKeeper[] zk = new ZooKeeper[SERVER_COUNT];
// Both servers 0 and 1 will have the .next config file, which means
// for them that a reconfiguration was in progress when they failed
for (int i = 0; i < 2; i++) {
mt[i] = new MainThread(i, clientPorts[i], currentQuorumCfgSection, true, "100000000");
// note that we should run the server, shut it down and only then
// simulate a reconfig in progress by writing the temp file, but here no
// other server is competing with them in FLE, so we can skip this step
mt[i].writeTempDynamicConfigFile(nextQuorumCfgSection, "200000000");
zk[i] = new ZooKeeper("" + clientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
Thread.sleep(CONNECTION_TIMEOUT * 2);
// make sure servers 0, 1 don't come online - this should be the case
// since they can't complete the reconfig
for (int i = 0; i < 2; i++) {
assertFalse(ClientBase.waitForServerUp("" + clientPorts[i], CONNECTION_TIMEOUT / 10),
"server " + i + " is up but shouldn't be");
for (int i = 0; i < 2; i++) {
* Reconfiguration recovery - test that old config members will join the new
* config if its already active, and not try to complete the reconfiguration
public void testNextConfigAlreadyActive() throws Exception {
// 2 servers in current config, 5 in next config
final int SERVER_COUNT = 5;
final int[] clientPorts = new int[SERVER_COUNT];
StringBuilder sb = new StringBuilder();
String server;
String currentQuorumCfgSection = null, nextQuorumCfgSection;
ArrayList<String> allServers = new ArrayList<String>();
for (int i = 0; i < SERVER_COUNT; i++) {
clientPorts[i] = PortAssignment.unique();
server = "server." + i + "=localhost:" + PortAssignment.unique() + ":" + PortAssignment.unique()
+ ":participant;localhost:" + clientPorts[i];
sb.append(server + "\n");
if (i == 1) {
currentQuorumCfgSection = sb.toString();
nextQuorumCfgSection = sb.toString();
// lets start servers 2, 3, 4 with the new config
MainThread[] mt = new MainThread[SERVER_COUNT];
ZooKeeper[] zk = new ZooKeeper[SERVER_COUNT];
for (int i = 2; i < SERVER_COUNT; i++) {
mt[i] = new MainThread(i, clientPorts[i], nextQuorumCfgSection, true, "200000000");
zk[i] = new ZooKeeper("" + clientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
for (int i = 2; i < SERVER_COUNT; i++) {
assertTrue(ClientBase.waitForServerUp("" + clientPorts[i], CONNECTION_TIMEOUT),
"waiting for server " + i + " being up");
ReconfigTest.testNormalOperation(zk[2], zk[3]);
long epoch = mt[2].main.quorumPeer.getAcceptedEpoch();
// Both servers 0 and 1 will have the .next config file, which means
// for them that a reconfiguration was in progress when they failed
// and the leader will complete it.
for (int i = 0; i < 2; i++) {
mt[i] = new MainThread(i, clientPorts[i], currentQuorumCfgSection, true, "100000000");
mt[i].writeTempDynamicConfigFile(nextQuorumCfgSection, "200000000");
zk[i] = new ZooKeeper("" + clientPorts[i], ClientBase.CONNECTION_TIMEOUT, this);
// servers 0 and 1 should connect to all servers, including the one in
// their .next file during startup, and will find the next config and join it
for (int i = 0; i < 2; i++) {
assertTrue(ClientBase.waitForServerUp("" + clientPorts[i], CONNECTION_TIMEOUT * 2),
"waiting for server " + i + " being up");
// make sure they joined the new config without any change to it
assertEquals(epoch, mt[0].main.quorumPeer.getAcceptedEpoch());
assertEquals(epoch, mt[1].main.quorumPeer.getAcceptedEpoch());
assertEquals(epoch, mt[2].main.quorumPeer.getAcceptedEpoch());
ReconfigTest.testServerHasConfig(zk[0], allServers, null);
ReconfigTest.testServerHasConfig(zk[1], allServers, null);
ReconfigTest.testNormalOperation(zk[0], zk[2]);
ReconfigTest.testNormalOperation(zk[4], zk[1]);
for (int i = 0; i < SERVER_COUNT; i++) {
* Tests conversion of observer to participant AFTER new config was already
* committed. Old config: servers 0 (participant), 1 (participant), 2
* (observer) New config: servers 2 (participant), 3 (participant) We start
* server 2 with old config and start server 3 with new config. All other
* servers are down. In order to terminate FLE, server 3 must 'convince'
* server 2 to adopt the new config and turn into a participant.
public void testObserverConvertedToParticipantDuringFLE() throws Exception {
final int SERVER_COUNT = 4;
int[][] ports = generatePorts(SERVER_COUNT);
String currentQuorumCfgSection, nextQuorumCfgSection;
// generate old config string
Set<Integer> observers = new HashSet<Integer>();
StringBuilder sb = generateConfig(3, ports, observers);
currentQuorumCfgSection = sb.toString();
// generate new config string
ArrayList<String> allServersNext = new ArrayList<String>();
sb = new StringBuilder();
for (int i = 2; i < SERVER_COUNT; i++) {
String server = "server." + i + "=localhost:" + ports[i][0] + ":" + ports[i][1]
+ ":participant;localhost:" + ports[i][2];
sb.append(server + "\n");
nextQuorumCfgSection = sb.toString();
MainThread[] mt = new MainThread[SERVER_COUNT];
ZooKeeper[] zk = new ZooKeeper[SERVER_COUNT];
// start server 2 with old config, where it is an observer
mt[2] = new MainThread(2, ports[2][2], currentQuorumCfgSection, true, "100000000");
zk[2] = new ZooKeeper("" + ports[2][2], ClientBase.CONNECTION_TIMEOUT, this);
// start server 3 with new config
mt[3] = new MainThread(3, ports[3][2], nextQuorumCfgSection, true, "200000000");
zk[3] = new ZooKeeper("" + ports[3][2], ClientBase.CONNECTION_TIMEOUT, this);
for (int i = 2; i < SERVER_COUNT; i++) {
assertTrue(ClientBase.waitForServerUp("" + ports[i][2], CONNECTION_TIMEOUT * 2),
"waiting for server " + i + " being up");
ReconfigTest.testServerHasConfig(zk[i], allServersNext, null);
nextQuorumCfgSection + "version=200000000",
ReconfigTest.testServerHasConfig(zk[2], null, null));
nextQuorumCfgSection + "version=200000000",
ReconfigTest.testServerHasConfig(zk[3], null, null));
ReconfigTest.testNormalOperation(zk[2], zk[2]);
ReconfigTest.testNormalOperation(zk[3], zk[2]);
for (int i = 2; i < SERVER_COUNT; i++) {
* Tests conversion of observer to participant during reconfig recovery, new
* config was not committed yet. Old config: servers 0 (participant), 1
* (participant), 2 (observer) New config: servers 2 (participant), 3
* (participant) We start server servers 0, 1, 2 with old config and a .next
* file indicating a reconfig in progress. We start server 3 with old config
* + itself in config file. In this scenario server 2 can't be converted to
* participant during reconfig since we don't gossip about proposed
* configurations, only about committed ones. This tests that new config can
* be completed, which requires server 2's ack for the newleader message,
* even though its an observer.
public void testCurrentObserverIsParticipantInNewConfig() throws Exception {
final int SERVER_COUNT = 4;
int[][] ports = generatePorts(SERVER_COUNT);
String currentQuorumCfg, nextQuorumCfgSection;
// generate old config string
Set<Integer> observers = new HashSet<Integer>();
StringBuilder sb = generateConfig(3, ports, observers);
currentQuorumCfg = sb.toString();
// Run servers 0..2 for a while
MainThread[] mt = new MainThread[SERVER_COUNT];
ZooKeeper[] zk = new ZooKeeper[SERVER_COUNT];
for (int i = 0; i <= 2; i++) {
mt[i] = new MainThread(i, ports[i][2], currentQuorumCfg, true, "100000000");
zk[i] = new ZooKeeper("" + ports[i][2], ClientBase.CONNECTION_TIMEOUT, this);
ReconfigTest.testNormalOperation(zk[0], zk[2]);
for (int i = 0; i <= 2; i++) {
assertTrue(ClientBase.waitForServerUp("" + ports[i][2], CONNECTION_TIMEOUT * 2),
"waiting for server " + i + " being up");
// shut servers 0..2 down
for (int i = 0; i <= 2; i++) {
// generate new config string
ArrayList<String> allServersNext = new ArrayList<String>();
sb = new StringBuilder();
for (int i = 2; i < SERVER_COUNT; i++) {
String server = "server." + i + "=localhost:" + ports[i][0] + ":" + ports[i][1]
+ ":participant;localhost:" + ports[i][2];
sb.append(server + "\n");
nextQuorumCfgSection = sb.toString();
// simulate reconfig in progress - servers 0..2 have a temp reconfig
// file when they boot
for (int i = 0; i <= 2; i++) {
mt[i].writeTempDynamicConfigFile(nextQuorumCfgSection, "200000000");
zk[i] = new ZooKeeper("" + ports[i][2], ClientBase.CONNECTION_TIMEOUT, this);
// new server 3 has still its invalid joiner config - everyone in old
// config + itself
mt[3] = new MainThread(3, ports[3][2], currentQuorumCfg + allServersNext.get(1));
zk[3] = new ZooKeeper("" + ports[3][2], ClientBase.CONNECTION_TIMEOUT, this);
for (int i = 2; i < SERVER_COUNT; i++) {
assertTrue(ClientBase.waitForServerUp("" + ports[i][2], CONNECTION_TIMEOUT * 3),
"waiting for server " + i + " being up");
ReconfigTest.testServerHasConfig(zk[i], allServersNext, null);
ReconfigTest.testNormalOperation(zk[0], zk[2]);
ReconfigTest.testNormalOperation(zk[3], zk[1]);
nextQuorumCfgSection + "version=200000000",
ReconfigTest.testServerHasConfig(zk[2], null, null));
nextQuorumCfgSection + "version=200000000",
ReconfigTest.testServerHasConfig(zk[3], null, null));
for (int i = 0; i < SERVER_COUNT; i++) {
* Generates 3 ports per server
public static int[][] generatePorts(int numServers) {
int[][] ports = new int[numServers][];
for (int i = 0; i < numServers; i++) {
ports[i] = new int[3];
for (int j = 0; j < 3; j++) {
ports[i][j] = PortAssignment.unique();
return ports;
* Creates a configuration string for servers 0..numServers-1 Ids in
* observerIds correspond to observers, other ids are for participants.
public static StringBuilder generateConfig(int numServers, int[][] ports, Set<Integer> observerIds) {
StringBuilder sb = new StringBuilder();
for (int i = 0; i < numServers; i++) {
String server = "server." + i + "=localhost:" + ports[i][0] + ":" + ports[i][1] + ":"
+ (observerIds.contains(i) ? "observer" : "participant")
+ ";localhost:" + ports[i][2];
sb.append(server + "\n");
return sb;