mongo/jstests/replsets/catchup_takeover_one_high_p...

117 lines
4.3 KiB
JavaScript

// Test to ensure that catchup takeover runs even if it isn't the highest
// priority node and that once the high priority node is caught up,
// it becomes primary again.
// 3-node replica set with one high priority node.
// Start replica set. Make node 0 primary and stop the replication
// for the high priority node as well as isolate it. Have the
// primary write something so node 2 is more than 2 seconds behind.
// Write something else to ensure the third node is also lagged.
// Reconnect the high priority node to the other nodes and make
// the lagged node (node 1) the next primary.
// Confirm that the most up-to-date node becomes primary.
// Let the highest priority node catchup and then confirm
// that it becomes primary.
import {ReplSetTest} from "jstests/libs/replsettest.js";
import {restartServerReplication, stopServerReplication} from "jstests/libs/write_concern_util.js";
let name = "catchup_takeover_one_high_priority";
let replSet = new ReplSetTest({name: name, nodes: 3, useBridge: true});
let nodenames = replSet.nodeList();
let nodes = replSet.startSet();
replSet.initiate(
{
"_id": name,
"members": [
{"_id": 0, "host": nodenames[0]},
{"_id": 1, "host": nodenames[1]},
{"_id": 2, "host": nodenames[2], "priority": 2},
],
},
null,
{initiateWithDefaultElectionTimeout: true},
);
// Wait until node 2 becomes primary.
replSet.waitForState(2, ReplSetTest.State.PRIMARY, replSet.timeoutMS);
jsTestLog("node 2 is now primary");
// The default WC is majority and this test can't test catchup properly if it used majority writes.
assert.commandWorked(
replSet
.getPrimary()
.adminCommand({setDefaultRWConcern: 1, defaultWriteConcern: {w: 1}, writeConcern: {w: "majority"}}),
);
replSet.awaitReplication();
replSet.waitForConfigReplication(nodes[2]);
// Stop replication and disconnect node 2 so that it cannot do a priority takeover.
stopServerReplication(nodes[2]);
nodes[2].disconnect(nodes[1]);
nodes[2].disconnect(nodes[0]);
// Ensure that node 0 becomes primary.
assert.commandWorked(nodes[0].adminCommand({replSetStepUp: 1}));
replSet.awaitNodesAgreeOnPrimary(replSet.timeoutMS, nodes.slice(0, 2));
assert.eq(
ReplSetTest.State.PRIMARY,
assert.commandWorked(nodes[0].adminCommand("replSetGetStatus")).myState,
nodes[0].host + " was not primary after step-up",
);
jsTestLog("node 0 is now primary");
// Sleep for a few seconds to ensure that node 2's optime is more than 2 seconds behind.
// This will ensure it can't do a priority takeover until it catches up.
sleep(3000);
let primary = replSet.getPrimary();
let writeConcern = {writeConcern: {w: 2, wtimeout: replSet.timeoutMS}};
assert.commandWorked(primary.getDB(name).bar.insert({y: 100}, writeConcern));
// Write something so that node 0 is ahead of node 1.
stopServerReplication(nodes[1]);
writeConcern = {
writeConcern: {w: 1, wtimeout: replSet.timeoutMS},
};
assert.commandWorked(primary.getDB(name).bar.insert({x: 100}, writeConcern));
nodes[2].reconnect(nodes[0]);
nodes[2].reconnect(nodes[1]);
// Wait until nodes have learned the latest config.
replSet.waitForConfigReplication(nodes[1], [nodes[1], nodes[2]]);
// Step up a lagged node.
assert.commandWorked(nodes[1].adminCommand({replSetStepUp: 1}));
replSet.awaitNodesAgreeOnPrimary(replSet.timeoutMS, nodes);
assert.eq(
ReplSetTest.State.PRIMARY,
assert.commandWorked(nodes[1].adminCommand("replSetGetStatus")).myState,
nodes[1].host + " was not primary after step-up",
);
jsTestLog("node 1 is now primary, but cannot accept writes");
// Confirm that the most up-to-date node becomes primary
// after the default catchup delay.
replSet.waitForState(0, ReplSetTest.State.PRIMARY, replSet.timeoutMS);
jsTestLog("node 0 performed catchup takeover and is now primary");
// Wait until the old primary steps down.
replSet.awaitNodesAgreeOnPrimary();
// Let the nodes catchup.
restartServerReplication(nodes[1]);
restartServerReplication(nodes[2]);
replSet.awaitReplication();
// Confirm that the highest priority node becomes primary
// after catching up.
replSet.waitForState(2, ReplSetTest.State.PRIMARY, replSet.timeoutMS);
jsTestLog("node 2 performed priority takeover and is now primary");
// Wait until the old primary steps down so the connections won't be closed during stopSet().
replSet.awaitSecondaryNodes(replSet.timeoutMS, [nodes[0]]);
replSet.stopSet();