Files
mongo/jstests/replsets/write_concern_after_stepdown_and_stepup.js
Steve McClure 1ffbc6c2e9 SERVER-109432: Autofix JS var usage to favor let (#40637)
GitOrigin-RevId: 9674b7db36a0f3f650d39c1e3fb2ad6ff2141cfb
2025-08-28 19:21:01 +00:00

141 lines
4.7 KiB
JavaScript

/*
* Tests that heartbeats containing writes from a different branch of history can't cause a stale
* primary to incorrectly acknowledge a w:majority write that's about to be rolled back, even if the
* stale primary is re-elected primary before waiting for the write concern acknowledgement.
*/
import {configureFailPoint} from "jstests/libs/fail_point_util.js";
import {ReplSetTest} from "jstests/libs/replsettest.js";
import {restartServerReplication, stopServerReplication} from "jstests/libs/write_concern_util.js";
import {waitForState} from "jstests/replsets/rslib.js";
let name = "writeConcernStepDownAndBackUp";
let dbName = "wMajorityCheck";
let collName = "stepdownAndBackUp";
let rst = new ReplSetTest({
name: name,
nodes: [{}, {}, {rsConfig: {priority: 0}}],
useBridge: true,
});
let nodes = rst.startSet();
rst.initiate(null, null, {initiateWithDefaultElectionTimeout: true});
function waitForPrimary(node) {
assert.soon(function () {
return node.adminCommand("hello").isWritablePrimary;
});
}
function stepUp(node) {
let primary = rst.getPrimary();
if (primary != node) {
assert.commandWorked(primary.adminCommand({replSetStepDown: 60 * 5}));
}
waitForPrimary(node);
}
jsTestLog("Make sure node 0 is primary.");
stepUp(nodes[0]);
let primary = rst.getPrimary();
let secondaries = rst.getSecondaries();
assert.eq(nodes[0], primary);
// The default WC is majority and stopServerReplication will prevent satisfying any majority writes.
assert.commandWorked(
primary.adminCommand({setDefaultRWConcern: 1, defaultWriteConcern: {w: 1}, writeConcern: {w: "majority"}}),
);
rst.awaitReplication();
// Wait for all data bearing nodes to get up to date.
assert.commandWorked(
nodes[0]
.getDB(dbName)
.getCollection(collName)
.insert({a: 1}, {writeConcern: {w: 3, wtimeout: rst.timeoutMS}}),
);
// Stop the secondaries from replicating.
stopServerReplication(secondaries);
// Stop the primary from calling into awaitReplication()
const hangBeforeWaitingForWriteConcern = configureFailPoint(nodes[0], "hangBeforeWaitingForWriteConcern");
jsTestLog(
"Do w:majority write that won't enter awaitReplication() until after the primary " + "has stepped down and back up",
);
let doMajorityWrite = function () {
// Run hello command with 'hangUpOnStepDown' set to false to mark this connection as
// one that shouldn't be closed when the node steps down. This simulates the scenario where
// the write was coming from a mongos.
assert.commandWorked(db.adminCommand({hello: 1, hangUpOnStepDown: false}));
let res = db.getSiblingDB("wMajorityCheck").stepdownAndBackUp.insert(
{a: 2},
{
writeConcern: {w: "majority"},
},
);
assert.writeErrorWithCode(res, ErrorCodes.InterruptedDueToReplStateChange);
};
let joinMajorityWriter = startParallelShell(doMajorityWrite, nodes[0].port);
// Ensure the parallel shell hangs on the majority write before stepping the primary down.
hangBeforeWaitingForWriteConcern.wait();
jsTest.log("Disconnect primary from all secondaries");
nodes[0].disconnect(nodes[1]);
nodes[0].disconnect(nodes[2]);
jsTest.log("Wait for a new primary to be elected");
// Allow the secondaries to replicate again.
restartServerReplication(secondaries);
waitForPrimary(nodes[1]);
jsTest.log("Do a write to the new primary");
assert.commandWorked(
nodes[1]
.getDB(dbName)
.getCollection(collName)
.insert({a: 3}, {writeConcern: {w: 2, wtimeout: rst.timeoutMS}}),
);
jsTest.log("Reconnect the old primary to the rest of the nodes");
nodes[0].reconnect(nodes[1]);
nodes[0].reconnect(nodes[2]);
jsTest.log(
"Wait for the old primary to step down, roll back its write, and apply the " + "new writes from the new primary",
);
waitForState(nodes[0], ReplSetTest.State.SECONDARY);
rst.awaitReplication();
// At this point all 3 nodes should have the same data
assert.soonNoExcept(function () {
nodes.forEach(function (node) {
assert.eq(
null,
node.getDB(dbName).getCollection(collName).findOne({a: 2}),
"Node " + node.host + " contained op that should have been rolled back",
);
assert.neq(
null,
node.getDB(dbName).getCollection(collName).findOne({a: 3}),
"Node " + node.host + " was missing op from branch of history that should have persisted",
);
});
return true;
});
jsTest.log("Make the original primary become primary once again");
stepUp(nodes[0]);
jsTest.log(
"Unblock the thread waiting for replication of the now rolled-back write, ensure " +
"that the write concern failed",
);
hangBeforeWaitingForWriteConcern.off();
joinMajorityWriter();
rst.stopSet();