261 lines
14 KiB
JavaScript
261 lines
14 KiB
JavaScript
/*
|
|
* Tests the following scenarios where the featureCompatibilityVersion document is rolled back and
|
|
* verify that the in-memory and on-disk FCV stay consistent.
|
|
* - the FCV document is rolled back from fully upgraded to upgrading
|
|
* - the FCV document is rolled back from upgrading to fully downgraded
|
|
* - the FCV document is rolled back from fully downgraded to downgrading
|
|
* - the FCV document is rolled back from downgrading to fully upgraded
|
|
*
|
|
* @tags: [multiversion_incompatible]
|
|
*/
|
|
|
|
(function() {
|
|
"use strict";
|
|
|
|
load("jstests/replsets/libs/rollback_test.js");
|
|
load('jstests/libs/parallel_shell_helpers.js');
|
|
load("jstests/libs/fail_point_util.js");
|
|
load("jstests/replsets/rslib.js");
|
|
load("jstests/libs/feature_flag_util.js");
|
|
|
|
function setFCV(fcv) {
|
|
assert.commandFailedWithCode(db.adminCommand({setFeatureCompatibilityVersion: fcv}),
|
|
ErrorCodes.InterruptedDueToReplStateChange);
|
|
}
|
|
|
|
// Using getParameter results in waiting for the current FCV to be majority committed. In this
|
|
// test, it never will, so we need to get the FCV directly.
|
|
function getFCVFromDocument(conn) {
|
|
return conn.getDB("admin").system.version.find().readConcern("local").toArray()[0];
|
|
}
|
|
|
|
// fromFCV refers to the FCV we will test rolling back from.
|
|
// toFCV refers to the FCV we will test rolling back to.
|
|
function rollbackFCVFromDowngradingOrUpgrading(fromFCV, toFCV) {
|
|
let primary = rollbackTest.getPrimary();
|
|
let secondary = rollbackTest.getSecondary();
|
|
let primaryAdminDB = primary.getDB('admin');
|
|
let secondaryAdminDB = secondary.getDB('admin');
|
|
|
|
// Ensure the cluster starts at the correct FCV.
|
|
assert.commandWorked(primary.adminCommand({setFeatureCompatibilityVersion: toFCV}));
|
|
// Wait until the config has propagated to the other nodes and the primary has learned of it, so
|
|
// that the config replication check in 'setFeatureCompatibilityVersion' is satisfied. This is
|
|
// only important since 'setFeatureCompatibilityVersion' is known to implicitly call internal
|
|
// reconfigs as part of upgrade/downgrade behavior.
|
|
rollbackTest.getTestFixture().waitForConfigReplication(primary);
|
|
// Wait for the majority commit point to be updated on the secondary, because checkFCV calls
|
|
// getParameter for the featureCompatibilityVersion, which will wait until the FCV change makes
|
|
// it into the node's majority committed snapshot.
|
|
rollbackTest.getTestFixture().awaitLastOpCommitted(undefined /* timeout */, [secondary]);
|
|
|
|
jsTestLog("Testing rolling back FCV from {version: " + lastLTSFCV +
|
|
", targetVersion: " + fromFCV + "} to {version: " + toFCV + "}");
|
|
|
|
rollbackTest.transitionToRollbackOperations();
|
|
let setFCVInParallel = startParallelShell(funWithArgs(setFCV, fromFCV), primary.port);
|
|
// Wait for the FCV update to be reflected on the primary. This should eventually be rolled
|
|
// back.
|
|
assert.soon(function() {
|
|
let featureCompatibilityVersion = getFCVFromDocument(primary);
|
|
return featureCompatibilityVersion.hasOwnProperty('targetVersion');
|
|
}, "Failed waiting for the server to set the targetVersion: " + fromFCV);
|
|
rollbackTest.transitionToSyncSourceOperationsBeforeRollback();
|
|
// Secondaries should never have received the FCV update.
|
|
checkFCV(secondaryAdminDB, toFCV);
|
|
rollbackTest.transitionToSyncSourceOperationsDuringRollback();
|
|
setFCVInParallel();
|
|
rollbackTest.transitionToSteadyStateOperations();
|
|
// The primary should have rolled back their FCV to be consistent with the rest of the replica
|
|
// set.
|
|
checkFCV(primaryAdminDB, toFCV);
|
|
checkFCV(secondaryAdminDB, toFCV);
|
|
|
|
let newPrimary = rollbackTest.getPrimary();
|
|
// As a rule, we forbid downgrading a node while a node is still in the upgrading state and
|
|
// vice versa. Ensure that the in-memory and on-disk FCV are consistent by checking that we are
|
|
// able to set the FCV back to the original version.
|
|
assert.commandWorked(newPrimary.adminCommand({setFeatureCompatibilityVersion: toFCV}));
|
|
}
|
|
|
|
// fromFCV refers to the FCV we will test rolling back from.
|
|
// toFCV refers to the FCV we will test rolling back to.
|
|
function rollbackFCVFromDowngradedOrUpgraded(fromFCV, toFCV, failPoint) {
|
|
let primary = rollbackTest.getPrimary();
|
|
let secondary = rollbackTest.getSecondary();
|
|
let primaryAdminDB = primary.getDB('admin');
|
|
let secondaryAdminDB = secondary.getDB('admin');
|
|
|
|
// Complete the upgrade/downgrade to ensure we are not in the upgrading/downgrading state.
|
|
assert.commandWorked(primary.adminCommand({setFeatureCompatibilityVersion: toFCV}));
|
|
// Wait for the majority commit point to be updated on the secondary, because checkFCV calls
|
|
// getParameter for the featureCompatibilityVersion, which will wait until the FCV change makes
|
|
// it into the node's majority committed snapshot.
|
|
rollbackTest.getTestFixture().awaitLastOpCommitted(undefined /* timeout */, [secondary]);
|
|
|
|
jsTestLog("Testing rolling back FCV from {version: " + fromFCV +
|
|
"} to {version: " + lastLTSFCV + ", targetVersion: " + fromFCV + "}");
|
|
|
|
// A failpoint to hang right before unsetting the targetVersion.
|
|
const hangBeforeUnsettingTargetVersion = configureFailPoint(primary, failPoint);
|
|
let setFCVInParallel = startParallelShell(funWithArgs(setFCV, fromFCV), primary.port);
|
|
hangBeforeUnsettingTargetVersion.wait();
|
|
rollbackTest.transitionToRollbackOperations();
|
|
// Turn off the failpoint so the primary will proceed to unset the targetVersion. This update
|
|
// should never make it to the secondary.
|
|
hangBeforeUnsettingTargetVersion.off();
|
|
assert.soon(function() {
|
|
let featureCompatibilityVersion = getFCVFromDocument(primary);
|
|
return !featureCompatibilityVersion.hasOwnProperty('targetVersion') &&
|
|
featureCompatibilityVersion.version === fromFCV;
|
|
}, "Failed waiting for server to unset the targetVersion or to set the FCV to " + fromFCV);
|
|
rollbackTest.transitionToSyncSourceOperationsBeforeRollback();
|
|
// The secondary should never have received the update to unset the targetVersion.
|
|
checkFCV(secondaryAdminDB, lastLTSFCV, fromFCV);
|
|
rollbackTest.transitionToSyncSourceOperationsDuringRollback();
|
|
setFCVInParallel();
|
|
rollbackTest.transitionToSteadyStateOperations();
|
|
// The primary should have rolled back their FCV to contain the targetVersion.
|
|
checkFCV(primaryAdminDB, lastLTSFCV, fromFCV);
|
|
checkFCV(secondaryAdminDB, lastLTSFCV, fromFCV);
|
|
|
|
let newPrimary = rollbackTest.getPrimary();
|
|
const newPrimaryAdminDB = newPrimary.getDB('admin');
|
|
// As a rule, we forbid downgrading a node while a node is still in the upgrading state and
|
|
// vice versa (except for the added path from downgrading to upgrading).
|
|
// Ensure that the in-memory and on-disk FCV are consistent by checking that this rule is
|
|
// upheld after rollback.
|
|
if (fromFCV === lastLTSFCV && toFCV === latestFCV &&
|
|
FeatureFlagUtil.isEnabled(newPrimaryAdminDB,
|
|
"DowngradingToUpgrading",
|
|
null /* user not specified */,
|
|
true /* ignores FCV */)) {
|
|
assert.commandWorked(newPrimary.adminCommand({setFeatureCompatibilityVersion: toFCV}));
|
|
} else {
|
|
assert.commandFailedWithCode(
|
|
newPrimary.adminCommand({setFeatureCompatibilityVersion: toFCV}), 5147403);
|
|
}
|
|
}
|
|
|
|
// Test rolling back from upgrading to downgrading.
|
|
// Start off with downgrading from latest to lastLTS.
|
|
// Go to upgrading from lastLTS to latest state.
|
|
// Rollback and make sure the FCV doc is back in the downgrading from latest to lastLTS state.
|
|
function rollbackFCVFromUpgradingToDowngrading() {
|
|
let fcvDoc;
|
|
const rollbackNode = rollbackTest.getPrimary();
|
|
const syncSource = rollbackTest.getSecondary();
|
|
const rollbackNodeAdminDB = rollbackNode.getDB('admin');
|
|
const syncSourceAdminDB = syncSource.getDB('admin');
|
|
|
|
// Ensure the cluster starts at the correct FCV.
|
|
assert.commandWorked(rollbackNode.adminCommand({setFeatureCompatibilityVersion: latestFCV}));
|
|
|
|
if (!FeatureFlagUtil.isEnabled(rollbackNodeAdminDB, "DowngradingToUpgrading")) {
|
|
jsTestLog(
|
|
"Skipping rollbackFCVFromUpgradingToDowngrading as featureFlagDowngradingToUpgrading is not enabled");
|
|
return;
|
|
}
|
|
|
|
fcvDoc = rollbackNodeAdminDB.system.version.findOne({_id: 'featureCompatibilityVersion'});
|
|
jsTestLog(`rollbackNode's version at start: ${tojson(fcvDoc)}`);
|
|
checkFCV(rollbackNodeAdminDB, latestFCV);
|
|
|
|
// Set the failpoints so that both upgrading and downgrading would fail.
|
|
assert.commandWorked(
|
|
rollbackNode.adminCommand({configureFailPoint: "failDowngrading", mode: "alwaysOn"}));
|
|
assert.commandWorked(
|
|
rollbackNode.adminCommand({configureFailPoint: "failUpgrading", mode: "alwaysOn"}));
|
|
|
|
// Go to downgrading state (downgrading from latest to lastLTS).
|
|
assert.commandFailed(
|
|
rollbackNodeAdminDB.runCommand({setFeatureCompatibilityVersion: lastLTSFCV}));
|
|
|
|
fcvDoc = rollbackNodeAdminDB.system.version.findOne({_id: 'featureCompatibilityVersion'});
|
|
jsTestLog(`rollbackNode's version after downgrading: ${tojson(fcvDoc)}`);
|
|
checkFCV(rollbackNodeAdminDB, lastLTSFCV, lastLTSFCV);
|
|
|
|
// Wait until the config has propagated to the other nodes and the rollbackNode has learned of
|
|
// it, so that the config replication check in 'setFeatureCompatibilityVersion' is satisfied.
|
|
// This is only important since 'setFeatureCompatibilityVersion' is known to implicitly call
|
|
// internal reconfigs as part of upgrade/downgrade behavior.
|
|
rollbackTest.getTestFixture().waitForConfigReplication(rollbackNode);
|
|
// Wait for the majority commit point to be updated on the sync source, because checkFCV calls
|
|
// getParameter for the featureCompatibilityVersion, which will wait until the FCV change makes
|
|
// it into the node's majority committed snapshot.
|
|
rollbackTest.getTestFixture().awaitLastOpCommitted(undefined /* timeout */, [syncSource]);
|
|
|
|
// test rolling back from upgrading to downgrading
|
|
jsTestLog("Testing rolling back FCV from {version: " + lastLTSFCV + ", targetVersion: " +
|
|
latestFCV + "} to {version: " + lastLTSFCV + ", targetVersion: " + lastLTSFCV + "}");
|
|
|
|
rollbackTest.transitionToRollbackOperations();
|
|
let setFCVInParallel = startParallelShell(funWithArgs(setFCV, latestFCV), rollbackNode.port);
|
|
// Wait for the FCV update to be reflected on the rollbackNode. This should eventually be rolled
|
|
// back.
|
|
assert.soon(
|
|
function() {
|
|
let featureCompatibilityVersion = getFCVFromDocument(rollbackNode);
|
|
jsTestLog(`rollbackNode's version in parallel shell (should eventually be upgrading): ${
|
|
tojson(featureCompatibilityVersion)}`);
|
|
return !featureCompatibilityVersion.hasOwnProperty('previousVersion') &&
|
|
featureCompatibilityVersion.hasOwnProperty('targetVersion') &&
|
|
featureCompatibilityVersion.targetVersion == latestFCV;
|
|
},
|
|
"Failed waiting for the server to unset the previous version and set the target version to " +
|
|
latestFCV);
|
|
checkFCV(rollbackNodeAdminDB, lastLTSFCV, latestFCV);
|
|
|
|
rollbackTest.transitionToSyncSourceOperationsBeforeRollback();
|
|
|
|
setFCVInParallel();
|
|
|
|
fcvDoc = rollbackNodeAdminDB.system.version.findOne({_id: 'featureCompatibilityVersion'});
|
|
jsTestLog(`Rollback node's version after setFCVInParallel: ${tojson(fcvDoc)}`);
|
|
checkFCV(rollbackNodeAdminDB, lastLTSFCV, latestFCV);
|
|
// Secondaries should never have received the FCV update.
|
|
fcvDoc = syncSourceAdminDB.system.version.findOne({_id: 'featureCompatibilityVersion'});
|
|
jsTestLog(`syncSource's version (should still be downgrading): ${tojson(fcvDoc)}`);
|
|
checkFCV(syncSourceAdminDB, lastLTSFCV, lastLTSFCV);
|
|
|
|
rollbackTest.transitionToSyncSourceOperationsDuringRollback();
|
|
rollbackTest.transitionToSteadyStateOperations();
|
|
|
|
// The rollbackNode should have rolled back their FCV to be consistent with the rest of the
|
|
// replica set.
|
|
fcvDoc = rollbackNodeAdminDB.system.version.findOne({_id: 'featureCompatibilityVersion'});
|
|
jsTestLog(`rollbackNode's version after rollback: ${tojson(fcvDoc)}`);
|
|
checkFCV(rollbackNodeAdminDB, lastLTSFCV, lastLTSFCV);
|
|
fcvDoc = syncSourceAdminDB.system.version.findOne({_id: 'featureCompatibilityVersion'});
|
|
jsTestLog(`SyncSource's version after rollback: ${tojson(fcvDoc)}`);
|
|
checkFCV(syncSourceAdminDB, lastLTSFCV, lastLTSFCV);
|
|
|
|
const newPrimary = rollbackTest.getPrimary();
|
|
const newPrimaryAdminDB = newPrimary.getDB('admin');
|
|
// We should now be able to set the FCV from downgrading to upgrading to upgraded.
|
|
assert.commandWorked(newPrimary.adminCommand({setFeatureCompatibilityVersion: latestFCV}));
|
|
checkFCV(newPrimaryAdminDB, latestFCV);
|
|
}
|
|
|
|
const testName = jsTest.name();
|
|
|
|
const rollbackTest = new RollbackTest(testName);
|
|
|
|
// Tests the case where we roll back the FCV state from downgrading to fully upgraded.
|
|
rollbackFCVFromDowngradingOrUpgrading(lastLTSFCV, latestFCV);
|
|
|
|
// Tests the case where we roll back the FCV state from upgrading to fully downgraded.
|
|
rollbackFCVFromDowngradingOrUpgrading(latestFCV, lastLTSFCV);
|
|
|
|
// Tests the case where we roll back the FCV state from fully downgraded to downgrading.
|
|
rollbackFCVFromDowngradedOrUpgraded(lastLTSFCV, latestFCV, "hangWhileDowngrading");
|
|
|
|
// Tests the case where we roll back the FCV state from fully upgraded to upgrading.
|
|
rollbackFCVFromDowngradedOrUpgraded(latestFCV, lastLTSFCV, "hangWhileUpgrading");
|
|
|
|
// Tests the case where we roll back the FCV state from upgrading to downgrading.
|
|
rollbackFCVFromUpgradingToDowngrading();
|
|
|
|
rollbackTest.stop();
|
|
}());
|