388 lines
15 KiB
C++
388 lines
15 KiB
C++
// rs_config.cpp
|
|
|
|
/**
|
|
* Copyright (C) 2008 10gen Inc.
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3,
|
|
* as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Affero General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include "pch.h"
|
|
#include "rs.h"
|
|
#include "../../client/dbclient.h"
|
|
#include "../../client/syncclusterconnection.h"
|
|
#include "../../util/hostandport.h"
|
|
#include "../dbhelpers.h"
|
|
#include "connections.h"
|
|
#include "../oplog.h"
|
|
|
|
using namespace bson;
|
|
|
|
namespace mongo {
|
|
|
|
void logOpInitiate(const bo&);
|
|
|
|
void assertOnlyHas(BSONObj o, const set<string>& fields) {
|
|
BSONObj::iterator i(o);
|
|
while( i.more() ) {
|
|
BSONElement e = i.next();
|
|
if( !fields.count( e.fieldName() ) ) {
|
|
uasserted(13434, str::stream() << "unexpected field '" << e.fieldName() << "'in object");
|
|
}
|
|
}
|
|
}
|
|
|
|
list<HostAndPort> ReplSetConfig::otherMemberHostnames() const {
|
|
list<HostAndPort> L;
|
|
for( vector<MemberCfg>::const_iterator i = members.begin(); i != members.end(); i++ ) {
|
|
if( !i->h.isSelf() )
|
|
L.push_back(i->h);
|
|
}
|
|
return L;
|
|
}
|
|
|
|
/* comment MUST only be set when initiating the set by the initiator */
|
|
void ReplSetConfig::saveConfigLocally(bo comment) {
|
|
checkRsConfig();
|
|
log() << "replSet info saving a newer config version to local.system.replset" << rsLog;
|
|
{
|
|
writelock lk("");
|
|
Client::Context cx( rsConfigNs );
|
|
cx.db()->flushFiles(true);
|
|
|
|
//theReplSet->lastOpTimeWritten = ??;
|
|
//rather than above, do a logOp()? probably
|
|
BSONObj o = asBson();
|
|
Helpers::putSingletonGod(rsConfigNs.c_str(), o, false/*logOp=false; local db so would work regardless...*/);
|
|
if( !comment.isEmpty() )
|
|
logOpInitiate(comment);
|
|
|
|
cx.db()->flushFiles(true);
|
|
}
|
|
DEV log() << "replSet saveConfigLocally done" << rsLog;
|
|
}
|
|
|
|
/*static*/
|
|
/*void ReplSetConfig::receivedNewConfig(BSONObj cfg) {
|
|
if( theReplSet )
|
|
return; // this is for initial setup only, so far. todo
|
|
|
|
ReplSetConfig c(cfg);
|
|
|
|
writelock lk("admin.");
|
|
if( theReplSet )
|
|
return;
|
|
c.saveConfigLocally(bo());
|
|
}*/
|
|
|
|
bo ReplSetConfig::MemberCfg::asBson() const {
|
|
bob b;
|
|
b << "_id" << _id;
|
|
b.append("host", h.toString());
|
|
if( votes != 1 ) b << "votes" << votes;
|
|
if( priority != 1.0 ) b << "priority" << priority;
|
|
if( arbiterOnly ) b << "arbiterOnly" << true;
|
|
if( slaveDelay ) b << "slaveDelay" << slaveDelay;
|
|
if( hidden ) b << "hidden" << hidden;
|
|
if( !buildIndexes ) b << "buildIndexes" << buildIndexes;
|
|
return b.obj();
|
|
}
|
|
|
|
bo ReplSetConfig::asBson() const {
|
|
bob b;
|
|
b.append("_id", _id).append("version", version);
|
|
if( !ho.isDefault() || !getLastErrorDefaults.isEmpty() ) {
|
|
bob settings;
|
|
if( !ho.isDefault() )
|
|
settings << "heartbeatConnRetries " << ho.heartbeatConnRetries <<
|
|
"heartbeatSleep" << ho.heartbeatSleepMillis / 1000 <<
|
|
"heartbeatTimeout" << ho.heartbeatTimeoutMillis / 1000;
|
|
if( !getLastErrorDefaults.isEmpty() )
|
|
settings << "getLastErrorDefaults" << getLastErrorDefaults;
|
|
b << "settings" << settings.obj();
|
|
}
|
|
|
|
BSONArrayBuilder a;
|
|
for( unsigned i = 0; i < members.size(); i++ )
|
|
a.append( members[i].asBson() );
|
|
b.append("members", a.arr());
|
|
|
|
return b.obj();
|
|
}
|
|
|
|
static inline void mchk(bool expr) {
|
|
uassert(13126, "bad Member config", expr);
|
|
}
|
|
|
|
void ReplSetConfig::MemberCfg::check() const{
|
|
mchk(_id >= 0 && _id <= 255);
|
|
mchk(priority >= 0 && priority <= 1000);
|
|
mchk(votes >= 0 && votes <= 100);
|
|
uassert(13419, "this version of mongod only supports priorities 0 and 1", priority == 0 || priority == 1);
|
|
uassert(13437, "slaveDelay requires priority be zero", slaveDelay == 0 || priority == 0);
|
|
uassert(13438, "bad slaveDelay value", slaveDelay >= 0 && slaveDelay <= 3600 * 24 * 366);
|
|
uassert(13439, "priority must be 0 when hidden=true", priority == 0 || !hidden);
|
|
uassert(13477, "priority must be 0 when buildIndexes=false", priority == 0 || !hidden);
|
|
}
|
|
|
|
/** @param o old config
|
|
@param n new config
|
|
*/
|
|
/*static*/ bool ReplSetConfig::legalChange(const ReplSetConfig& o, const ReplSetConfig& n, string& errmsg) {
|
|
assert( theReplSet );
|
|
|
|
if( o._id != n._id ) {
|
|
errmsg = "set name may not change";
|
|
return false;
|
|
}
|
|
/* TODO : wonder if we need to allow o.version < n.version only, which is more lenient.
|
|
if someone had some intermediate config this node doesnt have, that could be
|
|
necessary. but then how did we become primary? so perhaps we are fine as-is.
|
|
*/
|
|
if( o.version + 1 != n.version ) {
|
|
errmsg = "version number wrong";
|
|
return false;
|
|
}
|
|
|
|
map<HostAndPort,const ReplSetConfig::MemberCfg*> old;
|
|
for( vector<ReplSetConfig::MemberCfg>::const_iterator i = o.members.begin(); i != o.members.end(); i++ ) {
|
|
old[i->h] = &(*i);
|
|
}
|
|
int me = 0;
|
|
for( vector<ReplSetConfig::MemberCfg>::const_iterator i = n.members.begin(); i != n.members.end(); i++ ) {
|
|
const ReplSetConfig::MemberCfg& m = *i;
|
|
if( old.count(m.h) ) {
|
|
const ReplSetConfig::MemberCfg& oldCfg = *old[m.h];
|
|
if( oldCfg._id != m._id ) {
|
|
log() << "replSet reconfig error with member: " << m.h.toString() << rsLog;
|
|
uasserted(13432, "_id may not change for members");
|
|
}
|
|
if( oldCfg.buildIndexes != m.buildIndexes ) {
|
|
log() << "replSet reconfig error with member: " << m.h.toString() << rsLog;
|
|
uasserted(13476, "buildIndexes may not change for members");
|
|
}
|
|
}
|
|
if( m.h.isSelf() )
|
|
me++;
|
|
}
|
|
|
|
uassert(13433, "can't find self in new replset config", me == 1);
|
|
|
|
/* TODO : MORE CHECKS HERE */
|
|
|
|
log() << "replSet TODO : don't allow removal of a node until we handle it at the removed node end?" << endl;
|
|
// we could change its votes to zero perhaps instead as a short term...
|
|
|
|
return true;
|
|
}
|
|
|
|
void ReplSetConfig::clear() {
|
|
version = -5;
|
|
_ok = false;
|
|
}
|
|
|
|
void ReplSetConfig::checkRsConfig() const {
|
|
uassert(13132,
|
|
"nonmatching repl set name in _id field; check --replSet command line",
|
|
_id == cmdLine.ourSetName());
|
|
uassert(13308, "replSet bad config version #", version > 0);
|
|
uassert(13133, "replSet bad config no members", members.size() >= 1);
|
|
uassert(13309, "replSet bad config maximum number of members is 7 (for now)", members.size() <= 7);
|
|
}
|
|
|
|
void ReplSetConfig::from(BSONObj o) {
|
|
static const string legal[] = {"_id","version", "members","settings"};
|
|
static const set<string> legals(legal, legal + 4);
|
|
assertOnlyHas(o, legals);
|
|
|
|
md5 = o.md5();
|
|
_id = o["_id"].String();
|
|
if( o["version"].ok() ) {
|
|
version = o["version"].numberInt();
|
|
uassert(13115, "bad " + rsConfigNs + " config: version", version > 0);
|
|
}
|
|
|
|
if( o["settings"].ok() ) {
|
|
BSONObj settings = o["settings"].Obj();
|
|
if( settings["heartbeatConnRetries "].ok() )
|
|
ho.heartbeatConnRetries = settings["heartbeatConnRetries "].numberInt();
|
|
if( settings["heartbeatSleep"].ok() )
|
|
ho.heartbeatSleepMillis = (unsigned) (settings["heartbeatSleep"].Number() * 1000);
|
|
if( settings["heartbeatTimeout"].ok() )
|
|
ho.heartbeatTimeoutMillis = (unsigned) (settings["heartbeatTimeout"].Number() * 1000);
|
|
ho.check();
|
|
try { getLastErrorDefaults = settings["getLastErrorDefaults"].Obj().copy(); } catch(...) { }
|
|
}
|
|
|
|
set<string> hosts;
|
|
set<int> ords;
|
|
vector<BSONElement> members;
|
|
try {
|
|
members = o["members"].Array();
|
|
}
|
|
catch(...) {
|
|
uasserted(13131, "replSet error parsing (or missing) 'members' field in config object");
|
|
}
|
|
|
|
unsigned localhosts = 0;
|
|
for( unsigned i = 0; i < members.size(); i++ ) {
|
|
BSONObj mobj = members[i].Obj();
|
|
MemberCfg m;
|
|
try {
|
|
static const string legal[] = {"_id","votes","priority","host","hidden","slaveDelay","arbiterOnly","buildIndexes"};
|
|
static const set<string> legals(legal, legal + 8);
|
|
assertOnlyHas(mobj, legals);
|
|
|
|
try {
|
|
m._id = (int) mobj["_id"].Number();
|
|
} catch(...) {
|
|
/* TODO: use of string exceptions may be problematic for reconfig case! */
|
|
throw "_id must be numeric";
|
|
}
|
|
string s;
|
|
try {
|
|
s = mobj["host"].String();
|
|
m.h = HostAndPort(s);
|
|
}
|
|
catch(...) {
|
|
throw string("bad or missing host field? ") + mobj.toString();
|
|
}
|
|
if( m.h.isLocalHost() )
|
|
localhosts++;
|
|
m.arbiterOnly = mobj.getBoolField("arbiterOnly");
|
|
m.slaveDelay = mobj["slaveDelay"].numberInt();
|
|
if( mobj.hasElement("hidden") )
|
|
m.hidden = mobj.getBoolField("hidden");
|
|
if( mobj.hasElement("buildIndexes") )
|
|
m.buildIndexes = mobj.getBoolField("buildIndexes");
|
|
if( mobj.hasElement("priority") )
|
|
m.priority = mobj["priority"].Number();
|
|
if( mobj.hasElement("votes") )
|
|
m.votes = (unsigned) mobj["votes"].Number();
|
|
m.check();
|
|
}
|
|
catch( const char * p ) {
|
|
log() << "replSet cfg parsing exception for members[" << i << "] " << p << rsLog;
|
|
stringstream ss;
|
|
ss << "replSet members[" << i << "] " << p;
|
|
uassert(13107, ss.str(), false);
|
|
}
|
|
catch(DBException& e) {
|
|
log() << "replSet cfg parsing exception for members[" << i << "] " << e.what() << rsLog;
|
|
stringstream ss;
|
|
ss << "bad config for member[" << i << "] " << e.what();
|
|
uassert(13135, ss.str(), false);
|
|
}
|
|
if( !(ords.count(m._id) == 0 && hosts.count(m.h.toString()) == 0) ) {
|
|
log() << "replSet " << o.toString() << rsLog;
|
|
uassert(13108, "bad replset config -- duplicate hosts in the config object?", false);
|
|
}
|
|
hosts.insert(m.h.toString());
|
|
ords.insert(m._id);
|
|
this->members.push_back(m);
|
|
}
|
|
uassert(13393, "can't use localhost in repl set member names except when using it for all members", localhosts == 0 || localhosts == members.size());
|
|
uassert(13117, "bad " + rsConfigNs + " config", !_id.empty());
|
|
}
|
|
|
|
static inline void configAssert(bool expr) {
|
|
uassert(13122, "bad repl set config?", expr);
|
|
}
|
|
|
|
ReplSetConfig::ReplSetConfig(BSONObj cfg) {
|
|
clear();
|
|
from(cfg);
|
|
configAssert( version < 0 /*unspecified*/ || (version >= 1 && version <= 5000) );
|
|
if( version < 1 )
|
|
version = 1;
|
|
_ok = true;
|
|
}
|
|
|
|
ReplSetConfig::ReplSetConfig(const HostAndPort& h) {
|
|
clear();
|
|
int level = 2;
|
|
DEV level = 0;
|
|
//log(0) << "replSet load config from: " << h.toString() << rsLog;
|
|
|
|
auto_ptr<DBClientCursor> c;
|
|
int v = -5;
|
|
try {
|
|
if( h.isSelf() ) {
|
|
;
|
|
}
|
|
else {
|
|
/* first, make sure other node is configured to be a replset. just to be safe. */
|
|
string setname = cmdLine.ourSetName();
|
|
BSONObj cmd = BSON( "replSetHeartbeat" << setname );
|
|
int theirVersion;
|
|
BSONObj info;
|
|
bool ok = requestHeartbeat(setname, "", h.toString(), info, -2, theirVersion);
|
|
if( info["rs"].trueValue() ) {
|
|
// yes, it is a replicate set, although perhaps not yet initialized
|
|
}
|
|
else {
|
|
if( !ok ) {
|
|
log() << "replSet TEMP !ok heartbeating " << h.toString() << " on cfg load" << rsLog;
|
|
if( !info.isEmpty() )
|
|
log() << "replSet info " << h.toString() << " : " << info.toString() << rsLog;
|
|
return;
|
|
}
|
|
{
|
|
stringstream ss;
|
|
ss << "replSet error: member " << h.toString() << " is not in --replSet mode";
|
|
msgassertedNoTrace(13260, ss.str().c_str()); // not caught as not a user exception - we want it not caught
|
|
//for python err# checker: uassert(13260, "", false);
|
|
}
|
|
}
|
|
}
|
|
|
|
v = -4;
|
|
try {
|
|
ScopedConn conn(h.toString());
|
|
v = -3;
|
|
c = conn->query( rsConfigNs, Query() );
|
|
}
|
|
catch ( DBException& ) {
|
|
if ( !h.isSelf() ) {
|
|
throw;
|
|
}
|
|
|
|
// on startup, socket is not listening yet
|
|
DBDirectClient cli;
|
|
c = cli.query( rsConfigNs, Query() );
|
|
}
|
|
|
|
if( c.get() == 0 ) {
|
|
version = v; return;
|
|
}
|
|
if( !c->more() ) {
|
|
version = EMPTYCONFIG;
|
|
return;
|
|
}
|
|
version = -1;
|
|
}
|
|
catch( DBException& e) {
|
|
version = v;
|
|
log(level) << "replSet load config couldn't get from " << h.toString() << ' ' << e.what() << rsLog;
|
|
return;
|
|
}
|
|
|
|
BSONObj o = c->nextSafe();
|
|
uassert(13109, "multiple rows in " + rsConfigNs + " not supported", !c->more());
|
|
from(o);
|
|
checkRsConfig();
|
|
_ok = true;
|
|
log(level) << "replSet load config ok from " << (h.isSelf() ? "self" : h.toString()) << rsLog;
|
|
}
|
|
|
|
}
|