mirror of https://github.com/mongodb/mongo
461 lines
18 KiB
C++
461 lines
18 KiB
C++
// rs_config.cpp
|
|
|
|
/**
|
|
* Copyright (C) 2008 10gen Inc.
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3,
|
|
* as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Affero General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include "pch.h"
|
|
#include "rs.h"
|
|
#include "../../client/dbclient.h"
|
|
#include "../../client/syncclusterconnection.h"
|
|
#include "../../util/hostandport.h"
|
|
#include "../dbhelpers.h"
|
|
#include "connections.h"
|
|
#include "../oplog.h"
|
|
|
|
using namespace bson;
|
|
|
|
namespace mongo {
|
|
|
|
void logOpInitiate(const bo&);
|
|
|
|
void assertOnlyHas(BSONObj o, const set<string>& fields) {
|
|
BSONObj::iterator i(o);
|
|
while( i.more() ) {
|
|
BSONElement e = i.next();
|
|
if( !fields.count( e.fieldName() ) ) {
|
|
uasserted(13434, str::stream() << "unexpected field '" << e.fieldName() << "'in object");
|
|
}
|
|
}
|
|
}
|
|
|
|
list<HostAndPort> ReplSetConfig::otherMemberHostnames() const {
|
|
list<HostAndPort> L;
|
|
for( vector<MemberCfg>::const_iterator i = members.begin(); i != members.end(); i++ ) {
|
|
if( !i->h.isSelf() )
|
|
L.push_back(i->h);
|
|
}
|
|
return L;
|
|
}
|
|
|
|
/* comment MUST only be set when initiating the set by the initiator */
|
|
void ReplSetConfig::saveConfigLocally(bo comment) {
|
|
checkRsConfig();
|
|
log() << "replSet info saving a newer config version to local.system.replset" << rsLog;
|
|
{
|
|
writelock lk("");
|
|
Client::Context cx( rsConfigNs );
|
|
cx.db()->flushFiles(true);
|
|
|
|
//theReplSet->lastOpTimeWritten = ??;
|
|
//rather than above, do a logOp()? probably
|
|
BSONObj o = asBson();
|
|
Helpers::putSingletonGod(rsConfigNs.c_str(), o, false/*logOp=false; local db so would work regardless...*/);
|
|
if( !comment.isEmpty() )
|
|
logOpInitiate(comment);
|
|
|
|
cx.db()->flushFiles(true);
|
|
}
|
|
DEV log() << "replSet saveConfigLocally done" << rsLog;
|
|
}
|
|
|
|
/*static*/
|
|
/*void ReplSetConfig::receivedNewConfig(BSONObj cfg) {
|
|
if( theReplSet )
|
|
return; // this is for initial setup only, so far. todo
|
|
|
|
ReplSetConfig c(cfg);
|
|
|
|
writelock lk("admin.");
|
|
if( theReplSet )
|
|
return;
|
|
c.saveConfigLocally(bo());
|
|
}*/
|
|
|
|
bo ReplSetConfig::MemberCfg::asBson() const {
|
|
bob b;
|
|
b << "_id" << _id;
|
|
b.append("host", h.toString());
|
|
if( votes != 1 ) b << "votes" << votes;
|
|
if( priority != 1.0 ) b << "priority" << priority;
|
|
if( arbiterOnly ) b << "arbiterOnly" << true;
|
|
if( slaveDelay ) b << "slaveDelay" << slaveDelay;
|
|
if( hidden ) b << "hidden" << hidden;
|
|
if( !buildIndexes ) b << "buildIndexes" << buildIndexes;
|
|
if( !tags.empty() ) {
|
|
BSONArrayBuilder a;
|
|
for( set<string>::const_iterator i = tags.begin(); i != tags.end(); i++ )
|
|
a.append(*i);
|
|
b.appendArray("tags", a.done());
|
|
}
|
|
if( !initialSync.isEmpty() ) {
|
|
b << "initialSync" << initialSync;
|
|
}
|
|
return b.obj();
|
|
}
|
|
|
|
bo ReplSetConfig::asBson() const {
|
|
bob b;
|
|
b.append("_id", _id).append("version", version);
|
|
if( !ho.isDefault() || !getLastErrorDefaults.isEmpty() ) {
|
|
bob settings;
|
|
if( !ho.isDefault() )
|
|
settings << "heartbeatConnRetries " << ho.heartbeatConnRetries <<
|
|
"heartbeatSleep" << ho.heartbeatSleepMillis / 1000.0 <<
|
|
"heartbeatTimeout" << ho.heartbeatTimeoutMillis / 1000.0;
|
|
if( !getLastErrorDefaults.isEmpty() )
|
|
settings << "getLastErrorDefaults" << getLastErrorDefaults;
|
|
b << "settings" << settings.obj();
|
|
}
|
|
|
|
BSONArrayBuilder a;
|
|
for( unsigned i = 0; i < members.size(); i++ )
|
|
a.append( members[i].asBson() );
|
|
b.append("members", a.arr());
|
|
|
|
return b.obj();
|
|
}
|
|
|
|
static inline void mchk(bool expr) {
|
|
uassert(13126, "bad Member config", expr);
|
|
}
|
|
|
|
void ReplSetConfig::MemberCfg::check() const {
|
|
mchk(_id >= 0 && _id <= 255);
|
|
mchk(priority >= 0 && priority <= 1000);
|
|
mchk(votes <= 100); // votes >= 0 because it is unsigned
|
|
uassert(13419, "this version of mongod only supports priorities 0 and 1", priority == 0 || priority == 1);
|
|
uassert(13437, "slaveDelay requires priority be zero", slaveDelay == 0 || priority == 0);
|
|
uassert(13438, "bad slaveDelay value", slaveDelay >= 0 && slaveDelay <= 3600 * 24 * 366);
|
|
uassert(13439, "priority must be 0 when hidden=true", priority == 0 || !hidden);
|
|
uassert(13477, "priority must be 0 when buildIndexes=false", buildIndexes || priority == 0);
|
|
|
|
if (!initialSync.isEmpty()) {
|
|
static const string legal[] = {"state", "name", "_id","optime"};
|
|
static const set<string> legals(legal, legal + 4);
|
|
assertOnlyHas(initialSync, legals);
|
|
|
|
if (initialSync.hasElement("state")) {
|
|
uassert(13525, "initialSync source state must be 1 or 2",
|
|
initialSync["state"].isNumber() &&
|
|
(initialSync["state"].Number() == 1 ||
|
|
initialSync["state"].Number() == 2));
|
|
}
|
|
if (initialSync.hasElement("name")) {
|
|
uassert(13526, "initialSync source name must be a string",
|
|
initialSync["name"].type() == mongo::String);
|
|
}
|
|
if (initialSync.hasElement("_id")) {
|
|
uassert(13527, "initialSync source _id must be a number",
|
|
initialSync["_id"].isNumber());
|
|
}
|
|
if (initialSync.hasElement("optime")) {
|
|
uassert(13528, "initialSync source optime must be a timestamp",
|
|
initialSync["optime"].type() == mongo::Timestamp ||
|
|
initialSync["optime"].type() == mongo::Date);
|
|
}
|
|
}
|
|
}
|
|
|
|
/** @param o old config
|
|
@param n new config
|
|
*/
|
|
/*static*/
|
|
bool ReplSetConfig::legalChange(const ReplSetConfig& o, const ReplSetConfig& n, string& errmsg) {
|
|
assert( theReplSet );
|
|
|
|
if( o._id != n._id ) {
|
|
errmsg = "set name may not change";
|
|
return false;
|
|
}
|
|
/* TODO : wonder if we need to allow o.version < n.version only, which is more lenient.
|
|
if someone had some intermediate config this node doesnt have, that could be
|
|
necessary. but then how did we become primary? so perhaps we are fine as-is.
|
|
*/
|
|
if( o.version + 1 != n.version ) {
|
|
errmsg = "version number wrong";
|
|
return false;
|
|
}
|
|
|
|
map<HostAndPort,const ReplSetConfig::MemberCfg*> old;
|
|
bool isLocalHost = false;
|
|
for( vector<ReplSetConfig::MemberCfg>::const_iterator i = o.members.begin(); i != o.members.end(); i++ ) {
|
|
if (i->h.isLocalHost()) {
|
|
isLocalHost = true;
|
|
}
|
|
old[i->h] = &(*i);
|
|
}
|
|
int me = 0;
|
|
for( vector<ReplSetConfig::MemberCfg>::const_iterator i = n.members.begin(); i != n.members.end(); i++ ) {
|
|
const ReplSetConfig::MemberCfg& m = *i;
|
|
if ( isLocalHost && !m.h.isLocalHost() ) {
|
|
log() << "reconfig error: " << m.h.toString() << " cannot be used from localhost replset" << rsLog;
|
|
uasserted(13645, "hosts cannot change from localhost to hostname");
|
|
}
|
|
if( old.count(m.h) ) {
|
|
const ReplSetConfig::MemberCfg& oldCfg = *old[m.h];
|
|
if( oldCfg._id != m._id ) {
|
|
log() << "replSet reconfig error with member: " << m.h.toString() << rsLog;
|
|
uasserted(13432, "_id may not change for members");
|
|
}
|
|
if( oldCfg.buildIndexes != m.buildIndexes ) {
|
|
log() << "replSet reconfig error with member: " << m.h.toString() << rsLog;
|
|
uasserted(13476, "buildIndexes may not change for members");
|
|
}
|
|
/* are transitions to and from arbiterOnly guaranteed safe? if not, we should disallow here.
|
|
there is a test at replsets/replsetarb3.js */
|
|
if( oldCfg.arbiterOnly != m.arbiterOnly ) {
|
|
log() << "replSet reconfig error with member: " << m.h.toString() << " arbiterOnly cannot change. remove and readd the member instead " << rsLog;
|
|
uasserted(13510, "arbiterOnly may not change for members");
|
|
}
|
|
}
|
|
if( m.h.isSelf() )
|
|
me++;
|
|
}
|
|
|
|
uassert(13433, "can't find self in new replset config", me == 1);
|
|
|
|
/* TODO : MORE CHECKS HERE */
|
|
|
|
DEV log() << "replSet TODO : don't allow removal of a node until we handle it at the removed node end?" << endl;
|
|
// we could change its votes to zero perhaps instead as a short term...
|
|
|
|
return true;
|
|
}
|
|
|
|
void ReplSetConfig::clear() {
|
|
version = -5;
|
|
_ok = false;
|
|
}
|
|
|
|
void ReplSetConfig::checkRsConfig() const {
|
|
uassert(13132,
|
|
"nonmatching repl set name in _id field; check --replSet command line",
|
|
_id == cmdLine.ourSetName());
|
|
uassert(13308, "replSet bad config version #", version > 0);
|
|
uassert(13133, "replSet bad config no members", members.size() >= 1);
|
|
uassert(13309, "replSet bad config maximum number of members is 12", members.size() <= 12);
|
|
{
|
|
unsigned voters = 0;
|
|
for( vector<MemberCfg>::const_iterator i = members.begin(); i != members.end(); ++i ) {
|
|
if( i->votes )
|
|
voters++;
|
|
}
|
|
uassert(13612, "replSet bad config maximum number of voting members is 7", voters <= 7);
|
|
uassert(13613, "replSet bad config no voting members", voters > 0);
|
|
}
|
|
}
|
|
|
|
void ReplSetConfig::from(BSONObj o) {
|
|
static const string legal[] = {"_id","version", "members","settings"};
|
|
static const set<string> legals(legal, legal + 4);
|
|
assertOnlyHas(o, legals);
|
|
|
|
md5 = o.md5();
|
|
_id = o["_id"].String();
|
|
if( o["version"].ok() ) {
|
|
version = o["version"].numberInt();
|
|
uassert(13115, "bad " + rsConfigNs + " config: version", version > 0);
|
|
}
|
|
|
|
if( o["settings"].ok() ) {
|
|
BSONObj settings = o["settings"].Obj();
|
|
if( settings["heartbeatConnRetries "].ok() )
|
|
ho.heartbeatConnRetries = settings["heartbeatConnRetries "].numberInt();
|
|
if( settings["heartbeatSleep"].ok() )
|
|
ho.heartbeatSleepMillis = (unsigned) (settings["heartbeatSleep"].Number() * 1000);
|
|
if( settings["heartbeatTimeout"].ok() )
|
|
ho.heartbeatTimeoutMillis = (unsigned) (settings["heartbeatTimeout"].Number() * 1000);
|
|
ho.check();
|
|
try { getLastErrorDefaults = settings["getLastErrorDefaults"].Obj().copy(); }
|
|
catch(...) { }
|
|
}
|
|
|
|
set<string> hosts;
|
|
set<int> ords;
|
|
vector<BSONElement> members;
|
|
try {
|
|
members = o["members"].Array();
|
|
}
|
|
catch(...) {
|
|
uasserted(13131, "replSet error parsing (or missing) 'members' field in config object");
|
|
}
|
|
|
|
unsigned localhosts = 0;
|
|
for( unsigned i = 0; i < members.size(); i++ ) {
|
|
BSONObj mobj = members[i].Obj();
|
|
MemberCfg m;
|
|
try {
|
|
static const string legal[] = {
|
|
"_id","votes","priority","host", "hidden","slaveDelay",
|
|
"arbiterOnly","buildIndexes","tags","initialSync"
|
|
};
|
|
static const set<string> legals(legal, legal + 10);
|
|
assertOnlyHas(mobj, legals);
|
|
|
|
try {
|
|
m._id = (int) mobj["_id"].Number();
|
|
}
|
|
catch(...) {
|
|
/* TODO: use of string exceptions may be problematic for reconfig case! */
|
|
throw "_id must be numeric";
|
|
}
|
|
string s;
|
|
try {
|
|
s = mobj["host"].String();
|
|
m.h = HostAndPort(s);
|
|
}
|
|
catch(...) {
|
|
throw string("bad or missing host field? ") + mobj.toString();
|
|
}
|
|
if( m.h.isLocalHost() )
|
|
localhosts++;
|
|
m.arbiterOnly = mobj.getBoolField("arbiterOnly");
|
|
m.slaveDelay = mobj["slaveDelay"].numberInt();
|
|
if( mobj.hasElement("hidden") )
|
|
m.hidden = mobj.getBoolField("hidden");
|
|
if( mobj.hasElement("buildIndexes") )
|
|
m.buildIndexes = mobj.getBoolField("buildIndexes");
|
|
if( mobj.hasElement("priority") )
|
|
m.priority = mobj["priority"].Number();
|
|
if( mobj.hasElement("votes") )
|
|
m.votes = (unsigned) mobj["votes"].Number();
|
|
if( mobj.hasElement("tags") ) {
|
|
vector<BSONElement> v = mobj["tags"].Array();
|
|
for( unsigned i = 0; i < v.size(); i++ )
|
|
m.tags.insert( v[i].String() );
|
|
}
|
|
if( mobj.hasElement("initialSync")) {
|
|
m.initialSync = mobj["initialSync"].Obj().getOwned();
|
|
}
|
|
m.check();
|
|
}
|
|
catch( const char * p ) {
|
|
log() << "replSet cfg parsing exception for members[" << i << "] " << p << rsLog;
|
|
stringstream ss;
|
|
ss << "replSet members[" << i << "] " << p;
|
|
uassert(13107, ss.str(), false);
|
|
}
|
|
catch(DBException& e) {
|
|
log() << "replSet cfg parsing exception for members[" << i << "] " << e.what() << rsLog;
|
|
stringstream ss;
|
|
ss << "bad config for member[" << i << "] " << e.what();
|
|
uassert(13135, ss.str(), false);
|
|
}
|
|
if( !(ords.count(m._id) == 0 && hosts.count(m.h.toString()) == 0) ) {
|
|
log() << "replSet " << o.toString() << rsLog;
|
|
uassert(13108, "bad replset config -- duplicate hosts in the config object?", false);
|
|
}
|
|
hosts.insert(m.h.toString());
|
|
ords.insert(m._id);
|
|
this->members.push_back(m);
|
|
}
|
|
uassert(13393, "can't use localhost in repl set member names except when using it for all members", localhosts == 0 || localhosts == members.size());
|
|
uassert(13117, "bad " + rsConfigNs + " config", !_id.empty());
|
|
}
|
|
|
|
static inline void configAssert(bool expr) {
|
|
uassert(13122, "bad repl set config?", expr);
|
|
}
|
|
|
|
ReplSetConfig::ReplSetConfig(BSONObj cfg) {
|
|
clear();
|
|
from(cfg);
|
|
configAssert( version < 0 /*unspecified*/ || (version >= 1 && version <= 5000) );
|
|
if( version < 1 )
|
|
version = 1;
|
|
_ok = true;
|
|
}
|
|
|
|
ReplSetConfig::ReplSetConfig(const HostAndPort& h) {
|
|
clear();
|
|
int level = 2;
|
|
DEV level = 0;
|
|
|
|
BSONObj cfg;
|
|
int v = -5;
|
|
try {
|
|
if( h.isSelf() ) {
|
|
;
|
|
}
|
|
else {
|
|
/* first, make sure other node is configured to be a replset. just to be safe. */
|
|
string setname = cmdLine.ourSetName();
|
|
BSONObj cmd = BSON( "replSetHeartbeat" << setname );
|
|
int theirVersion;
|
|
BSONObj info;
|
|
log() << "trying to contact " << h.toString() << rsLog;
|
|
bool ok = requestHeartbeat(setname, "", h.toString(), info, -2, theirVersion);
|
|
if( info["rs"].trueValue() ) {
|
|
// yes, it is a replicate set, although perhaps not yet initialized
|
|
}
|
|
else {
|
|
if( !ok ) {
|
|
log() << "replSet TEMP !ok heartbeating " << h.toString() << " on cfg load" << rsLog;
|
|
if( !info.isEmpty() )
|
|
log() << "replSet info " << h.toString() << " : " << info.toString() << rsLog;
|
|
return;
|
|
}
|
|
{
|
|
stringstream ss;
|
|
ss << "replSet error: member " << h.toString() << " is not in --replSet mode";
|
|
msgassertedNoTrace(13260, ss.str().c_str()); // not caught as not a user exception - we want it not caught
|
|
//for python err# checker: uassert(13260, "", false);
|
|
}
|
|
}
|
|
}
|
|
|
|
v = -4;
|
|
unsigned long long count = 0;
|
|
try {
|
|
ScopedConn conn(h.toString());
|
|
v = -3;
|
|
cfg = conn.findOne(rsConfigNs, Query()).getOwned();
|
|
count = conn.count(rsConfigNs);
|
|
}
|
|
catch ( DBException& ) {
|
|
if ( !h.isSelf() ) {
|
|
throw;
|
|
}
|
|
|
|
// on startup, socket is not listening yet
|
|
DBDirectClient cli;
|
|
cfg = cli.findOne( rsConfigNs, Query() ).getOwned();
|
|
count = cli.count(rsConfigNs);
|
|
}
|
|
|
|
if( count > 1 )
|
|
uasserted(13109, str::stream() << "multiple rows in " << rsConfigNs << " not supported host: " << h.toString());
|
|
|
|
if( cfg.isEmpty() ) {
|
|
version = EMPTYCONFIG;
|
|
return;
|
|
}
|
|
version = -1;
|
|
}
|
|
catch( DBException& e) {
|
|
version = v;
|
|
log(level) << "replSet load config couldn't get from " << h.toString() << ' ' << e.what() << rsLog;
|
|
return;
|
|
}
|
|
|
|
from(cfg);
|
|
checkRsConfig();
|
|
_ok = true;
|
|
log(level) << "replSet load config ok from " << (h.isSelf() ? "self" : h.toString()) << rsLog;
|
|
}
|
|
|
|
}
|