summaryrefslogtreecommitdiff
path: root/db/repl/rs_initialsync.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'db/repl/rs_initialsync.cpp')
-rw-r--r--db/repl/rs_initialsync.cpp214
1 files changed, 214 insertions, 0 deletions
diff --git a/db/repl/rs_initialsync.cpp b/db/repl/rs_initialsync.cpp
new file mode 100644
index 0000000..4c6bd4d
--- /dev/null
+++ b/db/repl/rs_initialsync.cpp
@@ -0,0 +1,214 @@
+/**
+* Copyright (C) 2008 10gen Inc.
+*
+* This program is free software: you can redistribute it and/or modify
+* it under the terms of the GNU Affero General Public License, version 3,
+* as published by the Free Software Foundation.
+*
+* This program is distributed in the hope that it will be useful,
+* but WITHOUT ANY WARRANTY; without even the implied warranty of
+* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+* GNU Affero General Public License for more details.
+*
+* You should have received a copy of the GNU Affero General Public License
+* along with this program. If not, see <http://www.gnu.org/licenses/>.
+*/
+
+#include "pch.h"
+#include "../client.h"
+#include "../../client/dbclient.h"
+#include "rs.h"
+#include "../oplogreader.h"
+#include "../../util/mongoutils/str.h"
+#include "../dbhelpers.h"
+#include "rs_optime.h"
+#include "../oplog.h"
+
+namespace mongo {
+
+ using namespace mongoutils;
+ using namespace bson;
+
+ void dropAllDatabasesExceptLocal();
+
+ // add try/catch with sleep
+
+ void isyncassert(const char *msg, bool expr) {
+ if( !expr ) {
+ string m = str::stream() << "initial sync " << msg;
+ theReplSet->sethbmsg(m, 0);
+ uasserted(13404, m);
+ }
+ }
+
+ void ReplSetImpl::syncDoInitialSync() {
+ while( 1 ) {
+ try {
+ _syncDoInitialSync();
+ break;
+ }
+ catch(DBException& e) {
+ sethbmsg("initial sync exception " + e.toString(), 0);
+ sleepsecs(30);
+ }
+ }
+ }
+
+ bool cloneFrom(const char *masterHost, string& errmsg, const string& fromdb, bool logForReplication,
+ bool slaveOk, bool useReplAuth, bool snapshot);
+
+ /* todo : progress metering to sethbmsg. */
+ static bool clone(const char *master, string db) {
+ string err;
+ return cloneFrom(master, err, db, false,
+ /*slaveok later can be true*/ false, true, false);
+ }
+
+ void _logOpObjRS(const BSONObj& op);
+
+ bool copyCollectionFromRemote(const string& host, const string& ns, const BSONObj& query, string errmsg);
+
+ static void emptyOplog() {
+ writelock lk(rsoplog);
+ Client::Context ctx(rsoplog);
+ NamespaceDetails *d = nsdetails(rsoplog);
+
+ // temp
+ if( d && d->nrecords == 0 )
+ return; // already empty, ok.
+
+ log(1) << "replSet empty oplog" << rsLog;
+ d->emptyCappedCollection(rsoplog);
+
+ /*
+ string errmsg;
+ bob res;
+ dropCollection(rsoplog, errmsg, res);
+ log() << "replSet recreated oplog so it is empty. todo optimize this..." << rsLog;
+ createOplog();*/
+
+ // TEMP: restart to recreate empty oplog
+ //log() << "replSet FATAL error during initial sync. mongod restart required." << rsLog;
+ //dbexit( EXIT_CLEAN );
+
+ /*
+ writelock lk(rsoplog);
+ Client::Context c(rsoplog, dbpath, 0, doauth/false);
+ NamespaceDetails *oplogDetails = nsdetails(rsoplog);
+ uassert(13412, str::stream() << "replSet error " << rsoplog << " is missing", oplogDetails != 0);
+ oplogDetails->cappedTruncateAfter(rsoplog, h.commonPointOurDiskloc, false);
+ */
+ }
+
+ void ReplSetImpl::_syncDoInitialSync() {
+ sethbmsg("initial sync pending",0);
+
+ StateBox::SP sp = box.get();
+ assert( !sp.state.primary() ); // wouldn't make sense if we were.
+
+ const Member *cp = sp.primary;
+ if( cp == 0 ) {
+ sethbmsg("initial sync need a member to be primary",0);
+ sleepsecs(15);
+ return;
+ }
+
+ string masterHostname = cp->h().toString();
+ OplogReader r;
+ if( !r.connect(masterHostname) ) {
+ sethbmsg( str::stream() << "initial sync couldn't connect to " << cp->h().toString() , 0);
+ sleepsecs(15);
+ return;
+ }
+
+ BSONObj lastOp = r.getLastOp(rsoplog);
+ if( lastOp.isEmpty() ) {
+ sethbmsg("initial sync couldn't read remote oplog", 0);
+ sleepsecs(15);
+ return;
+ }
+ OpTime startingTS = lastOp["ts"]._opTime();
+
+ {
+ /* make sure things aren't too flappy */
+ sleepsecs(5);
+ isyncassert( "flapping?", box.getPrimary() == cp );
+ BSONObj o = r.getLastOp(rsoplog);
+ isyncassert( "flapping [2]?", !o.isEmpty() );
+ }
+
+ sethbmsg("initial sync drop all databases", 0);
+ dropAllDatabasesExceptLocal();
+
+// sethbmsg("initial sync drop oplog", 0);
+// emptyOplog();
+
+ list<string> dbs = r.conn()->getDatabaseNames();
+ for( list<string>::iterator i = dbs.begin(); i != dbs.end(); i++ ) {
+ string db = *i;
+ if( db != "local" ) {
+ sethbmsg( str::stream() << "initial sync cloning db: " << db , 0);
+ bool ok;
+ {
+ writelock lk(db);
+ Client::Context ctx(db);
+ ok = clone(masterHostname.c_str(), db);
+ }
+ if( !ok ) {
+ sethbmsg( str::stream() << "initial sync error clone of " << db << " failed sleeping 5 minutes" ,0);
+ sleepsecs(300);
+ return;
+ }
+ }
+ }
+
+ sethbmsg("initial sync query minValid",0);
+
+ /* our cloned copy will be strange until we apply oplog events that occurred
+ through the process. we note that time point here. */
+ BSONObj minValid = r.getLastOp(rsoplog);
+ assert( !minValid.isEmpty() );
+ OpTime mvoptime = minValid["ts"]._opTime();
+ assert( !mvoptime.isNull() );
+
+ /* copy the oplog
+ */
+ {
+ sethbmsg("initial sync copy+apply oplog");
+ if( ! initialSyncOplogApplication(masterHostname, cp, startingTS, mvoptime) ) { // note we assume here that this call does not throw
+ log() << "replSet initial sync failed during applyoplog" << rsLog;
+ emptyOplog(); // otherwise we'll be up!
+ lastOpTimeWritten = OpTime();
+ lastH = 0;
+ log() << "replSet cleaning up [1]" << rsLog;
+ {
+ writelock lk("local.");
+ Client::Context cx( "local." );
+ cx.db()->flushFiles(true);
+ }
+ log() << "replSet cleaning up [2]" << rsLog;
+ sleepsecs(2);
+ return;
+ }
+ }
+
+ sethbmsg("initial sync finishing up",0);
+
+ assert( !box.getState().primary() ); // wouldn't make sense if we were.
+
+ {
+ writelock lk("local.");
+ Client::Context cx( "local." );
+ cx.db()->flushFiles(true);
+ try {
+ log() << "replSet set minValid=" << minValid["ts"]._opTime().toString() << rsLog;
+ }
+ catch(...) { }
+ Helpers::putSingleton("local.replset.minvalid", minValid);
+ cx.db()->flushFiles(true);
+ }
+
+ sethbmsg("initial sync done",0);
+ }
+
+}