src/mongo/s/commands_admin.cpp

/**
*    Copyright (C) 2008 10gen Inc.
*
*    This program is free software: you can redistribute it and/or  modify
*    it under the terms of the GNU Affero General Public License, version 3,
*    as published by the Free Software Foundation.
*
*    This program is distributed in the hope that it will be useful,
*    but WITHOUT ANY WARRANTY; without even the implied warranty of
*    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
*    GNU Affero General Public License for more details.
*
*    You should have received a copy of the GNU Affero General Public License
*    along with this program.  If not, see <http://www.gnu.org/licenses/>.
*/

#include "pch.h"

#include <boost/thread/thread.hpp>
#include "mongo/db/commands.h"

#include "mongo/client/connpool.h"
#include "mongo/client/dbclientcursor.h"
#include "mongo/db/auth/action_set.h"
#include "mongo/db/auth/action_type.h"
#include "mongo/db/auth/authorization_manager.h"
#include "mongo/db/auth/privilege.h"
#include "mongo/db/dbmessage.h"
#include "mongo/db/stats/counters.h"
#include "mongo/db/repl/rs_optime.h"
#include "mongo/s/chunk.h"
#include "mongo/s/client_info.h"
#include "mongo/s/config.h"
#include "mongo/s/d_logic.h"
#include "mongo/s/field_parser.h"
#include "mongo/s/grid.h"
#include "mongo/db/oplogreader.h"
#include "mongo/s/strategy.h"
#include "mongo/s/type_chunk.h"
#include "mongo/s/type_database.h"
#include "mongo/s/type_shard.h"
#include "mongo/s/type_settings.h"
#include "mongo/s/writeback_listener.h"
#include "mongo/util/net/listen.h"
#include "mongo/util/net/message.h"
#include "mongo/util/processinfo.h"
#include "mongo/util/ramlog.h"
#include "mongo/util/stringutils.h"
#include "mongo/util/timer.h"
#include "mongo/util/version.h"

namespace mongo {

    namespace dbgrid_cmds {

        class GridAdminCmd : public Command {
        public:
            GridAdminCmd( const char * n ) : Command( n , false, tolowerString(n).c_str() ) {
            }
            virtual bool slaveOk() const {
                return true;
            }
            virtual bool adminOnly() const {
                return true;
            }

            // all grid commands are designed not to lock
            virtual LockType locktype() const { return NONE; }

            bool okForConfigChanges( string& errmsg ) {
                string e;
                if ( ! configServer.allUp(e) ) {
                    errmsg = str::stream() << "not all config servers are up: " << e;
                    return false;
                }
                return true;
            }
        };

        // --------------- misc commands ----------------------

        class NetStatCmd : public GridAdminCmd {
        public:
            NetStatCmd() : GridAdminCmd("netstat") { }
            virtual void help( stringstream& help ) const {
                help << " shows status/reachability of servers in the cluster";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::netstat);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                result.append("configserver", configServer.getPrimary().getConnString() );
                result.append("isdbgrid", 1);
                return true;
            }
        } netstat;

        class FlushRouterConfigCmd : public GridAdminCmd {
        public:
            FlushRouterConfigCmd() : GridAdminCmd("flushRouterConfig") { }
            virtual void help( stringstream& help ) const {
                help << "flush all router config";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::flushRouterConfig);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                grid.flushConfig();
                result.appendBool( "flushed" , true );
                return true;
            }
        } flushRouterConfigCmd;

        class FsyncCommand : public GridAdminCmd {
        public:
            FsyncCommand() : GridAdminCmd( "fsync" ) {}
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::fsync);
                out->push_back(Privilege(AuthorizationManager::SERVER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                if ( cmdObj["lock"].trueValue() ) {
                    errmsg = "can't do lock through mongos";
                    return false;
                }

                BSONObjBuilder sub;

                bool ok = true;
                int numFiles = 0;

                vector<Shard> shards;
                Shard::getAllShards( shards );
                for ( vector<Shard>::iterator i=shards.begin(); i!=shards.end(); i++ ) {
                    Shard s = *i;

                    BSONObj x = s.runCommand( "admin" , "fsync" );
                    sub.append( s.getName() , x );

                    if ( ! x["ok"].trueValue() ) {
                        ok = false;
                        errmsg = x["errmsg"].String();
                    }

                    numFiles += x["numFiles"].numberInt();
                }

                result.append( "numFiles" , numFiles );
                result.append( "all" , sub.obj() );
                return ok;
            }
        } fsyncCmd;

        // ------------ database level commands -------------

        class MoveDatabasePrimaryCommand : public GridAdminCmd {
        public:
            MoveDatabasePrimaryCommand() : GridAdminCmd("movePrimary") { }
            virtual void help( stringstream& help ) const {
                help << " example: { moveprimary : 'foo' , to : 'localhost:9999' }";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::movePrimary);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                string dbname = cmdObj.firstElement().valuestrsafe();

                if ( dbname.size() == 0 ) {
                    errmsg = "no db";
                    return false;
                }

                if ( dbname == "config" ) {
                    errmsg = "can't move config db";
                    return false;
                }

                // Flush the configuration
                // This can't be perfect, but it's better than nothing.
                grid.flushConfig();

                DBConfigPtr config = grid.getDBConfig( dbname , false );
                if ( ! config ) {
                    errmsg = "can't find db!";
                    return false;
                }

                string to = cmdObj["to"].valuestrsafe();
                if ( ! to.size()  ) {
                    errmsg = "you have to specify where you want to move it";
                    return false;
                }
                Shard s = Shard::make( to );

                if ( config->getPrimary() == s.getConnString() ) {
                    errmsg = "it is already the primary";
                    return false;
                }

                if ( ! grid.knowAboutShard( s.getConnString() ) ) {
                    errmsg = "that server isn't known to me";
                    return false;
                }

                log() << "Moving " << dbname << " primary from: " << config->getPrimary().toString()
                      << " to: " << s.toString() << endl;

                // Locking enabled now...
                DistributedLock lockSetup( configServer.getConnectionString(), dbname + "-movePrimary" );
                dist_lock_try dlk;

                // Distributed locking added.
                try{
                    dlk = dist_lock_try( &lockSetup , string("Moving primary shard of ") + dbname );
                }
                catch( LockException& e ){
	                errmsg = str::stream() << "error locking distributed lock to move primary shard of " << dbname << causedBy( e );
	                warning() << errmsg << endl;
	                return false;
                }

                if ( ! dlk.got() ) {
	                errmsg = (string)"metadata lock is already taken for moving " + dbname;
	                return false;
                }

                set<string> shardedColls;
                config->getAllShardedCollections( shardedColls );

                BSONArrayBuilder barr;
                barr.append( shardedColls );

                scoped_ptr<ScopedDbConnection> toconn(
                        ScopedDbConnection::getScopedDbConnection( s.getConnString() ) );

                // TODO ERH - we need a clone command which replays operations from clone start to now
                //            can just use local.oplog.$main
                BSONObj cloneRes;
                bool worked = toconn->get()->runCommand(
                    dbname.c_str(),
                    BSON( "clone" << config->getPrimary().getConnString() <<
                          "collsToIgnore" << barr.arr() ),
                    cloneRes );
                toconn->done();

                if ( ! worked ) {
                    log() << "clone failed" << cloneRes << endl;
                    errmsg = "clone failed";
                    return false;
                }

                string oldPrimary = config->getPrimary().getConnString();

                scoped_ptr<ScopedDbConnection> fromconn(
                        ScopedDbConnection::getScopedDbConnection( config->getPrimary()
                                                                   .getConnString() ) );

                config->setPrimary( s.getConnString() );

                if( shardedColls.empty() ){

                    // TODO: Collections can be created in the meantime, and we should handle in the future.
                    log() << "movePrimary dropping database on " << oldPrimary << ", no sharded collections in " << dbname << endl;

                    try {
                        fromconn->get()->dropDatabase( dbname.c_str() );
                    }
                    catch( DBException& e ){
                        e.addContext( str::stream() << "movePrimary could not drop the database " << dbname << " on " << oldPrimary );
                        throw;
                    }

                }
                else if( cloneRes["clonedColls"].type() != Array ){

                    // Legacy behavior from old mongod with sharded collections, *do not* delete database,
                    // but inform user they can drop manually (or ignore).
                    warning() << "movePrimary legacy mongod behavior detected, user must manually remove unsharded collections in "
                          << "database " << dbname << " on " << oldPrimary << endl;

                }
                else {

                    // We moved some unsharded collections, but not all
                    BSONObjIterator it( cloneRes["clonedColls"].Obj() );

                    while( it.more() ){
                        BSONElement el = it.next();
                        if( el.type() == String ){
                            try {
                                log() << "movePrimary dropping cloned collection " << el.String() << " on " << oldPrimary << endl;
                                fromconn->get()->dropCollection( el.String() );
                            }
                            catch( DBException& e ){
                                e.addContext( str::stream() << "movePrimary could not drop the cloned collection " << el.String() << " on " << oldPrimary );
                                throw;
                            }
                        }
                    }
                }

                fromconn->done();

                result << "primary " << s.toString();

                return true;
            }
        } movePrimary;

        class EnableShardingCmd : public GridAdminCmd {
        public:
            EnableShardingCmd() : GridAdminCmd( "enableSharding" ) {}
            virtual void help( stringstream& help ) const {
                help
                        << "Enable sharding for a db. (Use 'shardcollection' command afterwards.)\n"
                        << "  { enablesharding : \"<dbname>\" }\n";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::enableSharding);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                string dbname = cmdObj.firstElement().valuestrsafe();
                if ( dbname.size() == 0 ) {
                    errmsg = "no db";
                    return false;
                }
                
                if ( dbname == "admin" ) {
                    errmsg = "can't shard the admin db";
                    return false;
                }
                if ( dbname == "local" ) {
                    errmsg = "can't shard the local db";
                    return false;
                }

                DBConfigPtr config = grid.getDBConfig( dbname );
                if ( config->isShardingEnabled() ) {
                    errmsg = "already enabled";
                    return false;
                }
                
                if ( ! okForConfigChanges( errmsg ) )
                    return false;
                
                log() << "enabling sharding on: " << dbname << endl;

                config->enableSharding();

                return true;
            }
        } enableShardingCmd;

        // ------------ collection level commands -------------

        class ShardCollectionCmd : public GridAdminCmd {
        public:
            ShardCollectionCmd() : GridAdminCmd( "shardCollection" ) {}

            virtual void help( stringstream& help ) const {
                help
                        << "Shard a collection.  Requires key.  Optional unique. Sharding must already be enabled for the database.\n"
                        << "  { enablesharding : \"<dbname>\" }\n";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::shardCollection);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                const string ns = cmdObj.firstElement().valuestrsafe();
                if ( ns.size() == 0 ) {
                    errmsg = "no ns";
                    return false;
                }

                const NamespaceString nsStr( ns );
                if ( !nsStr.isValid() ){
                    errmsg = str::stream() << "bad ns[" << ns << "]";
                    return false;
                }

                DBConfigPtr config = grid.getDBConfig( ns );
                if ( ! config->isShardingEnabled() ) {
                    errmsg = "sharding not enabled for db";
                    return false;
                }

                if ( config->isSharded( ns ) ) {
                    errmsg = "already sharded";
                    return false;
                }

                BSONObj proposedKey = cmdObj.getObjectField( "key" );
                if ( proposedKey.isEmpty() ) {
                    errmsg = "no shard key";
                    return false;
                }

                // Currently the allowable shard keys are either
                // i) a hashed single field, e.g. { a : "hashed" }, or
                // ii) a compound list of ascending fields, e.g. { a : 1 , b : 1 }
                if ( proposedKey.firstElementType() == mongo::String ) {
                    // case i)
                    if ( !str::equals( proposedKey.firstElement().valuestrsafe() , "hashed" ) ) {
                        errmsg = "unrecognized string: " + proposedKey.firstElement().str();
                        return false;
                    }
                    if ( proposedKey.nFields() > 1 ) {
                        errmsg = "hashed shard keys currently only support single field keys";
                        return false;
                    }
                    if ( cmdObj["unique"].trueValue() ) {
                        // it's possible to ensure uniqueness on the hashed field by
                        // declaring an additional (non-hashed) unique index on the field,
                        // but the hashed shard key itself should not be declared unique
                        errmsg = "hashed shard keys cannot be declared unique.";
                        return false;
                    }
                } else {
                    // case ii)
                    BSONForEach(e, proposedKey) {
                        if (!e.isNumber() || e.number() != 1.0) {
                            errmsg = str::stream() << "Unsupported shard key pattern.  Pattern must"
                                                   << " either be a single hashed field, or a list"
                                                   << " of ascending fields.";
                            return false;
                        }
                    }
                }

                if ( ns.find( ".system." ) != string::npos ) {
                    errmsg = "can't shard system namespaces";
                    return false;
                }

                if ( ! okForConfigChanges( errmsg ) )
                    return false;

                //the rest of the checks require a connection to the primary db
                scoped_ptr<ScopedDbConnection> conn(
                        ScopedDbConnection::getScopedDbConnection(
                                        config->getPrimary().getConnString() ) );

                //check that collection is not capped
                BSONObj res = conn->get()->findOne( config->getName() + ".system.namespaces",
                                                    BSON( "name" << ns ) );
                if ( res["options"].type() == Object &&
                     res["options"].embeddedObject()["capped"].trueValue() ) {
                    errmsg = "can't shard capped collection";
                    conn->done();
                    return false;
                }

                // The proposed shard key must be validated against the set of existing indexes.
                // In particular, we must ensure the following constraints
                //
                // 1. All existing unique indexes, except those which start with the _id index,
                //    must contain the proposed key as a prefix (uniqueness of the _id index is
                //    ensured by the _id generation process or guaranteed by the user).
                //
                // 2. If the collection is not empty, there must exist at least one index that
                //    is "useful" for the proposed key.  A "useful" index is defined as follows
                //    Useful Index:
                //         i. contains proposedKey as a prefix
                //         ii. is not sparse
                //         iii. contains no null values
                //         iv. is not multikey (maybe lift this restriction later)
                //
                // 3. If the proposed shard key is specified as unique, there must exist a useful,
                //    unique index exactly equal to the proposedKey (not just a prefix).
                //
                // After validating these constraint:
                //
                // 4. If there is no useful index, and the collection is non-empty, we
                //    must fail.
                //
                // 5. If the collection is empty, and it's still possible to create an index
                //    on the proposed key, we go ahead and do so.

                string indexNS = config->getName() + ".system.indexes";

                // 1.  Verify consistency with existing unique indexes
                BSONObj uniqueQuery = BSON( "ns" << ns << "unique" << true );
                auto_ptr<DBClientCursor> uniqueQueryResult =
                                conn->get()->query( indexNS , uniqueQuery );

                ShardKeyPattern proposedShardKey( proposedKey );
                while ( uniqueQueryResult->more() ) {
                    BSONObj idx = uniqueQueryResult->next();
                    BSONObj currentKey = idx["key"].embeddedObject();
                    if( ! proposedShardKey.isUniqueIndexCompatible( currentKey ) ) {
                        errmsg = str::stream() << "can't shard collection '" << ns << "' "
                                               << "with unique index on " << currentKey << " "
                                               << "and proposed shard key " << proposedKey << ". "
                                               << "Uniqueness can't be maintained unless "
                                               << "shard key is a prefix";
                        conn->done();
                        return false;
                    }
                }

                // 2. Check for a useful index
                bool hasUsefulIndexForKey = false;

                BSONObj allQuery = BSON( "ns" << ns );
                auto_ptr<DBClientCursor> allQueryResult =
                                conn->get()->query( indexNS , allQuery );

                BSONArrayBuilder allIndexes;
                while ( allQueryResult->more() ) {
                    BSONObj idx = allQueryResult->next();
                    allIndexes.append( idx );
                    BSONObj currentKey = idx["key"].embeddedObject();
                    // Check 2.i. and 2.ii.
                    if ( ! idx["sparse"].trueValue() && proposedKey.isPrefixOf( currentKey ) ) {
                        hasUsefulIndexForKey = true;
                    }
                }

                // 3. If proposed key is required to be unique, additionally check for exact match.
                bool careAboutUnique = cmdObj["unique"].trueValue();
                if ( hasUsefulIndexForKey && careAboutUnique ) {
                    BSONObj eqQuery = BSON( "ns" << ns << "key" << proposedKey );
                    BSONObj eqQueryResult = conn->get()->findOne( indexNS, eqQuery );
                    if ( eqQueryResult.isEmpty() ) {
                        hasUsefulIndexForKey = false;  // if no exact match, index not useful,
                                                       // but still possible to create one later
                    }
                    else {
                        bool isExplicitlyUnique = eqQueryResult["unique"].trueValue();
                        BSONObj currKey = eqQueryResult["key"].embeddedObject();
                        bool isCurrentID = str::equals( currKey.firstElementFieldName() , "_id" );
                        if ( ! isExplicitlyUnique && ! isCurrentID ) {
                            errmsg = str::stream() << "can't shard collection " << ns << ", "
                                                   << proposedKey << " index not unique, "
                                                   << "and unique index explicitly specified";
                            conn->done();
                            return false;
                        }
                    }
                }

                if ( hasUsefulIndexForKey ) {
                    // Check 2.iii and 2.iv. Make sure no null entries in the sharding index
                    // and that there is a useful, non-multikey index available
                    BSONObjBuilder cmd;
                    cmd.append( "checkShardingIndex" , ns );
                    cmd.append( "keyPattern" , proposedKey );
                    BSONObj cmdObj = cmd.obj();
                    if ( ! conn->get()->runCommand( "admin" , cmdObj , res ) ) {
                        errmsg = res["errmsg"].str();
                        conn->done();
                        return false;
                    }
                }
                // 4. if no useful index, and collection is non-empty, fail
                else if ( conn->get()->count( ns ) != 0 ) {
                    errmsg = str::stream() << "please create an index that starts with the "
                                           << "shard key before sharding.";
                    result.append( "proposedKey" , proposedKey );
                    result.appendArray( "curIndexes" , allIndexes.done() );
                    conn->done();
                    return false;
                }
                // 5. If no useful index exists, and collection empty, create one on proposedKey.
                //    Only need to call ensureIndex on primary shard, since indexes get copied to
                //    receiving shard whenever a migrate occurs.
                else {
                    // call ensureIndex with cache=false, see SERVER-1691
                    bool ensureSuccess = conn->get()->ensureIndex( ns ,
                                                                   proposedKey ,
                                                                   careAboutUnique ,
                                                                   "" ,
                                                                   false );
                    if ( ! ensureSuccess ) {
                        errmsg = "ensureIndex failed to create index on primary shard";
                        conn->done();
                        return false;
                    }
                }

                bool isEmpty = ( conn->get()->count( ns ) == 0 );

                conn->done();

                // Pre-splitting:
                // For new collections which use hashed shard keys, we can can pre-split the
                // range of possible hashes into a large number of chunks, and distribute them
                // evenly at creation time. Until we design a better initialization scheme, the
                // safest way to pre-split is to
                // 1. make one big chunk for each shard
                // 2. move them one at a time
                // 3. split the big chunks to achieve the desired total number of initial chunks

                vector<Shard> shards;
                Shard primary = config->getPrimary();
                primary.getAllShards( shards );
                int numShards = shards.size();

                vector<BSONObj> initSplits;  // there will be at most numShards-1 of these
                vector<BSONObj> allSplits;   // all of the initial desired split points

                bool isHashedShardKey =
                        str::equals(proposedKey.firstElement().valuestrsafe(), "hashed");

                // only pre-split when using a hashed shard key and collection is still empty
                if ( isHashedShardKey && isEmpty ){

                    int numChunks = cmdObj["numInitialChunks"].numberInt();
                    if ( numChunks <= 0 )
                        numChunks = 2*numShards;  // default number of initial chunks

                    // hashes are signed, 64-bit ints. So we divide the range (-MIN long, +MAX long)
                    // into intervals of size (2^64/numChunks) and create split points at the
                    // boundaries.  The logic below ensures that initial chunks are all
                    // symmetric around 0.
                    long long intervalSize = ( std::numeric_limits<long long>::max()/ numChunks )*2;
                    long long current = 0;
                    if( numChunks % 2 == 0 ){
                        allSplits.push_back( BSON(proposedKey.firstElementFieldName() << current) );
                        current += intervalSize;
                    } else {
                        current += intervalSize/2;
                    }
                    for( int i=0; i < (numChunks-1)/2; i++ ){
                        allSplits.push_back( BSON(proposedKey.firstElementFieldName() << current) );
                        allSplits.push_back( BSON(proposedKey.firstElementFieldName() << -current));
                        current += intervalSize;
                    }
                    sort( allSplits.begin() , allSplits.end() );

                    // 1. the initial splits define the "big chunks" that we will subdivide later
                    int lastIndex = -1;
                    for ( int i = 1; i < numShards; i++ ){
                        if ( lastIndex < (i*numChunks)/numShards - 1 ){
                            lastIndex = (i*numChunks)/numShards - 1;
                            initSplits.push_back( allSplits[ lastIndex ] );
                        }
                    }
                }

                tlog() << "CMD: shardcollection: " << cmdObj << endl;

                config->shardCollection( ns , proposedKey , careAboutUnique , &initSplits );

                result << "collectionsharded" << ns;

                // only initially move chunks when using a hashed shard key
                if (isHashedShardKey) {

                    // Reload the new config info.  If we created more than one initial chunk, then
                    // we need to move them around to balance.
                    ChunkManagerPtr chunkManager = config->getChunkManager( ns , true );
                    ChunkMap chunkMap = chunkManager->getChunkMap();
                    // 2. Move and commit each "big chunk" to a different shard.
                    int i = 0;
                    for ( ChunkMap::const_iterator c = chunkMap.begin(); c != chunkMap.end(); ++c,++i ){
                        Shard to = shards[ i % numShards ];
                        ChunkPtr chunk = c->second;

                        // can't move chunk to shard it's already on
                        if ( to == chunk->getShard() )
                            continue;

                        BSONObj moveResult;
                        if (!chunk->moveAndCommit(to, Chunk::MaxChunkSize,
                                false, true, moveResult)) {
                            warning() << "Couldn't move chunk " << chunk << " to shard "  << to
                                      << " while sharding collection " << ns << ". Reason: "
                                      <<  moveResult << endl;
                        }
                    }

                    if (allSplits.empty()) {
                        return true;
                    }

                    // Reload the config info, after all the migrations
                    chunkManager = config->getChunkManager( ns , true );

                    // 3. Subdivide the big chunks by splitting at each of the points in "allSplits"
                    //    that we haven't already split by.
                    ChunkPtr currentChunk = chunkManager->findIntersectingChunk( allSplits[0] );
                    vector<BSONObj> subSplits;
                    for ( unsigned i = 0 ; i <= allSplits.size(); i++){
                        if ( i == allSplits.size() || ! currentChunk->containsPoint( allSplits[i] ) ) {
                            if ( ! subSplits.empty() ){
                                BSONObj splitResult;
                                if ( ! currentChunk->multiSplit( subSplits , splitResult ) ){
                                    warning() << "Couldn't split chunk " << currentChunk
                                              << " while sharding collection " << ns << ". Reason: "
                                              << splitResult << endl;
                                }
                                subSplits.clear();
                            }
                            if ( i < allSplits.size() )
                                currentChunk = chunkManager->findIntersectingChunk( allSplits[i] );
                        } else {
                            subSplits.push_back( allSplits[i] );
                        }
                    }

                    // Proactively refresh the chunk manager. Not really necessary, but this way it's
                    // immediately up-to-date the next time it's used.
                    config->getChunkManager( ns , true );
                }

                return true;
            }
        } shardCollectionCmd;

        class ReShardCollectionCmd : public GridAdminCmd {
        public:
            ReShardCollectionCmd() : GridAdminCmd( "reShardCollection" ) {}

            virtual void help( stringstream& help ) const {
                help
                        << "Shard a collection with a new key.  Requires new key.  Optional unique. Sharding must already be enabled for the database.\n"
                        << "  { enablesharding : \"<dbname>\" }\n";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::reShardCollection);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
				Timer t;
                const string ns = cmdObj.firstElement().valuestrsafe();
                if ( ns.size() == 0 ) {
                    errmsg = "no ns";
                    return false;
                }

                const NamespaceString nsStr( ns );
                if ( !nsStr.isValid() ){
                    errmsg = str::stream() << "bad ns[" << ns << "]";
                    return false;
                }

                DBConfigPtr config = grid.getDBConfig( ns );
                if ( ! config->isShardingEnabled() ) {
                    errmsg = "sharding not enabled for db";
                    return false;
                }

                if ( !config->isSharded( ns ) ) {
                    errmsg = "already not sharded";
                    return false;
                }

                BSONObj proposedKey = cmdObj.getObjectField( "key" );
                if ( proposedKey.isEmpty() ) {
                    errmsg = "no shard key";
                    return false;
                }

                // Currently the allowable shard keys are either
                // i) a hashed single field, e.g. { a : "hashed" }, or
                // ii) a compound list of ascending fields, e.g. { a : 1 , b : 1 }
                if ( proposedKey.firstElementType() == mongo::String ) {
                    // case i)
                    if ( !str::equals( proposedKey.firstElement().valuestrsafe() , "hashed" ) ) {
                        errmsg = "unrecognized string: " + proposedKey.firstElement().str();
                        return false;
                    }
                    if ( proposedKey.nFields() > 1 ) {
                        errmsg = "hashed shard keys currently only support single field keys";
                        return false;
                    }
                    if ( cmdObj["unique"].trueValue() ) {
                        // it's possible to ensure uniqueness on the hashed field by
                        // declaring an additional (non-hashed) unique index on the field,
                        // but the hashed shard key itself should not be declared unique
                        errmsg = "hashed shard keys cannot be declared unique.";
                        return false;
                    }
                } else {
                    // case ii)
                    BSONForEach(e, proposedKey) {
                        if (!e.isNumber() || e.number() != 1.0) {
                            errmsg = str::stream() << "Unsupported shard key pattern.  Pattern must"
                                                   << " either be a single hashed field, or a list"
                                                   << " of ascending fields.";
                            return false;
                        }
                    }
                }

				ChunkManagerPtr manager = grid.getDBConfig(ns)->getChunkManager(ns);
				ShardKeyPattern shardKeyPattern = manager->getShardKey();

				if (shardKeyPattern.hasShardKey(proposedKey))
				{
					errmsg = "shard key already in use";
					return false;
				}
				
                if ( ns.find( ".system." ) != string::npos ) {
                    errmsg = "can't shard system namespaces";
                    return false;
                }

                if ( ! okForConfigChanges( errmsg ) )
                    return false;

                //the rest of the checks require a connection to the primary db
                scoped_ptr<ScopedDbConnection> conn(
                        ScopedDbConnection::getScopedDbConnection(
                                        config->getPrimary().getConnString() ) );

                //check that collection is not capped
                BSONObj res = conn->get()->findOne( config->getName() + ".system.namespaces",
                                                    BSON( "name" << ns ) );
                if ( res["options"].type() == Object &&
                     res["options"].embeddedObject()["capped"].trueValue() ) {
                    errmsg = "can't shard capped collection";
                    conn->done();
                    return false;
                }

                // The proposed shard key must be validated against the set of existing indexes.
                // In particular, we must ensure the following constraints
                //
                // 1. All existing unique indexes, except those which start with the _id index,
                //    must contain the proposed key as a prefix (uniqueness of the _id index is
                //    ensured by the _id generation process or guaranteed by the user).
                //
                // 2. If the collection is not empty, there must exist at least one index that
                //    is "useful" for the proposed key.  A "useful" index is defined as follows
                //    Useful Index:
                //         i. contains proposedKey as a prefix
                //         ii. is not sparse
                //         iii. contains no null values
                //         iv. is not multikey (maybe lift this restriction later)
                //
                // 3. If the proposed shard key is specified as unique, there must exist a useful,
                //    unique index exactly equal to the proposedKey (not just a prefix).
                //
                // After validating these constraint:
                //
                // 4. If there is no useful index, and the collection is non-empty, we
                //    must fail.
                //
                // 5. If the collection is empty, and it's still possible to create an index
                //    on the proposed key, we go ahead and do so.

                string indexNS = config->getName() + ".system.indexes";

                // 1.  Verify consistency with existing unique indexes
                BSONObj uniqueQuery = BSON( "ns" << ns << "unique" << true );
                auto_ptr<DBClientCursor> uniqueQueryResult =
                                conn->get()->query( indexNS , uniqueQuery );

                ShardKeyPattern proposedShardKey( proposedKey );
                while ( uniqueQueryResult->more() ) {
                    BSONObj idx = uniqueQueryResult->next();
                    BSONObj currentKey = idx["key"].embeddedObject();
                    if( ! proposedShardKey.isUniqueIndexCompatible( currentKey ) ) {
                        errmsg = str::stream() << "can't shard collection '" << ns << "' "
                                               << "with unique index on " << currentKey << " "
                                               << "and proposed shard key " << proposedKey << ". "
                                               << "Uniqueness can't be maintained unless "
                                               << "shard key is a prefix";
                        conn->done();
                        return false;
                    }
                }

                // 2. Check for a useful index
                bool hasUsefulIndexForKey = false;

                BSONObj allQuery = BSON( "ns" << ns );
                auto_ptr<DBClientCursor> allQueryResult =
                                conn->get()->query( indexNS , allQuery );

                BSONArrayBuilder allIndexes;
                while ( allQueryResult->more() ) {
                    BSONObj idx = allQueryResult->next();
                    allIndexes.append( idx );
                    BSONObj currentKey = idx["key"].embeddedObject();
                    // Check 2.i. and 2.ii.
                    if ( ! idx["sparse"].trueValue() && proposedKey.isPrefixOf( currentKey ) ) {
                        hasUsefulIndexForKey = true;
                    }
                }

                // 3. If proposed key is required to be unique, additionally check for exact match.
                bool careAboutUnique = cmdObj["unique"].trueValue();
                if ( hasUsefulIndexForKey && careAboutUnique ) {
                    BSONObj eqQuery = BSON( "ns" << ns << "key" << proposedKey );
                    BSONObj eqQueryResult = conn->get()->findOne( indexNS, eqQuery );
                    if ( eqQueryResult.isEmpty() ) {
                        hasUsefulIndexForKey = false;  // if no exact match, index not useful,
                                                       // but still possible to create one later
                    }
                    else {
                        bool isExplicitlyUnique = eqQueryResult["unique"].trueValue();
                        BSONObj currKey = eqQueryResult["key"].embeddedObject();
                        bool isCurrentID = str::equals( currKey.firstElementFieldName() , "_id" );
                        if ( ! isExplicitlyUnique && ! isCurrentID ) {
                            errmsg = str::stream() << "can't shard collection " << ns << ", "
                                                   << proposedKey << " index not unique, "
                                                   << "and unique index explicitly specified";
                            conn->done();
                            return false;
                        }
                    }
                }

                if ( hasUsefulIndexForKey ) {
                    // Check 2.iii and 2.iv. Make sure no null entries in the sharding index
                    // and that there is a useful, non-multikey index available
                    BSONObjBuilder cmd;
                    cmd.append( "checkShardingIndex" , ns );
                    cmd.append( "keyPattern" , proposedKey );
                    BSONObj cmdObj = cmd.obj();
                    if ( ! conn->get()->runCommand( "admin" , cmdObj , res ) ) {
                        errmsg = res["errmsg"].str();
                        conn->done();
                        return false;
                    }
                }
                // 4. if no useful index, and collection is non-empty, fail
                else if ( conn->get()->count( ns ) != 0 ) {
                    errmsg = str::stream() << "please create an index that starts with the "
                                           << "shard key before sharding.";
                    result.append( "proposedKey" , proposedKey );
                    result.appendArray( "curIndexes" , allIndexes.done() );
                    conn->done();
                    return false;
                }
                // 5. If no useful index exists, and collection empty, create one on proposedKey.
                //    Only need to call ensureIndex on primary shard, since indexes get copied to
                //    receiving shard whenever a migrate occurs.
                else {
                    // call ensureIndex with cache=false, see SERVER-1691
                    bool ensureSuccess = conn->get()->ensureIndex( ns ,
                                                                   proposedKey ,
                                                                   careAboutUnique ,
                                                                   "" ,
                                                                  false );
                    if ( ! ensureSuccess ) {
                        errmsg = "ensureIndex failed to create index on primary shard";
                        conn->done();
                        return false;
                    }
                }

		        conn->done();

                // 1. Calculate the splits for the new shard key
                log() << "[MYCODE_TIME] Split Chunks min:" << proposedShardKey.globalMin() << "\tmax:" << proposedShardKey.globalMax() << "\tmillis:" << t.millis() << "\n";
                BSONObjSet splitPoints; 
                int numChunk = manager->numChunks();

                vector<Shard> shards;
                Shard primary = grid.getDBConfig(ns)->getPrimary();
                primary.getAllShards( shards );
                int numShards = shards.size();
                long long rowCount = 0;
				for (int i = 0; i < numShards; i++)
                {
					log() << "[MYCODE] Shard Info: " << shards[i].toString() << endl;
                    scoped_ptr<ScopedDbConnection> shardconn(
                    	ScopedDbConnection::getScopedDbConnection(
                           	shards[i].getConnString() ) );
                    
                    rowCount += shardconn->get()->count(ns);
                    shardconn->done();
                }

                log() << "[MYCODE_TIME] rowCount: " << rowCount << endl;

                long long maxObjectPerChunk = rowCount / numChunk;
                //if (maxObjectPerChunk > Chunk::MaxObjectPerChunk)
                //    maxObjectPerChunk = Chunk::MaxObjectPerChunk;

                pickSplitVector(splitPoints, ns, proposedKey, proposedShardKey.globalMin(), proposedShardKey.globalMax(), Chunk::MaxChunkSize, numChunk - 1, maxObjectPerChunk);

				numChunk = splitPoints.size() + 1;
                for (BSONObjSet::iterator it = splitPoints.begin(); it != splitPoints.end(); it++)
                    log() << "[MYCODE] Split Points:" << it->toString() << endl;

                log() << "[MYCODE_TIME] Split Points Done\tmillis:" << t.millis() << endl;

                // 2. Disable the balancer
                setBalancerState(false);

                log() << "[MYCODE_TIME] Balancer Turned off\tmillis:" << t.millis() << endl;

				// 3. create replica sets and collect replica ids
                scoped_ptr<ScopedDbConnection> shardconn(
                	ScopedDbConnection::getScopedDbConnection(
                       	shards[0].getConnString() ) );

				log() << "[MYCODE_TIME] Before isMaster call" << endl;
				int numHosts = 0;
				BSONObj info;
				shardconn->get()->runCommand("admin", BSON("isMaster" << 1), info);
				log() << "[MYCODE_TIME] After isMaster call" << endl;
				BSONObjIterator iter(info["hosts"].Obj());
				while (iter.more())
				{
					string str = iter.next().String();
					numHosts++;
				}

				log() << "[MYCODE_TIME] NumHosts:" << numHosts << endl;
				shardconn->done();

				string **replicaSets = new string*[numHosts];
				for (int i = 0; i < numHosts; i++)
					replicaSets[i] = new string[numShards];
				collectReplicas(replicaSets, shards, numShards);
				log() << "[MYCODE_TIME] Replicas Collected" << endl;

				map<string, int> hostIDMap;
				collectIDs(shards, numShards, hostIDMap);
				log() << "[MYCODE_TIME] IDs Collected hostIDMap size:" << hostIDMap.size() << endl;

				for (int i = 0; i < numShards; i++)
				{
					cout << "[MYCODE] Shard " << i << ":";
					for (int j = 0; j < numHosts; j++)
					{
						cout << replicaSets[j][i] << "\t";
					}
					cout << "\n";
				}

				string removedReplicas[numShards], primaryReplicas[numShards];
				for (int i = 0; i < numShards; i++)
					removedReplicas[i] = replicaSets[0][i];
				
				for (int i = 0; i < numShards; i++)
					primaryReplicas[i] = replicaSets[numHosts - 1][i];

                // 4. Stopping the first set of replicas
				OpTime currTS[numShards];

				log() << "[MYCODE_TIME] End of PREPARE Phase:\tmillis:" << t.millis() << endl;

				log() << "[MYCODE_TIME] Stopping first set of hosts" << endl;
                cout << "[MYCODE] Namespace:" << ns << endl;
				replicaStop(ns, numShards, removedReplicas, primaryReplicas, currTS, true);

				log() << "[MYCODE_TIME] End of ISOLATION Phase:\tmillis:" << t.millis() << endl;

				// 5. Run the algorithm
				log() << "[MYCODE_TIME] Running the algorithm" << endl;
				int assignment[numChunk];
				runAlgorithm(splitPoints, ns, removedReplicas, numChunk, numShards, proposedKey, assignment);

				log() << "[MYCODE_TIME] End of Algorithm Phase:\tmillis:" << t.millis() << endl;

                // 6. Reconfiguring the first set of replicas
				log() << "[MYCODE_TIME] Reconfiguring first set of hosts" << endl;

				bool success = reconfigureHosts(ns, shards, removedReplicas, primaryReplicas, currTS, proposedKey, hostIDMap, true, errmsg, splitPoints, assignment, t);
				if (!success)
				{
				    delete[] replicaSets;
                    setBalancerState(true);
					return false;
				}

				log() << "[MYCODE_TIME] End of Primary Reconfiguration:\tmillis:" << t.millis() << endl;

				log() << "[MYCODE_TIME] Checking Timestamp before starting secondaries" << endl;

				OpTime newTS[numShards];
				checkTimestamp(removedReplicas, numShards, newTS);

				for (int i = 0; i < numShards; i++)
					primaryReplicas[i] = replicaSets[0][i];

				log() << "[MYCODE_TIME] Stopping secondary set of replicas" << endl;
				for (int j = 1; j < numHosts; j++)
				{
					cout << "[MYCODE] Stopping replicas:";
					for (int i = 0; i < numShards; i++)
					{
						cout << replicaSets[j][i] << "\t";
						removedReplicas[i] = replicaSets[j][i];
					}
					cout << endl;

                    // 7. Stopping the secondary replicas
					replicaStop(ns, numShards, removedReplicas, primaryReplicas, currTS, false);
				}

				log() << "[MYCODE_TIME] End of Secondary ISOLATION\tmillis:" << t.millis() << endl;

				log() << "[MYCODE_TIME] Reconfiguring secondary set of replicas" << endl;
				for (int j = 1; j < numHosts; j++)
				{
					cout << "[MYCODE] Reconfiguring replicas:";
					for (int i = 0; i < numShards; i++)
					{
						cout << replicaSets[j][i] << "\t";
						removedReplicas[i] = replicaSets[j][i];
					}
					cout << endl;

                    // 8. Reconfiguring the secondary replicas
					success = reconfigureHosts(ns, shards, removedReplicas, primaryReplicas, newTS, proposedKey, hostIDMap, false, errmsg, splitPoints, assignment, t);
					if (!success)
					{
				        delete[] replicaSets;
                        setBalancerState(true);
						return false;
					}
				}
				
				delete[] replicaSets;

				log() << "[MYCODE_TIME] End of Secondary Reconfigure\tmillis:" << t.millis() << endl;

                // 9. Enabling the balancer
                setBalancerState(true);

				log() << "[MYCODE_TIME] Resharding Complete\tmillis:" << t.millis() << endl;

				result.append("millis", t.millis());

				return true;
			}

            void setBalancerState(bool state)
            {
		        scoped_ptr<ScopedDbConnection> conn1( ScopedDbConnection::getInternalScopedDbConnection( 
                        configServer.getPrimary().getConnString() ) );

				//2. Disable the balancer
				try { 
					// look for the stop balancer marker
					BSONObj b1 = conn1->get()->findOne( SettingsType::ConfigNS, BSON( "_id" << "balancer" ) );
					log() << "[MYCODE] BEFORE UPDATE:" << b1.toString() << endl;
					conn1->get()->update( SettingsType::ConfigNS, BSON( "_id" << "balancer" ), BSON( "$set" << BSON( "stopped" << !state )), true );
					BSONObj b2 = conn1->get()->findOne( SettingsType::ConfigNS, BSON( "_id" << "balancer" ) );
					log() << "[MYCODE] AFTER UPDATE:" << b2.toString() << endl;
				}
				catch( DBException& e ){
                    log() << "[MYCODE] Exception trying to disable/enable balancer" << endl;
				}

                conn1->done();
            }

            void pickSplitVector( BSONObjSet& splitPoints, const string ns, BSONObj shardKey, BSONObj min, BSONObj max, int chunkSize /* bytes */, int maxPoints, int maxObjs ) const {
                // Ask the mongod holding this chunk to figure out the split points.
                vector<Shard> newShards;
                Shard newprimary = grid.getDBConfig(ns)->getPrimary();
                newprimary.getAllShards( newShards );
                int numShards = 1;

                for (int i = 0; i < numShards; i++)
                {
                    log() << "[MYCODE] Pick split Vector\n";
                    scoped_ptr<ScopedDbConnection> conn(
                            ScopedDbConnection::getInternalScopedDbConnection( newShards[i].getConnString() ) );
                    BSONObj result;
                    BSONObjBuilder cmd;
                    cmd.append( "splitVector" , ns );
                    cmd.append( "keyPattern" , shardKey );
                    cmd.append( "min" , min );
                    cmd.append( "max" , max );
                    cmd.append( "maxChunkSizeBytes" , chunkSize );
                    cmd.append( "maxSplitPoints" , maxPoints );
                    cmd.append( "maxChunkObjects" , maxObjs );
                    cmd.appendBool( "reShard" , true);
                    BSONObj cmdObj = cmd.obj();
        
                    if ( ! conn->get()->runCommand( "admin" , cmdObj , result )) {
                        conn->done();
                        log() << "[MYCODE] Pick split Vector cmd failed\n";
                        return;
                    }
        
                    log() << "[MYCODE] Pick split Vector cmd done\n";
                    BSONObjIterator it( result.getObjectField( "splitKeys" ) );
                    while ( it.more() ) {
                        splitPoints.insert( it.next().Obj().getOwned() );
                    }
                    conn->done();
                }
            }

			bool reconfigureHosts(string ns, vector<Shard> shards, string removedReplicas[], string primary[], OpTime currTS[], BSONObj proposedKey, map<string, int> hostIDMap, bool configUpdate, string &errmsg, BSONObjSet splitPoints, int assignment[], Timer t)
			{
                int numShards = shards.size();
				int numChunk = splitPoints.size() + 1;

				// 1. Chunk Migration
				log() << "[MYCODE_TIME] Migrating Chunk\tmillis:" << t.millis() << endl;
				migrateChunk(ns, proposedKey, splitPoints, numChunk, assignment, shards, removedReplicas);
				log() << "[MYCODE_TIME] End Migrating Chunk\tmillis:" << t.millis() << endl;
				log() << "[MYCODE_TIME] End EXECUTION Phase\tmillis:" << t.millis() << endl;

                //conversion from array to vector
                vector<OpTime> currTSVector(currTS, currTS + numShards);
                
                // 2. Oplog Replay once
                log() << "[MYCODE_TIME] Replaying Oplog once" << endl;
                replayOplog(ns, proposedKey, splitPoints, 
                            numShards, primary, removedReplicas, currTSVector, 
                            numChunk, assignment, 
                            errmsg, false, currTSVector);
				log() << "[MYCODE_TIME] End First Oplog Replay\tmillis:" << t.millis() << endl;

				// 3. Write Throttle
				log() << "[MYCODE_TIME] Throttling Writes" << endl;
				replicaThrottle(ns, numShards, primary, true);

                // 4. Oplog Replay again
                OpTime endTS[numShards]; 
                checkTimestamp(primary, numShards, endTS);

                //conversion from array to vector
                vector<OpTime> endTSVector(endTS, endTS + numShards);
                
                log() << "[MYCODE_TIME] Replaying Oplog again" << endl;
                replayOplog(ns, proposedKey, splitPoints, 
                            numShards, primary, removedReplicas, currTSVector, 
                            numChunk, assignment, 
                            errmsg, true, endTSVector );
				log() << "[MYCODE_TIME] End RECOVERY Phase\tmillis:" << t.millis() << endl;

				if (configUpdate)
				{
					// 5. Update Config DB
					log() << "[MYCODE_TIME] Update Config" << endl;
					updateConfig(ns, proposedKey, splitPoints, numChunk, assignment);
				}

				// 6. Replica return as primary
				log() << "[MYCODE_TIME] Replica Return" << endl;
				replicaReturn(ns, numShards, removedReplicas, primary, hostIDMap, configUpdate);

				// 7. Write UnThrottle
				log() << "[MYCODE_TIME] UnThrottling Writes" << endl;
				replicaThrottle(ns, numShards, primary, false);
				log() << "[MYCODE_TIME] End COMMIT Phase\tmillis:" << t.millis() << endl;

                return true;
            }

            bool replayOplog(const string ns, BSONObj proposedKey, BSONObjSet splitPoints,  
                                int numShards, string primary[], string removedReplicas[], vector<OpTime>& startTS,
                                int numChunks,  int assignments[], 
                                string& errmsg, bool replayAllOps, vector<OpTime>& endTS) {
                //success variable
                bool success = true;

                cout<<"[MYCODE_HOLLA] ==== In replyOplog ==== "<<endl;

                //global min and max (positive and negative infinities)
                BSONObj globalMin = ShardKeyPattern(proposedKey).globalMin();
                BSONObj globalMax = ShardKeyPattern(proposedKey).globalMax();

                //conversion from arrays to vectors for bundling into bson
                vector<string> removedReplicasVector(removedReplicas, removedReplicas + numShards);
                vector<int> assignmentsVector(assignments, assignments + numChunks);

                //conversion from BSONObjSet to BSONObj for bundling into bson
                vector<BSONObj> points;
                for(BSONObjSet::iterator point = splitPoints.begin(); point != splitPoints.end(); point++) {
                    points.push_back(*point);
                }

                //create the thread tracker
                vector<shared_ptr<boost::thread> > replayOplogThreads;

                //iterate over each removed replica and ask mongod to attempt replay of oplog
                for (int i = 0; i < numShards; i++) {
                    //TODO GOPAL: Comment this out!
                    //startTS[i] = OpTime(1,1);

                    //bundle the params
                    BSONObjBuilder params;
                    params.append("ns", ns);                                            //namespace
                    params.append("startTime", startTS[i]);                             //time from which oplog needs to be replayed                         
                    params.append("primary", primary[i]);                               //the primary to connect to (for oplog details)
                    params.append("shardID", i);                                        //the id for this particular shard
                    params.append("numChunks", numChunks);                              //number of chunks
                    params.append("proposedKey", proposedKey);                          //the proposed key
                    params.append("globalMin", globalMin);                              //global min
                    params.append("globalMax", globalMax);                              //global max
                    params.append("splitPoints", points);                               //split points
                    params.append("assignments", assignmentsVector);                    //the new assignments for chunks
                    params.append("removedReplicas", removedReplicasVector);            //the other removed replicas
                    params.append("replayAllOps", replayAllOps);                        //replay all ops or not (if false, caps ops to replay which might or might not cover all ops)

                    if(replayAllOps){
                        params.append("endTime", endTS[i]);                              //if replayAllOps is true then we need a time till when we want to replay
                    }

                    //create an object to encapsulate all the params
                    BSONObj oplogParams = params.obj();                 
                    cout<<"[MYCODE_HOLLA] Oplog params are "<< oplogParams.toString()<<endl;

                    //create threads and push threads into thread tracker
                    replayOplogThreads.push_back(shared_ptr<boost::thread>(
                                    new boost::thread (boost::bind(&ReShardCollectionCmd::delegateReplay, 
                                        this, removedReplicas[i], oplogParams, &startTS[i]))));                    
                }

                for (unsigned i = 0; i < replayOplogThreads.size(); i++) {
                    replayOplogThreads[i]->join();
                    cout << "Oplog for " << removedReplicas[i] << " needs to be replayed from " << startTS[i].toString() << endl;
                    //TODO GOPAL: find a way of returning these errors
                }

                return success;

            }

            void delegateReplay(string replica, BSONObj oplogParams, OpTime *startTS) {
                BSONObj info;

                //make a connection to the required replica
                scoped_ptr<ScopedDbConnection> conn(
                    ScopedDbConnection::getScopedDbConnection(
                        replica ) );

                //attempt to tell mongod to run the command
                bool done = true;
                int trials = 0;
                do {
                    done = true;
                    try {
                        //make the connection and issue the command
                        cout<<"[MYCODE_HOLLA] Making a connection to "<< replica <<endl;
                        
                        if( !conn->get()->runCommand("admin", BSON("replayOplog" << oplogParams), info)) {
                            cout<<"[MYCODE_HOLLA] Replay Command failed at " << replica << endl;
                            string errmsg = conn->get()->getLastError();
                            cout<<"[MYCODE_HOLLA] ErrMsg: "<<errmsg<<endl;
                            //TODO GOPAL: What do you do if this happens? Retry/Fail?
                        } else {
                            //TODO GOPAL: Do we want anything from info?
                            cout<<"[MYCODE_HOLLA] Replay Info from " << replica << " has: "<<info.toString()<<endl;
                            if(!info["lastOpTime"].eoo()) {
                                *startTS = info["lastOpTime"]._opTime();
                            }
                        }
                    }
                    catch(DBException e){
                        //oops something went wrong
                        //TODO GOPAL: What do you do if this happens? Retry/Fail?
                        cout << "[MYCODE_HOLLA] replayOplog connecting to " << replica << " threw exception: " << e.toString() << endl;
                        done = false;
                        trials++;
                    }
                } while (!done && trials < 10);

                if(!done && trials >= 10) {
                    cout << "[MYCODE_HOLLA] Could not replay oplog on " << replica << endl;
                }
                //close the connection
                conn->done();
            }

			void collectReplicas(string** replicaSets, vector<Shard> newShards, int numShards)
			{
				BSONObj info;
				int hostNum;
				for (int i = 0; i < numShards; i++)
				{
					hostNum = 0;
					printf("[MYCODE] MYCUSTOMPRINT: %s\n", newShards[i].getConnString().c_str());
                	scoped_ptr<ScopedDbConnection> conn(
                		ScopedDbConnection::getScopedDbConnection(
                        	newShards[i].getConnString() ) );

					conn->get()->runCommand("admin", BSON("isMaster" << 1), info);
					string primaryStr = info["primary"].String();

					BSONObjIterator iter(info["hosts"].Obj());
					while (iter.more())
					{
						string hostName = iter.next().String();
						if (primaryStr.compare(hostName))
							replicaSets[hostNum++][i] = hostName;
					}
					replicaSets[hostNum][i] = primaryStr;

					conn->done();
				}
			}

			void collectIDs(vector<Shard> newShards, int numShards, map<string, int>& hostIDMap)
			{
				BSONObj info;
				int hostNum;
				for (int i = 0; i < numShards; i++)
				{
					hostNum = 0;
					printf("[MYCODE] MYCUSTOMPRINT: %s\n", newShards[i].getConnString().c_str());
                	scoped_ptr<ScopedDbConnection> conn(
                		ScopedDbConnection::getScopedDbConnection(
                        	newShards[i].getConnString() ) );

					conn->get()->runCommand("admin", BSON("getIdentifier" << 1), info);
					vector<BSONElement> hosts = info["hosts"].Array();
					vector<BSONElement> ids = info["id"].Array();
					vector<BSONElement>::iterator dit = ids.begin();
					for (vector<BSONElement>::iterator hit = hosts.begin(); hit != hosts.end(); hit++,dit++)
					{
						string host = (*hit).String();
						int id = (*dit).Int();
						cout << "[MYCODE] Host:" << host << " ID:" << id << endl;
						hostIDMap.insert(pair<string, int>(host, id));
					}

					conn->done();
				}
				cout << "[MYCODE] hostIDMap size: " << hostIDMap.size() << endl;
			}

			void checkTimestamp(string shards[], int numShards, OpTime startTS[])
			{
				BSONObj info;
				for (int i = 0; i < numShards; i++)
				{
					while(!oplogReader.connect(shards[i]))
                    {
                        cout << "[MYCODE] Oplog Reader Connect Failed" << endl;
                    }

					BSONObj lastOp = oplogReader.getLastOp(rsoplog);
					OpTime lastOpTS = lastOp["ts"]._opTime();

					startTS[i] = lastOpTS;
					oplogReader.resetConnection();
				}
			}

			void runAlgorithm(BSONObjSet splitPoints, string ns, string replicas[], int numChunk, int numShards, BSONObj proposedKey, int assignment[])
			{
				printf("[MYCODE] RUNALGORITHM\n");
				long long **datainkr;
                datainkr = new long long*[numChunk];
				for (int i = 0; i < numChunk; i++)
                    datainkr[i] = new long long[numShards];

				for (int i = 0; i < numChunk; i++)
					for (int j = 0; j < numShards; j++)
						datainkr[i][j] = 0;

                collectData(splitPoints, ns, replicas, numChunk, numShards, proposedKey, datainkr);

				for (int i = 0; i < numChunk; i++)
				{
					int max = 0, shard_num = 0;
					for (int j = 0; j < numShards; j++)
					{
						if (max < datainkr[i][j])
						{
							max = datainkr[i][j];
							shard_num = j;
						}
					}
					assignment[i] = shard_num;
				}

				cout << "[MYCODE] ASSIGNMENT:\n [MYCODE] ";
				for (int i = 0; i < numChunk; i++)
					cout << assignment[i] << "\t";
				cout << "\n";

                delete[] datainkr;
			}

            void collectData(BSONObjSet splitPoints, string ns, string replicas[], int numChunk, int numShards, BSONObj proposedKey, long long **datainkr)
            {
			    const char *key = proposedKey.firstElement().fieldName();
                BSONObj globalMin = ShardKeyPattern(proposedKey).globalMin();
                BSONObj globalMax = ShardKeyPattern(proposedKey).globalMax();
                for (int i = 0; i < numShards; i++)
                {
                	scoped_ptr<ScopedDbConnection> conn(
                		ScopedDbConnection::getScopedDbConnection(
							replicas[i] ) );

                    long long total = conn->get()->count(ns, BSONObj(), QueryOption_SlaveOk);
                    cout << "[MYCODE] Shard " << i << " count:" << total << endl;

                    BSONObjSet::iterator it = splitPoints.begin();
                    BSONObj prev;
                    for (int j = 0; j < numChunk; j++)
                    {
                        BSONObj min = j > 0 ? prev : globalMin;
                        BSONObj max = j == numChunk - 1 ? globalMax : *it;

                        BSONObj range = getRangeAsBSON(key, min, max);
                        //cout << "[MYCODE] Range:" << range.toString() << endl;
						while (true) {
							cout << "[MYCODE] Range:" << range.toString() << endl;
                        	try
                        	{
							    datainkr[j][i] = conn->get()->count(ns, range, QueryOption_SlaveOk);
								break;
                        	    //cout << "[MYCODE] Error:" << conn->get()->getLastError() << endl;
                        	}
                        	catch(DBException e)
                        	{
                        	    cout << "[MYCODE] Exception trying to populate datainkr: " << e.what() << endl;
								continue;
                        	}
						}

						//cout << "[MYCODE] j:" << j << " numChunk:" << numChunk << endl;
						if (j < numChunk - 1)
						{
                        	prev = *it;
                        	it++;
						}
						//cout << "[MYCODE] prev:" << prev.toString() << " *it:" << it->toString() << endl;
                    }

                    conn->done();
                }

				cout << "[MYCODE] DATAINKR:" << endl;
				for (int i = 0; i < numChunk; i++)
				{
					cout << "[MYCODE] ";
					for (int j = 0; j < numShards; j++)
						cout << datainkr[i][j] << "\t";
					cout << endl;
				}
            }

            BSONObj getRangeAsBSON(const char* key, BSONObj min, BSONObj max)
            {
                BSONElement minElem = min[key];
                BSONElement maxElem = max[key];

                BSONObjBuilder b;
                BSONObjBuilder sub(b.subobjStart(key));
                if (minElem.type() == MinKey)
                    sub.appendAs(maxElem, "$lt");
                else if (maxElem.type() == MaxKey)
                    sub.appendAs(minElem, "$gte");
                else
                {
                    sub.appendAs(minElem, "$gte");
                    sub.appendAs(maxElem, "$lt");
                }

                BSONObj subObj = sub.done();
                BSONObj range = b.done().getOwned();
                return range;
            }

			void migrateChunk(const string ns, BSONObj proposedKey, BSONObjSet splitPoints, int numChunk, int assignment[], vector<Shard> shards, string removedReplicas[])
			{
                vector<Shard> newShards;
                Shard primary = grid.getDBConfig(ns)->getPrimary();
                primary.getAllShards( newShards );
                int numShards = newShards.size();
				for (int i = 0; i < numShards; i++)
					cout << "[MYCODE] Shard Info: " << newShards[i].toString() << endl;

				/*string newRemovedReplicas[numShards];
				for (int i = 0; i < numShards; i++)
				{
					for (int j = 0; j < numShards; j++)
					{
						if (!newShards[i].getName().compare(shards[j].getName()))
						{
							newRemovedReplicas[i] = removedReplicas[j];
						}
					}
				}*/

				vector<shared_ptr<boost::thread> > migrateThreads;

				const char *key = proposedKey.firstElement().fieldName();
                BSONObj globalMin = ShardKeyPattern(proposedKey).globalMin();
                BSONObj globalMax = ShardKeyPattern(proposedKey).globalMax();
                BSONObjSet::iterator it = splitPoints.begin();
                BSONObj prev;
				long long sourceCount;

				for (int i = 0; i < numChunk; i++)
				{
                    BSONObj min = i > 0 ? prev : globalMin;
                    BSONObj max = i == numChunk - 1 ? globalMax : *it;
                    BSONObj range = getRangeAsBSON(key, min, max);
                    cout << "[MYCODE] Range:" << range.toString() << endl;

		 			for (int j = 0; j < numShards; j++)
					{
						if (j != assignment[i])
						{
							scoped_ptr<ScopedDbConnection> fromconn(
                				ScopedDbConnection::getScopedDbConnection(
                        			removedReplicas[j] ) );

							while (true)
							{
								try
								{
									sourceCount = fromconn->get()->count(ns, range, QueryOption_SlaveOk);
									break;
								}
								catch (DBException e)
								{
									continue;
								}
							}
							
							fromconn->done();
							
							if (sourceCount > 0)
							{
								migrateThreads.push_back(shared_ptr<boost::thread>(
									new boost::thread (boost::bind(&ReShardCollectionCmd::singleMigrate, this, removedReplicas, range, key, min, i, j, assignment, ns))));
							}
						}
					}

					if (i < numChunk - 1)
					{
                    	prev = *it;
                    	it++;
					}
				}

				for (unsigned i = 0; i < migrateThreads.size(); i++) {
					migrateThreads[i]->join();
				}

				long long **datainkr;
                datainkr = new long long*[numChunk];
				for (int i = 0; i < numChunk; i++)
                    datainkr[i] = new long long[numShards];

				for (int i = 0; i < numChunk; i++)
					for (int j = 0; j < numShards; j++)
						datainkr[i][j] = 0;

                //collectData(splitPoints, ns, removedReplicas, numChunk, numShards, proposedKey, datainkr);

                delete[] datainkr;
			}

			void singleMigrate(string removedreplicas[], BSONObj range, const char *key, BSONObj min, int i, int j, int assignment[], const string ns)
			{
				BSONObj res;

                scoped_ptr<ScopedDbConnection> toconn(
               		ScopedDbConnection::getScopedDbConnection(
                 		removedreplicas[assignment[i]] ) );

				scoped_ptr<ScopedDbConnection> fromconn(
               		ScopedDbConnection::getScopedDbConnection(
                     	removedreplicas[j] ) );

				long long sourceCount = fromconn->get()->count(ns, range, QueryOption_SlaveOk);
				long long dstCount = toconn->get()->count(ns, range, QueryOption_SlaveOk);

				while (true)
				{
					try
					{
						sourceCount = fromconn->get()->count(ns, range, QueryOption_SlaveOk);
						break;
					}
					catch (DBException e)
					{
						continue;
					}
				}

				while (true)
				{
					try
					{
						dstCount = toconn->get()->count(ns, range, QueryOption_SlaveOk);
						break;
					}
					catch (DBException e)
					{
						continue;
					}
				}

				cout << "[MYCODE] Chunk " << i << " moving data from shard " << j << " to " << assignment[i] << endl;
				cout << "[MYCODE] Source Count: " << sourceCount << " Dest Count: " << dstCount << endl;

                BSONObjBuilder b;
                b.appendAs(min[key], "min");
                BSONObj minID = b.done();

				try
				{
					toconn->get()->runCommand( "admin" , 
						BSON( 	"moveData" << ns <<
								"key" << key << 
      							"from" << removedreplicas[j] << 
      							"to" << removedreplicas[assignment[i]] << 
      							/////////////////////////////// 
      							"range" << range << 
      							"maxChunkSizeBytes" << Chunk::MaxChunkSize << 
      							"shardId" << Chunk::genID(ns, minID) << 
      							"configdb" << configServer.modelServer() << 
      							"secondaryThrottle" << true 
      						) ,
							res
					);
				}
				catch (DBException e)
				{
					cout << "[MYCODE] Caught exception while moving data:" << e.what() << endl;
				}

				toconn->done();
				fromconn->done();
			}

			void replicaStop(const string ns, int numShards, string removedReplicas[], string primary[], OpTime startTS[], bool collectTS)
			{
				// Code for bringing down replica
				vector<shared_ptr<boost::thread> > stopThreads;
				for (int i = 0; i < numShards; i++)
				{
					printf("[MYCODE] MYCUSTOMPRINT: %s going to remove %s\n", primary[i].c_str(), removedReplicas[i].c_str());

					if (collectTS)
					{
                        while(!oplogReader.connect(primary[i]))
                        {
                            cout << "[MYCODE] Oplog Reader Connect Failed" << endl;
                        }

						BSONObj lastOp = oplogReader.getLastOp(rsoplog);
						OpTime lastOpTS = lastOp["ts"]._opTime();
						startTS[i] = lastOpTS;
						oplogReader.resetConnection();
					}

                    stopThreads.push_back(shared_ptr<boost::thread>(new boost::thread (boost::bind(&ReShardCollectionCmd::singleStop, this, primary[i], removedReplicas[i], ns))));
                }

				for (unsigned i = 0; i < stopThreads.size(); i++) 
					stopThreads[i]->join();
            }

            /*void singleStop(string primary, string removedReplica)
            {
				BSONObj info;
                scoped_ptr<ScopedDbConnection> conn(
                	ScopedDbConnection::getScopedDbConnection(
                       	primary ) );
                
                try
				{
					conn->get()->runCommand("admin", BSON("replSetRemove" << removedReplica), info);
				}
				catch(DBException e){
					cout << "[MYCODE] stepping down" << " threw exception: " << e.toString() << endl;
				}

				conn->done();
			}*/

            void singleStop(string primary, string removedReplica, string ns)
            {
				BSONObj info;
                scoped_ptr<ScopedDbConnection> conn(
                	ScopedDbConnection::getScopedDbConnection(
                       	removedReplica ) );
                
                try
				{
					conn->get()->runCommand("admin", BSON("replSetWriteThrottle" << "local.oplogthrottle" << "namespace" << ns << "throttle" << true), info);
				}
				catch(DBException e){
					cout << "[MYCODE] stepping down" << " threw exception: " << e.toString() << endl;
				}

				conn->done();
			}

			void replicaReturn(const string ns, int numShards, string removedReplicas[], string primary[], map<string, int> hostIDMap, bool makePrimary)
			{
				// Code for adding back replica
				cout << "[MYCODE] hostIDMap size:" << hostIDMap.size() << endl;

				int hostID = -1;
				vector<shared_ptr<boost::thread> > returnThreads;

				for (int i = 0; i < numShards; i++)
				{
					printf("[MYCODE] MYCUSTOMPRINT: %s going to add %s\n", primary[i].c_str(), removedReplicas[i].c_str());

					hostID = -1;
					for (map<string, int>::iterator it = hostIDMap.begin(); it != hostIDMap.end(); it++)
					{
						if (!removedReplicas[i].compare(it->first))
						{
							hostID = it->second;
							cout << "[MYCODE] Adding host id:" << hostID << endl;
							break;
						}
					}

					verify(hostID != -1);

                    returnThreads.push_back(shared_ptr<boost::thread>(new boost::thread (boost::bind(&ReShardCollectionCmd::singleReturn, this, primary[i], removedReplicas[i], ns, makePrimary, hostID))));
                }

				for (unsigned i = 0; i < returnThreads.size(); i++) 
					returnThreads[i]->join();
            }

            void singleReturn(string primary, string removedReplica, string ns, bool makePrimary, int hostID)
            {
				BSONObj info;
                scoped_ptr<ScopedDbConnection> conn(
                	ScopedDbConnection::getScopedDbConnection(
                       	primary ) );

                scoped_ptr<ScopedDbConnection> hostConn(
                	ScopedDbConnection::getScopedDbConnection(
                       	removedReplica ) );
				try
				{
					conn->get()->runCommand("admin", BSON("replSetAdd" << removedReplica << "primary" << makePrimary << "id" << hostID), info);
					string errmsg = conn->get()->getLastError();
					cout << "[MYCODE] Replica Return:" << errmsg << endl;
				}
				catch(DBException e){
					cout << "[MYCODE] adding replica" << " threw exception: " << e.toString() << endl;
				}

				try
				{
					hostConn->get()->runCommand("admin", BSON("replSetWriteThrottle" << "local.oplogthrottle" << "namespace" << ns << "throttle" << false), info);
					string errmsg = hostConn->get()->getLastError();
					cout << "[MYCODE] Write Throttle:" << errmsg << endl;
				}
				catch(DBException e){
					cout << "[MYCODE] oplog throttle replica" << " threw exception: " << e.toString() << endl;
				}

				conn->done();
                hostConn->done();
			}

			void replicaThrottle(const string ns, int numShards, string primary[], bool throttle)
			{
				vector<shared_ptr<boost::thread> > throttleThreads;

				for (int i = 0; i < numShards; i++)
				{
					printf("[MYCODE] MYCUSTOMPRINT: %s going to send throttle write command\n", primary[i].c_str());

                    throttleThreads.push_back(shared_ptr<boost::thread>(new boost::thread (boost::bind(&ReShardCollectionCmd::singleThrottle, this, primary[i], ns, throttle))));
                }

				for (unsigned i = 0; i < throttleThreads.size(); i++) 
					throttleThreads[i]->join();
            }

            void singleThrottle(string primary, string ns, bool throttle)
            {
				BSONObj info;
                scoped_ptr<ScopedDbConnection> conn(
                	ScopedDbConnection::getScopedDbConnection(
                       	primary ) );

				try
				{
					conn->get()->runCommand("admin", BSON("replSetWriteThrottle" << "local.writethrottle" << "namespace" << ns << "throttle" << throttle), info);
					string errmsg = conn->get()->getLastError();
					cout << "[MYCODE] Replica Return:" << errmsg << endl;
				}
				catch(DBException e){
					cout << "[MYCODE] adding replica" << " threw exception: " << e.toString() << endl;
				}

				conn->done();
			}

			void updateConfig(string ns, BSONObj proposedKey, BSONObjSet splitPoints, int numChunk, int assignment[])
			{
           		DistributedLock lockSetup( ConnectionString( configServer.getPrimary().getConnString() , ConnectionString::SYNC ) , ns ); 
           		dist_lock_try dlk;
				string errmsg;

           		try{ 
               		dlk = dist_lock_try( &lockSetup , "Reshard Collection" ); 
           		}
           		catch( LockException& e ){ 
               		errmsg = str::stream() << "error reshard collection " << causedBy( e ); 
               		return; 
           		} 

           		if ( ! dlk.got() ) { 
               		errmsg = str::stream() << "the collection metadata could not be locked with lock "; 
               		return; 
           		}

				//Remove all the chunk entries for given ns
                scoped_ptr<ScopedDbConnection> conn(
                	ScopedDbConnection::getScopedDbConnection(
                       	configServer.getPrimary().getConnString() ) );

				BSONObj query = BSON(ChunkType::ns() << ns);
				auto_ptr<DBClientCursor> cursor(conn->get()->query(ChunkType::ConfigNS, query));
				cout << "[MYCODE] Current Config Contents" << endl;
                while ( cursor->more() ) {
                    BSONObj o = cursor->next();
                    cout << "[MYCODE] " << o.toString() << endl;
                }

				ChunkVersion maxVersion;
				{
    				BSONObj x;
    				try {
        				x = conn->get()->findOne(ChunkType::ConfigNS,
                			Query(BSON(ChunkType::ns(ns)))
                                .sort(BSON(ChunkType::DEPRECATED_lastmod() << -1)));

    				}
					catch( DBException& e ){
        				string errmsg = str::stream() << "aborted update config" << causedBy( e );
        				warning() << errmsg << endl;
        				return;
    				}
					cout << "[MYCODE] x: " << x.toString() << endl;
					maxVersion = ChunkVersion::fromBSON(x, ChunkType::DEPRECATED_lastmod());
				}

				cout << "[MYCODE] MAXVERSION: " << maxVersion.toString() << endl;

				try
				{
					conn->get()->remove(ChunkType::ConfigNS, query);
				}
				catch (DBException e)
				{
					cout << "[MYCODE] All the chunk metadata could not be removed " << e.what() << endl;
				}

				maxVersion.incMinor();
				cout << "[MYCODE] MAXVERSION: " << maxVersion.toString() << endl;
				ChunkManager* cm = new ChunkManager( ns, proposedKey, true );

                vector<Shard> shards;
                Shard primary = grid.getDBConfig(ns)->getPrimary();
                primary.getAllShards( shards );
				int numShards = shards.size();
				for (int i = 0; i < numShards; i++)
					cout << "[MYCODE] Shard Info: " << shards[i].toString() << endl;

				BSONObj globalMin = ShardKeyPattern(proposedKey).globalMin();
				BSONObj globalMax = ShardKeyPattern(proposedKey).globalMax();
				BSONObjSet::iterator it = splitPoints.begin();
				BSONObj prev;

				//Add the new chunk entries
				for (int i = 0; i < numChunk; i++)
				{
                    BSONObj min = i > 0 ? prev : globalMin;
                    BSONObj max = i == numChunk - 1 ? globalMax : *it;

					Chunk temp(cm, min, max, shards[assignment[i]], maxVersion);
					BSONObjBuilder n;
					temp.serialize(n);
                    BSONObj chunkInfo = n.done();

					cout << "[MYCODE] New Config Members:" << chunkInfo.toString() << endl;

					try
					{
						conn->get()->update(ChunkType::ConfigNS, QUERY(ChunkType::name(temp.genID())), chunkInfo, true, false);
					}
					catch (DBException e)
					{
						cout << "[MYCODE] Insert to chunk metadata failed " << e.what() << endl;
					}
					maxVersion.incMinor();
					cout << "[MYCODE] MAXVERSION: " << maxVersion.toString() << endl;

					if (i < numChunk - 1)
					{
						prev = *it;
						it++;
					}
				}

				auto_ptr<DBClientCursor> cursor1(conn->get()->query(ChunkType::ConfigNS, query));
				cout << "[MYCODE] Current Config Contents" << endl;
                while ( cursor1->more() ) {
                    BSONObj o = cursor1->next();
                    cout << "[MYCODE]" << o.toString() << endl;
                }

				conn->done();

                DBConfigPtr config = grid.getDBConfig( ns );
				config->resetCM(ns, cm);
                config->reload();
                config->getChunkManager( ns , true );
			}

			private:
				OplogReader oplogReader;

        } reShardCollectionCmd;

        class GetShardVersion : public GridAdminCmd {
        public:
            GetShardVersion() : GridAdminCmd( "getShardVersion" ) {}
            virtual void help( stringstream& help ) const {
                help << " example: { getShardVersion : 'alleyinsider.foo'  } ";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::getShardVersion);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                string ns = cmdObj.firstElement().valuestrsafe();
                if ( ns.size() == 0 ) {
                    errmsg = "need to specify fully namespace";
                    return false;
                }

                DBConfigPtr config = grid.getDBConfig( ns );
                if ( ! config->isSharded( ns ) ) {
                    errmsg = "ns not sharded.";
                    return false;
                }

                ChunkManagerPtr cm = config->getChunkManagerIfExists( ns );
                if ( ! cm ) {
                    errmsg = "no chunk manager?";
                    return false;
                }
                cm->_printChunks();
                cm->getVersion().addToBSON( result );

                return 1;
            }
        } getShardVersionCmd;

        class SplitCollectionCmd : public GridAdminCmd {
        public:
            SplitCollectionCmd() : GridAdminCmd( "split" ) {}
            virtual void help( stringstream& help ) const {
                help
                        << " example: - split the shard that contains give key \n"
                        << " { split : 'alleyinsider.blog.posts' , find : { ts : 1 } }\n"
                        << " example: - split the shard that contains the key with this as the middle \n"
                        << " { split : 'alleyinsider.blog.posts' , middle : { ts : 1 } }\n"
                        << " NOTE: this does not move move the chunks, it merely creates a logical separation \n"
                        ;
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::split);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                if ( ! okForConfigChanges( errmsg ) )
                    return false;

                ShardConnection::sync();

                string ns = cmdObj.firstElement().valuestrsafe();
                if ( ns.size() == 0 ) {
                    errmsg = "no ns";
                    return false;
                }

                DBConfigPtr config = grid.getDBConfig( ns );
                if ( ! config->isSharded( ns ) ) {
                    config->reload();
                    if ( ! config->isSharded( ns ) ) {
                        errmsg = "ns not sharded.  have to shard before can split";
                        return false;
                    }
                }

                const BSONField<BSONObj> findField("find", BSONObj());
                const BSONField<BSONArray> boundsField("bounds", BSONArray());
                const BSONField<BSONObj> middleField("middle", BSONObj());

                BSONObj find;
                if (FieldParser::extract(cmdObj, findField, &find, &errmsg) ==
                        FieldParser::FIELD_INVALID) {
                    return false;
                }

                BSONArray bounds;
                if (FieldParser::extract(cmdObj, boundsField, &bounds, &errmsg) ==
                        FieldParser::FIELD_INVALID) {
                    return false;
                }

                if (!bounds.isEmpty()) {
                    if (!bounds.hasField("0")) {
                        errmsg = "lower bound not specified";
                        return false;
                    }

                    if (!bounds.hasField("1")) {
                        errmsg = "upper bound not specified";
                        return false;
                    }
                }

                if (!find.isEmpty() && !bounds.isEmpty()) {
                    errmsg = "cannot specify bounds and find at the same time";
                    return false;
                }

                BSONObj middle;
                if (FieldParser::extract(cmdObj, middleField, &middle, &errmsg) ==
                        FieldParser::FIELD_INVALID) {
                    return false;
                }

                if (find.isEmpty() && bounds.isEmpty() && middle.isEmpty()) {
                    errmsg = "need to specify find/bounds or middle";
                    return false;
                }

                if (!find.isEmpty() && !middle.isEmpty()) {
                    errmsg = "cannot specify find and middle together";
                    return false;
                }

                if (!bounds.isEmpty() && !middle.isEmpty()) {
                    errmsg = "cannot specify bounds and middle together";
                    return false;
                }

                ChunkManagerPtr info = config->getChunkManager( ns );
                ChunkPtr chunk;

                if (!find.isEmpty()) {
                    chunk = info->findChunkForDoc(find);
                }
                else if (!bounds.isEmpty()) {
                    chunk = info->findIntersectingChunk(bounds[0].Obj());
                    verify(chunk.get());

                    if (chunk->getMin() != bounds[0].Obj() ||
                        chunk->getMax() != bounds[1].Obj()) {
                        errmsg = "no chunk found from the given upper and lower bounds";
                        return false;
                    }
                }
                else { // middle
                    chunk = info->findIntersectingChunk(middle);
                }

                verify(chunk.get());
                log() << "splitting: " << ns << "  shard: " << chunk << endl;

                BSONObj res;
                bool worked;
                if ( middle.isEmpty() ) {
                    BSONObj ret = chunk->singleSplit( true /* force a split even if not enough data */ , res );
                    worked = !ret.isEmpty();
                }
                else {
                    // sanity check if the key provided is a valid split point
                    if ( ( middle == chunk->getMin() ) || ( middle == chunk->getMax() ) ) {
                        errmsg = "cannot split on initial or final chunk's key";
                        return false;
                    }

                    if (!fieldsMatch(middle, info->getShardKey().key())){
                        errmsg = "middle has different fields (or different order) than shard key";
                        return false;
                    }

                    vector<BSONObj> splitPoints;
                    splitPoints.push_back( middle );
                    worked = chunk->multiSplit( splitPoints , res );
                }

                if ( !worked ) {
                    errmsg = "split failed";
                    result.append( "cause" , res );
                    return false;
                }
                config->getChunkManager( ns , true );
                return true;
            }
        } splitCollectionCmd;

        class MoveChunkCmd : public GridAdminCmd {
        public:
            MoveChunkCmd() : GridAdminCmd( "moveChunk" ) {}
            virtual void help( stringstream& help ) const {
                help << "Example: move chunk that contains the doc {num : 7} to shard001\n"
                     << "  { movechunk : 'test.foo' , find : { num : 7 } , to : 'shard0001' }\n"
                     << "Example: move chunk with lower bound 0 and upper bound 10 to shard001\n"
                     << "  { movechunk : 'test.foo' , bounds : [ { num : 0 } , { num : 10 } ] "
                     << " , to : 'shard001' }\n";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::moveChunk);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                if ( ! okForConfigChanges( errmsg ) )
                    return false;

                ShardConnection::sync();

                Timer t;
                string ns = cmdObj.firstElement().valuestrsafe();
                if ( ns.size() == 0 ) {
                    errmsg = "no ns";
                    return false;
                }

                DBConfigPtr config = grid.getDBConfig( ns );
                if ( ! config->isSharded( ns ) ) {
                    config->reload();
                    if ( ! config->isSharded( ns ) ) {
                        errmsg = "ns not sharded.  have to shard before we can move a chunk";
                        return false;
                    }
                }

                string toString = cmdObj["to"].valuestrsafe();
                if ( ! toString.size()  ) {
                    errmsg = "you have to specify where you want to move the chunk";
                    return false;
                }

                Shard to = Shard::make( toString );

                // so far, chunk size serves test purposes; it may or may not become a supported parameter
                long long maxChunkSizeBytes = cmdObj["maxChunkSizeBytes"].numberLong();
                if ( maxChunkSizeBytes == 0 ) {
                    maxChunkSizeBytes = Chunk::MaxChunkSize;
                }

                BSONObj find = cmdObj.getObjectField( "find" );
                BSONObj bounds = cmdObj.getObjectField( "bounds" );

                // check that only one of the two chunk specification methods is used
                if ( find.isEmpty() == bounds.isEmpty() ) {
                    errmsg = "need to specify either a find query, or both lower and upper bounds.";
                    return false;
                }

                ChunkManagerPtr info = config->getChunkManager( ns );
                ChunkPtr c = find.isEmpty() ?
                                info->findIntersectingChunk( bounds[0].Obj() ) :
                                info->findChunkForDoc( find );

                if ( ! bounds.isEmpty() && ( c->getMin() != bounds[0].Obj() ||
                                             c->getMax() != bounds[1].Obj() ) ) {
                    errmsg = "no chunk found with those upper and lower bounds";
                    return false;
                }

                const Shard& from = c->getShard();

                if ( from == to ) {
                    errmsg = "that chunk is already on that shard";
                    return false;
                }

                tlog() << "CMD: movechunk: " << cmdObj << endl;

                BSONObj res;
                if (!c->moveAndCommit(to,
                                      maxChunkSizeBytes,
                                      cmdObj["_secondaryThrottle"].trueValue(),
                                      cmdObj["_waitForDelete"].trueValue(),
                                      res)) {
                    errmsg = "move failed";
                    result.append( "cause" , res );
                    return false;
                }
                
                // preemptively reload the config to get new version info
                config->getChunkManager( ns , true );

                result.append( "millis" , t.millis() );
                return true;
            }
        } moveChunkCmd;

        // ------------ server level commands -------------

        class ListShardsCmd : public GridAdminCmd {
        public:
            ListShardsCmd() : GridAdminCmd("listShards") { }
            virtual void help( stringstream& help ) const {
                help << "list all shards of the system";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::listShards);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                scoped_ptr<ScopedDbConnection> conn(
                        ScopedDbConnection::getInternalScopedDbConnection(
                                configServer.getPrimary().getConnString(), 30));

                vector<BSONObj> all;
                auto_ptr<DBClientCursor> cursor = conn->get()->query( ShardType::ConfigNS , BSONObj() );
                while ( cursor->more() ) {
                    BSONObj o = cursor->next();
                    all.push_back( o );
                }

                result.append("shards" , all );
                conn->done();

                return true;
            }
        } listShardsCmd;

        /* a shard is a single mongod server or a replica pair.  add it (them) to the cluster as a storage partition. */
        class AddShard : public GridAdminCmd {
        public:
            AddShard() : GridAdminCmd("addShard") { }
            virtual void help( stringstream& help ) const {
                help << "add a new shard to the system";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::addShard);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                errmsg.clear();

                // get replica set component hosts
                ConnectionString servers = ConnectionString::parse( cmdObj.firstElement().valuestrsafe() , errmsg );
                if ( ! errmsg.empty() ) {
                    log() << "addshard request " << cmdObj << " failed:" << errmsg << endl;
                    return false;
                }

                // using localhost in server names implies every other process must use localhost addresses too
                vector<HostAndPort> serverAddrs = servers.getServers();
                for ( size_t i = 0 ; i < serverAddrs.size() ; i++ ) {
                    if ( serverAddrs[i].isLocalHost() != grid.allowLocalHost() ) {
                        errmsg = str::stream() << 
                            "can't use localhost as a shard since all shards need to communicate. " <<
                            "either use all shards and configdbs in localhost or all in actual IPs " << 
                            " host: " << serverAddrs[i].toString() << " isLocalHost:" << serverAddrs[i].isLocalHost();
                        
                        log() << "addshard request " << cmdObj << " failed: attempt to mix localhosts and IPs" << endl;
                        return false;
                    }

                    // it's fine if mongods of a set all use default port
                    if ( ! serverAddrs[i].hasPort() ) {
                        serverAddrs[i].setPort( CmdLine::ShardServerPort );
                    }
                }

                // name is optional; addShard will provide one if needed
                string name = "";
                if ( cmdObj["name"].type() == String ) {
                    name = cmdObj["name"].valuestrsafe();
                }

                // maxSize is the space usage cap in a shard in MBs
                long long maxSize = 0;
                if ( cmdObj[ ShardType::maxSize() ].isNumber() ) {
                    maxSize = cmdObj[ ShardType::maxSize() ].numberLong();
                }

                if ( ! grid.addShard( &name , servers , maxSize , errmsg ) ) {
                    log() << "addshard request " << cmdObj << " failed: " << errmsg << endl;
                    return false;
                }

                result << "shardAdded" << name;
                return true;
            }

        } addServer;

        /* See usage docs at:
         * http://dochub.mongodb.org/core/configuringsharding#ConfiguringSharding-Removingashard
         */
        class RemoveShardCmd : public GridAdminCmd {
        public:
            RemoveShardCmd() : GridAdminCmd("removeShard") { }
            virtual void help( stringstream& help ) const {
                help << "remove a shard to the system.";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {
                ActionSet actions;
                actions.addAction(ActionType::removeShard);
                out->push_back(Privilege(AuthorizationManager::CLUSTER_RESOURCE_NAME, actions));
            }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                string target = cmdObj.firstElement().valuestrsafe();
                Shard s = Shard::make( target );
                if ( ! grid.knowAboutShard( s.getConnString() ) ) {
                    errmsg = "unknown shard";
                    return false;
                }

                scoped_ptr<ScopedDbConnection> connPtr(
                        ScopedDbConnection::getInternalScopedDbConnection(
                                configServer.getPrimary().getConnString(), 30));
                ScopedDbConnection& conn = *connPtr;

                if (conn->count(ShardType::ConfigNS,
                                BSON(ShardType::name() << NE << s.getName() <<
                                     ShardType::draining(true)))){
                    conn.done();
                    errmsg = "Can't have more than one draining shard at a time";
                    return false;
                }

                if (conn->count(ShardType::ConfigNS, BSON(ShardType::name() << NE << s.getName())) == 0){
                    conn.done();
                    errmsg = "Can't remove last shard";
                    return false;
                }

                BSONObj primaryDoc = BSON(DatabaseType::name.ne("local") <<
                                          DatabaseType::primary(s.getName()));
                BSONObj dbInfo; // appended at end of result on success
                {
                    boost::scoped_ptr<DBClientCursor> cursor (conn->query(DatabaseType::ConfigNS, primaryDoc));
                    if (cursor->more()) { // skip block and allocations if empty
                        BSONObjBuilder dbInfoBuilder;
                        dbInfoBuilder.append("note", "you need to drop or movePrimary these databases");
                        BSONArrayBuilder dbs(dbInfoBuilder.subarrayStart("dbsToMove"));

                        while (cursor->more()){
                            BSONObj db = cursor->nextSafe();
                            dbs.append(db[DatabaseType::name()]);
                        }
                        dbs.doneFast();

                        dbInfo = dbInfoBuilder.obj();
                    }
                }

                // If the server is not yet draining chunks, put it in draining mode.
                BSONObj searchDoc = BSON(ShardType::name() << s.getName());
                BSONObj drainingDoc = BSON(ShardType::name() << s.getName() << ShardType::draining(true));
                BSONObj shardDoc = conn->findOne(ShardType::ConfigNS, drainingDoc);
                if ( shardDoc.isEmpty() ) {

                    // TODO prevent move chunks to this shard.

                    log() << "going to start draining shard: " << s.getName() << endl;
                    BSONObj newStatus = BSON( "$set" << BSON( ShardType::draining(true) ) );
                    conn->update( ShardType::ConfigNS , searchDoc , newStatus, false /* do no upsert */);

                    errmsg = conn->getLastError();
                    if ( errmsg.size() ) {
                        log() << "error starting remove shard: " << s.getName() << " err: " << errmsg << endl;
                        return false;
                    }

                    BSONObj primaryLocalDoc = BSON(DatabaseType::name("local") <<
                                                   DatabaseType::primary(s.getName()));
                    PRINT(primaryLocalDoc);
                    if (conn->count(DatabaseType::ConfigNS, primaryLocalDoc)) {
                        log() << "This shard is listed as primary of local db. Removing entry." << endl;
                        conn->remove(DatabaseType::ConfigNS, BSON(DatabaseType::name("local")));
                        errmsg = conn->getLastError();
                        if ( errmsg.size() ) {
                            log() << "error removing local db: " << errmsg << endl;
                            return false;
                        }
                    }

                    Shard::reloadShardInfo();

                    result.append( "msg"   , "draining started successfully" );
                    result.append( "state" , "started" );
                    result.append( "shard" , s.getName() );
                    result.appendElements(dbInfo);
                    conn.done();
                    return true;
                }

                // If the server has been completely drained, remove it from the ConfigDB.
                // Check not only for chunks but also databases.
                BSONObj shardIDDoc = BSON(ChunkType::shard(shardDoc[ShardType::name()].str()));
                long long chunkCount = conn->count(ChunkType::ConfigNS, shardIDDoc);
                long long dbCount = conn->count( DatabaseType::ConfigNS , primaryDoc );
                if ( ( chunkCount == 0 ) && ( dbCount == 0 ) ) {
                    log() << "going to remove shard: " << s.getName() << endl;
                    conn->remove( ShardType::ConfigNS , searchDoc );

                    errmsg = conn->getLastError();
                    if ( errmsg.size() ) {
                        log() << "error concluding remove shard: " << s.getName() << " err: " << errmsg << endl;
                        return false;
                    }

                    string shardName = shardDoc[ ShardType::name() ].str();
                    Shard::removeShard( shardName );
                    shardConnectionPool.removeHost( shardName );
                    ReplicaSetMonitor::remove( shardName, true );
                    Shard::reloadShardInfo();

                    result.append( "msg"   , "removeshard completed successfully" );
                    result.append( "state" , "completed" );
                    result.append( "shard" , s.getName() );
                    conn.done();
                    return true;
                }

                // If the server is already in draining mode, just report on its progress.
                // Report on databases (not just chunks) that are left too.
                result.append( "msg"  , "draining ongoing" );
                result.append( "state" , "ongoing" );
                BSONObjBuilder inner;
                inner.append( "chunks" , chunkCount );
                inner.append( "dbs" , dbCount );
                result.append( "remaining" , inner.obj() );
                result.appendElements(dbInfo);

                conn.done();
                return true;
            }
        } removeShardCmd;


        // --------------- public commands ----------------

        class IsDbGridCmd : public Command {
        public:
            virtual LockType locktype() const { return NONE; }
            virtual bool requiresAuth() { return false; }
            virtual bool slaveOk() const {
                return true;
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {} // No auth required
            IsDbGridCmd() : Command("isdbgrid") { }
            bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                result.append("isdbgrid", 1);
                result.append("hostname", getHostNameCached());
                return true;
            }
        } isdbgrid;

        class CmdIsMaster : public Command {
        public:
            virtual LockType locktype() const { return NONE; }
            virtual bool requiresAuth() { return false; }
            virtual bool slaveOk() const {
                return true;
            }
            virtual void help( stringstream& help ) const {
                help << "test if this is master half of a replica pair";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {} // No auth required
            CmdIsMaster() : Command("isMaster" , false , "ismaster") { }
            virtual bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                result.appendBool("ismaster", true );
                result.append("msg", "isdbgrid");
                result.appendNumber("maxBsonObjectSize", BSONObjMaxUserSize);
                result.appendNumber("maxMessageSizeBytes", MaxMessageSizeBytes);
                result.appendDate("localTime", jsTime());

                return true;
            }
        } ismaster;

        class CmdWhatsMyUri : public Command {
        public:
            CmdWhatsMyUri() : Command("whatsmyuri") { }
            virtual bool logTheOp() {
                return false; // the modification will be logged directly
            }
            virtual bool slaveOk() const {
                return true;
            }
            virtual LockType locktype() const { return NONE; }
            virtual bool requiresAuth() { return false; }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {} // No auth required
            virtual void help( stringstream &help ) const {
                help << "{whatsmyuri:1}";
            }
            virtual bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                result << "you" << ClientInfo::get()->getRemote();
                return true;
            }
        } cmdWhatsMyUri;


        class CmdShardingGetPrevError : public Command {
        public:
            virtual LockType locktype() const { return NONE; }
            virtual bool requiresAuth() { return false; }

            virtual bool slaveOk() const {
                return true;
            }
            virtual void help( stringstream& help ) const {
                help << "get previous error (since last reseterror command)";
            }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {} // No auth required
            CmdShardingGetPrevError() : Command( "getPrevError" , false , "getpreverror") { }
            virtual bool run(const string& , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                errmsg += "getpreverror not supported for sharded environments";
                return false;
            }
        } cmdGetPrevError;

        class CmdShardingGetLastError : public Command {
        public:
            virtual LockType locktype() const { return NONE; }
            virtual bool slaveOk() const {
                return true;
            }
            virtual void help( stringstream& help ) const {
                help << "check for an error on the last command executed";
            }
            virtual bool requiresAuth() { return false; }
            virtual void addRequiredPrivileges(const std::string& dbname,
                                               const BSONObj& cmdObj,
                                               std::vector<Privilege>* out) {} // No auth required
            CmdShardingGetLastError() : Command("getLastError" , false , "getlasterror") { }

            virtual bool run(const string& dbName, BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool) {
                LastError *le = lastError.disableForCommand();
                verify( le );
                {
                    if ( le->msg.size() && le->nPrev == 1 ) {
                        le->appendSelf( result );
                        return true;
                    }
                }
                ClientInfo * client = ClientInfo::get();
                bool res = client->getLastError( dbName, cmdObj , result, errmsg );
                client->disableForCommand();
                return res;
            }
        } cmdGetLastError;

    }

    class CmdShardingResetError : public Command {
    public:
        CmdShardingResetError() : Command( "resetError" , false , "reseterror" ) {}

        virtual LockType locktype() const { return NONE; }
        virtual bool slaveOk() const {
            return true;
        }
        virtual bool requiresAuth() { return false; }
        virtual void addRequiredPrivileges(const std::string& dbname,
                                           const BSONObj& cmdObj,
                                           std::vector<Privilege>* out) {} // No auth required
        bool run(const string& dbName , BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool /*fromRepl*/) {
            LastError *le = lastError.get();
            if ( le )
                le->reset();

            ClientInfo * client = ClientInfo::get();
            set<string> * shards = client->getPrev();

            for ( set<string>::iterator i = shards->begin(); i != shards->end(); i++ ) {
                string theShard = *i;
                ShardConnection conn( theShard , "" );
                BSONObj res;
                conn->runCommand( dbName , cmdObj , res );
                conn.done();
            }

            return true;
        }
    } cmdShardingResetError;

    class CmdListDatabases : public Command {
    public:
        CmdListDatabases() : Command("listDatabases", true , "listdatabases" ) {}

        virtual bool logTheOp() { return false; }
        virtual bool slaveOk() const { return true; }
        virtual bool slaveOverrideOk() const { return true; }
        virtual bool adminOnly() const { return true; }
        virtual LockType locktype() const { return NONE; }
        virtual void help( stringstream& help ) const { help << "list databases on cluster"; }
        virtual void addRequiredPrivileges(const std::string& dbname,
                                           const BSONObj& cmdObj,
                                           std::vector<Privilege>* out) {
            ActionSet actions;
            actions.addAction(ActionType::listDatabases);
            out->push_back(Privilege(AuthorizationManager::SERVER_RESOURCE_NAME, actions));
        }

        bool run(const string& , BSONObj& jsobj, int, string& errmsg, BSONObjBuilder& result, bool /*fromRepl*/) {
            vector<Shard> shards;
            Shard::getAllShards( shards );

            map<string,long long> sizes;
            map< string,shared_ptr<BSONObjBuilder> > dbShardInfo;

            for ( vector<Shard>::iterator i=shards.begin(); i!=shards.end(); i++ ) {
                Shard s = *i;
                BSONObj x = s.runCommand( "admin" , "listDatabases" );

                BSONObjIterator j( x["databases"].Obj() );
                while ( j.more() ) {
                    BSONObj theDB = j.next().Obj();

                    string name = theDB["name"].String();
                    long long size = theDB["sizeOnDisk"].numberLong();

                    long long& totalSize = sizes[name];
                    if ( size == 1 ) {
                        if ( totalSize <= 1 )
                            totalSize = 1;
                    }
                    else
                        totalSize += size;

                    shared_ptr<BSONObjBuilder>& bb = dbShardInfo[name];
                    if ( ! bb.get() )
                        bb.reset( new BSONObjBuilder() );
                    bb->appendNumber( s.getName() , size );
                }

            }

            long long totalSize = 0;

            BSONArrayBuilder bb( result.subarrayStart( "databases" ) );
            for ( map<string,long long>::iterator i=sizes.begin(); i!=sizes.end(); ++i ) {
                string name = i->first;

                if ( name == "local" ) {
                    // we don't return local
                    // since all shards have their own independent local
                    continue;
                }

                if ( name == "config" || name == "admin" ) {
                    //always get this from the config servers
                    continue;
                }

                long long size = i->second;
                totalSize += size;

                BSONObjBuilder temp;
                temp.append( "name" , name );
                temp.appendNumber( "sizeOnDisk" , size );
                temp.appendBool( "empty" , size == 1 );
                temp.append( "shards" , dbShardInfo[name]->obj() );

                bb.append( temp.obj() );
            }
            
            { // get config db from the config servers (first one)
                scoped_ptr<ScopedDbConnection> conn(
                        ScopedDbConnection::getInternalScopedDbConnection(
                                configServer.getPrimary().getConnString(), 30));
                BSONObj x;
                if ( conn->get()->simpleCommand( "config" , &x , "dbstats" ) ){
                    BSONObjBuilder b;
                    b.append( "name" , "config" );
                    b.appendBool( "empty" , false );
                    if ( x["fileSize"].type() )
                        b.appendAs( x["fileSize"] , "sizeOnDisk" );
                    else
                        b.append( "sizeOnDisk" , 1 );
                    bb.append( b.obj() );
                }
                else {
                    bb.append( BSON( "name" << "config" ) );
                }
                conn->done();
            }

            { // get admin db from the config servers (first one)
                scoped_ptr<ScopedDbConnection> conn(
                        ScopedDbConnection::getInternalScopedDbConnection(
                                configServer.getPrimary().getConnString(), 30));
                BSONObj x;
                if ( conn->get()->simpleCommand( "admin" , &x , "dbstats" ) ){
                    BSONObjBuilder b;
                    b.append( "name" , "admin" );
                    b.appendBool( "empty" , false );
                    if ( x["fileSize"].type() )
                        b.appendAs( x["fileSize"] , "sizeOnDisk" );
                    else
                        b.append( "sizeOnDisk" , 1 );
                    bb.append( b.obj() );
                }
                else {
                    bb.append( BSON( "name" << "admin" ) );
                }
                conn->done();
            }

            bb.done();

            result.appendNumber( "totalSize" , totalSize );
            result.appendNumber( "totalSizeMb" , totalSize / ( 1024 * 1024 ) );

            return 1;
        }

    } cmdListDatabases;

    class CmdCloseAllDatabases : public Command {
    public:
        CmdCloseAllDatabases() : Command("closeAllDatabases", false , "closeAllDatabases" ) {}
        virtual bool logTheOp() { return false; }
        virtual bool slaveOk() const { return true; }
        virtual bool slaveOverrideOk() const { return true; }
        virtual bool adminOnly() const { return true; }
        virtual LockType locktype() const { return NONE; }
        virtual void help( stringstream& help ) const { help << "Not supported sharded"; }
        virtual void addRequiredPrivileges(const std::string& dbname,
                                           const BSONObj& cmdObj,
                                           std::vector<Privilege>* out) {
            ActionSet actions;
            actions.addAction(ActionType::closeAllDatabases);
            out->push_back(Privilege(AuthorizationManager::SERVER_RESOURCE_NAME, actions));
        }

        bool run(const string& , BSONObj& jsobj, int, string& errmsg, BSONObjBuilder& /*result*/, bool /*fromRepl*/) {
            errmsg = "closeAllDatabases isn't supported through mongos";
            return false;
        }
    } cmdCloseAllDatabases;


    class CmdReplSetGetStatus : public Command {
    public:
        CmdReplSetGetStatus() : Command("replSetGetStatus"){}
        virtual bool logTheOp() { return false; }
        virtual bool slaveOk() const { return true; }
        virtual bool adminOnly() const { return true; }
        virtual LockType locktype() const { return NONE; }
        virtual void help( stringstream& help ) const { help << "Not supported through mongos"; }
        virtual void addRequiredPrivileges(const std::string& dbname,
                                           const BSONObj& cmdObj,
                                           std::vector<Privilege>* out) {
            // TODO: Should this require no auth since it's not supported in mongos anyway?
            ActionSet actions;
            actions.addAction(ActionType::replSetGetStatus);
            out->push_back(Privilege(AuthorizationManager::SERVER_RESOURCE_NAME, actions));
        }
        bool run(const string& , BSONObj& jsobj, int, string& errmsg, BSONObjBuilder& result, bool /*fromRepl*/) {
            if ( jsobj["forShell"].trueValue() ) {
                lastError.disableForCommand();
                ClientInfo::get()->disableForCommand();
            }

            errmsg = "replSetGetStatus is not supported through mongos";
            result.append("info", "mongos"); // see sayReplSetMemberState
            return false;
        }
    } cmdReplSetGetStatus;

    CmdShutdown cmdShutdown;

    void CmdShutdown::help( stringstream& help ) const {
        help << "shutdown the database.  must be ran against admin db and "
             << "either (1) ran from localhost or (2) authenticated.";
    }

    bool CmdShutdown::run(const string& dbname, BSONObj& cmdObj, int, string& errmsg, BSONObjBuilder& result, bool fromRepl) {
        return shutdownHelper();
    }

} // namespace mongo