1
0
Fork 0
arangodb/arangod/Cluster/ResignShardLeadership.cpp

143 lines
5.0 KiB
C++

////////////////////////////////////////////////////////////////////////////////
/// DISCLAIMER
///
/// Copyright 2014-2018 ArangoDB GmbH, Cologne, Germany
/// Copyright 2004-2014 triAGENS GmbH, Cologne, Germany
///
/// Licensed under the Apache License, Version 2.0 (the "License");
/// you may not use this file except in compliance with the License.
/// You may obtain a copy of the License at
///
/// http://www.apache.org/licenses/LICENSE-2.0
///
/// Unless required by applicable law or agreed to in writing, software
/// distributed under the License is distributed on an "AS IS" BASIS,
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
/// See the License for the specific language governing permissions and
/// limitations under the License.
///
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
///
/// @author Kaveh Vahedipour
/// @author Matthew Von-Maszewski
////////////////////////////////////////////////////////////////////////////////
#include "ResignShardLeadership.h"
#include "MaintenanceFeature.h"
#include "ApplicationFeatures/ApplicationServer.h"
#include "Basics/VelocyPackHelper.h"
#include "Cluster/ClusterFeature.h"
#include "Cluster/FollowerInfo.h"
#include "Logger/LogMacros.h"
#include "Logger/Logger.h"
#include "Logger/LoggerStream.h"
#include "Transaction/ClusterUtils.h"
#include "Transaction/Methods.h"
#include "Transaction/StandaloneContext.h"
#include "Utils/DatabaseGuard.h"
#include "Utils/SingleCollectionTransaction.h"
#include "VocBase/LogicalCollection.h"
#include "VocBase/Methods/Collections.h"
#include "VocBase/Methods/Databases.h"
#include <velocypack/Compare.h>
#include <velocypack/Iterator.h>
#include <velocypack/Slice.h>
#include <velocypack/velocypack-aliases.h>
using namespace arangodb;
using namespace arangodb::application_features;
using namespace arangodb::maintenance;
using namespace arangodb::methods;
ResignShardLeadership::ResignShardLeadership(MaintenanceFeature& feature,
ActionDescription const& desc)
: ActionBase(feature, desc) {
std::stringstream error;
_labels.emplace(FAST_TRACK);
if (!desc.has(DATABASE)) {
error << "database must be specified";
}
TRI_ASSERT(desc.has(DATABASE));
if (!desc.has(SHARD)) {
error << "shard must be specified";
}
TRI_ASSERT(desc.has(SHARD));
if (!error.str().empty()) {
LOG_TOPIC("2aa84", ERR, Logger::MAINTENANCE) << "ResignLeadership: " << error.str();
_result.reset(TRI_ERROR_INTERNAL, error.str());
setState(FAILED);
}
}
ResignShardLeadership::~ResignShardLeadership() = default;
bool ResignShardLeadership::first() {
std::string const& database = _description.get(DATABASE);
std::string const& collection = _description.get(SHARD);
LOG_TOPIC("14f43", DEBUG, Logger::MAINTENANCE)
<< "trying to withdraw as leader of shard '" << database << "/" << collection;
// This starts a write transaction, just to wait for any ongoing
// write transaction on this shard to terminate. We will then later
// report to Current about this resignation. If a new write operation
// starts in the meantime (which is unlikely, since no coordinator that
// has seen the _ will start a new one), it is doomed, and we ignore the
// problem, since similar problems can arise in failover scenarios anyway.
try {
// Guard database againts deletion for now
DatabaseGuard guard(database);
auto vocbase = &guard.database();
auto col = vocbase->lookupCollection(collection);
if (col == nullptr) {
std::stringstream error;
error << "Failed to lookup local collection " << collection
<< " in database " + database;
LOG_TOPIC("e06ca", ERR, Logger::MAINTENANCE) << "EnsureIndex: " << error.str();
_result.reset(TRI_ERROR_ARANGO_DATA_SOURCE_NOT_FOUND, error.str());
return false;
}
// Get write transaction on collection
auto ctx = std::make_shared<transaction::StandaloneContext>(*vocbase);
SingleCollectionTransaction trx{ctx, *col, AccessMode::Type::EXCLUSIVE};
Result res = trx.begin();
if (!res.ok()) {
THROW_ARANGO_EXCEPTION(res);
}
// Note that it is likely that we will be a follower for this shard
// with another leader in due course. However, we do not know the
// name of the new leader yet. This setting will make us a follower
// for now but we will not accept any replication operation from any
// leader, until we have negotiated a deal with it. Then the actual
// name of the leader will be set.
col->followers()->setTheLeader(LeaderNotYetKnownString); // resign
trx.abort(); // unlock
transaction::cluster::abortLeaderTransactionsOnShard(col->id());
} catch (std::exception const& e) {
std::stringstream error;
error << "exception thrown when resigning:" << e.what();
LOG_TOPIC("173dd", ERR, Logger::MAINTENANCE) << "ResignLeadership: " << error.str();
_result.reset(TRI_ERROR_INTERNAL, error.str());
return false;
}
notify();
return false;
}
std::string const ResignShardLeadership::LeaderNotYetKnownString = "LEADER_NOT_YET_KNOWN";