1
0
Fork 0
arangodb/arangod/Cluster/TraverserEngine.cpp

526 lines
19 KiB
C++

////////////////////////////////////////////////////////////////////////////////
/// DISCLAIMER
///
/// Copyright 2014-2018 ArangoDB GmbH, Cologne, Germany
/// Copyright 2004-2014 triAGENS GmbH, Cologne, Germany
///
/// Licensed under the Apache License, Version 2.0 (the "License");
/// you may not use this file except in compliance with the License.
/// You may obtain a copy of the License at
///
/// http://www.apache.org/licenses/LICENSE-2.0
///
/// Unless required by applicable law or agreed to in writing, software
/// distributed under the License is distributed on an "AS IS" BASIS,
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
/// See the License for the specific language governing permissions and
/// limitations under the License.
///
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
///
/// @author Michael Hackstein
////////////////////////////////////////////////////////////////////////////////
#include "TraverserEngine.h"
#include "Aql/AqlTransaction.h"
#include "Aql/Ast.h"
#include "Aql/Query.h"
#include "Aql/QueryString.h"
#include "Basics/Exceptions.h"
#include "Basics/Result.h"
#include "Graph/EdgeCursor.h"
#include "Graph/ShortestPathOptions.h"
#include "Graph/TraverserCache.h"
#include "Graph/TraverserOptions.h"
#include "Logger/LogMacros.h"
#include "Logger/Logger.h"
#include "Logger/LoggerStream.h"
#include "Transaction/Context.h"
#include "Utils/CollectionNameResolver.h"
#include "VocBase/ManagedDocumentResult.h"
#include <velocypack/Iterator.h>
#include <velocypack/Slice.h>
#include <velocypack/velocypack-aliases.h>
using namespace arangodb;
using namespace arangodb::graph;
using namespace arangodb::traverser;
static const std::string OPTIONS = "options";
static const std::string INACCESSIBLE = "inaccessible";
static const std::string SHARDS = "shards";
static const std::string EDGES = "edges";
static const std::string TYPE = "type";
static const std::string VARIABLES = "variables";
static const std::string VERTICES = "vertices";
#ifndef USE_ENTERPRISE
/*static*/ std::unique_ptr<BaseEngine> BaseEngine::BuildEngine(
TRI_vocbase_t& vocbase, std::shared_ptr<transaction::Context> const& ctx,
VPackSlice info, bool needToLock) {
VPackSlice type = info.get(std::vector<std::string>({"options", "type"}));
if (!type.isString()) {
THROW_ARANGO_EXCEPTION_MESSAGE(
TRI_ERROR_BAD_PARAMETER,
"The body requires an 'options.type' attribute.");
}
if (type.isEqualString("traversal")) {
return std::make_unique<TraverserEngine>(vocbase, ctx, info, needToLock);
} else if (type.isEqualString("shortestPath")) {
return std::make_unique<ShortestPathEngine>(vocbase, ctx, info, needToLock);
}
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The 'options.type' attribute either has to "
"be traversal or shortestPath");
}
#endif
BaseEngine::BaseEngine(TRI_vocbase_t& vocbase,
std::shared_ptr<transaction::Context> const& ctx,
VPackSlice info, bool needToLock)
: _query(nullptr), _trx(nullptr), _collections(&vocbase) {
VPackSlice shardsSlice = info.get(SHARDS);
if (shardsSlice.isNone() || !shardsSlice.isObject()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The body requires a " + SHARDS +
" attribute.");
}
VPackSlice edgesSlice = shardsSlice.get(EDGES);
if (edgesSlice.isNone() || !edgesSlice.isArray()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The " + SHARDS + " object requires an " +
EDGES + " attribute.");
}
VPackSlice vertexSlice = shardsSlice.get(VERTICES);
if (vertexSlice.isNone() || !vertexSlice.isObject()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The " + SHARDS + " object requires a " +
VERTICES + " attribute.");
}
// Add all Edge shards to the transaction
for (VPackSlice const shardList : VPackArrayIterator(edgesSlice)) {
TRI_ASSERT(shardList.isArray());
for (VPackSlice const shard : VPackArrayIterator(shardList)) {
TRI_ASSERT(shard.isString());
_collections.add(shard.copyString(), AccessMode::Type::READ);
}
}
// Add all Vertex shards to the transaction
for (auto const& collection : VPackObjectIterator(vertexSlice)) {
std::vector<std::string> shards;
for (VPackSlice const shard : VPackArrayIterator(collection.value)) {
TRI_ASSERT(shard.isString());
std::string name = shard.copyString();
_collections.add(name, AccessMode::Type::READ);
shards.emplace_back(std::move(name));
}
_vertexShards.try_emplace(collection.key.copyString(), std::move(shards));
}
// FIXME: in the future this needs to be replaced with
// the new cluster wide transactions
transaction::Options trxOpts;
#ifdef USE_ENTERPRISE
VPackSlice inaccessSlice = shardsSlice.get(INACCESSIBLE);
if (inaccessSlice.isArray()) {
trxOpts.skipInaccessibleCollections = true;
std::unordered_set<ShardID> inaccessible;
for (VPackSlice const& shard : VPackArrayIterator(inaccessSlice)) {
TRI_ASSERT(shard.isString());
inaccessible.insert(shard.copyString());
}
_trx = aql::AqlTransaction::create(ctx, _collections.collections(), trxOpts,
true, std::move(inaccessible));
} else {
_trx = aql::AqlTransaction::create(ctx, _collections.collections(), trxOpts, /*isMainTransaction*/true);
}
#else
_trx = aql::AqlTransaction::create(ctx, _collections.collections(), trxOpts, /*isMainTransaction*/true);
#endif
if (!needToLock) {
_trx->addHint(transaction::Hints::Hint::LOCK_NEVER);
}
// true here as last argument is crucial: it leads to the fact that the
// created transaction is considered a "MAIN" part and will not switch
// off collection locking completely!
auto params = std::make_shared<VPackBuilder>();
auto opts = std::make_shared<VPackBuilder>();
_query = new aql::Query(false, vocbase, aql::QueryString(), params, opts, aql::PART_DEPENDENT);
_query->injectTransaction(_trx);
VPackSlice variablesSlice = info.get(VARIABLES);
if (!variablesSlice.isNone()) {
if (!variablesSlice.isArray()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The optional " + VARIABLES +
" has to be an array.");
}
for (auto v : VPackArrayIterator(variablesSlice)) {
_query->ast()->variables()->createVariable(v);
}
}
// We begin the transaction before we lock.
// We also setup indexes before we lock.
Result res = _trx->begin();
if (res.fail()) {
THROW_ARANGO_EXCEPTION(res);
}
}
BaseEngine::~BaseEngine() {
if (_trx) {
try {
if (_trx->status() == transaction::Status::RUNNING) {
Result res = _trx->commit();
if (res.fail()) {
LOG_TOPIC("315cf", ERR, Logger::CLUSTER)
<< "BaseEngine could not commit: "
<< res.errorMessage()
<< ", current status: " << transaction::statusString(_trx->status());
}
}
} catch (...) {
// If we could not abort
// we are in a bad state.
}
}
delete _query;
}
bool BaseEngine::lockCollection(std::string const& shard) {
auto resolver = _trx->resolver();
TRI_voc_cid_t cid = resolver->getCollectionIdLocal(shard);
if (cid == 0) {
return false;
}
_trx->pinData(cid); // will throw when it fails
Result lockResult = _trx->lockRecursive(cid, AccessMode::Type::READ);
if (!lockResult.ok() && !lockResult.is(TRI_ERROR_LOCKED)) {
LOG_TOPIC("d7485", ERR, arangodb::Logger::CLUSTER)
<< "Locking shard " << shard << " lead to exception '"
<< lockResult.errorNumber() << "' (" << lockResult.errorMessage() << ")";
return false;
}
return true;
}
Result BaseEngine::lockAll() { return _trx->lockCollections(); }
std::shared_ptr<transaction::Context> BaseEngine::context() const {
return _trx->transactionContext();
}
void BaseEngine::getVertexData(VPackSlice vertex, VPackBuilder& builder) {
// We just hope someone has locked the shards properly. We have no clue...
// Thanks locking
TRI_ASSERT(ServerState::instance()->isDBServer());
TRI_ASSERT(vertex.isString() || vertex.isArray());
ManagedDocumentResult mmdr;
builder.openObject();
auto workOnOneDocument = [&](VPackSlice v) {
arangodb::velocypack::StringRef id(v);
size_t pos = id.find('/');
if (pos == std::string::npos || pos + 1 == id.size()) {
TRI_ASSERT(false);
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_GRAPH_INVALID_EDGE,
"edge contains invalid value " + id.toString());
}
ShardID shardName = id.substr(0, pos).toString();
auto shards = _vertexShards.find(shardName);
if (shards == _vertexShards.end()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_QUERY_COLLECTION_LOCK_FAILED,
"collection not known to traversal: '" +
shardName + "'. please add 'WITH " + shardName +
"' as the first line in your AQL");
// The collection is not known here!
// Maybe handle differently
}
arangodb::velocypack::StringRef vertex = id.substr(pos + 1);
for (std::string const& shard : shards->second) {
Result res = _trx->documentFastPathLocal(shard, vertex, mmdr, false);
if (res.ok()) {
// FOUND short circuit.
builder.add(v);
mmdr.addToBuilder(builder, true);
break;
} else if (res.isNot(TRI_ERROR_ARANGO_DOCUMENT_NOT_FOUND)) {
// We are in a very bad condition here...
THROW_ARANGO_EXCEPTION(res);
}
}
};
if (vertex.isArray()) {
for (VPackSlice v : VPackArrayIterator(vertex)) {
workOnOneDocument(v);
}
} else {
workOnOneDocument(vertex);
}
builder.close(); // The outer object
}
BaseTraverserEngine::BaseTraverserEngine(TRI_vocbase_t& vocbase,
std::shared_ptr<transaction::Context> const& ctx,
VPackSlice info, bool needToLock)
: BaseEngine(vocbase, ctx, info, needToLock), _opts(nullptr) {}
BaseTraverserEngine::~BaseTraverserEngine() = default;
void BaseTraverserEngine::getEdges(VPackSlice vertex, size_t depth, VPackBuilder& builder) {
// We just hope someone has locked the shards properly. We have no clue...
// Thanks locking
TRI_ASSERT(vertex.isString() || vertex.isArray());
builder.openObject();
builder.add(VPackValue("edges"));
builder.openArray();
if (vertex.isArray()) {
for (VPackSlice v : VPackArrayIterator(vertex)) {
TRI_ASSERT(v.isString());
// result.clear();
arangodb::velocypack::StringRef vertexId(v);
std::unique_ptr<arangodb::graph::EdgeCursor> edgeCursor(
_opts->nextCursor(vertexId, depth));
edgeCursor->readAll([&](EdgeDocumentToken&& eid, VPackSlice edge, size_t cursorId) {
if (edge.isString()) {
edge = _opts->cache()->lookupToken(eid);
}
if (edge.isNull()) {
return;
}
if (_opts->evaluateEdgeExpression(edge, arangodb::velocypack::StringRef(v), depth, cursorId)) {
builder.add(edge);
}
});
// Result now contains all valid edges, probably multiples.
}
} else if (vertex.isString()) {
std::unique_ptr<arangodb::graph::EdgeCursor> edgeCursor(
_opts->nextCursor(arangodb::velocypack::StringRef(vertex), depth));
edgeCursor->readAll([&](EdgeDocumentToken&& eid, VPackSlice edge, size_t cursorId) {
if (edge.isString()) {
edge = _opts->cache()->lookupToken(eid);
}
if (edge.isNull()) {
return;
}
if (_opts->evaluateEdgeExpression(edge, arangodb::velocypack::StringRef(vertex), depth, cursorId)) {
builder.add(edge);
}
});
// Result now contains all valid edges, probably multiples.
} else {
THROW_ARANGO_EXCEPTION(TRI_ERROR_BAD_PARAMETER);
}
builder.close();
builder.add("readIndex", VPackValue(_opts->cache()->getAndResetInsertedDocuments()));
builder.add("filtered", VPackValue(_opts->cache()->getAndResetFilteredDocuments()));
builder.close();
}
void BaseTraverserEngine::getVertexData(VPackSlice vertex, size_t depth,
VPackBuilder& builder) {
// We just hope someone has locked the shards properly. We have no clue...
// Thanks locking
TRI_ASSERT(ServerState::instance()->isDBServer());
TRI_ASSERT(vertex.isString() || vertex.isArray());
size_t read = 0;
ManagedDocumentResult mmdr;
builder.openObject();
builder.add(VPackValue("vertices"));
auto workOnOneDocument = [&](VPackSlice v) {
if (v.isNull()) {
return;
}
arangodb::velocypack::StringRef id(v);
size_t pos = id.find('/');
if (pos == std::string::npos || pos + 1 == id.size()) {
TRI_ASSERT(false);
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_GRAPH_INVALID_EDGE,
"edge contains invalid value " + id.toString());
}
ShardID shardName = id.substr(0, pos).toString();
auto shards = _vertexShards.find(shardName);
if (shards == _vertexShards.end()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_QUERY_COLLECTION_LOCK_FAILED,
"collection not known to traversal: '" +
shardName + "'. please add 'WITH " + shardName +
"' as the first line in your AQL");
// The collection is not known here!
// Maybe handle differently
}
arangodb::velocypack::StringRef vertex = id.substr(pos + 1);
for (std::string const& shard : shards->second) {
Result res = _trx->documentFastPathLocal(shard, vertex, mmdr, false);
if (res.ok()) {
// FOUND short circuit.
read++;
builder.add(v);
mmdr.addToBuilder(builder, true);
break;
} else if (res.isNot(TRI_ERROR_ARANGO_DOCUMENT_NOT_FOUND)) {
// We are in a very bad condition here...
THROW_ARANGO_EXCEPTION(res);
}
}
// TODO FILTERING!
// HOWTO Distinguish filtered vs NULL?
};
if (vertex.isArray()) {
builder.openArray();
for (VPackSlice v : VPackArrayIterator(vertex)) {
workOnOneDocument(v);
}
builder.close();
} else {
workOnOneDocument(vertex);
}
builder.add("readIndex", VPackValue(read));
builder.add("filtered", VPackValue(0));
builder.close();
}
ShortestPathEngine::ShortestPathEngine(TRI_vocbase_t& vocbase,
std::shared_ptr<transaction::Context> const& ctx,
arangodb::velocypack::Slice info, bool needToLock)
: BaseEngine(vocbase, ctx, info, needToLock) {
VPackSlice optsSlice = info.get(OPTIONS);
if (optsSlice.isNone() || !optsSlice.isObject()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The body requires an " + OPTIONS +
" attribute.");
}
VPackSlice shardsSlice = info.get(SHARDS);
VPackSlice edgesSlice = shardsSlice.get(EDGES);
VPackSlice type = optsSlice.get(TYPE);
if (!type.isString()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The " + OPTIONS + " require a " + TYPE +
" attribute.");
}
TRI_ASSERT(type.isEqualString("shortestPath"));
_opts.reset(new ShortestPathOptions(_query, optsSlice, edgesSlice));
// We create the cache, but we do not need any engines.
_opts->activateCache(false, nullptr);
}
ShortestPathEngine::~ShortestPathEngine() = default;
void ShortestPathEngine::getEdges(VPackSlice vertex, bool backward, VPackBuilder& builder) {
// We just hope someone has locked the shards properly. We have no clue...
// Thanks locking
TRI_ASSERT(vertex.isString() || vertex.isArray());
std::unique_ptr<arangodb::graph::EdgeCursor> edgeCursor;
builder.openObject();
builder.add(VPackValue("edges"));
builder.openArray();
if (vertex.isArray()) {
for (VPackSlice v : VPackArrayIterator(vertex)) {
if (!vertex.isString()) {
continue;
}
TRI_ASSERT(v.isString());
// result.clear();
arangodb::velocypack::StringRef vertexId(v);
if (backward) {
edgeCursor.reset(_opts->nextReverseCursor(vertexId));
} else {
edgeCursor.reset(_opts->nextCursor(vertexId));
}
edgeCursor->readAll([&](EdgeDocumentToken&& eid, VPackSlice edge, size_t cursorId) {
if (edge.isString()) {
edge = _opts->cache()->lookupToken(eid);
}
if (edge.isNull()) {
return;
}
builder.add(edge);
});
// Result now contains all valid edges, probably multiples.
}
} else if (vertex.isString()) {
arangodb::velocypack::StringRef vertexId(vertex);
if (backward) {
edgeCursor.reset(_opts->nextReverseCursor(vertexId));
} else {
edgeCursor.reset(_opts->nextCursor(vertexId));
}
edgeCursor->readAll([&](EdgeDocumentToken&& eid, VPackSlice edge, size_t cursorId) {
if (edge.isString()) {
edge = _opts->cache()->lookupToken(eid);
}
if (edge.isNull()) {
return;
}
builder.add(edge);
});
// Result now contains all valid edges, probably multiples.
} else {
THROW_ARANGO_EXCEPTION(TRI_ERROR_BAD_PARAMETER);
}
builder.close();
builder.add("readIndex", VPackValue(_opts->cache()->getAndResetInsertedDocuments()));
builder.add("filtered", VPackValue(0));
builder.close();
}
TraverserEngine::TraverserEngine(TRI_vocbase_t& vocbase,
std::shared_ptr<transaction::Context> const& ctx,
arangodb::velocypack::Slice info, bool needToLock)
: BaseTraverserEngine(vocbase, ctx, info, needToLock) {
VPackSlice optsSlice = info.get(OPTIONS);
if (!optsSlice.isObject()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The body requires an " + OPTIONS +
" attribute.");
}
VPackSlice shardsSlice = info.get(SHARDS);
VPackSlice edgesSlice = shardsSlice.get(EDGES);
VPackSlice type = optsSlice.get(TYPE);
if (!type.isString()) {
THROW_ARANGO_EXCEPTION_MESSAGE(TRI_ERROR_BAD_PARAMETER,
"The " + OPTIONS + " require a " + TYPE +
" attribute.");
}
TRI_ASSERT(type.isEqualString("traversal"));
_opts.reset(new TraverserOptions(_query, optsSlice, edgesSlice));
// We create the cache, but we do not need any engines.
_opts->activateCache(false, nullptr);
}
TraverserEngine::~TraverserEngine() = default;
void TraverserEngine::smartSearch(VPackSlice, VPackBuilder&) {
THROW_ARANGO_EXCEPTION(TRI_ERROR_ONLY_ENTERPRISE);
}
void TraverserEngine::smartSearchBFS(VPackSlice, VPackBuilder&) {
THROW_ARANGO_EXCEPTION(TRI_ERROR_ONLY_ENTERPRISE);
}