1
0
Fork 0
arangodb/arangod/Cluster/ClusterTraverser.cpp

521 lines
18 KiB
C++

////////////////////////////////////////////////////////////////////////////////
/// DISCLAIMER
///
/// Copyright 2014-2016 ArangoDB GmbH, Cologne, Germany
/// Copyright 2004-2014 triAGENS GmbH, Cologne, Germany
///
/// Licensed under the Apache License, Version 2.0 (the "License");
/// you may not use this file except in compliance with the License.
/// You may obtain a copy of the License at
///
/// http://www.apache.org/licenses/LICENSE-2.0
///
/// Unless required by applicable law or agreed to in writing, software
/// distributed under the License is distributed on an "AS IS" BASIS,
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
/// See the License for the specific language governing permissions and
/// limitations under the License.
///
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
///
/// @author Michael Hackstein
////////////////////////////////////////////////////////////////////////////////
#include "ClusterTraverser.h"
#include "Basics/VelocyPackHelper.h"
#include "Cluster/ClusterMethods.h"
#include <velocypack/Iterator.h>
#include <velocypack/velocypack-aliases.h>
using namespace arangodb;
using ClusterTraverser = arangodb::traverser::ClusterTraverser;
bool ClusterTraverser::VertexGetter::getVertex(
VPackSlice edge, std::vector<VPackSlice>& result) {
VPackSlice cmp = result.back();
VPackSlice from = edge.get(StaticStrings::FromString);
#warning Here we have to execute VertexFilter
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
/// Else check condition if ok => return true, else return false.
/// When returning false set result = ""
if (arangodb::basics::VelocyPackHelper::compare(cmp, from, false) != 0) {
result.emplace_back(from);
} else {
result.emplace_back(edge.get(StaticStrings::ToString));
}
return true;
}
bool ClusterTraverser::VertexGetter::getSingleVertex(VPackSlice edge,
VPackSlice cmp,
size_t depth,
VPackSlice& result) {
VPackSlice from = edge.get(StaticStrings::FromString);
#warning Here we have to execute VertexFilter
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
/// Else check condition if ok => return true, else return false.
/// When returning false set result = ""
if (arangodb::basics::VelocyPackHelper::compare(cmp, from, false) != 0) {
result = from;
} else {
result = edge.get(StaticStrings::ToString);
}
return true;
}
void ClusterTraverser::VertexGetter::reset() {
// Nothing to do here. Subclass has to clear list of already returned vertices.
}
bool ClusterTraverser::UniqueVertexGetter::getVertex(
VPackSlice edge, std::vector<VPackSlice>& result) {
VPackSlice toAdd = edge.get(StaticStrings::FromString);
VPackSlice cmp = result.back();
if (arangodb::basics::VelocyPackHelper::compare(toAdd, cmp, false) == 0) {
toAdd = edge.get(StaticStrings::ToString);
}
#warning Here we have to execute VertexFilter
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
/// Else check condition if ok => return true, else return false.
/// When returning false set result = ""
/// When returning true: _returnedVertices.emplace(result)
if (_returnedVertices.find(toAdd) != _returnedVertices.end()) {
// This vertex is not unique.
++_traverser->_filteredPaths;
return false;
} else {
_returnedVertices.emplace(toAdd);
result.emplace_back(toAdd);
}
// This should never be reached
return false;
}
bool ClusterTraverser::UniqueVertexGetter::getSingleVertex(
VPackSlice edge, VPackSlice cmp, size_t depth, VPackSlice& result) {
result = edge.get(StaticStrings::FromString);
if (arangodb::basics::VelocyPackHelper::compare(result, cmp, false) == 0) {
result = edge.get(StaticStrings::ToString);
}
#warning Here we have to execute VertexFilter
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
/// Else check condition if ok => return true, else return false.
/// When returning false set result = ""
/// When returning true: _returnedVertices.emplace(result)
if (_returnedVertices.find(result) != _returnedVertices.end()) {
// This vertex is not unique.
++_traverser->_filteredPaths;
return false;
} else {
_returnedVertices.emplace(result);
return true;
}
// This should never be reached
return false;
}
void ClusterTraverser::UniqueVertexGetter::reset() {
_returnedVertices.clear();
}
void ClusterTraverser::ClusterEdgeGetter::getEdge(
std::string const& startVertex, std::vector<std::string>& result,
size_t*& last, size_t& eColIdx) {
#warning This path fetches Edges from DBServer, honoring conditions. Has to be rewritten.
/*
std::string collName;
TRI_edge_direction_e dir;
if (!_traverser->_opts.getCollection(eColIdx, collName, dir)) {
// Nothing to do, caller has set a defined state already.
return;
}
if (last == nullptr) {
size_t depth = result.size();
TRI_ASSERT(_traverser->_iteratorCache.size() == result.size());
// We have to request the next level
arangodb::GeneralResponse::ResponseCode responseCode;
std::vector<TraverserExpression*> expEdges;
VPackBuilder resultEdges;
resultEdges.openObject();
auto found = _traverser->_opts.expressions->find(depth);
if (found != _traverser->_opts.expressions->end()) {
expEdges = found->second;
}
int res = getFilteredEdgesOnCoordinator(
_traverser->_dbname, collName, startVertex, dir,
expEdges, responseCode, resultEdges);
if (res != TRI_ERROR_NO_ERROR) {
THROW_ARANGO_EXCEPTION(res);
}
resultEdges.close();
VPackSlice resSlice = resultEdges.slice();
VPackSlice edgesSlice = resSlice.get("edges");
VPackSlice statsSlice = resSlice.get("stats");
size_t read = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
statsSlice, "scannedIndex", 0);
size_t filter = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
statsSlice, "filtered", 0);
_traverser->_readDocuments += read;
_traverser->_filteredPaths += filter;
if (edgesSlice.isNone() || edgesSlice.length() == 0) {
last = nullptr;
eColIdx++;
getEdge(startVertex, result, last, eColIdx);
return;
}
std::stack<std::string> stack;
std::unordered_set<std::string> verticesToFetch;
for (auto const& edge : VPackArrayIterator(edgesSlice)) {
std::string edgeId = arangodb::basics::VelocyPackHelper::getStringValue(
edge, StaticStrings::IdString.c_str(), "");
if (_traverser->_opts.uniqueEdges == TraverserOptions::UniquenessLevel::GLOBAL) {
// DO not push this edge on the stack.
if (_traverser->_edges.find(edgeId) != _traverser->_edges.end()) {
continue;
}
}
std::string fromId = arangodb::basics::VelocyPackHelper::getStringValue(
edge, StaticStrings::FromString.c_str(), "");
if (_traverser->_vertices.find(fromId) == _traverser->_vertices.end()) {
verticesToFetch.emplace(std::move(fromId));
}
std::string toId = arangodb::basics::VelocyPackHelper::getStringValue(
edge, StaticStrings::ToString.c_str(), "");
if (_traverser->_vertices.find(toId) == _traverser->_vertices.end()) {
verticesToFetch.emplace(std::move(toId));
}
VPackBuilder tmpBuilder;
tmpBuilder.add(edge);
_traverser->_edges.emplace(edgeId, tmpBuilder.steal());
stack.push(std::move(edgeId));
}
if (stack.empty()) {
// We did not find any valid edge here.
// Try next index
last = nullptr;
eColIdx++;
getEdge(startVertex, result, last, eColIdx);
return;
}
_traverser->fetchVertices(verticesToFetch, depth + 1);
std::string next = stack.top();
stack.pop();
last = &_continueConst;
_traverser->_iteratorCache.emplace(stack);
if (_traverser->_opts.uniqueEdges == TraverserOptions::UniquenessLevel::PATH) {
auto search = std::find(result.begin(), result.end(), next);
if (search != result.end()) {
// The edge is now included twice. Go on with the next
getEdge(startVertex, result, last, eColIdx);
return;
}
}
result.push_back(std::move(next));
} else {
if (_traverser->_iteratorCache.empty()) {
last = nullptr;
return;
}
std::stack<std::string>& tmp = _traverser->_iteratorCache.top();
if (tmp.empty()) {
_traverser->_iteratorCache.pop();
last = nullptr;
eColIdx++;
getEdge(startVertex, result, last, eColIdx);
return;
} else {
std::string next = tmp.top();
tmp.pop();
if (_traverser->_opts.uniqueEdges == TraverserOptions::UniquenessLevel::PATH) {
auto search = std::find(result.begin(), result.end(), next);
if (search != result.end()) {
// The edge would be included twice. Go on with the next
getEdge(startVertex, result, last, eColIdx);
return;
}
}
result.push_back(std::move(next));
}
}
*/
}
void ClusterTraverser::ClusterEdgeGetter::getAllEdges(
VPackSlice startVertex, std::unordered_set<VPackSlice>& result,
size_t depth) {
std::string collName;
TRI_edge_direction_e dir;
size_t eColIdx = 0;
#warning This path fetches Edges from DBServer, honoring conditions. Has to be rewritten.
std::unordered_set<std::string> verticesToFetch;
/*
std::vector<TraverserExpression*> expEdges;
auto found = _traverser->_opts.expressions->find(depth);
if (found != _traverser->_opts.expressions->end()) {
expEdges = found->second;
}
arangodb::GeneralResponse::ResponseCode responseCode;
VPackBuilder resultEdges;
while (_traverser->_opts.getCollection(eColIdx++, collName, dir)) {
resultEdges.clear();
resultEdges.openObject();
int res = getFilteredEdgesOnCoordinator(
_traverser->_dbname, collName, startVertex, dir,
expEdges, responseCode, resultEdges);
if (res != TRI_ERROR_NO_ERROR) {
THROW_ARANGO_EXCEPTION(res);
}
resultEdges.close();
VPackSlice resSlice = resultEdges.slice();
VPackSlice edgesSlice = resSlice.get("edges");
VPackSlice statsSlice = resSlice.get("stats");
size_t read = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
statsSlice, "scannedIndex", 0);
size_t filter = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
statsSlice, "filtered", 0);
_traverser->_readDocuments += read;
_traverser->_filteredPaths += filter;
if (edgesSlice.isNone() || edgesSlice.length() == 0) {
// No edges found here
continue;
}
for (auto const& edge : VPackArrayIterator(edgesSlice)) {
std::string edgeId = arangodb::basics::VelocyPackHelper::getStringValue(
edge, StaticStrings::IdString.c_str(), "");
if (_traverser->_opts.uniqueEdges ==
TraverserOptions::UniquenessLevel::GLOBAL) {
// DO not push this edge on the stack.
if (_traverser->_edges.find(edgeId) != _traverser->_edges.end()) {
continue;
}
}
std::string fromId = arangodb::basics::VelocyPackHelper::getStringValue(
edge, StaticStrings::FromString.c_str(), "");
if (_traverser->_vertices.find(fromId) == _traverser->_vertices.end()) {
verticesToFetch.emplace(std::move(fromId));
}
std::string toId = arangodb::basics::VelocyPackHelper::getStringValue(
edge, StaticStrings::ToString.c_str(), "");
if (_traverser->_vertices.find(toId) == _traverser->_vertices.end()) {
verticesToFetch.emplace(std::move(toId));
}
VPackBuilder tmpBuilder;
tmpBuilder.add(edge);
_traverser->_edges.emplace(edgeId, tmpBuilder.steal());
result.emplace(std::move(edgeId));
}
}
*/
_traverser->fetchVertices(verticesToFetch, depth + 1);
}
void ClusterTraverser::setStartVertex(std::string const& id) {
_vertexGetter->reset();
_done = false;
#warning Arraaghghh Who is responsible for the Builder and Slice?
VPackBuilder tmp;
tmp.add(VPackValue(id));
VPackSlice idSlice = tmp.slice();
auto it = _vertices.find(idSlice);
if (it == _vertices.end()) {
size_t firstSlash = id.find("/");
if (firstSlash == std::string::npos ||
id.find("/", firstSlash + 1) != std::string::npos) {
// We can stop here. The start vertex is not a valid _id
++_filteredPaths;
_done = true;
return;
}
std::unordered_set<std::string> vertexToFetch;
vertexToFetch.emplace(id);
fetchVertices(vertexToFetch, 0); // this inserts the vertex
it = _vertices.find(idSlice);
if (it == _vertices.end()) {
// We can stop here. The start vertex does not match condition.
++_filteredPaths;
_done = true;
return;
}
}
if (_opts.evaluateVertexExpression(VPackSlice(it->second->data()), 0)) {
// We can stop here. The start vertex does not match condition
_done = true;
return;
}
VPackSlice startId(it->second->data());
if (_opts.useBreadthFirst) {
_enumerator.reset(
new arangodb::traverser::BreadthFirstEnumerator(this, startId, &_opts));
_vertexGetter->setStartVertex(startId);
} else {
_enumerator.reset(
new arangodb::traverser::DepthFirstEnumerator(this, startId, &_opts));
}
}
void ClusterTraverser::getEdge(std::string const& startVertex,
std::vector<std::string>& result, size_t*& last,
size_t& eColIdx) {
return _edgeGetter->getEdge(startVertex, result, last, eColIdx);
}
void ClusterTraverser::getAllEdges(
VPackSlice startVertex, std::unordered_set<VPackSlice>& result,
size_t depth) {
return _edgeGetter->getAllEdges(startVertex, result, depth);
}
bool ClusterTraverser::getVertex(VPackSlice edge,
std::vector<VPackSlice>& result) {
return _vertexGetter->getVertex(edge, result);
}
bool ClusterTraverser::getSingleVertex(VPackSlice edge, VPackSlice comp,
size_t depth, VPackSlice& result) {
return _vertexGetter->getSingleVertex(edge, comp, depth, result);
}
void ClusterTraverser::fetchVertices(std::unordered_set<std::string>& verticesToFetch, size_t depth) {
_readDocuments += verticesToFetch.size();
#warning Reimplement this. Fetching Documents Coordinator-Case
/*
std::vector<TraverserExpression*> expVertices;
auto found = _opts.expressions->find(depth);
if (found != _opts.expressions->end()) {
expVertices = found->second;
}
int res = getFilteredDocumentsOnCoordinator(_dbname, expVertices,
verticesToFetch, _vertices);
if (res != TRI_ERROR_NO_ERROR &&
res != TRI_ERROR_ARANGO_COLLECTION_NOT_FOUND) {
THROW_ARANGO_EXCEPTION(res);
}
// By convention verticesToFetch now contains all _ids of vertices that
// could not be found.
// Store them as NULL
for (auto const& it : verticesToFetch) {
VPackBuilder builder;
builder.add(VPackValue(VPackValueType::Null));
_vertices.emplace(it, builder.steal());
}
*/
}
bool ClusterTraverser::vertexMatchesCondition(
VPackSlice const& v,
std::vector<arangodb::traverser::TraverserExpression*> const& exp) {
for (auto const& e : exp) {
if (!e->isEdgeAccess) {
if (v.isNone() || !e->matchesCheck(_trx, v)) {
++_filteredPaths;
return false;
}
}
}
return true;
}
bool ClusterTraverser::next() {
TRI_ASSERT(!_done);
return _enumerator->next();
/*
if (_opts.useBreadthFirst &&
_opts.uniqueVertices == TraverserOptions::UniquenessLevel::NONE &&
_opts.uniqueEdges == TraverserOptions::UniquenessLevel::PATH) {
// Only if we use breadth first
// and vertex uniqueness is not guaranteed
// We have to validate edges on path uniqueness.
// Otherwise this situation cannot occur.
// If two edges are identical than at least their start or end vertex
// is on the path twice: A -> B <- A
for (size_t i = 0; i < countEdges; ++i) {
for (size_t j = i + 1; j < countEdges; ++j) {
if (path.edges[i] == path.edges[j]) {
// We found two idential edges. Prune.
// Next
_pruneNext = true;
return next();
}
}
}
}
*/
}
aql::AqlValue ClusterTraverser::fetchVertexData(VPackSlice idString) {
TRI_ASSERT(idString.isString());
auto cached = _vertices.find(idString);
// All vertices are cached!!
TRI_ASSERT(cached != _vertices.end());
return aql::AqlValue((*cached).second->data());
}
aql::AqlValue ClusterTraverser::fetchEdgeData(VPackSlice edge) {
return aql::AqlValue(edge);
}
//////////////////////////////////////////////////////////////////////////////
/// @brief Function to add the real data of a vertex into a velocypack builder
//////////////////////////////////////////////////////////////////////////////
void ClusterTraverser::addVertexToVelocyPack(VPackSlice id,
VPackBuilder& result) {
TRI_ASSERT(id.isString());
auto cached = _vertices.find(id);
// All vertices are cached!!
TRI_ASSERT(cached != _vertices.end());
result.add(VPackSlice((*cached).second->data()));
}
//////////////////////////////////////////////////////////////////////////////
/// @brief Function to add the real data of an edge into a velocypack builder
//////////////////////////////////////////////////////////////////////////////
void ClusterTraverser::addEdgeToVelocyPack(arangodb::velocypack::Slice edge,
arangodb::velocypack::Builder& result) {
result.add(edge);
}
aql::AqlValue ClusterTraverser::lastVertexToAqlValue() {
return _enumerator->lastVertexToAqlValue();
}
aql::AqlValue ClusterTraverser::lastEdgeToAqlValue() {
return _enumerator->lastEdgeToAqlValue();
}
aql::AqlValue ClusterTraverser::pathToAqlValue(VPackBuilder& builder) {
return _enumerator->pathToAqlValue(builder);
}