mirror of https://gitee.com/bigwinds/arangodb
521 lines
18 KiB
C++
521 lines
18 KiB
C++
////////////////////////////////////////////////////////////////////////////////
|
|
/// DISCLAIMER
|
|
///
|
|
/// Copyright 2014-2016 ArangoDB GmbH, Cologne, Germany
|
|
/// Copyright 2004-2014 triAGENS GmbH, Cologne, Germany
|
|
///
|
|
/// Licensed under the Apache License, Version 2.0 (the "License");
|
|
/// you may not use this file except in compliance with the License.
|
|
/// You may obtain a copy of the License at
|
|
///
|
|
/// http://www.apache.org/licenses/LICENSE-2.0
|
|
///
|
|
/// Unless required by applicable law or agreed to in writing, software
|
|
/// distributed under the License is distributed on an "AS IS" BASIS,
|
|
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
/// See the License for the specific language governing permissions and
|
|
/// limitations under the License.
|
|
///
|
|
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
|
|
///
|
|
/// @author Michael Hackstein
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#include "ClusterTraverser.h"
|
|
#include "Basics/VelocyPackHelper.h"
|
|
#include "Cluster/ClusterMethods.h"
|
|
|
|
#include <velocypack/Iterator.h>
|
|
#include <velocypack/velocypack-aliases.h>
|
|
|
|
using namespace arangodb;
|
|
|
|
using ClusterTraverser = arangodb::traverser::ClusterTraverser;
|
|
|
|
bool ClusterTraverser::VertexGetter::getVertex(
|
|
VPackSlice edge, std::vector<VPackSlice>& result) {
|
|
VPackSlice cmp = result.back();
|
|
VPackSlice from = edge.get(StaticStrings::FromString);
|
|
#warning Here we have to execute VertexFilter
|
|
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
|
|
/// Else check condition if ok => return true, else return false.
|
|
/// When returning false set result = ""
|
|
if (arangodb::basics::VelocyPackHelper::compare(cmp, from, false) != 0) {
|
|
result.emplace_back(from);
|
|
} else {
|
|
result.emplace_back(edge.get(StaticStrings::ToString));
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool ClusterTraverser::VertexGetter::getSingleVertex(VPackSlice edge,
|
|
VPackSlice cmp,
|
|
size_t depth,
|
|
VPackSlice& result) {
|
|
VPackSlice from = edge.get(StaticStrings::FromString);
|
|
#warning Here we have to execute VertexFilter
|
|
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
|
|
/// Else check condition if ok => return true, else return false.
|
|
/// When returning false set result = ""
|
|
if (arangodb::basics::VelocyPackHelper::compare(cmp, from, false) != 0) {
|
|
result = from;
|
|
} else {
|
|
result = edge.get(StaticStrings::ToString);
|
|
}
|
|
return true;
|
|
}
|
|
|
|
|
|
|
|
void ClusterTraverser::VertexGetter::reset() {
|
|
// Nothing to do here. Subclass has to clear list of already returned vertices.
|
|
}
|
|
|
|
bool ClusterTraverser::UniqueVertexGetter::getVertex(
|
|
VPackSlice edge, std::vector<VPackSlice>& result) {
|
|
VPackSlice toAdd = edge.get(StaticStrings::FromString);
|
|
VPackSlice cmp = result.back();
|
|
|
|
if (arangodb::basics::VelocyPackHelper::compare(toAdd, cmp, false) == 0) {
|
|
toAdd = edge.get(StaticStrings::ToString);
|
|
}
|
|
|
|
#warning Here we have to execute VertexFilter
|
|
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
|
|
/// Else check condition if ok => return true, else return false.
|
|
/// When returning false set result = ""
|
|
/// When returning true: _returnedVertices.emplace(result)
|
|
|
|
if (_returnedVertices.find(toAdd) != _returnedVertices.end()) {
|
|
// This vertex is not unique.
|
|
++_traverser->_filteredPaths;
|
|
return false;
|
|
} else {
|
|
_returnedVertices.emplace(toAdd);
|
|
result.emplace_back(toAdd);
|
|
}
|
|
|
|
// This should never be reached
|
|
return false;
|
|
}
|
|
|
|
bool ClusterTraverser::UniqueVertexGetter::getSingleVertex(
|
|
VPackSlice edge, VPackSlice cmp, size_t depth, VPackSlice& result) {
|
|
|
|
result = edge.get(StaticStrings::FromString);
|
|
|
|
if (arangodb::basics::VelocyPackHelper::compare(result, cmp, false) == 0) {
|
|
result = edge.get(StaticStrings::ToString);
|
|
}
|
|
|
|
#warning Here we have to execute VertexFilter
|
|
/// If the vertex is not cached in _traverser->_vertices => incr. _filteredPath return false;
|
|
/// Else check condition if ok => return true, else return false.
|
|
/// When returning false set result = ""
|
|
/// When returning true: _returnedVertices.emplace(result)
|
|
|
|
if (_returnedVertices.find(result) != _returnedVertices.end()) {
|
|
// This vertex is not unique.
|
|
++_traverser->_filteredPaths;
|
|
return false;
|
|
} else {
|
|
_returnedVertices.emplace(result);
|
|
return true;
|
|
}
|
|
|
|
// This should never be reached
|
|
return false;
|
|
}
|
|
|
|
|
|
|
|
void ClusterTraverser::UniqueVertexGetter::reset() {
|
|
_returnedVertices.clear();
|
|
}
|
|
|
|
void ClusterTraverser::ClusterEdgeGetter::getEdge(
|
|
std::string const& startVertex, std::vector<std::string>& result,
|
|
size_t*& last, size_t& eColIdx) {
|
|
#warning This path fetches Edges from DBServer, honoring conditions. Has to be rewritten.
|
|
/*
|
|
std::string collName;
|
|
TRI_edge_direction_e dir;
|
|
if (!_traverser->_opts.getCollection(eColIdx, collName, dir)) {
|
|
// Nothing to do, caller has set a defined state already.
|
|
return;
|
|
}
|
|
if (last == nullptr) {
|
|
size_t depth = result.size();
|
|
TRI_ASSERT(_traverser->_iteratorCache.size() == result.size());
|
|
// We have to request the next level
|
|
arangodb::GeneralResponse::ResponseCode responseCode;
|
|
std::vector<TraverserExpression*> expEdges;
|
|
|
|
VPackBuilder resultEdges;
|
|
resultEdges.openObject();
|
|
auto found = _traverser->_opts.expressions->find(depth);
|
|
if (found != _traverser->_opts.expressions->end()) {
|
|
expEdges = found->second;
|
|
}
|
|
|
|
int res = getFilteredEdgesOnCoordinator(
|
|
_traverser->_dbname, collName, startVertex, dir,
|
|
expEdges, responseCode, resultEdges);
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
THROW_ARANGO_EXCEPTION(res);
|
|
}
|
|
resultEdges.close();
|
|
VPackSlice resSlice = resultEdges.slice();
|
|
VPackSlice edgesSlice = resSlice.get("edges");
|
|
VPackSlice statsSlice = resSlice.get("stats");
|
|
|
|
size_t read = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
|
|
statsSlice, "scannedIndex", 0);
|
|
size_t filter = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
|
|
statsSlice, "filtered", 0);
|
|
_traverser->_readDocuments += read;
|
|
_traverser->_filteredPaths += filter;
|
|
|
|
if (edgesSlice.isNone() || edgesSlice.length() == 0) {
|
|
last = nullptr;
|
|
eColIdx++;
|
|
getEdge(startVertex, result, last, eColIdx);
|
|
return;
|
|
}
|
|
std::stack<std::string> stack;
|
|
std::unordered_set<std::string> verticesToFetch;
|
|
for (auto const& edge : VPackArrayIterator(edgesSlice)) {
|
|
std::string edgeId = arangodb::basics::VelocyPackHelper::getStringValue(
|
|
edge, StaticStrings::IdString.c_str(), "");
|
|
if (_traverser->_opts.uniqueEdges == TraverserOptions::UniquenessLevel::GLOBAL) {
|
|
// DO not push this edge on the stack.
|
|
if (_traverser->_edges.find(edgeId) != _traverser->_edges.end()) {
|
|
continue;
|
|
}
|
|
}
|
|
std::string fromId = arangodb::basics::VelocyPackHelper::getStringValue(
|
|
edge, StaticStrings::FromString.c_str(), "");
|
|
if (_traverser->_vertices.find(fromId) == _traverser->_vertices.end()) {
|
|
verticesToFetch.emplace(std::move(fromId));
|
|
}
|
|
std::string toId = arangodb::basics::VelocyPackHelper::getStringValue(
|
|
edge, StaticStrings::ToString.c_str(), "");
|
|
if (_traverser->_vertices.find(toId) == _traverser->_vertices.end()) {
|
|
verticesToFetch.emplace(std::move(toId));
|
|
}
|
|
VPackBuilder tmpBuilder;
|
|
tmpBuilder.add(edge);
|
|
_traverser->_edges.emplace(edgeId, tmpBuilder.steal());
|
|
stack.push(std::move(edgeId));
|
|
}
|
|
|
|
if (stack.empty()) {
|
|
// We did not find any valid edge here.
|
|
// Try next index
|
|
last = nullptr;
|
|
eColIdx++;
|
|
getEdge(startVertex, result, last, eColIdx);
|
|
return;
|
|
}
|
|
|
|
_traverser->fetchVertices(verticesToFetch, depth + 1);
|
|
|
|
std::string next = stack.top();
|
|
stack.pop();
|
|
last = &_continueConst;
|
|
_traverser->_iteratorCache.emplace(stack);
|
|
if (_traverser->_opts.uniqueEdges == TraverserOptions::UniquenessLevel::PATH) {
|
|
auto search = std::find(result.begin(), result.end(), next);
|
|
if (search != result.end()) {
|
|
// The edge is now included twice. Go on with the next
|
|
getEdge(startVertex, result, last, eColIdx);
|
|
return;
|
|
}
|
|
}
|
|
result.push_back(std::move(next));
|
|
} else {
|
|
if (_traverser->_iteratorCache.empty()) {
|
|
last = nullptr;
|
|
return;
|
|
}
|
|
std::stack<std::string>& tmp = _traverser->_iteratorCache.top();
|
|
if (tmp.empty()) {
|
|
_traverser->_iteratorCache.pop();
|
|
last = nullptr;
|
|
eColIdx++;
|
|
getEdge(startVertex, result, last, eColIdx);
|
|
return;
|
|
} else {
|
|
std::string next = tmp.top();
|
|
tmp.pop();
|
|
if (_traverser->_opts.uniqueEdges == TraverserOptions::UniquenessLevel::PATH) {
|
|
auto search = std::find(result.begin(), result.end(), next);
|
|
if (search != result.end()) {
|
|
// The edge would be included twice. Go on with the next
|
|
getEdge(startVertex, result, last, eColIdx);
|
|
return;
|
|
}
|
|
}
|
|
result.push_back(std::move(next));
|
|
}
|
|
}
|
|
*/
|
|
}
|
|
|
|
void ClusterTraverser::ClusterEdgeGetter::getAllEdges(
|
|
VPackSlice startVertex, std::unordered_set<VPackSlice>& result,
|
|
size_t depth) {
|
|
std::string collName;
|
|
TRI_edge_direction_e dir;
|
|
size_t eColIdx = 0;
|
|
#warning This path fetches Edges from DBServer, honoring conditions. Has to be rewritten.
|
|
std::unordered_set<std::string> verticesToFetch;
|
|
/*
|
|
std::vector<TraverserExpression*> expEdges;
|
|
auto found = _traverser->_opts.expressions->find(depth);
|
|
if (found != _traverser->_opts.expressions->end()) {
|
|
expEdges = found->second;
|
|
}
|
|
|
|
arangodb::GeneralResponse::ResponseCode responseCode;
|
|
VPackBuilder resultEdges;
|
|
while (_traverser->_opts.getCollection(eColIdx++, collName, dir)) {
|
|
resultEdges.clear();
|
|
resultEdges.openObject();
|
|
int res = getFilteredEdgesOnCoordinator(
|
|
_traverser->_dbname, collName, startVertex, dir,
|
|
expEdges, responseCode, resultEdges);
|
|
if (res != TRI_ERROR_NO_ERROR) {
|
|
THROW_ARANGO_EXCEPTION(res);
|
|
}
|
|
resultEdges.close();
|
|
VPackSlice resSlice = resultEdges.slice();
|
|
VPackSlice edgesSlice = resSlice.get("edges");
|
|
VPackSlice statsSlice = resSlice.get("stats");
|
|
|
|
size_t read = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
|
|
statsSlice, "scannedIndex", 0);
|
|
size_t filter = arangodb::basics::VelocyPackHelper::getNumericValue<size_t>(
|
|
statsSlice, "filtered", 0);
|
|
_traverser->_readDocuments += read;
|
|
_traverser->_filteredPaths += filter;
|
|
if (edgesSlice.isNone() || edgesSlice.length() == 0) {
|
|
// No edges found here
|
|
continue;
|
|
}
|
|
for (auto const& edge : VPackArrayIterator(edgesSlice)) {
|
|
std::string edgeId = arangodb::basics::VelocyPackHelper::getStringValue(
|
|
edge, StaticStrings::IdString.c_str(), "");
|
|
if (_traverser->_opts.uniqueEdges ==
|
|
TraverserOptions::UniquenessLevel::GLOBAL) {
|
|
// DO not push this edge on the stack.
|
|
if (_traverser->_edges.find(edgeId) != _traverser->_edges.end()) {
|
|
continue;
|
|
}
|
|
}
|
|
std::string fromId = arangodb::basics::VelocyPackHelper::getStringValue(
|
|
edge, StaticStrings::FromString.c_str(), "");
|
|
if (_traverser->_vertices.find(fromId) == _traverser->_vertices.end()) {
|
|
verticesToFetch.emplace(std::move(fromId));
|
|
}
|
|
std::string toId = arangodb::basics::VelocyPackHelper::getStringValue(
|
|
edge, StaticStrings::ToString.c_str(), "");
|
|
if (_traverser->_vertices.find(toId) == _traverser->_vertices.end()) {
|
|
verticesToFetch.emplace(std::move(toId));
|
|
}
|
|
VPackBuilder tmpBuilder;
|
|
tmpBuilder.add(edge);
|
|
_traverser->_edges.emplace(edgeId, tmpBuilder.steal());
|
|
result.emplace(std::move(edgeId));
|
|
}
|
|
}
|
|
*/
|
|
_traverser->fetchVertices(verticesToFetch, depth + 1);
|
|
}
|
|
|
|
void ClusterTraverser::setStartVertex(std::string const& id) {
|
|
_vertexGetter->reset();
|
|
_done = false;
|
|
#warning Arraaghghh Who is responsible for the Builder and Slice?
|
|
|
|
VPackBuilder tmp;
|
|
tmp.add(VPackValue(id));
|
|
VPackSlice idSlice = tmp.slice();
|
|
|
|
auto it = _vertices.find(idSlice);
|
|
if (it == _vertices.end()) {
|
|
size_t firstSlash = id.find("/");
|
|
if (firstSlash == std::string::npos ||
|
|
id.find("/", firstSlash + 1) != std::string::npos) {
|
|
// We can stop here. The start vertex is not a valid _id
|
|
++_filteredPaths;
|
|
_done = true;
|
|
return;
|
|
}
|
|
std::unordered_set<std::string> vertexToFetch;
|
|
vertexToFetch.emplace(id);
|
|
fetchVertices(vertexToFetch, 0); // this inserts the vertex
|
|
it = _vertices.find(idSlice);
|
|
if (it == _vertices.end()) {
|
|
// We can stop here. The start vertex does not match condition.
|
|
++_filteredPaths;
|
|
_done = true;
|
|
return;
|
|
}
|
|
}
|
|
|
|
if (_opts.evaluateVertexExpression(VPackSlice(it->second->data()), 0)) {
|
|
// We can stop here. The start vertex does not match condition
|
|
_done = true;
|
|
return;
|
|
}
|
|
VPackSlice startId(it->second->data());
|
|
if (_opts.useBreadthFirst) {
|
|
_enumerator.reset(
|
|
new arangodb::traverser::BreadthFirstEnumerator(this, startId, &_opts));
|
|
_vertexGetter->setStartVertex(startId);
|
|
} else {
|
|
_enumerator.reset(
|
|
new arangodb::traverser::DepthFirstEnumerator(this, startId, &_opts));
|
|
}
|
|
}
|
|
|
|
void ClusterTraverser::getEdge(std::string const& startVertex,
|
|
std::vector<std::string>& result, size_t*& last,
|
|
size_t& eColIdx) {
|
|
return _edgeGetter->getEdge(startVertex, result, last, eColIdx);
|
|
}
|
|
|
|
void ClusterTraverser::getAllEdges(
|
|
VPackSlice startVertex, std::unordered_set<VPackSlice>& result,
|
|
size_t depth) {
|
|
return _edgeGetter->getAllEdges(startVertex, result, depth);
|
|
}
|
|
|
|
bool ClusterTraverser::getVertex(VPackSlice edge,
|
|
std::vector<VPackSlice>& result) {
|
|
return _vertexGetter->getVertex(edge, result);
|
|
}
|
|
|
|
bool ClusterTraverser::getSingleVertex(VPackSlice edge, VPackSlice comp,
|
|
size_t depth, VPackSlice& result) {
|
|
return _vertexGetter->getSingleVertex(edge, comp, depth, result);
|
|
}
|
|
|
|
|
|
void ClusterTraverser::fetchVertices(std::unordered_set<std::string>& verticesToFetch, size_t depth) {
|
|
_readDocuments += verticesToFetch.size();
|
|
|
|
#warning Reimplement this. Fetching Documents Coordinator-Case
|
|
/*
|
|
std::vector<TraverserExpression*> expVertices;
|
|
auto found = _opts.expressions->find(depth);
|
|
if (found != _opts.expressions->end()) {
|
|
expVertices = found->second;
|
|
}
|
|
|
|
int res = getFilteredDocumentsOnCoordinator(_dbname, expVertices,
|
|
verticesToFetch, _vertices);
|
|
if (res != TRI_ERROR_NO_ERROR &&
|
|
res != TRI_ERROR_ARANGO_COLLECTION_NOT_FOUND) {
|
|
THROW_ARANGO_EXCEPTION(res);
|
|
}
|
|
|
|
// By convention verticesToFetch now contains all _ids of vertices that
|
|
// could not be found.
|
|
// Store them as NULL
|
|
for (auto const& it : verticesToFetch) {
|
|
VPackBuilder builder;
|
|
builder.add(VPackValue(VPackValueType::Null));
|
|
_vertices.emplace(it, builder.steal());
|
|
}
|
|
*/
|
|
}
|
|
|
|
bool ClusterTraverser::vertexMatchesCondition(
|
|
VPackSlice const& v,
|
|
std::vector<arangodb::traverser::TraverserExpression*> const& exp) {
|
|
for (auto const& e : exp) {
|
|
if (!e->isEdgeAccess) {
|
|
if (v.isNone() || !e->matchesCheck(_trx, v)) {
|
|
++_filteredPaths;
|
|
return false;
|
|
}
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool ClusterTraverser::next() {
|
|
TRI_ASSERT(!_done);
|
|
return _enumerator->next();
|
|
/*
|
|
if (_opts.useBreadthFirst &&
|
|
_opts.uniqueVertices == TraverserOptions::UniquenessLevel::NONE &&
|
|
_opts.uniqueEdges == TraverserOptions::UniquenessLevel::PATH) {
|
|
// Only if we use breadth first
|
|
// and vertex uniqueness is not guaranteed
|
|
// We have to validate edges on path uniqueness.
|
|
// Otherwise this situation cannot occur.
|
|
// If two edges are identical than at least their start or end vertex
|
|
// is on the path twice: A -> B <- A
|
|
for (size_t i = 0; i < countEdges; ++i) {
|
|
for (size_t j = i + 1; j < countEdges; ++j) {
|
|
if (path.edges[i] == path.edges[j]) {
|
|
// We found two idential edges. Prune.
|
|
// Next
|
|
_pruneNext = true;
|
|
return next();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
*/
|
|
}
|
|
|
|
aql::AqlValue ClusterTraverser::fetchVertexData(VPackSlice idString) {
|
|
TRI_ASSERT(idString.isString());
|
|
auto cached = _vertices.find(idString);
|
|
// All vertices are cached!!
|
|
TRI_ASSERT(cached != _vertices.end());
|
|
return aql::AqlValue((*cached).second->data());
|
|
}
|
|
|
|
aql::AqlValue ClusterTraverser::fetchEdgeData(VPackSlice edge) {
|
|
return aql::AqlValue(edge);
|
|
}
|
|
|
|
//////////////////////////////////////////////////////////////////////////////
|
|
/// @brief Function to add the real data of a vertex into a velocypack builder
|
|
//////////////////////////////////////////////////////////////////////////////
|
|
|
|
void ClusterTraverser::addVertexToVelocyPack(VPackSlice id,
|
|
VPackBuilder& result) {
|
|
TRI_ASSERT(id.isString());
|
|
auto cached = _vertices.find(id);
|
|
// All vertices are cached!!
|
|
TRI_ASSERT(cached != _vertices.end());
|
|
result.add(VPackSlice((*cached).second->data()));
|
|
}
|
|
|
|
//////////////////////////////////////////////////////////////////////////////
|
|
/// @brief Function to add the real data of an edge into a velocypack builder
|
|
//////////////////////////////////////////////////////////////////////////////
|
|
|
|
void ClusterTraverser::addEdgeToVelocyPack(arangodb::velocypack::Slice edge,
|
|
arangodb::velocypack::Builder& result) {
|
|
result.add(edge);
|
|
}
|
|
|
|
aql::AqlValue ClusterTraverser::lastVertexToAqlValue() {
|
|
return _enumerator->lastVertexToAqlValue();
|
|
}
|
|
|
|
aql::AqlValue ClusterTraverser::lastEdgeToAqlValue() {
|
|
return _enumerator->lastEdgeToAqlValue();
|
|
}
|
|
|
|
aql::AqlValue ClusterTraverser::pathToAqlValue(VPackBuilder& builder) {
|
|
return _enumerator->pathToAqlValue(builder);
|
|
}
|