mirror of https://gitee.com/bigwinds/arangodb
367 lines
13 KiB
C++
367 lines
13 KiB
C++
////////////////////////////////////////////////////////////////////////////////
|
|
/// DISCLAIMER
|
|
///
|
|
/// Copyright 2014-2016 ArangoDB GmbH, Cologne, Germany
|
|
/// Copyright 2004-2014 triAGENS GmbH, Cologne, Germany
|
|
///
|
|
/// Licensed under the Apache License, Version 2.0 (the "License");
|
|
/// you may not use this file except in compliance with the License.
|
|
/// You may obtain a copy of the License at
|
|
///
|
|
/// http://www.apache.org/licenses/LICENSE-2.0
|
|
///
|
|
/// Unless required by applicable law or agreed to in writing, software
|
|
/// distributed under the License is distributed on an "AS IS" BASIS,
|
|
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
/// See the License for the specific language governing permissions and
|
|
/// limitations under the License.
|
|
///
|
|
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
|
|
///
|
|
/// @author Jan Steemann
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#ifndef ARANGOD_INDEXES_INDEX_H
|
|
#define ARANGOD_INDEXES_INDEX_H 1
|
|
|
|
#include "Basics/AttributeNameParser.h"
|
|
#include "Basics/Common.h"
|
|
#include "Basics/Exceptions.h"
|
|
#include "Basics/Result.h"
|
|
#include "Basics/StringRef.h"
|
|
#include "VocBase/LocalDocumentId.h"
|
|
#include "VocBase/voc-types.h"
|
|
#include "VocBase/vocbase.h"
|
|
|
|
#include <iosfwd>
|
|
|
|
namespace arangodb {
|
|
namespace basics {
|
|
class LocalTaskQueue;
|
|
}
|
|
|
|
class IndexIterator;
|
|
class LogicalCollection;
|
|
class ManagedDocumentResult;
|
|
struct IndexIteratorOptions;
|
|
|
|
namespace velocypack {
|
|
class Builder;
|
|
class Slice;
|
|
} // namespace velocypack
|
|
|
|
namespace aql {
|
|
struct AstNode;
|
|
class SortCondition;
|
|
struct Variable;
|
|
} // namespace aql
|
|
|
|
namespace transaction {
|
|
class Methods;
|
|
}
|
|
|
|
class Index {
|
|
public:
|
|
Index() = delete;
|
|
Index(Index const&) = delete;
|
|
Index& operator=(Index const&) = delete;
|
|
|
|
Index(TRI_idx_iid_t iid, LogicalCollection& collection,
|
|
std::vector<std::vector<arangodb::basics::AttributeName>> const& fields,
|
|
bool unique, bool sparse);
|
|
|
|
Index(TRI_idx_iid_t iid, LogicalCollection& collection,
|
|
arangodb::velocypack::Slice const& slice);
|
|
|
|
virtual ~Index();
|
|
|
|
public:
|
|
/// @brief index types
|
|
enum IndexType {
|
|
TRI_IDX_TYPE_UNKNOWN = 0,
|
|
TRI_IDX_TYPE_PRIMARY_INDEX,
|
|
TRI_IDX_TYPE_GEO_INDEX,
|
|
TRI_IDX_TYPE_GEO1_INDEX,
|
|
TRI_IDX_TYPE_GEO2_INDEX,
|
|
TRI_IDX_TYPE_HASH_INDEX,
|
|
TRI_IDX_TYPE_EDGE_INDEX,
|
|
TRI_IDX_TYPE_FULLTEXT_INDEX,
|
|
TRI_IDX_TYPE_SKIPLIST_INDEX,
|
|
TRI_IDX_TYPE_PERSISTENT_INDEX,
|
|
TRI_IDX_TYPE_IRESEARCH_LINK,
|
|
TRI_IDX_TYPE_NO_ACCESS_INDEX
|
|
};
|
|
|
|
// mode to signal how operation should behave
|
|
enum OperationMode { normal, internal, rollback };
|
|
|
|
public:
|
|
/// @brief return the index id
|
|
inline TRI_idx_iid_t id() const { return _iid; }
|
|
|
|
/// @brief return the index fields
|
|
inline std::vector<std::vector<arangodb::basics::AttributeName>> const& fields() const {
|
|
return _fields;
|
|
}
|
|
|
|
/// @brief return the fields covered by this index.
|
|
/// Typically just the fields, but e.g. EdgeIndex on _from also covers _to
|
|
virtual std::vector<std::vector<arangodb::basics::AttributeName>> const& coveredFields() const {
|
|
return fields();
|
|
}
|
|
|
|
/// @brief return the index fields names
|
|
inline std::vector<std::vector<std::string>> fieldNames() const {
|
|
std::vector<std::vector<std::string>> result;
|
|
|
|
for (auto const& it : _fields) {
|
|
std::vector<std::string> parts;
|
|
parts.reserve(it.size());
|
|
for (auto const& it2 : it) {
|
|
parts.emplace_back(it2.name);
|
|
}
|
|
result.emplace_back(std::move(parts));
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/// @brief whether or not the ith attribute is expanded (somewhere)
|
|
inline bool isAttributeExpanded(size_t i) const {
|
|
if (i >= _fields.size()) {
|
|
return false;
|
|
}
|
|
return TRI_AttributeNamesHaveExpansion(_fields[i]);
|
|
}
|
|
|
|
/// @brief whether or not any attribute is expanded
|
|
inline bool isAttributeExpanded(std::vector<arangodb::basics::AttributeName> const& attribute) const {
|
|
for (auto const& it : _fields) {
|
|
if (!arangodb::basics::AttributeName::namesMatch(attribute, it)) {
|
|
continue;
|
|
}
|
|
return TRI_AttributeNamesHaveExpansion(it);
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/// @brief whether or not any attribute is expanded
|
|
inline bool attributeMatches(std::vector<arangodb::basics::AttributeName> const& attribute) const {
|
|
for (auto const& it : _fields) {
|
|
if (arangodb::basics::AttributeName::isIdentical(attribute, it, true)) {
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/// @brief whether or not any attribute is expanded
|
|
inline bool hasExpansion() const { return _useExpansion; }
|
|
|
|
/// @brief whether or not the index covers all the attributes passed in
|
|
virtual bool covers(std::unordered_set<std::string> const& attributes) const;
|
|
|
|
/// @brief return the underlying collection
|
|
inline LogicalCollection* collection() const { return &_collection; }
|
|
|
|
/// @brief return a contextual string for logging
|
|
std::string context() const;
|
|
|
|
/// @brief whether or not the index is sparse
|
|
inline bool sparse() const { return _sparse; }
|
|
|
|
/// @brief whether or not the index is unique
|
|
inline bool unique() const { return _unique; }
|
|
|
|
/// @brief validate fields from slice
|
|
static void validateFields(velocypack::Slice const& slice);
|
|
|
|
/// @brief return the name of the index
|
|
char const* oldtypeName() const { return oldtypeName(type()); }
|
|
|
|
/// @brief return the index type based on a type name
|
|
static IndexType type(char const* type);
|
|
|
|
static IndexType type(std::string const& type);
|
|
|
|
static bool isGeoIndex(IndexType type) {
|
|
return type == TRI_IDX_TYPE_GEO1_INDEX || type == TRI_IDX_TYPE_GEO2_INDEX ||
|
|
type == TRI_IDX_TYPE_GEO_INDEX;
|
|
}
|
|
|
|
virtual char const* typeName() const = 0;
|
|
|
|
static bool allowExpansion(IndexType type) {
|
|
return (type == TRI_IDX_TYPE_HASH_INDEX || type == TRI_IDX_TYPE_SKIPLIST_INDEX ||
|
|
type == TRI_IDX_TYPE_PERSISTENT_INDEX);
|
|
}
|
|
|
|
virtual IndexType type() const = 0;
|
|
|
|
/// @brief return the name of an index type
|
|
static char const* oldtypeName(IndexType);
|
|
|
|
/// @brief validate an index id
|
|
static bool validateId(char const*);
|
|
|
|
/// @brief validate an index handle (collection name + / + index id)
|
|
static bool validateHandle(char const*, size_t*);
|
|
|
|
/// @brief generate a new index id
|
|
static TRI_idx_iid_t generateId();
|
|
|
|
/// @brief index comparator, used by the coordinator to detect if two index
|
|
/// contents are the same
|
|
static bool Compare(velocypack::Slice const& lhs, velocypack::Slice const& rhs);
|
|
|
|
virtual bool isPersistent() const { return false; }
|
|
virtual bool canBeDropped() const = 0;
|
|
|
|
/// @brief whether or not the index provides an iterator that can extract
|
|
/// attribute values from the index data, without having to refer to the
|
|
/// actual document data
|
|
/// By default, indexes do not have this type of iterator, but they can
|
|
/// add it as a performance optimization
|
|
virtual bool hasCoveringIterator() const { return false; }
|
|
|
|
/// @brief Checks if this index is identical to the given definition
|
|
virtual bool matchesDefinition(arangodb::velocypack::Slice const&) const;
|
|
|
|
/// @brief whether or not the index is sorted
|
|
virtual bool isSorted() const = 0;
|
|
|
|
/// @brief whether or not the index has a selectivity estimate
|
|
virtual bool hasSelectivityEstimate() const = 0;
|
|
|
|
/// @brief return the selectivity estimate of the index
|
|
/// must only be called if hasSelectivityEstimate() returns true
|
|
///
|
|
/// The extra StringRef is only used in the edge index as direction
|
|
/// attribute attribute, a Slice would be more flexible.
|
|
virtual double selectivityEstimate(arangodb::StringRef const& extra = arangodb::StringRef()) const;
|
|
|
|
/// @brief update the cluster selectivity estimate
|
|
virtual void updateClusterSelectivityEstimate(double /*estimate*/) {
|
|
TRI_ASSERT(false); // should never be called except on Coordinator
|
|
}
|
|
|
|
/// @brief whether or not the index is implicitly unique
|
|
/// this can be the case if the index is not declared as unique,
|
|
/// but contains a unique attribute such as _key
|
|
virtual bool implicitlyUnique() const;
|
|
|
|
virtual size_t memory() const = 0;
|
|
|
|
/// @brief serialization flags for indexes.
|
|
/// note that these must be mutually exclusive when bit-ORed
|
|
enum class Serialize : uint8_t {
|
|
/// @brief serialize figures for index
|
|
Basics = 0,
|
|
/// @brief serialize figures for index
|
|
Figures = 2,
|
|
/// @brief serialize object ids for persistence
|
|
ObjectId = 4,
|
|
/// @brief serialize selectivity estimates
|
|
Estimates = 8
|
|
};
|
|
|
|
/// @brief helper for building flags
|
|
template <typename... Args>
|
|
static inline constexpr std::underlying_type<Serialize>::type makeFlags(Serialize flag,
|
|
Args... args) {
|
|
return static_cast<std::underlying_type<Serialize>::type>(flag) + makeFlags(args...);
|
|
}
|
|
|
|
static inline constexpr std::underlying_type<Serialize>::type makeFlags() {
|
|
return static_cast<std::underlying_type<Serialize>::type>(Serialize::Basics);
|
|
}
|
|
|
|
static inline constexpr bool hasFlag(std::underlying_type<Serialize>::type flags,
|
|
Serialize aflag) {
|
|
return (flags & static_cast<std::underlying_type<Serialize>::type>(aflag)) != 0;
|
|
}
|
|
|
|
/// serialize an index to velocypack, using the serialization flags above
|
|
virtual void toVelocyPack(arangodb::velocypack::Builder&,
|
|
std::underlying_type<Index::Serialize>::type flags) const;
|
|
std::shared_ptr<arangodb::velocypack::Builder> toVelocyPack(
|
|
std::underlying_type<Serialize>::type flags) const;
|
|
|
|
virtual void toVelocyPackFigures(arangodb::velocypack::Builder&) const;
|
|
std::shared_ptr<arangodb::velocypack::Builder> toVelocyPackFigures() const;
|
|
|
|
virtual Result insert(transaction::Methods*, LocalDocumentId const& documentId,
|
|
arangodb::velocypack::Slice const&, OperationMode mode) = 0;
|
|
virtual Result remove(transaction::Methods*, LocalDocumentId const& documentId,
|
|
arangodb::velocypack::Slice const&, OperationMode mode) = 0;
|
|
|
|
virtual void batchInsert(transaction::Methods*,
|
|
std::vector<std::pair<LocalDocumentId, arangodb::velocypack::Slice>> const&,
|
|
std::shared_ptr<arangodb::basics::LocalTaskQueue> queue);
|
|
|
|
virtual void load() = 0;
|
|
virtual void unload() = 0;
|
|
|
|
// called when the index is dropped
|
|
virtual int drop();
|
|
|
|
/// @brief called after the collection was truncated
|
|
/// @param tick at which truncate was applied
|
|
virtual void afterTruncate(TRI_voc_tick_t tick){};
|
|
|
|
// give index a hint about the expected size
|
|
virtual int sizeHint(transaction::Methods*, size_t);
|
|
|
|
virtual bool hasBatchInsert() const;
|
|
|
|
virtual bool supportsFilterCondition(std::vector<std::shared_ptr<arangodb::Index>> const& allIndexes,
|
|
arangodb::aql::AstNode const*,
|
|
arangodb::aql::Variable const*, size_t,
|
|
size_t&, double&) const;
|
|
|
|
virtual bool supportsSortCondition(arangodb::aql::SortCondition const*,
|
|
arangodb::aql::Variable const*, size_t,
|
|
double&, size_t&) const;
|
|
|
|
virtual arangodb::aql::AstNode* specializeCondition(arangodb::aql::AstNode*,
|
|
arangodb::aql::Variable const*) const;
|
|
|
|
virtual IndexIterator* iteratorForCondition(transaction::Methods*, ManagedDocumentResult*,
|
|
arangodb::aql::AstNode const*,
|
|
arangodb::aql::Variable const*,
|
|
IndexIteratorOptions const&) {
|
|
return nullptr; // IResearch will never use this
|
|
};
|
|
|
|
bool canUseConditionPart(arangodb::aql::AstNode const* access,
|
|
arangodb::aql::AstNode const* other,
|
|
arangodb::aql::AstNode const* op,
|
|
arangodb::aql::Variable const* reference,
|
|
std::unordered_set<std::string>& nonNullAttributes, bool) const;
|
|
|
|
/// @brief Transform the list of search slices to search values.
|
|
/// This will multiply all IN entries and simply return all other
|
|
/// entries.
|
|
void expandInSearchValues(arangodb::velocypack::Slice const,
|
|
arangodb::velocypack::Builder&) const;
|
|
|
|
virtual void warmup(arangodb::transaction::Methods* trx,
|
|
std::shared_ptr<basics::LocalTaskQueue> queue);
|
|
|
|
static size_t sortWeight(arangodb::aql::AstNode const* node);
|
|
|
|
protected:
|
|
TRI_idx_iid_t const _iid;
|
|
LogicalCollection& _collection;
|
|
std::vector<std::vector<arangodb::basics::AttributeName>> const _fields;
|
|
bool const _useExpansion;
|
|
|
|
mutable bool _unique;
|
|
mutable bool _sparse;
|
|
};
|
|
} // namespace arangodb
|
|
|
|
std::ostream& operator<<(std::ostream&, arangodb::Index const*);
|
|
std::ostream& operator<<(std::ostream&, arangodb::Index const&);
|
|
|
|
#endif
|