1
0
Fork 0
arangodb/arangod/Aql/LimitExecutor.h

183 lines
5.9 KiB
C++

////////////////////////////////////////////////////////////////////////////////
/// DISCLAIMER
///
/// Copyright 2018 ArangoDB GmbH, Cologne, Germany
///
/// Licensed under the Apache License, Version 2.0 (the "License");
/// you may not use this file except in compliance with the License.
/// You may obtain a copy of the License at
///
/// http://www.apache.org/licenses/LICENSE-2.0
///
/// Unless required by applicable law or agreed to in writing, software
/// distributed under the License is distributed on an "AS IS" BASIS,
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
/// See the License for the specific language governing permissions and
/// limitations under the License.
///
/// Copyright holder is ArangoDB GmbH, Cologne, Germany
///
/// @author Tobias Goedderz
/// @author Michael Hackstein
/// @author Heiko Kernbach
/// @author Jan Christoph Uhde
////////////////////////////////////////////////////////////////////////////////
#ifndef ARANGOD_AQL_LIMIT_EXECUTOR_H
#define ARANGOD_AQL_LIMIT_EXECUTOR_H
#include "Aql/ExecutionBlock.h"
#include "Aql/ExecutionBlockImpl.h"
#include "Aql/ExecutionState.h"
#include "Aql/ExecutorInfos.h"
#include "Aql/LimitStats.h"
#include "Aql/OutputAqlItemRow.h"
#include "Aql/types.h"
#include <memory>
namespace arangodb {
namespace aql {
class InputAqlItemRow;
class ExecutorInfos;
template <bool>
class SingleRowFetcher;
class LimitExecutorInfos : public ExecutorInfos {
public:
LimitExecutorInfos(RegisterId nrInputRegisters, RegisterId nrOutputRegisters,
std::unordered_set<RegisterId> registersToClear,
std::unordered_set<RegisterId> registersToKeep,
size_t offset, size_t limit, bool fullCount);
LimitExecutorInfos() = delete;
LimitExecutorInfos(LimitExecutorInfos&&) = default;
LimitExecutorInfos(LimitExecutorInfos const&) = delete;
~LimitExecutorInfos() = default;
size_t getOffset() const noexcept { return _offset; };
size_t getLimit() const noexcept { return _limit; };
size_t getLimitPlusOffset() const noexcept { return _offset + _limit; };
bool isFullCountEnabled() const noexcept { return _fullCount; };
private:
/// @brief the remaining offset
size_t const _offset;
/// @brief the limit
size_t const _limit;
/// @brief whether or not the node should fully count what it limits
bool const _fullCount;
};
/**
* @brief Implementation of Limit Node
*/
class LimitExecutor {
public:
struct Properties {
static const bool preservesOrder = true;
// TODO Maybe we can and want to allow passthrough. For this it would be
// necessary to allow the LimitExecutor to skip before ExecutionBlockImpl
// prefetches a block. This is related to the comment on
// inputSizeRestrictsOutputSize.
static const bool allowsBlockPassthrough = false;
//TODO:
// The implementation of this is currently suboptimal for the LimitExecutor.
// ExecutionBlockImpl allocates a block before calling produceRows();
// that means before LimitExecutor had a chance to skip;
// that means we cannot yet call expectedNumberOfRows() on the Fetcher,
// because it would call getSome on the parent when we actually want to
// skip.
// One possible solution is to call skipSome during expectedNumberOfRows(),
// which is more than a little ugly. Perhaps we can find a better way.
// Note that there are corresponding comments in
// ExecutionBlockImpl::requestWrappedBlock() and
// LimitExecutor::expectedNumberOfRows().
static const bool inputSizeRestrictsOutputSize = true;
};
using Fetcher = SingleRowFetcher<Properties::allowsBlockPassthrough>;
using Infos = LimitExecutorInfos;
using Stats = LimitStats;
LimitExecutor() = delete;
LimitExecutor(LimitExecutor&&) = default;
LimitExecutor(LimitExecutor const&) = delete;
LimitExecutor(Fetcher& fetcher, Infos&);
~LimitExecutor();
/**
* @brief produce the next Row of Aql Values.
*
* @return ExecutionState, and if successful exactly one new Row of AqlItems.
*/
std::pair<ExecutionState, Stats> produceRows(OutputAqlItemRow& output);
std::pair<ExecutionState, size_t> expectedNumberOfRows(size_t atMost) const;
private:
Infos const& infos() const noexcept { return _infos; };
size_t maxRowsLeftToFetch() const noexcept {
return infos().getLimitPlusOffset() - _counter;
}
size_t maxRowsLeftToSkip() const noexcept {
return infos().getOffset() - _counter;
}
enum class LimitState {
// state is SKIPPING until the offset is reached
SKIPPING,
// state is RETURNING until the limit is reached
RETURNING,
// state is RETURNING_LAST_ROW only if fullCount is disabled, and we've seen
// the second to last row until the limit is reached
RETURNING_LAST_ROW,
// state is COUNTING when the limit is reached and fullcount is enabled
COUNTING,
// state is LIMIT_REACHED only if fullCount is disabled, and we've seen all
// rows up to limit
LIMIT_REACHED,
};
/**
* @brief Returns the current state of the executor, based on _counter (i.e.
* number of lines seen), limit, offset and fullCount.
* @return See LimitState comments for a description.
*/
LimitState currentState() const noexcept {
// Note that not only offset, but also limit can be zero. Thus the order
// of all following checks is important, even the first two!
if (_counter < infos().getOffset()) {
return LimitState::SKIPPING;
}
if (!infos().isFullCountEnabled() && _counter + 1 == infos().getLimitPlusOffset()) {
return LimitState::RETURNING_LAST_ROW;
}
if (_counter < infos().getLimitPlusOffset()) {
return LimitState::RETURNING;
}
if (infos().isFullCountEnabled()) {
return LimitState::COUNTING;
}
return LimitState::LIMIT_REACHED;
}
private:
Infos const& _infos;
Fetcher& _fetcher;
// Number of input lines seen
size_t _counter = 0;
};
} // namespace aql
} // namespace arangodb
#endif