mirror of https://gitee.com/bigwinds/arangodb
190 lines
5.3 KiB
C++
190 lines
5.3 KiB
C++
////////////////////////////////////////////////////////////////////////////////
|
|
/// DISCLAIMER
|
|
///
|
|
/// Copyright 2016 by EMC Corporation, All Rights Reserved
|
|
///
|
|
/// Licensed under the Apache License, Version 2.0 (the "License");
|
|
/// you may not use this file except in compliance with the License.
|
|
/// You may obtain a copy of the License at
|
|
///
|
|
/// http://www.apache.org/licenses/LICENSE-2.0
|
|
///
|
|
/// Unless required by applicable law or agreed to in writing, software
|
|
/// distributed under the License is distributed on an "AS IS" BASIS,
|
|
/// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
/// See the License for the specific language governing permissions and
|
|
/// limitations under the License.
|
|
///
|
|
/// Copyright holder is EMC Corporation
|
|
///
|
|
/// @author Andrey Abramov
|
|
/// @author Vasiliy Nabatchikov
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
// list of statically loaded scorers via init()
|
|
#ifndef IRESEARCH_DLL
|
|
#include "tfidf.hpp"
|
|
#include "bm25.hpp"
|
|
#endif
|
|
|
|
#include "utils/register.hpp"
|
|
#include "scorers.hpp"
|
|
|
|
NS_LOCAL
|
|
|
|
struct entry_key_t {
|
|
const irs::text_format::type_id& args_format_;
|
|
const irs::string_ref name_;
|
|
entry_key_t(
|
|
const irs::string_ref& name, const irs::text_format::type_id& args_format
|
|
): args_format_(args_format), name_(name) {}
|
|
bool operator==(const entry_key_t& other) const NOEXCEPT {
|
|
return &args_format_ == &other.args_format_ && name_ == other.name_;
|
|
}
|
|
};
|
|
|
|
NS_END
|
|
|
|
NS_BEGIN(std)
|
|
|
|
template<>
|
|
struct hash<entry_key_t> {
|
|
size_t operator()(const entry_key_t& value) const {
|
|
return std::hash<irs::string_ref>()(value.name_);
|
|
}
|
|
}; // hash
|
|
|
|
NS_END // std
|
|
|
|
NS_LOCAL
|
|
|
|
const std::string FILENAME_PREFIX("libscorer-");
|
|
|
|
class scorer_register:
|
|
public irs::tagged_generic_register<entry_key_t, irs::sort::ptr(*)(const irs::string_ref& args), irs::string_ref, scorer_register> {
|
|
protected:
|
|
virtual std::string key_to_filename(const key_type& key) const override {
|
|
auto& name = key.name_;
|
|
std::string filename(FILENAME_PREFIX.size() + name.size(), 0);
|
|
|
|
std::memcpy(
|
|
&filename[0],
|
|
FILENAME_PREFIX.c_str(),
|
|
FILENAME_PREFIX.size()
|
|
);
|
|
|
|
irs::string_ref::traits_type::copy(
|
|
&filename[0] + FILENAME_PREFIX.size(),
|
|
name.c_str(),
|
|
name.size()
|
|
);
|
|
|
|
return filename;
|
|
}
|
|
};
|
|
|
|
NS_END
|
|
|
|
NS_ROOT
|
|
|
|
/*static*/ bool scorers::exists(
|
|
const string_ref& name,
|
|
const irs::text_format::type_id& args_format
|
|
) {
|
|
return nullptr != scorer_register::instance().get(entry_key_t(name, args_format));
|
|
}
|
|
|
|
/*static*/ sort::ptr scorers::get(
|
|
const string_ref& name,
|
|
const irs::text_format::type_id& args_format,
|
|
const string_ref& args
|
|
) {
|
|
auto* factory =
|
|
scorer_register::instance().get(entry_key_t(name, args_format));
|
|
|
|
return factory ? factory(args) : nullptr;
|
|
}
|
|
|
|
/*static*/ void scorers::init() {
|
|
#ifndef IRESEARCH_DLL
|
|
irs::bm25_sort::init();
|
|
irs::tfidf_sort::init();
|
|
#endif
|
|
}
|
|
|
|
/*static*/ void scorers::load_all(const std::string& path) {
|
|
load_libraries(path, FILENAME_PREFIX, "");
|
|
}
|
|
|
|
/*static*/ bool scorers::visit(
|
|
const std::function<bool(const string_ref&, const irs::text_format::type_id&)>& visitor
|
|
) {
|
|
scorer_register::visitor_t wrapper = [&visitor](const entry_key_t& key)->bool {
|
|
return visitor(key.name_, key.args_format_);
|
|
};
|
|
|
|
return scorer_register::instance().visit(wrapper);
|
|
}
|
|
|
|
// -----------------------------------------------------------------------------
|
|
// --SECTION-- scorer registration
|
|
// -----------------------------------------------------------------------------
|
|
|
|
scorer_registrar::scorer_registrar(
|
|
const sort::type_id& type,
|
|
const irs::text_format::type_id& args_format,
|
|
sort::ptr(*factory)(const irs::string_ref& args),
|
|
const char* source /*= nullptr*/
|
|
) {
|
|
irs::string_ref source_ref(source);
|
|
auto entry = scorer_register::instance().set(
|
|
entry_key_t(type.name(), args_format),
|
|
factory,
|
|
source_ref.null() ? nullptr : &source_ref
|
|
);
|
|
|
|
registered_ = entry.second;
|
|
|
|
if (!registered_ && factory != entry.first) {
|
|
auto* registered_source =
|
|
scorer_register::instance().tag(entry_key_t(type.name(), args_format));
|
|
|
|
if (source && registered_source) {
|
|
IR_FRMT_WARN(
|
|
"type name collision detected while registering scorer, ignoring: type '%s' from %s, previously from %s",
|
|
type.name().c_str(),
|
|
source,
|
|
registered_source->c_str()
|
|
);
|
|
} else if (source) {
|
|
IR_FRMT_WARN(
|
|
"type name collision detected while registering scorer, ignoring: type '%s' from %s",
|
|
type.name().c_str(),
|
|
source
|
|
);
|
|
} else if (registered_source) {
|
|
IR_FRMT_WARN(
|
|
"type name collision detected while registering scorer, ignoring: type '%s', previously from %s",
|
|
type.name().c_str(),
|
|
registered_source->c_str()
|
|
);
|
|
} else {
|
|
IR_FRMT_WARN(
|
|
"type name collision detected while registering scorer, ignoring: type '%s'",
|
|
type.name().c_str()
|
|
);
|
|
}
|
|
|
|
IR_LOG_STACK_TRACE();
|
|
}}
|
|
|
|
scorer_registrar::operator bool() const NOEXCEPT {
|
|
return registered_;
|
|
}
|
|
|
|
NS_END
|
|
|
|
// -----------------------------------------------------------------------------
|
|
// --SECTION-- END-OF-FILE
|
|
// -----------------------------------------------------------------------------
|