mirror of
https://github.com/scylladb/scylladb.git
synced 2026-05-23 00:02:37 +00:00
Move common description logic into a protected helper `describe_with_target` on `custom_index`, so subclasses can delegate to it when implementing the `describe()` virtual method.
303 lines
11 KiB
C++
303 lines
11 KiB
C++
/*
|
|
* Copyright (C) 2017-present ScyllaDB
|
|
*
|
|
* Modified by ScyllaDB
|
|
*/
|
|
|
|
/*
|
|
* SPDX-License-Identifier: (LicenseRef-ScyllaDB-Source-Available-1.1 and Apache-2.0)
|
|
*/
|
|
|
|
#include <functional>
|
|
#include <map>
|
|
#include <optional>
|
|
#include <ranges>
|
|
#include <seastar/core/shared_ptr.hh>
|
|
#include <string_view>
|
|
#include <unordered_map>
|
|
#include <unordered_set>
|
|
|
|
#include "index/secondary_index_manager.hh"
|
|
#include "index/secondary_index.hh"
|
|
#include "index/fulltext_index.hh"
|
|
#include "index/vector_index.hh"
|
|
|
|
#include "cql3/expr/expression.hh"
|
|
#include "cql3/util.hh"
|
|
#include "index/target_parser.hh"
|
|
#include "schema/schema.hh"
|
|
#include "utils/histogram_metrics_helper.hh"
|
|
|
|
seastar::metrics::label idx{"idx"};
|
|
seastar::metrics::label ks{"ks"};
|
|
|
|
namespace secondary_index {
|
|
|
|
index::index(const sstring& target_column, const index_metadata& im)
|
|
: _im{im}
|
|
, _target_type{cql3::statements::index_target::from_target_string(target_column)}
|
|
, _target_column{cql3::statements::index_target::column_name_from_target_string(target_column)}
|
|
{}
|
|
|
|
bool index::depends_on(const column_definition& cdef) const {
|
|
return cdef.name_as_text() == _target_column;
|
|
}
|
|
|
|
index::supports_expression_v index::supports_expression(const column_definition& cdef, const cql3::expr::oper_t op) const {
|
|
using target_type = cql3::statements::index_target::target_type;
|
|
auto collection_yes = supports_expression_v::from_bool_collection(true);
|
|
if (cdef.name_as_text() != _target_column) {
|
|
return supports_expression_v::from_bool(false);
|
|
}
|
|
|
|
switch (op) {
|
|
case cql3::expr::oper_t::EQ:
|
|
return supports_expression_v::from_bool(_target_type == target_type::regular_values);
|
|
case cql3::expr::oper_t::CONTAINS:
|
|
if (cdef.type->is_set() && _target_type == target_type::keys) {
|
|
return collection_yes;
|
|
}
|
|
if (cdef.type->is_list() && _target_type == target_type::collection_values) {
|
|
return collection_yes;
|
|
}
|
|
if (cdef.type->is_map() && _target_type == target_type::collection_values) {
|
|
return collection_yes;
|
|
}
|
|
return supports_expression_v::from_bool(false);
|
|
case cql3::expr::oper_t::CONTAINS_KEY:
|
|
if (cdef.type->is_map() && _target_type == target_type::keys) {
|
|
return collection_yes;
|
|
}
|
|
return supports_expression_v::from_bool(false);
|
|
default:
|
|
return supports_expression_v::from_bool(false);
|
|
}
|
|
}
|
|
|
|
index::supports_expression_v index::supports_subscript_expression(const column_definition& cdef, const cql3::expr::oper_t op) const {
|
|
using target_type = cql3::statements::index_target::target_type;
|
|
if (cdef.name_as_text() != _target_column) {
|
|
return supports_expression_v::from_bool(false);
|
|
}
|
|
|
|
return supports_expression_v::from_bool_collection(op == cql3::expr::oper_t::EQ && _target_type == target_type::keys_and_values);
|
|
}
|
|
|
|
const index_metadata& index::metadata() const {
|
|
return _im;
|
|
}
|
|
|
|
secondary_index_manager::secondary_index_manager(data_dictionary::table cf)
|
|
: _cf{cf}
|
|
{}
|
|
|
|
void secondary_index_manager::reload() {
|
|
const auto& table_indices = _cf.schema()->all_indices();
|
|
auto it = _indices.begin();
|
|
while (it != _indices.end()) {
|
|
auto index_name = it->first;
|
|
if (!table_indices.contains(index_name)) {
|
|
it = _indices.erase(it);
|
|
if (auto mi = _metrics.find(index_name); mi != _metrics.end()) {
|
|
mi->second->deregister();
|
|
_metrics.erase(mi);
|
|
}
|
|
} else {
|
|
++it;
|
|
}
|
|
}
|
|
for (const auto& index : _cf.schema()->all_indices()) {
|
|
add_index(index.second);
|
|
}
|
|
}
|
|
|
|
void secondary_index_manager::add_index(const index_metadata& im) {
|
|
sstring index_target = im.options().at(cql3::statements::index_target::target_option_name);
|
|
sstring index_target_name = target_parser::get_target_column_name_from_string(index_target);
|
|
_indices.emplace(im.name(), index{index_target_name, im});
|
|
if (!_metrics.contains(im.name())) {
|
|
_metrics.emplace(im.name(), make_lw_shared<stats>(_cf.schema()->ks_name(), im.name()));
|
|
}
|
|
}
|
|
|
|
|
|
sstring index_table_name(const sstring& index_name) {
|
|
return format("{}_index", index_name);
|
|
}
|
|
|
|
sstring index_name_from_table_name(const sstring& table_name) {
|
|
if (table_name.size() < 7 || !table_name.ends_with("_index")) {
|
|
throw std::runtime_error(format("Table {} does not have _index suffix", table_name));
|
|
}
|
|
return table_name.substr(0, table_name.size() - 6); // remove the _index suffix from an index name;
|
|
}
|
|
|
|
std::set<sstring>
|
|
existing_index_names(std::span<const schema_ptr> tables, std::string_view cf_to_exclude) {
|
|
std::set<sstring> names;
|
|
for (auto& schema : tables) {
|
|
if (!cf_to_exclude.empty() && schema->cf_name() == cf_to_exclude) {
|
|
continue;
|
|
}
|
|
for (const auto& index_name : schema->index_names()) {
|
|
names.emplace(index_name);
|
|
}
|
|
}
|
|
return names;
|
|
}
|
|
|
|
sstring get_available_index_name(
|
|
std::string_view ks_name,
|
|
std::string_view cf_name,
|
|
std::optional<sstring> index_name_root,
|
|
const std::set<sstring>& existing_names,
|
|
std::function<bool(std::string_view, std::string_view)> has_schema) {
|
|
auto base_name = index_metadata::get_default_index_name(sstring(cf_name), index_name_root);
|
|
sstring accepted_name = base_name;
|
|
int i = 0;
|
|
auto name_accepted = [&] {
|
|
auto index_table_name = secondary_index::index_table_name(accepted_name);
|
|
return !has_schema(ks_name, index_table_name) && !existing_names.contains(accepted_name);
|
|
};
|
|
while (!name_accepted()) {
|
|
accepted_name = base_name + "_" + std::to_string(++i);
|
|
}
|
|
return accepted_name;
|
|
}
|
|
|
|
std::vector<index_metadata> secondary_index_manager::get_dependent_indices(const column_definition& cdef) const {
|
|
return _indices
|
|
| std::views::values
|
|
| std::views::filter([&] (auto& index) { return index.depends_on(cdef); })
|
|
| std::views::transform([&] (auto& index) { return index.metadata(); })
|
|
| std::ranges::to<std::vector>();
|
|
}
|
|
|
|
std::vector<index> secondary_index_manager::list_indexes() const {
|
|
return _indices | std::views::values | std::ranges::to<std::vector>();
|
|
}
|
|
|
|
bool secondary_index_manager::is_index(view_ptr view) const {
|
|
return is_index(*view);
|
|
}
|
|
|
|
bool secondary_index_manager::is_index(const schema& s) const {
|
|
return std::ranges::any_of(_indices | std::views::values, [&s] (const index& i) {
|
|
return s.cf_name() == index_table_name(i.metadata().name());
|
|
});
|
|
}
|
|
|
|
bool secondary_index_manager::is_global_index(const schema& s) const {
|
|
return std::ranges::any_of(_indices | std::views::values, [&s] (const index& i) {
|
|
return !i.metadata().local() && s.cf_name() == index_table_name(i.metadata().name());
|
|
});
|
|
}
|
|
|
|
std::optional<sstring> secondary_index_manager::custom_index_class(const schema& s) const {
|
|
|
|
auto idx = _indices.find(index_name_from_table_name(s.cf_name()));
|
|
|
|
if (idx == _indices.end() || !(*idx).second.metadata().options().contains(db::index::secondary_index::custom_class_option_name)) {
|
|
return std::nullopt;
|
|
} else {
|
|
return (*idx).second.metadata().options().at(db::index::secondary_index::custom_class_option_name);
|
|
}
|
|
}
|
|
|
|
// This function returns a factory, as the custom index class should be lightweight, preferably not holding any state.
|
|
// We prefer this over a static custom index class instance, as it allows us to avoid any issues with thread safety.
|
|
//
|
|
// Note: SAI class names (StorageAttachedIndex, sai) are not listed here
|
|
// because maybe_rewrite_sai_to_vector_index() in create_index_statement.cc
|
|
// rewrites them to "vector_index" before the index metadata is persisted.
|
|
std::optional<std::function<std::unique_ptr<custom_index>()>> secondary_index_manager::get_custom_class_factory(const sstring& class_name) {
|
|
sstring lower_class_name = class_name;
|
|
std::transform(lower_class_name.begin(), lower_class_name.end(), lower_class_name.begin(), ::tolower);
|
|
|
|
const static std::unordered_map<std::string_view, std::function<std::unique_ptr<custom_index>()>> classes = {
|
|
{"fulltext_index", fulltext_index_factory},
|
|
{"vector_index", vector_index_factory},
|
|
};
|
|
|
|
if (auto class_it = classes.find(lower_class_name); class_it != classes.end()) {
|
|
return class_it->second;
|
|
} else {
|
|
return std::nullopt;
|
|
}
|
|
}
|
|
|
|
std::optional<std::unique_ptr<custom_index>> secondary_index_manager::get_custom_class(const index_metadata& im) {
|
|
auto it = im.options().find(db::index::secondary_index::custom_class_option_name);
|
|
if (it == im.options().end()) {
|
|
return std::nullopt;
|
|
}
|
|
auto custom_class_factory = secondary_index::secondary_index_manager::get_custom_class_factory(it->second);
|
|
if (!custom_class_factory) {
|
|
return std::nullopt;
|
|
}
|
|
return (*custom_class_factory)();
|
|
}
|
|
|
|
std::optional<cql3::description> custom_index::describe_with_target(
|
|
const index_metadata& im,
|
|
const schema& base_schema,
|
|
const sstring& target_cql) const {
|
|
static const std::unordered_set<sstring> system_options = {
|
|
cql3::statements::index_target::target_option_name,
|
|
db::index::secondary_index::custom_class_option_name,
|
|
db::index::secondary_index::index_version_option_name,
|
|
};
|
|
|
|
fragmented_ostringstream os;
|
|
os << "CREATE CUSTOM INDEX " << cql3::util::maybe_quote(im.name()) << " ON "
|
|
<< cql3::util::maybe_quote(base_schema.ks_name()) << "."
|
|
<< cql3::util::maybe_quote(base_schema.cf_name()) << "(" << target_cql << ")"
|
|
<< " USING '" << index_type_name() << "_index'";
|
|
|
|
std::map<sstring, sstring> user_options;
|
|
for (const auto& [key, value] : im.options()) {
|
|
if (!system_options.contains(key)) {
|
|
user_options.emplace(key, value);
|
|
}
|
|
}
|
|
if (!user_options.empty()) {
|
|
os << " WITH OPTIONS = {";
|
|
bool first = true;
|
|
for (const auto& [key, value] : user_options) {
|
|
if (!first) {
|
|
os << ", ";
|
|
}
|
|
os << "'" << key << "': '" << value << "'";
|
|
first = false;
|
|
}
|
|
os << "}";
|
|
}
|
|
|
|
return cql3::description{
|
|
.keyspace = base_schema.ks_name(),
|
|
.type = "index",
|
|
.name = im.name(),
|
|
.create_statement = std::move(os).to_managed_string(),
|
|
};
|
|
}
|
|
|
|
stats::stats(const sstring& ks_name, const sstring& index_name) {
|
|
metrics.add_group("index",
|
|
{seastar::metrics::make_histogram("query_latencies", seastar::metrics::description("Index query latencies"), {idx(index_name), ks(ks_name)},
|
|
[this]() {
|
|
return to_metrics_histogram(query_latency);
|
|
})
|
|
.aggregate({seastar::metrics::shard_label})
|
|
.set_skip_when_empty()});
|
|
}
|
|
|
|
void stats::deregister() {
|
|
metrics.clear();
|
|
}
|
|
|
|
void stats::add_latency(std::chrono::steady_clock::duration d) {
|
|
query_latency.add(d);
|
|
}
|
|
|
|
}
|