Files
scylladb/cql3/expr/restrictions.cc
Avi Kivity f3eade2f62 treewide: relicense to ScyllaDB-Source-Available-1.0
Drop the AGPL license in favor of a source-available license.
See the blog post [1] for details.

[1] https://www.scylladb.com/2024/12/18/why-were-moving-to-a-source-available-license/
2024-12-18 17:45:13 +02:00

258 lines
12 KiB
C++

/*
* Copyright (C) 2022-present ScyllaDB
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
*/
#include "cql3/statements/request_validations.hh"
#include "exceptions/exceptions.hh"
#include "schema/schema.hh"
#include <seastar/util/defer.hh>
#include "cql3/prepare_context.hh"
#include "cql3/expr/expr-utils.hh"
#include "types/list.hh"
#include <iterator>
#include <ranges>
namespace cql3 {
namespace expr {
extern logging::logger expr_logger;
namespace {
bool is_legal_relation_for_non_frozen_collection(oper_t oper, bool is_lhs_col_indexed) {
return oper == oper_t::CONTAINS_KEY || oper == oper_t::CONTAINS || (oper == oper_t::EQ && is_lhs_col_indexed);
}
void validate_single_column_relation(const column_value& lhs, oper_t oper, const schema& schema, bool is_lhs_subscripted) {
using namespace statements::request_validations; // used for check_false and check_true
const abstract_type& lhs_col_type = lhs.col->column_specification->type->without_reversed();
const ::shared_ptr<column_identifier>& lhs_col_name = lhs.col->column_specification->name;
if (schema.is_dense() && lhs.col->is_regular()) {
throw exceptions::invalid_request_exception(
format("Predicates on the non-primary-key column ({}) of a COMPACT table are not yet supported",
lhs.col->name_as_text()));
}
if (is_lhs_subscripted) {
check_true(lhs_col_type.is_map() || lhs_col_type.is_list(), "Column {} cannot be subscripted", lhs_col_name);
check_true(!lhs_col_type.is_map() || lhs_col_type.is_multi_cell(),
"Map-entry equality predicates on frozen map column {} are not supported",
lhs_col_name);
check_true(!lhs_col_type.is_list() || lhs_col_type.is_multi_cell(),
"List element equality predicates on frozen list column {} are not supported",
lhs_col_name);
check_true(oper == oper_t::EQ, "Only EQ relations are supported on map/list entries");
}
if (lhs_col_type.is_collection()) {
// We don't support relations against entire collections (unless they're frozen), like "numbers = {1, 2, 3}"
check_false(lhs_col_type.is_multi_cell()
&& !is_legal_relation_for_non_frozen_collection(oper, is_lhs_subscripted),
"Collection column '{}' ({}) cannot be restricted by a '{}' relation",
lhs_col_name,
lhs_col_type.as_cql3_type(),
oper);
}
}
std::vector<const column_definition*> to_column_definitions(const std::vector<expression>& cols) {
std::vector<const column_definition*> result;
result.reserve(cols.size());
for (const expression& col : cols) {
if (auto col_val = as_if<column_value>(&col)) {
result.push_back(col_val->col);
} else {
on_internal_error(expr_logger, format("to_column_definitions bad expression: {}", col));
}
}
return result;
}
void validate_multi_column_relation(const std::vector<const column_definition*>& lhs, oper_t oper) {
using namespace statements::request_validations;
int previous_position = -1;
for (const column_definition* col_def : lhs) {
check_true(col_def->is_clustering_key(),
"Multi-column relations can only be applied to clustering columns but was applied to: {}",
col_def->name_as_text());
// FIXME: the following restriction should be removed (CASSANDRA-8613)
if (col_def->position() != unsigned(previous_position + 1)) {
check_false(previous_position == -1, "Clustering columns may not be skipped in multi-column relations. "
"They should appear in the PRIMARY KEY order"); // TODO: More detailed messages?
throw exceptions::invalid_request_exception(format("Clustering columns must appear in the PRIMARY KEY order in multi-column relations"));
}
previous_position = col_def->position();
}
}
void validate_token_relation(const std::vector<const column_definition*> column_defs, oper_t oper, const schema& schema) {
auto pk = schema.partition_key_columns();
if (!std::equal(column_defs.begin(), column_defs.end(), pk.begin(),
pk.end(), [](auto* c1, auto& c2) {
return c1 == &c2; // same, not "equal".
})) {
std::vector<const column_definition*> unique_columns;
std::ranges::unique_copy(column_defs, std::back_inserter(unique_columns));
if (unique_columns.size() < column_defs.size()) {
throw exceptions::invalid_request_exception(
"The token() function contains duplicate partition key components");
}
if (unique_columns.size() < pk.size()) {
throw exceptions::invalid_request_exception(
"The token() function must be applied to all partition key components or none of them");
}
throw exceptions::invalid_request_exception(
seastar::format("The token function arguments must be in the partition key order: {}",
fmt::join(pk | std::views::transform(std::mem_fn(&column_definition::name_as_text)), ", ")));
}
}
void preliminary_binop_vaidation_checks(const binary_operator& binop) {
if (binop.op == oper_t::NEQ) {
throw exceptions::invalid_request_exception(format("Unsupported \"!=\" relation: {:user}", binop));
}
if (binop.op == oper_t::IS_NOT) {
bool rhs_is_null = (is<untyped_constant>(binop.rhs) && as<untyped_constant>(binop.rhs).partial_type == untyped_constant::type_class::null)
|| (is<constant>(binop.rhs) && as<constant>(binop.rhs).is_null());
if (!rhs_is_null) {
throw exceptions::invalid_request_exception(format("Unsupported \"IS NOT\" relation: {:user}", binop));
}
}
if (auto lhs_tup = as_if<tuple_constructor>(&binop.lhs)) {
if (binop.op == oper_t::CONTAINS) {
throw exceptions::invalid_request_exception("CONTAINS cannot be used for Multi-column relations");
}
if (binop.op == oper_t::CONTAINS_KEY) {
throw exceptions::invalid_request_exception("CONTAINS_KEY cannot be used for Multi-column relations");
}
if (binop.op == oper_t::LIKE) {
throw exceptions::invalid_request_exception("LIKE cannot be used for Multi-column relations");
}
if (auto rhs_tup = as_if<tuple_constructor>(&binop.rhs)) {
if (lhs_tup->elements.size() != rhs_tup->elements.size()) {
throw exceptions::invalid_request_exception(
format("Expected {} elements in value tuple, but got {}: {}",
lhs_tup->elements.size(), rhs_tup->elements.size(), *rhs_tup));
}
}
}
// Right now a token() on the LHS means that there's a partition token there.
// In the future with relaxed grammar this might no longer be true and this check will have to be revisisted.
// Moving the check after preparation would break tests and cassandra compatibility.
if (is_token_function(binop.lhs)) {
if (binop.op == oper_t::IN) {
throw exceptions::invalid_request_exception("IN cannot be used with the token function");
}
if (binop.op == oper_t::LIKE) {
throw exceptions::invalid_request_exception("LIKE cannot be used with the token function");
}
if (binop.op == oper_t::CONTAINS) {
throw exceptions::invalid_request_exception("CONTAINS cannot be used with the token function");
}
if (binop.op == oper_t::CONTAINS_KEY) {
throw exceptions::invalid_request_exception("CONTAINS_KEY cannot be used with the token function");
}
}
}
} // anonymous namespace
binary_operator validate_and_prepare_new_restriction(const binary_operator& restriction,
data_dictionary::database db,
schema_ptr schema,
prepare_context& ctx) {
// Perform basic initial checks
preliminary_binop_vaidation_checks(restriction);
// Prepare the restriction
binary_operator prepared_binop = prepare_binary_operator(restriction, db, *schema);
expr::verify_no_aggregate_functions(prepared_binop, "WHERE clause");
// Fill prepare context
const column_value* lhs_pk_col_search_res = find_in_expression<column_value>(prepared_binop.lhs,
[](const column_value& col) {
return col.col->is_partition_key();
}
);
auto reset_processing_pk_column = defer([&ctx] () noexcept { ctx.set_processing_pk_restrictions(false); });
if (lhs_pk_col_search_res != nullptr) {
ctx.set_processing_pk_restrictions(true);
}
fill_prepare_context(prepared_binop.lhs, ctx);
fill_prepare_context(prepared_binop.rhs, ctx);
// Perform more throughout validation depending on restriction type
if (auto col_val = as_if<column_value>(&prepared_binop.lhs)) {
// Simple single column restriction
validate_single_column_relation(*col_val, prepared_binop.op, *schema, false);
} else if (auto sub = as_if<subscript>(&prepared_binop.lhs)) {
// Subscripted single column restriction
const column_value& sub_col = get_subscripted_column(*sub);
validate_single_column_relation(sub_col, prepared_binop.op, *schema, true);
} else if (auto multi_col_tuple = as_if<tuple_constructor>(&prepared_binop.lhs)) {
// Multi column restriction
std::vector<const column_definition*> lhs_cols = to_column_definitions(multi_col_tuple->elements);
std::vector<lw_shared_ptr<column_specification>> lhs_col_specs;
lhs_col_specs.reserve(multi_col_tuple->elements.size());
for (const column_definition* col_def : lhs_cols) {
lhs_col_specs.push_back(col_def->column_specification);
}
validate_multi_column_relation(lhs_cols, prepared_binop.op);
} else if (is_token_function(prepared_binop.lhs)) {
// Token restriction
std::vector<const column_definition*> column_defs = to_column_definitions(as<function_call>(prepared_binop.lhs).args);
validate_token_relation(column_defs, prepared_binop.op, *schema);
} else {
// Anything else
throw exceptions::invalid_request_exception(
format("expr::validate_and_prepare_new_restriction unhandled restriction: {}", prepared_binop));
}
// Convert single element IN relation to an EQ relation
if (prepared_binop.op == oper_t::IN) {
if (is<collection_constructor>(prepared_binop.rhs)) {
const std::vector<expression>& elements = as<collection_constructor>(prepared_binop.rhs).elements;
if (elements.size() == 1) {
prepared_binop.op = oper_t::EQ;
prepared_binop.rhs = elements[0];
}
}
if(is<constant>(prepared_binop.rhs) && as<constant>(prepared_binop.rhs).type->without_reversed().is_list()) {
const constant& rhs_constant = as<constant>(prepared_binop.rhs);
const list_type_impl* rhs_list_type =
dynamic_cast<const list_type_impl*>(&rhs_constant.type->without_reversed());
utils::chunked_vector<managed_bytes_opt> elements = get_list_elements(rhs_constant.value);
if (elements.size() == 1) {
prepared_binop.op = oper_t::EQ;
prepared_binop.rhs = constant(cql3::raw_value::make_value(elements[0]),
rhs_list_type->get_elements_type());
}
}
}
return prepared_binop;
}
} // namespace expr
} // namespace cql3