/* * Copyright (C) 2020 ScyllaDB */ /* * This file is part of Scylla. * * Scylla is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * Scylla is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with Scylla. If not, see . */ #pragma once #include #include #include #include #include #include "bytes.hh" #include "cql3/query_options.hh" #include "cql3/selection/selection.hh" #include "cql3/statements/bound.hh" #include "cql3/term.hh" #include "database_fwd.hh" #include "gc_clock.hh" #include "mutation_partition.hh" #include "query-result-reader.hh" #include "range.hh" #include "seastarx.hh" #include "utils/overloaded_functor.hh" namespace secondary_index { class index; class secondary_index_manager; } // namespace secondary_index namespace cql3 { namespace expr { struct allow_local_index_tag {}; using allow_local_index = bool_class; class binary_operator; class conjunction; /// A restriction expression -- union of all possible restriction types. bool means a Boolean constant. using expression = std::variant; /// A column, optionally subscripted by a term (eg, c1 or c2['abc']). struct column_value { const column_definition* col; ::shared_ptr sub; ///< If present, this LHS is col[sub], otherwise just col. /// For easy creation of vector from vector. column_value(const column_definition* col) : col(col) {} /// The compiler doesn't auto-generate this due to the other constructor's existence. column_value(const column_definition* col, ::shared_ptr sub) : col(col), sub(sub) {} }; /// A tuple of column selectors. Usually used for range constraints on clustering keys. struct column_value_tuple { std::vector elements; explicit column_value_tuple(std::vector); template requires requires (Range r) { { r.begin() } -> std::input_iterator; { r.end() } -> std::input_iterator; { *r.begin() } -> std::convertible_to; } explicit column_value_tuple(Range r); }; /// Represents token function on LHS of an operator relation. No need to list column definitions /// here -- token takes exactly the partition key as its argument. struct token {}; enum class oper_t { EQ, NEQ, LT, LTE, GTE, GT, IN, CONTAINS, CONTAINS_KEY, IS_NOT, LIKE }; /// Describes the nature of clustering-key comparisons. Useful for implementing SCYLLA_CLUSTERING_BOUND. enum class comparison_order : char { cql, ///< CQL order. (a,b)>(1,1) is equivalent to a>1 OR (a=1 AND b>1). clustering, ///< Table's clustering order. (a,b)>(1,1) means any row past (1,1) in storage. }; /// Operator restriction: LHS op RHS. struct binary_operator { std::variant lhs; oper_t op; ::shared_ptr rhs; comparison_order order = comparison_order::cql; }; /// A conjunction of restrictions. struct conjunction { std::vector children; }; /// Creates a conjunction of a and b. If either a or b is itself a conjunction, its children are inserted /// directly into the resulting conjunction's children, flattening the expression tree. extern expression make_conjunction(expression a, expression b); extern std::ostream& operator<<(std::ostream&, oper_t); /// True iff restr is satisfied with respect to the row provided from a partition slice. extern bool is_satisfied_by( const expression& restr, const std::vector& partition_key, const std::vector& clustering_key, const query::result_row_view& static_row, const query::result_row_view* row, const selection::selection&, const query_options&); /// True iff restr is satisfied with respect to the row provided from a mutation. extern bool is_satisfied_by( const expression& restr, const schema& schema, const partition_key& key, const clustering_key_prefix& ckey, const row& cells, const query_options& options, gc_clock::time_point now); /// Finds the first binary_operator in restr that represents a bound and returns its RHS as a tuple. If no /// such binary_operator exists, returns an empty vector. The search is depth first. extern std::vector first_multicolumn_bound(const expression&, const query_options&, statements::bound); /// A set of discrete values. using value_list = std::vector; // Sorted and deduped using value comparator. /// General set of values. Empty set and single-element sets are always value_list. nonwrapping_range is /// never singular and never has start > end. Universal set is a nonwrapping_range with both bounds null. using value_set = std::variant>; /// A set of all column values that would satisfy an expression. If column is null, a set of all token values /// that satisfy. /// /// An expression restricts possible values of a column or token: /// - `A>5` restricts A from below /// - `A>5 AND A>6 AND B<10 AND A=12 AND B>0` restricts A to 12 and B to between 0 and 10 /// - `A IN (1, 3, 5)` restricts A to 1, 3, or 5 /// - `A IN (1, 3, 5) AND A>3` restricts A to just 5 /// - `A=1 AND A<=0` restricts A to an empty list; no value is able to satisfy the expression /// - `A>=NULL` also restricts A to an empty list; all comparisons to NULL are false /// - an expression without A "restricts" A to unbounded range extern value_set possible_lhs_values(const column_definition*, const expression&, const query_options&); /// Turns value_set into a range, unless it's a multi-valued list (in which case this throws). extern nonwrapping_range to_range(const value_set&); /// A range of all X such that X op val. nonwrapping_range to_range(oper_t op, const clustering_key_prefix& val); /// True iff the index can support the entire expression. extern bool is_supported_by(const expression&, const secondary_index::index&); /// True iff any of the indices from the manager can support the entire expression. If allow_local, use all /// indices; otherwise, use only global indices. extern bool has_supporting_index( const expression&, const secondary_index::secondary_index_manager&, allow_local_index allow_local); extern sstring to_string(const expression&); extern std::ostream& operator<<(std::ostream&, const column_value&); extern std::ostream& operator<<(std::ostream&, const expression&); /// If there is a binary_operator atom b for which f(b) is true, returns it. Otherwise returns null. template requires std::regular_invocable const binary_operator* find_atom(const expression& e, Fn f) { return std::visit(overloaded_functor{ [&] (const binary_operator& op) { return f(op) ? &op : nullptr; }, [] (bool) -> const binary_operator* { return nullptr; }, [&] (const conjunction& conj) -> const binary_operator* { for (auto& child : conj.children) { if (auto found = find_atom(child, f)) { return found; } } return nullptr; }, }, e); } /// Counts binary_operator atoms b for which f(b) is true. template requires std::regular_invocable size_t count_if(const expression& e, Fn f) { return std::visit(overloaded_functor{ [&] (const binary_operator& op) -> size_t { return f(op) ? 1 : 0; }, [&] (const conjunction& conj) { return std::accumulate(conj.children.cbegin(), conj.children.cend(), size_t{0}, [&] (size_t acc, const expression& c) { return acc + count_if(c, f); }); }, [] (bool) -> size_t { return 0; }, }, e); } inline const binary_operator* find(const expression& e, oper_t op) { return find_atom(e, [&] (const binary_operator& o) { return o.op == op; }); } inline bool needs_filtering(oper_t op) { return (op == oper_t::CONTAINS) || (op == oper_t::CONTAINS_KEY) || (op == oper_t::LIKE) || (op == oper_t::IS_NOT) || (op == oper_t::NEQ) ; } inline auto find_needs_filtering(const expression& e) { return find_atom(e, [] (const binary_operator& bo) { return needs_filtering(bo.op); }); } inline bool is_slice(oper_t op) { return (op == oper_t::LT) || (op == oper_t::LTE) || (op == oper_t::GT) || (op == oper_t::GTE); } inline bool has_slice(const expression& e) { return find_atom(e, [] (const binary_operator& bo) { return is_slice(bo.op); }); } inline bool is_compare(oper_t op) { switch (op) { case oper_t::EQ: case oper_t::LT: case oper_t::LTE: case oper_t::GT: case oper_t::GTE: case oper_t::NEQ: return true; default: return false; } } inline bool is_multi_column(const binary_operator& op) { return holds_alternative(op.lhs); } inline bool has_token(const expression& e) { return find_atom(e, [] (const binary_operator& o) { return std::holds_alternative(o.lhs); }); } inline bool has_slice_or_needs_filtering(const expression& e) { return find_atom(e, [] (const binary_operator& o) { return is_slice(o.op) || needs_filtering(o.op); }); } inline bool is_clustering_order(const binary_operator& op) { return op.order == comparison_order::clustering; } inline auto find_clustering_order(const expression& e) { return find_atom(e, is_clustering_order); } /// True iff binary_operator involves a collection. extern bool is_on_collection(const binary_operator&); /// Replaces every column_definition in an expression with this one. Throws if any LHS is not a single /// column_value. extern expression replace_column_def(const expression&, const column_definition*); inline oper_t pick_operator(statements::bound b, bool inclusive) { return is_start(b) ? (inclusive ? oper_t::GTE : oper_t::GT) : (inclusive ? oper_t::LTE : oper_t::LT); } inline column_value_tuple::column_value_tuple(std::vector e) : elements(std::move(e)) { } template requires requires (Range r) { { r.begin() } -> std::input_iterator; { r.end() } -> std::input_iterator; { *r.begin() } -> std::convertible_to; } column_value_tuple::column_value_tuple(Range r) : column_value_tuple(std::vector(r.begin(), r.end())) { } } // namespace expr } // namespace cql3 /// Required for fmt::join() to work on expression. template <> struct fmt::formatter; /// Required for fmt::join() to work on column_value. template <> struct fmt::formatter;