From c4ab0ddb85baecb9753cf004f0fbe8e951583e86 Mon Sep 17 00:00:00 2001
From: Avi Kivity <avi@scylladb.com>
Date: Sun, 3 Nov 2024 19:24:17 +0200
Subject: [PATCH] cql3: statement_restrictions: pre-analyze single-column
 clustering key restrictions

Change _clustering_prefix_restrictions and _idx_tbl_ck_prefix
(the latter is the equivalent of the former, for indexed queries),
to use predicate instead of expressions. This lets us do
more of the work of solving restrictions during prepare time.

We only handle single-column restrictions here. Multi-column
restrictions use the existing path.

We introduce two helpers:
 - value_set_to_singleton() converts a restriction solution to a singleton
   when we know that's the only possible answer
 - replace_column_def() overload for predicate, similar to the
   existing overload for expressions

There is a wart in get_single_column_clustering_bounds(): we arrive at
his point with the two vectors possibly pointing at different
columns. Previously, possible_lhs_values() did this check while solving.
We now check for it here.

The predicate::on variant gets another member, for clustering key prefixes.
Since everything is still handled by the legacy paths, we mostly
error out.
---
 cql3/restrictions/statement_restrictions.cc | 180 ++++++++++++++++----
 cql3/restrictions/statement_restrictions.hh |  13 +-
 2 files changed, 153 insertions(+), 40 deletions(-)

diff --git a/cql3/restrictions/statement_restrictions.cc b/cql3/restrictions/statement_restrictions.cc
index 04a41ec3e7..e9a9b3cdc0 100644
--- a/cql3/restrictions/statement_restrictions.cc
+++ b/cql3/restrictions/statement_restrictions.cc
@@ -148,6 +148,9 @@ solve(const predicate& ac, const query_options& options) {
             [&] (const on_partition_key_token& pkt) {
                 return possible_partition_token_values(ac.filter, options, *pkt.schema);
             },
+            [&] (const on_clustering_key_prefix& ockp) -> value_set {
+                on_internal_error(rlogger, "asked to directly solve for clustering key prefix");
+            },
         },
         ac.on);
 }
@@ -185,6 +188,18 @@ value_set intersection(value_set a, value_set b, const abstract_type* type) {
     return std::visit(intersection_visitor{type}, std::move(a), std::move(b));
 }
 
+static
+managed_bytes
+value_set_to_singleton(const value_set& vs) {
+    if (std::holds_alternative<value_list>(vs)) {
+        const auto& vl = std::get<value_list>(vs);
+        if (vl.size() == 1) {
+            return vl.front();
+        }
+    }
+    throw std::logic_error("value_set_to_singleton: value_set is not a singleton");
+}
+
 template<std::ranges::forward_range Range>
 value_list to_sorted_vector(Range r, const serialized_compare& comparator) {
     value_list tmp(r.begin(), r.end()); // Need random-access range to sort (r is not necessarily random-access).
@@ -245,6 +260,7 @@ type(const predicate& p) {
         overloaded_functor{
             [] (const on_column& oc) { return oc.column->type->without_reversed().shared_from_this(); },
             [] (const on_partition_key_token&) { return long_type; },
+            [] (const on_clustering_key_prefix&) -> data_type { on_internal_error(rlogger, "type: asked for clustering key prefix type"); },
         },
         p.on);
 }
@@ -495,6 +511,17 @@ interval<managed_bytes> to_range(const value_set& s) {
         }, s);
 }
 
+/// Replaces every column_definition in an expression with this one.  Throws if any LHS is not a single
+/// column_value.
+static
+predicate
+replace_column_def(predicate p, const column_definition* col) {
+    // Note: does not replace and `col` embedded in the p.solve_for
+    p.filter = expr::replace_column_def(p.filter, col);
+    p.on = on_column{col};
+    return p;
+}
+
 namespace {
 constexpr inline secondary_index::index::supports_expression_v operator&&(secondary_index::index::supports_expression_v v1, secondary_index::index::supports_expression_v v2) {
     using namespace secondary_index;
@@ -991,7 +1018,7 @@ static partition_range_restrictions extract_partition_range(
 /// Extracts where_clause atoms with clustering-column LHS and copies them to a vector.  These elements define the
 /// boundaries of any clustering slice that can possibly meet where_clause.  This vector can be calculated before
 /// binding expression markers, since LHS and operator are always known.
-static std::vector<expr::expression> extract_clustering_prefix_restrictions(
+static std::vector<predicate> extract_clustering_prefix_restrictions(
         const expr::expression& where_clause, schema_ptr schema) {
     using namespace expr;
 
@@ -999,10 +1026,10 @@ static std::vector<expr::expression> extract_clustering_prefix_restrictions(
     /// conjunction to combine subexpressions.
     struct visitor {
         schema_ptr table_schema;
-        std::vector<expression> multi; ///< All multi-column restrictions.
+        std::vector<predicate> multi; ///< All multi-column restrictions.
         /// All single-clustering-column restrictions, grouped by column.  Each value is either an atom or a
         /// conjunction of atoms.
-        std::unordered_map<const column_definition*, expression> single;
+        std::unordered_map<const column_definition*, predicate> single;
         const binary_operator* current_binary_operator = nullptr;
 
         void operator()(const conjunction& c) {
@@ -1019,13 +1046,21 @@ static std::vector<expr::expression> extract_clustering_prefix_restrictions(
         }
 
         void operator()(const tuple_constructor& tc) {
+            std::vector<const column_definition*> prefix;
             for (auto& e : tc.elements) {
-                if (!expr::is<column_value>(e)) {
+                if (auto cv = expr::as_if<column_value>(&e)) {
+                    prefix.push_back(cv->col);
+                } else {
                     on_internal_error(rlogger, fmt::format("extract_clustering_prefix_restrictions: tuple of non-column_value: {}", tc));
                 }
             }
             with_current_binary_operator(*this, [&] (const binary_operator& b) {
-                multi.push_back(b);
+                multi.push_back(predicate{
+                    .solve_for = nullptr, // FIXME: implement
+                    .filter = b,
+                    .on = on_clustering_key_prefix{prefix},
+                    .is_singleton = false,
+                });
             });
         }
 
@@ -1033,9 +1068,15 @@ static std::vector<expr::expression> extract_clustering_prefix_restrictions(
             auto s = &cv;
             with_current_binary_operator(*this, [&] (const binary_operator& b) {
                 if (s->col->is_clustering_key()) {
-                    const auto [it, inserted] = single.try_emplace(s->col, b);
+                    auto a = predicate{
+                        .solve_for = std::bind_front(possible_column_values, s->col, b),
+                        .filter = b,
+                        .on  = on_column{s->col},
+                        .is_singleton = b.op == oper_t::EQ,
+                    };
+                    const auto [it, inserted] = single.try_emplace(s->col, std::move(a));
                     if (!inserted) {
-                        it->second = make_conjunction(std::move(it->second), b);
+                        it->second = make_conjunction(std::move(it->second), std::move(a));
                     }
                 }
             });
@@ -1046,9 +1087,15 @@ static std::vector<expr::expression> extract_clustering_prefix_restrictions(
 
             with_current_binary_operator(*this, [&] (const binary_operator& b) {
                 if (cval.col->is_clustering_key()) {
-                    const auto [it, inserted] = single.try_emplace(cval.col, b);
+                    auto a = predicate{
+                        .solve_for = std::bind_front(possible_column_values, cval.col, b),
+                        .filter = b,
+                        .on  = on_column{cval.col},
+                        .is_singleton = b.op == oper_t::EQ,
+                    };
+                    const auto [it, inserted] = single.try_emplace(cval.col, std::move(a));
                     if (!inserted) {
-                        it->second = make_conjunction(std::move(it->second), b);
+                        it->second = make_conjunction(std::move(it->second), std::move(a));
                     }
                 }
             });
@@ -1111,19 +1158,19 @@ static std::vector<expr::expression> extract_clustering_prefix_restrictions(
         return std::move(v.multi);
     }
 
-    std::vector<expression> prefix;
+    std::vector<predicate> prefix;
     for (const auto& col : schema->clustering_key_columns()) {
         const auto found = v.single.find(&col);
         if (found == v.single.end()) { // Any further restrictions are skipping the CK order.
             break;
         }
-        if (find_needs_filtering(found->second)) { // This column's restriction doesn't define a clear bound.
+        if (find_needs_filtering(found->second.filter)) { // This column's restriction doesn't define a clear bound.
             // TODO: if this is a conjunction of filtering and non-filtering atoms, we could split them and add the
             // latter to the prefix.
             break;
         }
         prefix.push_back(found->second);
-        if (has_slice(found->second)) {
+        if (has_slice(found->second.filter)) {
             break;
         }
     }
@@ -2323,9 +2370,9 @@ struct multi_column_range_accumulator {
 std::vector<query::clustering_range> get_multi_column_clustering_bounds(
         const query_options& options,
         schema_ptr schema,
-        const std::vector<expression>& multi_column_restrictions) {
+        const std::vector<predicate>& multi_column_restrictions) {
     multi_column_range_accumulator acc{options, schema};
-    for (const auto& restr : multi_column_restrictions) {
+    for (const auto& restr : multi_column_restrictions | std::views::transform(&predicate::filter)) {
         expr::visit(acc, restr);
     }
     return acc.ranges;
@@ -2340,14 +2387,16 @@ query::clustering_range reverse_if_reqd(query::clustering_range r, const abstrac
 std::vector<query::clustering_range> get_single_column_clustering_bounds(
         const query_options& options,
         const schema& schema,
-        const std::vector<expression>& single_column_restrictions) {
+        const std::vector<predicate>& single_column_restrictions) {
     const size_t size_limit =
             options.get_cql_config().restrictions.clustering_key_restrictions_max_cartesian_product_size;
     size_t product_size = 1;
     std::vector<std::vector<managed_bytes>> prior_column_values; // Equality values of columns seen so far.
     for (size_t i = 0; i < single_column_restrictions.size(); ++i) {
-        auto values = possible_column_values(
-                &schema.clustering_column_at(i), // This should be the LHS of restrictions[i].
+        if (&schema.clustering_column_at(i) != require_on_single_column(single_column_restrictions[i])) {
+            break;
+        }
+        auto values = solve(
                 single_column_restrictions[i],
                 options);
         if (auto list = std::get_if<value_list>(&values)) {
@@ -2414,7 +2463,7 @@ std::vector<query::clustering_range> get_single_column_clustering_bounds(
 static std::vector<query::clustering_range> get_index_v1_token_range_clustering_bounds(
         const query_options& options,
         const column_definition& token_column,
-        const expression& token_restriction) {
+        const predicate& token_restriction) {
 
     // A workaround in order to make possible_column_values work properly.
     // possible_column_values looks at the column type and uses this type's comparator.
@@ -2425,10 +2474,10 @@ static std::vector<query::clustering_range> get_index_v1_token_range_clustering_
     // and use this restriction to calculate possible lhs values.
     column_definition token_column_bigint = token_column;
     token_column_bigint.type = long_type;
-    expression new_token_restrictions = replace_column_def(token_restriction, &token_column_bigint);
+    predicate new_token_restrictions = replace_column_def(token_restriction, &token_column_bigint);
 
     std::variant<value_list, interval<managed_bytes>> values =
-        possible_column_values(&token_column_bigint, new_token_restrictions, options);
+        new_token_restrictions.solve_for(options);
 
     return std::visit(overloaded_functor {
         [](const value_list& list) {
@@ -2618,9 +2667,9 @@ std::vector<query::clustering_range> get_equivalent_ranges(
 
 /// Extracts raw multi-column bounds from exprs; last one wins.
 query::clustering_range range_from_raw_bounds(
-        const std::vector<expression>& exprs, const query_options& options, const schema& schema) {
+        const std::vector<predicate>& exprs, const query_options& options, const schema& schema) {
     opt_bound lb, ub;
-    for (const auto& e : exprs) {
+    for (const auto& e : exprs | std::views::transform(&predicate::filter)) {
         if (auto b = find_clustering_order(e)) {
             cql3::raw_value tup_val = expr::evaluate(b->rhs, options);
             if (tup_val.is_null()) {
@@ -2649,10 +2698,10 @@ statement_restrictions::build_get_clustering_bounds_fn() const {
         return {query::clustering_range::make_open_ended_both_sides()};
       };
     }
-    if (find_binop(_clustering_prefix_restrictions[0], is_multi_column)) {
+    if (find_binop(_clustering_prefix_restrictions[0].filter, is_multi_column)) { // FIXME: adjust for solve_for
       return [&] (const query_options& options) -> std::vector<query::clustering_range> {
         bool all_natural = true, all_reverse = true; ///< Whether column types are reversed or natural.
-        for (auto& r : _clustering_prefix_restrictions) { // TODO: move to constructor, do only once.
+        for (auto& r : _clustering_prefix_restrictions | std::views::transform(&predicate::filter)) { // TODO: move to constructor, do only once.
             using namespace expr;
             const auto& binop = expr::as<binary_operator>(r);
             if (is_clustering_order(binop)) {
@@ -2798,45 +2847,89 @@ void statement_restrictions::prepare_indexed_global(const schema& idx_tbl_schema
         // This means that p1 and p2 can have many different values (token is a hash, can have collisions).
         // Clustering prefix ends after token_restriction, all further restrictions have to be filtered.
         expr::expression token_restriction = replace_partition_token(_partition_key_restrictions, token_column, *_schema);
-        _idx_tbl_ck_prefix = std::vector{std::move(token_restriction)};
+        _idx_tbl_ck_prefix = std::vector{predicate{
+            .solve_for = nullptr, // FIXME: adjust for solve_for
+            .filter = std::move(token_restriction),
+            .on = on_column{token_column},
+            .is_singleton = false, // FIXME: could be a singleton token. Not very important.
+        }};
 
         return;
     }
 
     // If we're here, it means the index cannot be on a partition column: process_partition_key_restrictions()
     // avoids indexing when _partition_range_is_simple.  See _idx_tbl_ck_prefix blurb for its composition.
-    _idx_tbl_ck_prefix = std::vector<expr::expression>(1 + _schema->partition_key_size(), expr::conjunction({}));
+    _idx_tbl_ck_prefix = std::vector<predicate>(1 + _schema->partition_key_size(), predicate{
+        .solve_for = nullptr,  // FIXME: this is all overwritten later. Should be refactored.
+        .filter = expr::expression(expr::conjunction{}),
+        .on = on_column{nullptr}, // Illegal but will be overwritten
+        .is_singleton = false,
+    });
     _idx_tbl_ck_prefix->reserve(_idx_tbl_ck_prefix->size() + idx_tbl_schema.clustering_key_size());
     auto *single_column_partition_key_restrictions = std::get_if<single_column_partition_range_restrictions>(&_partition_range_restrictions);
     if (single_column_partition_key_restrictions) {
       for (const auto& e : single_column_partition_key_restrictions->per_column_restrictions) {
-        const auto col = expr::as<column_value>(find(e.filter, oper_t::EQ)->lhs).col;
+        const auto col = require_on_single_column(e);
         const auto pos = _schema->position(*col) + 1;
-        (*_idx_tbl_ck_prefix)[pos] = replace_column_def(e.filter, &idx_tbl_schema.clustering_column_at(pos));
+        (*_idx_tbl_ck_prefix)[pos] = replace_column_def(e, &idx_tbl_schema.clustering_column_at(pos));
       }
     }
 
-    if (std::ranges::any_of(*_idx_tbl_ck_prefix | std::views::drop(1), is_empty_restriction)) {
+    if (std::ranges::any_of(*_idx_tbl_ck_prefix | std::views::drop(1) | std::views::transform(&predicate::filter), is_empty_restriction)) {
         // If the partition key is not fully restricted, the index clustering key is of no use.
-        (*_idx_tbl_ck_prefix) = std::vector<expr::expression>();
+        (*_idx_tbl_ck_prefix) = std::vector<predicate>();
         return;
     }
 
     add_clustering_restrictions_to_idx_ck_prefix(idx_tbl_schema);
 
     auto pk_expressions = (*_idx_tbl_ck_prefix)
+            | std::views::transform(&predicate::filter)
             | std::views::drop(1)   // skip the token restriction
             | std::views::take(_schema->partition_key_size()) // take only the partition key restrictions
             | std::views::transform(expr::as<expr::binary_operator>) // we know it's an EQ
             | std::views::transform(std::mem_fn(&expr::binary_operator::rhs)) // "solve" for the column value
             | std::ranges::to<std::vector>();
 
+    auto pk_solvers = (*_idx_tbl_ck_prefix)
+            | std::views::drop(1) // skip the token restriction
+            | std::views::take(_schema->partition_key_size()) // take only the partition key restrictions
+            | std::views::transform(&predicate::solve_for)
+            | std::ranges::to<std::vector>();
+
+    auto is_singleton = std::ranges::all_of(
+            (*_idx_tbl_ck_prefix)
+            | std::views::drop(1)
+            | std::views::take(_schema->partition_key_size()),
+            &predicate::is_singleton);
+
+    if (!is_singleton) {
+        on_internal_error(rlogger, "Inconsistency in singleton calculation in indexed query");
+    }
+
     auto token_func = make_shared<cql3::functions::token_fct>(_schema);
 
-    (*_idx_tbl_ck_prefix)[0] = binary_operator(
+    auto token_expr = binary_operator(
             column_value(token_column),
             oper_t::EQ,
             expr::function_call{.func = std::move(token_func), .args = std::move(pk_expressions)});
+
+    auto token_solver = [this, pk_solvers = std::move(pk_solvers)] (const query_options& options) -> value_set {
+        auto pk_values = pk_solvers
+            | std::views::transform([&] (auto&& solver) { return solver(options); })
+            | std::views::transform(value_set_to_singleton)
+            | std::ranges::to<utils::small_vector<managed_bytes, 4>>();
+        auto pk = partition_key::from_exploded(pk_values);
+        auto tok = dht::get_token(*_schema, pk);
+        return value_list{managed_bytes(serialized(dht::token::to_int64(tok)))};
+    };
+
+    (*_idx_tbl_ck_prefix)[0] = predicate{
+        .solve_for = std::move(token_solver),
+        .filter = std::move(token_expr),
+        .on = on_column{token_column},
+        .is_singleton = is_singleton,
+    };
 }
 
 void statement_restrictions::prepare_indexed_local(const schema& idx_tbl_schema) {
@@ -2845,7 +2938,7 @@ void statement_restrictions::prepare_indexed_local(const schema& idx_tbl_schema)
     }
 
     // Local index clustering key is (indexed column, base clustering key)
-    _idx_tbl_ck_prefix = std::vector<expr::expression>();
+    _idx_tbl_ck_prefix = std::vector<predicate>();
     _idx_tbl_ck_prefix->reserve(1 + _clustering_prefix_restrictions.size());
 
     const column_definition& indexed_column = idx_tbl_schema.column_at(column_kind::clustering_key, 0);
@@ -2858,7 +2951,12 @@ void statement_restrictions::prepare_indexed_local(const schema& idx_tbl_schema)
 
     // Translate the restriction to use column from the index schema and add it
     expr::expression replaced_idx_restriction = replace_column_def(idx_col_restriction_expr, &indexed_column);
-    _idx_tbl_ck_prefix->push_back(replaced_idx_restriction);
+    _idx_tbl_ck_prefix->push_back(predicate{
+        .solve_for = std::bind_front(possible_column_values, &indexed_column, replaced_idx_restriction),
+        .filter = replaced_idx_restriction,
+        .on = on_column{&indexed_column},
+        .is_singleton = false, // Could be true, but not important.
+    });
 
     // Add restrictions for the clustering key
     add_clustering_restrictions_to_idx_ck_prefix(idx_tbl_schema);
@@ -2866,16 +2964,24 @@ void statement_restrictions::prepare_indexed_local(const schema& idx_tbl_schema)
 
 void statement_restrictions::add_clustering_restrictions_to_idx_ck_prefix(const schema& idx_tbl_schema) {
     for (const auto& e : _clustering_prefix_restrictions) {
-        if (find_binop(_clustering_prefix_restrictions[0], is_multi_column)) {
+        if (find_binop(_clustering_prefix_restrictions[0].filter, is_multi_column)) {
             // TODO: We could handle single-element tuples, eg. `(c)>=(123)`.
             break;
         }
-        const auto any_binop = find_binop(e, [] (auto&&) { return true; });
+        const auto any_binop = find_binop(e.filter, [] (auto&&) { return true; });
         if (!any_binop) {
             break;
         }
         const auto col = expr::as<column_value>(any_binop->lhs).col;
-        _idx_tbl_ck_prefix->push_back(replace_column_def(e, idx_tbl_schema.get_column_definition(col->name())));
+        auto col_in_index = idx_tbl_schema.get_column_definition(col->name());
+        auto replaced = replace_column_def(e.filter, col_in_index);
+        auto a = predicate{
+            .solve_for = std::bind_front(possible_column_values, col_in_index, replaced),
+            .filter = replaced,
+            .on = on_column{col_in_index},
+            .is_singleton = false, // FIXME: could be a singleton token. Not very important.
+        };
+        _idx_tbl_ck_prefix->push_back(std::move(a));
     }
 }
 
@@ -3024,7 +3130,7 @@ void statement_restrictions::validate_primary_key(const query_options& options)
             validate_primary_key_restrictions(options, r.per_column_restrictions | std::views::transform(&predicate::filter));
         }
     }, _partition_range_restrictions);
-    validate_primary_key_restrictions(options, _clustering_prefix_restrictions);
+    validate_primary_key_restrictions(options, _clustering_prefix_restrictions | std::views::transform(&predicate::filter));
 }
 
 
diff --git a/cql3/restrictions/statement_restrictions.hh b/cql3/restrictions/statement_restrictions.hh
index a9345452a3..babec09b5a 100644
--- a/cql3/restrictions/statement_restrictions.hh
+++ b/cql3/restrictions/statement_restrictions.hh
@@ -48,6 +48,12 @@ struct on_partition_key_token {
     bool operator==(const on_partition_key_token&) const = default;
 };
 
+struct on_clustering_key_prefix {
+    std::vector<const column_definition*> columns;
+
+    bool operator==(const on_clustering_key_prefix&) const = default;
+};
+
 // A predicate on a column or a combination of columns. The WHERE clause analyzer
 // will attempt to convert predicates (that return true or false for a particular row)
 // to solvers (that return the set of column values that satisfy the predicate) when possible.
@@ -60,7 +66,8 @@ struct predicate {
     // What column the predicate can be solved for
     std::variant<
             on_column,                     // solving for a single column: e.g. c1 = 3
-            on_partition_key_token         // solving for the token, e.g. token(pk1, pk2) >= :var
+            on_partition_key_token,        // solving for the token, e.g. token(pk1, pk2) >= :var
+            on_clustering_key_prefix       // solving for a clustering key prefix: e.g. (ck1, ck2) >= (3, 4)
     > on;
     // Whether the returned value_set will resolve to a single value.
     bool is_singleton = false;
@@ -167,7 +174,7 @@ private:
     ///   4.4 elements other than the last have only EQ or IN atoms
     ///   4.5 the last element has only EQ, IN, or is_slice() atoms
     /// 5. if multi-column, then each element is a binary_operator
-    std::vector<expr::expression> _clustering_prefix_restrictions;
+    std::vector<predicate> _clustering_prefix_restrictions;
 
     /// Like _clustering_prefix_restrictions, but for the indexing table (if this is an index-reading statement).
     /// Recall that the index-table CK is (token, PK, CK) of the base table for a global index and (indexed column,
@@ -176,7 +183,7 @@ private:
     /// Elements are conjunctions of single-column binary operators with the same LHS.
     /// Element order follows the indexing-table clustering key.
     /// In case of a global index the first element's (token restriction) RHS is a dummy value, it is filled later.
-    std::optional<std::vector<expr::expression>> _idx_tbl_ck_prefix;
+    std::optional<std::vector<predicate>> _idx_tbl_ck_prefix;
 
     /// Parts of _where defining the partition range.
     ///