Files
scylladb/schema/schema.hh
Michael Litvak 9172cc172e schema: add logstor cf property
add a schema property for tables with logstor storage
2026-03-18 19:24:26 +01:00

1122 lines
41 KiB
C++

/*
* Copyright (C) 2015-present ScyllaDB
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
*/
#pragma once
#include "cql3/description.hh"
#include "utils/assert.hh"
#include <functional>
#include <optional>
#include <unordered_map>
#include <ranges>
#include <boost/dynamic_bitset.hpp>
#include "cql3/column_specification.hh"
#include <seastar/core/shared_ptr.hh>
#include <seastar/util/backtrace.hh>
#include <seastar/core/sstring.hh>
#include "types/types.hh"
#include "keys/compound.hh"
#include "gc_clock.hh"
#include "sstables/compressor.hh"
#include "compaction/compaction_strategy_type.hh"
#include "caching_options.hh"
#include "column_computation.hh"
#include "mutation/timestamp.hh"
#include "tombstone_gc_options.hh"
#include "db/per_partition_rate_limit_options.hh"
#include "db/tablet_options.hh"
#include "schema_fwd.hh"
#include "db/view/base_info.hh"
namespace dht {
class i_partitioner;
class sharder;
class static_sharder;
}
namespace cdc {
class options;
}
namespace replica {
class table;
}
using column_count_type = uint32_t;
// Column ID, unique within column_kind
using column_id = column_count_type;
// Column ID unique within a schema. Enum class to avoid
// mixing with column id.
enum class ordinal_column_id: column_count_type {};
// Maintains a set of columns used in a query. The columns are
// identified by ordinal_id.
//
// @sa column_definition::ordinal_id.
class column_set {
public:
using bitset = boost::dynamic_bitset<uint64_t>;
using size_type = bitset::size_type;
// column_count_type is more narrow than size_type, but truncating a size_type max value does
// give column_count_type max value. This is used to avoid extra branching in
// find_first()/find_next().
static_assert(static_cast<column_count_type>(boost::dynamic_bitset<uint64_t>::npos) == ~static_cast<column_count_type>(0));
static constexpr ordinal_column_id npos = static_cast<ordinal_column_id>(bitset::npos);
explicit column_set(column_count_type num_bits = 0)
: _mask(num_bits)
{
}
void resize(column_count_type num_bits) {
_mask.resize(num_bits);
}
// Set the appropriate bit for column id.
void set(ordinal_column_id id) {
column_count_type bit = static_cast<column_count_type>(id);
_mask.set(bit);
}
// Test the mask for use of a given column id.
bool test(ordinal_column_id id) const {
column_count_type bit = static_cast<column_count_type>(id);
return _mask.test(bit);
}
// @sa boost::dynamic_bistet docs
size_type count() const { return _mask.count(); }
ordinal_column_id find_first() const {
return static_cast<ordinal_column_id>(_mask.find_first());
}
ordinal_column_id find_next(ordinal_column_id pos) const {
return static_cast<ordinal_column_id>(_mask.find_next(static_cast<column_count_type>(pos)));
}
// Logical or
void union_with(const column_set& with) {
_mask |= with._mask;
}
private:
bitset _mask;
};
class schema_registry_entry;
class schema_builder;
// Useful functions to manipulate the schema's comparator field
namespace cell_comparator {
sstring to_sstring(const schema& s);
bool check_compound(sstring comparator);
void read_collections(schema_builder& builder, sstring comparator);
}
namespace db {
class extensions;
}
// make sure these match the order we like columns back from schema
enum class column_kind { partition_key, clustering_key, static_column, regular_column };
enum class column_view_virtual { no, yes };
sstring to_sstring(column_kind k);
bool is_compatible(column_kind k1, column_kind k2);
enum class cf_type : uint8_t {
standard,
super,
};
inline sstring cf_type_to_sstring(cf_type t) {
if (t == cf_type::standard) {
return "Standard";
} else if (t == cf_type::super) {
return "Super";
}
throw std::invalid_argument(format("unknown type: {:d}\n", uint8_t(t)));
}
inline cf_type sstring_to_cf_type(sstring name) {
if (name == "Standard") {
return cf_type::standard;
} else if (name == "Super") {
return cf_type::super;
}
throw std::invalid_argument(format("unknown type: {}\n", name));
}
struct speculative_retry {
enum class type {
NONE, CUSTOM, PERCENTILE, ALWAYS
};
private:
type _t;
double _v;
public:
speculative_retry(type t, double v) : _t(t), _v(v) {}
sstring to_sstring() const;
static speculative_retry from_sstring(sstring str);
type get_type() const {
return _t;
}
double get_value() const {
return _v;
}
bool operator==(const speculative_retry& other) const = default;
};
enum class storage_engine_type {
normal,
logstor,
};
inline sstring storage_engine_type_to_sstring(storage_engine_type t) {
switch (t) {
case storage_engine_type::normal:
return "normal";
case storage_engine_type::logstor:
return "logstor";
}
throw std::invalid_argument(format("unknown storage engine type: {:d}\n", uint8_t(t)));
}
using index_options_map = std::unordered_map<sstring, sstring>;
enum class index_metadata_kind {
keys,
custom,
composites,
};
class index_metadata final {
public:
struct is_local_index_tag {};
using is_local_index = bool_class<is_local_index_tag>;
private:
table_id _id;
sstring _name;
index_metadata_kind _kind;
index_options_map _options;
bool _local;
public:
index_metadata(const sstring& name, const index_options_map& options, index_metadata_kind kind, is_local_index local);
bool operator==(const index_metadata& other) const;
bool equals_noname(const index_metadata& other) const;
const table_id& id() const;
const sstring& name() const;
index_metadata_kind kind() const;
const index_options_map& options() const;
bool local() const;
static sstring get_default_index_name(const sstring& cf_name, std::optional<sstring> root);
};
class column_definition final {
public:
struct name_comparator {
data_type type;
name_comparator(data_type type) : type(type) {}
bool operator()(const column_definition& cd1, const column_definition& cd2) const {
return type->less(cd1.name(), cd2.name());
}
};
private:
bytes _name;
api::timestamp_type _dropped_at;
bool _is_atomic;
bool _is_counter;
column_view_virtual _is_view_virtual;
column_computation_ptr _computation;
struct thrift_bits {
thrift_bits()
: is_on_all_components(0)
{}
uint8_t is_on_all_components : 1;
// more...?
};
thrift_bits _thrift_bits;
friend class schema;
public:
column_definition(bytes name, data_type type, column_kind kind,
column_id component_index = 0,
column_view_virtual view_virtual = column_view_virtual::no,
column_computation_ptr = nullptr,
api::timestamp_type dropped_at = api::missing_timestamp);
data_type type;
// Unique within (kind, schema instance).
// schema::position() and component_index() depend on the fact that for PK columns this is
// equivalent to component index.
column_id id;
// Unique within schema instance
ordinal_column_id ordinal_id;
column_kind kind;
lw_shared_ptr<cql3::column_specification> column_specification;
// NOTICE(sarna): This copy constructor is hand-written instead of default,
// because it involves deep copying of the computation object.
// Computation has a strict ownership policy provided by
// unique_ptr, and as such cannot rely on default copying.
column_definition(const column_definition& other)
: _name(other._name)
, _dropped_at(other._dropped_at)
, _is_atomic(other._is_atomic)
, _is_counter(other._is_counter)
, _is_view_virtual(other._is_view_virtual)
, _computation(other.get_computation_ptr())
, type(other.type)
, id(other.id)
, ordinal_id(other.ordinal_id)
, kind(other.kind)
, column_specification(other.column_specification)
{}
column_definition& operator=(const column_definition& other) {
if (this == &other) {
return *this;
}
column_definition tmp(other);
*this = std::move(tmp);
return *this;
}
column_definition& operator=(column_definition&& other) = default;
bool is_static() const { return kind == column_kind::static_column; }
bool is_regular() const { return kind == column_kind::regular_column; }
bool is_partition_key() const { return kind == column_kind::partition_key; }
bool is_clustering_key() const { return kind == column_kind::clustering_key; }
bool is_primary_key() const { return kind == column_kind::partition_key || kind == column_kind::clustering_key; }
bool is_atomic() const { return _is_atomic; }
bool is_multi_cell() const { return !_is_atomic; }
bool is_counter() const { return _is_counter; }
// "virtual columns" appear in a materialized view as placeholders for
// unselected columns, with liveness information but without data, and
// allow view rows to remain alive despite having no data (issue #3362).
// These columns should be hidden from the user's SELECT queries.
bool is_view_virtual() const { return _is_view_virtual == column_view_virtual::yes; }
column_view_virtual view_virtual() const { return _is_view_virtual; }
// Computed column values are generated from other columns (and possibly other sources) during updates.
// Their values are still stored on disk, same as a regular columns.
bool is_computed() const { return bool(_computation); }
const column_computation& get_computation() const { return *_computation; }
column_computation_ptr get_computation_ptr() const {
return _computation ? _computation->clone() : nullptr;
}
void set_computed(column_computation_ptr computation) { _computation = std::move(computation); }
// Columns hidden from CQL cannot be in any way retrieved by the user,
// either explicitly or via the '*' operator, or functions, aggregates, etc.
bool is_hidden_from_cql() const { return is_view_virtual(); }
const sstring& name_as_text() const;
const bytes& name() const;
sstring name_as_cql_string() const;
friend fmt::formatter<column_definition>;
bool has_component_index() const {
return is_primary_key();
}
uint32_t component_index() const {
SCYLLA_ASSERT(has_component_index());
return id;
}
uint32_t position() const {
if (has_component_index()) {
return component_index();
}
return 0;
}
bool is_on_all_components() const;
bool is_part_of_cell_name() const {
return is_regular() || is_static();
}
api::timestamp_type dropped_at() const { return _dropped_at; }
friend bool operator==(const column_definition&, const column_definition&);
};
class schema_builder;
bool operator==(const column_definition&, const column_definition&);
static constexpr int DEFAULT_MIN_COMPACTION_THRESHOLD = 4;
static constexpr int DEFAULT_MAX_COMPACTION_THRESHOLD = 32;
static constexpr int DEFAULT_MIN_INDEX_INTERVAL = 128;
static constexpr int DEFAULT_GC_GRACE_SECONDS = 864000;
// Unsafe to access across shards.
// Safe to copy across shards.
class column_mapping_entry {
bytes _name;
data_type _type;
bool _is_atomic;
public:
column_mapping_entry(bytes name, data_type type)
: _name(std::move(name)), _type(std::move(type)), _is_atomic(_type->is_atomic()) { }
column_mapping_entry(bytes name, sstring type_name);
column_mapping_entry(const column_mapping_entry&);
column_mapping_entry& operator=(const column_mapping_entry&);
column_mapping_entry(column_mapping_entry&&) = default;
column_mapping_entry& operator=(column_mapping_entry&&) = default;
const bytes& name() const { return _name; }
const data_type& type() const { return _type; }
const sstring& type_name() const { return _type->name(); }
bool is_atomic() const { return _is_atomic; }
};
bool operator==(const column_mapping_entry& lhs, const column_mapping_entry& rhs);
// Encapsulates information needed for converting mutations between different schema versions.
//
// Unsafe to access across shards.
// Safe to copy across shards.
class column_mapping {
private:
// Contains _n_static definitions for static columns followed by definitions for regular columns,
// both ordered by consecutive column_ids.
// Primary key column sets are not mutable so we don't need to map them.
std::vector<column_mapping_entry> _columns;
column_count_type _n_static = 0;
public:
column_mapping() {}
column_mapping(std::vector<column_mapping_entry> columns, column_count_type n_static)
: _columns(std::move(columns))
, _n_static(n_static)
{ }
const std::vector<column_mapping_entry>& columns() const { return _columns; }
column_count_type n_static() const { return _n_static; }
const column_mapping_entry& column_at(column_kind kind, column_id id) const;
const column_mapping_entry& static_column_at(column_id id) const;
const column_mapping_entry& regular_column_at(column_id id) const;
};
bool operator==(const column_mapping& lhs, const column_mapping& rhs);
/**
* Augments a schema with fields related to materialized views.
* Effectively immutable.
*/
class raw_view_info final {
table_id _base_id;
sstring _base_name;
bool _include_all_columns;
sstring _where_clause;
public:
raw_view_info(table_id base_id, sstring base_name, bool include_all_columns, sstring where_clause);
const table_id& base_id() const {
return _base_id;
}
const sstring& base_name() const {
return _base_name;
}
bool include_all_columns() const {
return _include_all_columns;
}
const sstring& where_clause() const {
return _where_clause;
}
friend bool operator==(const raw_view_info&, const raw_view_info&);
friend fmt::formatter<raw_view_info>;
};
bool operator==(const raw_view_info&, const raw_view_info&);
class view_info;
// Represents a column set which is compactible with Cassandra 3.x.
//
// This layout differs from the layout Scylla uses in schema/schema_builder for static compact tables.
// For such tables, Scylla expects all columns to be of regular type and no clustering columns,
// whereas in v3 those columns are static and there is a clustering column with type matching the
// cell name comparator and a regular column with type matching the default validator.
// See issues #2555 and #1474.
class v3_columns {
bool _is_dense = false;
bool _is_compound = false;
std::vector<column_definition> _columns;
std::unordered_map<bytes, const column_definition*> _columns_by_name;
public:
v3_columns(std::vector<column_definition> columns, bool is_dense, bool is_compound);
v3_columns() = default;
v3_columns(v3_columns&&) = default;
v3_columns& operator=(v3_columns&&) = default;
v3_columns(const v3_columns&) = delete;
static v3_columns from_v2_schema(const schema&);
public:
const std::vector<column_definition>& all_columns() const;
const std::unordered_map<bytes, const column_definition*>& columns_by_name() const;
bool is_static_compact() const;
bool is_compact() const;
void apply_to(schema_builder&) const;
};
namespace query {
class partition_slice;
}
/**
* Schema extension. An opaque type representing
* entries in the "extensions" part of a table/view (see schema_tables).
*
* An extension has a name (the mapping key), and it can re-serialize
* itself to bytes again, when we write back into schema tables.
*
* Code using a particular extension can locate it by name in the schema map,
* and barring the "is_placeholder" says true, cast it to whatever might
* be the expected implementation.
*
* We allow placeholder object since an extension written to schema tables
* might be unavailable on next boot/other node. To avoid losing the config data,
* a placeholder object is put into schema map, which at least can
* re-serialize the data back.
*
*/
class schema_extension {
public:
virtual ~schema_extension() {};
[[deprecated("Use dedicated columns in system_schema.scylla_tables instead")]]
schema_extension() = default;
virtual future<> validate(const schema&) const {
return make_ready_future<>();
}
virtual bytes serialize() const = 0;
virtual bool is_placeholder() const {
return false;
}
using default_map_type = std::map<sstring, sstring>;
// default impl assumes options are in a map.
// implementations should override if not
virtual std::string options_to_string() const;
};
/**
* Schema static properties
*
* Represents internal table properties not visible to users.
* Their values are derived solely from keyspace/table names (thereby "static").
* Despite their name, they are NOT part of the schema (i.e., they do not map to
* user-visible schema fields) and they are NOT persisted in system tables.
* The reason they are carried along with in-memory `schema` objects is just
* convenience, see:
* https://github.com/scylladb/scylladb/pull/13170#issuecomment-1469848086
*/
struct schema_static_props {
bool use_null_sharder = false; // use a sharder that puts everything on shard 0
bool wait_for_sync_to_commitlog = false; // true if all writes using this schema have to be synced immediately by commitlog
bool use_schema_commitlog = false;
void enable_schema_commitlog() {
use_schema_commitlog = true;
use_null_sharder = true; // schema commitlog lives only on the null shard
}
bool is_group0_table = false; // the table is a group 0 table
};
struct schema_describe_helper {
enum class type { table, view, index };
type type;
bool is_global_index;
std::optional<sstring> custom_index_class;
schema_ptr base_schema; // relevant for view and index
};
/*
* Effectively immutable.
* Not safe to access across cores because of shared_ptr's.
* Use global_schema_ptr for safe across-shard access.
*/
class schema final : public enable_lw_shared_from_this<schema> {
friend class v3_columns;
public:
struct dropped_column {
data_type type;
api::timestamp_type timestamp;
bool operator==(const dropped_column& rhs) const {
return type == rhs.type && timestamp == rhs.timestamp;
}
};
using extensions_map = std::map<sstring, ::shared_ptr<schema_extension>>;
/// This structure represents the properties of schema entities that the user
/// can directly set or modify via CREATE/ALTER statements.
///
/// Note that ID is absent. That's because it cannot be changed.
struct user_properties {
sstring comment;
gc_clock::duration default_time_to_live = gc_clock::duration::zero();
double bloom_filter_fp_chance = 0.01;
compression_parameters compressor_params;
extensions_map extensions;
int32_t gc_grace_seconds = DEFAULT_GC_GRACE_SECONDS;
std::optional<int32_t> _paxos_grace_seconds;
double crc_check_chance = 1;
int32_t min_compaction_threshold = DEFAULT_MIN_COMPACTION_THRESHOLD;
int32_t max_compaction_threshold = DEFAULT_MAX_COMPACTION_THRESHOLD;
int32_t min_index_interval = DEFAULT_MIN_INDEX_INTERVAL;
int32_t max_index_interval = 2048;
int32_t memtable_flush_period = 0;
::speculative_retry speculative_retry = ::speculative_retry(speculative_retry::type::PERCENTILE, 0.99);
// This is the compaction strategy that will be used by default on tables which don't have one explicitly specified.
compaction::compaction_strategy_type compaction_strategy = compaction::compaction_strategy_type::incremental;
std::map<sstring, sstring> compaction_strategy_options;
bool compaction_enabled = true;
storage_engine_type storage_engine = storage_engine_type::normal;
::caching_options caching_options;
std::optional<std::map<sstring, sstring>> tablet_options;
const cdc::options& get_cdc_options() const;
gc_clock::duration get_paxos_grace_seconds() const;
const ::tombstone_gc_options& get_tombstone_gc_options() const;
};
private:
// More complex fields are derived from these inside rebuild().
// Contains only fields which can be safely default-copied.
struct raw_schema {
raw_schema(table_id id);
table_id _id;
sstring _ks_name;
sstring _cf_name;
// regular columns are sorted by name
// static columns are sorted by name, but present only when there's any clustering column
std::vector<column_definition> _columns;
data_type _regular_column_name_type;
data_type _default_validation_class = bytes_type;
bool _is_dense = false;
bool _is_compound = true;
bool _is_counter = false;
cf_type _type = cf_type::standard;
db::per_partition_rate_limit_options _per_partition_rate_limit_options;
table_schema_version _version;
std::unordered_map<sstring, dropped_column> _dropped_columns;
std::map<bytes, data_type> _collections;
std::unordered_map<sstring, index_metadata> _indices_by_name;
std::reference_wrapper<const dht::i_partitioner> _partitioner;
// Sharding info is not stored in the schema mutation and does not affect
// schema digest. It is also not set locally on a schema tables.
std::reference_wrapper<const dht::static_sharder> _sharder;
bool _in_memory = false;
std::optional<raw_view_info> _view_info;
user_properties _props;
};
raw_schema _raw;
schema_static_props _static_props;
v3_columns _v3_columns;
mutable schema_registry_entry* _registry_entry = nullptr;
std::unique_ptr<::view_info> _view_info;
mutable schema_ptr _cdc_schema;
const std::array<column_count_type, 3> _offsets;
inline column_count_type column_offset(column_kind k) const {
return k == column_kind::partition_key ? 0 : _offsets[column_count_type(k) - 1];
}
std::unordered_map<bytes, const column_definition*> _columns_by_name;
lw_shared_ptr<compound_type<allow_prefixes::no>> _partition_key_type;
lw_shared_ptr<compound_type<allow_prefixes::yes>> _clustering_key_type;
column_mapping _column_mapping;
shared_ptr<query::partition_slice> _full_slice;
column_count_type _clustering_key_size;
column_count_type _regular_column_count;
column_count_type _static_column_count;
std::vector<const column_definition*> _all_columns_in_select_order;
extensions_map& extensions() {
return _raw._props.extensions;
}
friend class db::extensions;
friend class schema_builder;
public:
using row_column_ids_are_ordered_by_name = std::true_type;
typedef std::vector<column_definition> columns_type;
typedef typename columns_type::iterator iterator;
typedef typename columns_type::const_iterator const_iterator;
typedef std::ranges::subrange<iterator> iterator_range_type;
typedef std::ranges::subrange<const_iterator> const_iterator_range_type;
// The maximum allowed length for any schema name (table, keyspace, view, or index).
// This limit is primarily determined by the maximum table name length.
//
// When a new table is created, sstables::init_table_storage() generates a directory name
// by concatenating the full table name, a dash ('-'), and a 32-byte UUID. Since most Linux
// filesystems restrict a single filename component to 255 bytes, any table name longer than
// 222 bytes would result in a directory name exceeding this limit, causing mkdir() to fail.
//
// Additionally, we reserve 15 bytes for the "_scylla_cdc_log" suffix, which is appended to
// CDC-enabled table names (see cdc_log_suffix in cdc/log.cc). While this suffix
// only applies to table names, for simplicity, the same length restriction is enforced for
// keyspace, view, and index names as well.
// We also reserve 15 bytes for future use, allowing for potential future extensions without
// breaking existing schemas.
// Hence the length is: 255 - 32 (UUID) - 1 (dash) - 15 (CDC suffix) - 15 (reserved) = 192.
static constexpr size_t NAME_LENGTH = 192;
struct column {
bytes name;
data_type type;
};
private:
struct reversed_tag { };
struct with_cdc_schema_tag { };
lw_shared_ptr<cql3::column_specification> make_column_specification(const column_definition& def) const;
void rebuild();
void compute_all_columns_in_select_order();
schema(const schema&, const std::function<void(schema&)>&);
class private_tag{};
public:
schema(private_tag, const raw_schema&, const schema_static_props& props, schema_ptr cdc_schema, std::optional<std::variant<schema_ptr, db::view::base_dependent_view_info>> base = std::nullopt);
schema(const schema&);
// See \ref make_reversed().
schema(reversed_tag, const schema&);
schema(with_cdc_schema_tag, const schema&, schema_ptr cdc_schema);
~schema();
const schema_static_props& static_props() const {
return _static_props;
}
table_schema_version version() const {
return _raw._version;
}
double bloom_filter_fp_chance() const {
return _raw._props.bloom_filter_fp_chance;
}
const compression_parameters& get_compressor_params() const {
return _raw._props.compressor_params;
}
const extensions_map& extensions() const {
return _raw._props.extensions;
}
bool is_dense() const {
return _raw._is_dense;
}
bool is_compound() const {
return _raw._is_compound;
}
bool is_cql3_table() const {
return !is_super() && !is_dense() && is_compound();
}
bool is_compact_table() const {
return !is_cql3_table();
}
bool is_static_compact_table() const {
return !is_super() && !is_dense() && !is_compound();
}
const table_id& id() const {
return _raw._id;
}
const sstring& comment() const {
return _raw._props.comment;
}
bool is_counter() const {
return _raw._is_counter;
}
cf_type type() const {
return _raw._type;
}
bool is_super() const {
return _raw._type == cf_type::super;
}
gc_clock::duration gc_grace_seconds() const {
auto seconds = std::chrono::seconds(_raw._props.gc_grace_seconds);
return std::chrono::duration_cast<gc_clock::duration>(seconds);
}
gc_clock::duration paxos_grace_seconds() const {
return _raw._props.get_paxos_grace_seconds();
}
double crc_check_chance() const {
return _raw._props.crc_check_chance;
}
int32_t min_compaction_threshold() const {
return _raw._props.min_compaction_threshold;
}
int32_t max_compaction_threshold() const {
return _raw._props.max_compaction_threshold;
}
int32_t min_index_interval() const {
return _raw._props.min_index_interval;
}
int32_t max_index_interval() const {
return _raw._props.max_index_interval;
}
int32_t memtable_flush_period() const {
return _raw._props.memtable_flush_period;
}
compaction::compaction_strategy_type configured_compaction_strategy() const {
return _raw._props.compaction_strategy;
}
compaction::compaction_strategy_type compaction_strategy() const {
return _raw._props.compaction_enabled ? _raw._props.compaction_strategy : compaction::compaction_strategy_type::null;
}
const std::map<sstring, sstring>& compaction_strategy_options() const {
return _raw._props.compaction_strategy_options;
}
bool compaction_enabled() const {
return _raw._props.compaction_enabled;
}
storage_engine_type storage_engine() const {
return _raw._props.storage_engine;
}
bool logstor_enabled() const {
return _raw._props.storage_engine == storage_engine_type::logstor;
}
const cdc::options& cdc_options() const {
return _raw._props.get_cdc_options();
}
const ::tombstone_gc_options& tombstone_gc_options() const {
return _raw._props.get_tombstone_gc_options();
}
const db::per_partition_rate_limit_options& per_partition_rate_limit_options() const {
return _raw._per_partition_rate_limit_options;
}
const ::speculative_retry& speculative_retry() const {
return _raw._props.speculative_retry;
}
const ::caching_options& caching_options() const {
return _raw._props.caching_options;
}
// Returns true iff the _tablet_options are initialized.
// They may still be empty, e.g. after ALTER TABLE.
bool has_tablet_options() const noexcept;
db::tablet_options tablet_options() const;
const db::tablet_options::map_type& raw_tablet_options() const noexcept;
static void set_default_partitioner(const sstring& class_name, unsigned ignore_msb = 0);
const dht::i_partitioner& get_partitioner() const;
// Returns a sharder for this table.
// Use only for tables which use vnode-based replication strategy, that is for which
// table::uses_static_sharding() is true.
// To obtain a sharder which is valid for all kinds of tables, use table::get_effective_replication_map()->get_sharder()
const dht::static_sharder& get_sharder() const;
// Returns a sharder for this table, but only if it is a static sharder (token->shard mappings
// don't change while the node is up)
const dht::static_sharder* try_get_static_sharder() const;
// Returns a pointer to the table if the local database has a table which this object references by id().
// The table pointer is not guaranteed to be stable, schema_ptr doesn't keep the table alive.
replica::table* maybe_table() const;
// Like maybe_table() but throws replica::no_such_column_family if the table is not set.
replica::table& table() const;
bool has_custom_partitioner() const;
bool is_in_memory() const {
return _raw._in_memory;
}
const user_properties& get_properties() const {
return _raw._props;
}
const column_definition* get_column_definition(const bytes& name) const;
const column_definition& column_at(column_kind, column_id) const;
// Find a column definition given column ordinal id in the schema
const column_definition& column_at(ordinal_column_id ordinal_id) const;
const_iterator regular_begin() const;
const_iterator regular_end() const;
const_iterator regular_lower_bound(const bytes& name) const;
const_iterator regular_upper_bound(const bytes& name) const;
const_iterator static_begin() const;
const_iterator static_end() const;
const_iterator static_lower_bound(const bytes& name) const;
const_iterator static_upper_bound(const bytes& name) const;
static data_type column_name_type(const column_definition& def, const data_type& regular_column_name_type);
data_type column_name_type(const column_definition& def) const;
const column_definition& clustering_column_at(column_id id) const;
const column_definition& regular_column_at(column_id id) const;
const column_definition& static_column_at(column_id id) const;
bool is_last_partition_key(const column_definition& def) const;
bool has_multi_cell_collections() const;
bool has_static_columns() const;
column_count_type columns_count(column_kind kind) const;
column_count_type partition_key_size() const;
column_count_type clustering_key_size() const { return _clustering_key_size; }
column_count_type static_columns_count() const { return _static_column_count; }
column_count_type regular_columns_count() const { return _regular_column_count; }
column_count_type all_columns_count() const { return _raw._columns.size(); }
// Returns a range of column definitions
const_iterator_range_type partition_key_columns() const;
// Returns a range of column definitions
const_iterator_range_type clustering_key_columns() const;
// Returns a range of column definitions
const_iterator_range_type static_columns() const;
// Returns a range of column definitions
const_iterator_range_type regular_columns() const;
// Returns a range of column definitions
const_iterator_range_type columns(column_kind) const;
// Returns a range of column definitions
const_iterator_range_type primary_key_columns() const;
const_iterator_range_type static_and_regular_columns() const;
std::ranges::range auto all_columns_in_select_order() const {
return _all_columns_in_select_order | std::views::transform([] (const column_definition* def) -> const column_definition& { return *def; });
}
uint32_t position(const column_definition& column) const;
const columns_type& all_columns() const {
return _raw._columns;
}
const std::unordered_map<bytes, const column_definition*>& columns_by_name() const {
return _columns_by_name;
}
const auto& dropped_columns() const {
return _raw._dropped_columns;
}
const auto& collections() const {
return _raw._collections;
}
gc_clock::duration default_time_to_live() const {
return _raw._props.default_time_to_live;
}
data_type make_legacy_default_validator() const;
const sstring& ks_name() const {
return _raw._ks_name;
}
const sstring& cf_name() const {
return _raw._cf_name;
}
const lw_shared_ptr<compound_type<allow_prefixes::no>>& partition_key_type() const {
return _partition_key_type;
}
const lw_shared_ptr<compound_type<allow_prefixes::yes>>& clustering_key_type() const {
return _clustering_key_type;
}
const lw_shared_ptr<compound_type<allow_prefixes::yes>>& clustering_key_prefix_type() const {
return _clustering_key_type;
}
const data_type& regular_column_name_type() const {
return _raw._regular_column_name_type;
}
const data_type& static_column_name_type() const {
return utf8_type;
}
const std::unique_ptr<::view_info>& view_info() const {
return _view_info;
}
bool is_view() const {
return bool(_view_info);
}
schema_ptr cdc_schema() const {
return _cdc_schema;
}
const query::partition_slice& full_slice() const {
return *_full_slice;
}
// Returns all index names of this schema.
std::vector<sstring> index_names() const;
// Returns all indices of this schema.
std::vector<index_metadata> indices() const;
const std::unordered_map<sstring, index_metadata>& all_indices() const;
// Search for an index with a given name.
bool has_index(const sstring& index_name) const;
// Search for an existing index with same kind and options.
std::optional<index_metadata> find_index_noname(const index_metadata& target) const;
friend fmt::formatter<schema>;
/*!
* \brief generate the CQL DESCRIBE output.
*
* The output of DESCRIBE is the CQL command to create the described table with its indexes and views.
*
* For tables with Indexes or Materialized Views, the CQL DESCRIBE is split between the base and view tables.
* Calling the describe method on the base table schema would result with the CQL "CREATE TABLE"
* command for creating that table only.
*
* Calling the describe method on a view schema would result with the appropriate "CREATE MATERIALIZED VIEW"
* or "CREATE INDEX" depends on the type of index that schema describes (ie. Materialized View, Global
* Index or Local Index).
*
* When `cql3::describe_option::WITH_STMTS_AND_INTERNALS` is used, the description is extended with
* table's id and dropped columns. The dropped columns are present in column definitions and also the `ALTER DROP`
* statement (and `ALTER ADD` if the column has been re-added) to the description.
*/
cql3::description describe(const schema_describe_helper& helper, cql3::describe_option) const;
// Generate ALTER TABLE/MATERIALIZED VIEW statement containing all properties with current values.
// The method cannot be used on index, as indexes don't support alter statement.
fragmented_ostringstream& describe_alter_with_properties(const schema_describe_helper& helper, fragmented_ostringstream& os) const;
friend bool operator==(const schema&, const schema&);
const column_mapping& get_column_mapping() const;
friend class schema_registry_entry;
friend class schema_registry;
// May be called from different shard
schema_registry_entry* registry_entry() const noexcept;
// Returns true iff this schema version was synced with on current node.
// Schema version is said to be synced with when its mutations were merged
// into current node's schema, so that current node's schema is at least as
// recent as this version.
bool is_synced() const;
bool equal_columns(const schema&) const;
bool wait_for_sync_to_commitlog() const {
return _static_props.wait_for_sync_to_commitlog;
}
// The calculated version should be machine-independent, so that all nodes
// arrive at the same version for the same schema definition.
static table_schema_version calculate_digest(const raw_schema& r);
private:
// Print all schema properties in CQL syntax
fragmented_ostringstream& schema_properties(const schema_describe_helper& helper, fragmented_ostringstream& os) const;
managed_string get_create_statement(const schema_describe_helper& helper, bool with_internals) const;
public:
const v3_columns& v3() const {
return _v3_columns;
}
// Make a copy of the schema with reversed clustering order.
//
// The reversing is revertible, so that:
//
// s->make_reversed()->make_reversed()->version() == s->version()
//
// But note that: `s != s->make_reversed()->make_reversed()` (they are two
// different C++ objects).
// The schema's version is also reversed using UUID_gen::negate().
schema_ptr make_reversed() const;
schema_ptr make_with_cdc(schema_ptr cdc_schema) const;
// Get the reversed counterpart of this schema from the schema registry.
//
// If not present in the registry, create one (via \ref make_reversed()) and
// load it. Unlike \ref make_reversed(), this method guarantees that double
// reversing will return the very same C++ object:
//
// auto schema = make_schema();
// auto reverse_schema = schema->get_reversed();
// SCYLLA_ASSERT(reverse_schema->get_reversed().get() == schema.get());
// SCYLLA_ASSERT(schema->get_reversed().get() == reverse_schema.get());
//
schema_ptr get_reversed() const;
};
bool operator==(const schema&, const schema&);
/**
* Wrapper for schema_ptr used by functions that expect an engaged view_info field.
*/
class view_ptr final {
schema_ptr _schema;
public:
explicit view_ptr(schema_ptr schema) noexcept : _schema(schema) {
if (schema) {
SCYLLA_ASSERT(_schema->is_view());
}
}
const schema& operator*() const noexcept { return *_schema; }
const schema* operator->() const noexcept { return _schema.operator->(); }
const schema* get() const noexcept { return _schema.get(); }
operator schema_ptr() const noexcept {
return _schema;
}
explicit operator bool() const noexcept {
return bool(_schema);
}
};
std::ostream& operator<<(std::ostream& os, const view_ptr& view);
table_id generate_legacy_id(const sstring& ks_name, const sstring& cf_name);
// Thrown when attempted to access a schema-dependent object using
// an incompatible version of the schema object.
class schema_mismatch_error : public std::runtime_error {
public:
schema_mismatch_error(table_schema_version expected, const schema& access);
};
// Throws schema_mismatch_error when a schema-dependent object of "expected" version
// cannot be accessed using "access" schema.
inline void check_schema_version(table_schema_version expected, const schema& access) {
if (expected != access.version()) {
throw_with_backtrace<schema_mismatch_error>(expected, access);
}
}
template <> struct fmt::formatter<ordinal_column_id> : fmt::formatter<string_view> {
auto format(ordinal_column_id id, fmt::format_context& ctx) const {
return fmt::format_to(ctx.out(), "{}", static_cast<column_count_type>(id));
}
};
template <> struct fmt::formatter<column_definition> : fmt::formatter<string_view> {
auto format(const column_definition&, fmt::format_context& ctx) const -> decltype(ctx.out());
};
template <> struct fmt::formatter<column_mapping> : fmt::formatter<string_view> {
auto format(const column_mapping&, fmt::format_context& ctx) const -> decltype(ctx.out());
};
template <> struct fmt::formatter<raw_view_info> : fmt::formatter<string_view> {
auto format(const raw_view_info&, fmt::format_context& ctx) const -> decltype(ctx.out());
};
template <> struct fmt::formatter<schema> : fmt::formatter<string_view> {
auto format(const schema&, fmt::format_context& ctx) const -> decltype(ctx.out());
};
std::ostream& operator<<(std::ostream& os, const schema& s);
template <> struct fmt::formatter<view_ptr> : fmt::formatter<string_view> {
auto format(const view_ptr& view, fmt::format_context& ctx) const -> decltype(ctx.out());
};