Files
scylladb/streamed_mutation.hh

1037 lines
38 KiB
C++

/*
* Copyright (C) 2016 ScyllaDB
*/
/*
* This file is part of Scylla.
*
* Scylla is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Scylla is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Scylla. If not, see <http://www.gnu.org/licenses/>.
*/
#pragma once
#include "mutation_partition.hh"
#include "utils/optimized_optional.hh"
#include <experimental/optional>
namespace stdx = std::experimental;
// mutation_fragments are the objects that streamed_mutation are going to
// stream. They can represent:
// - a static row
// - a clustering row
// - a range tombstone
//
// There exists an ordering (implemented in position_in_partition class) between
// mutation_fragment objects. It reflects the order in which content of
// partition appears in the sstables.
class position_in_partition_view;
class clustering_row {
clustering_key_prefix _ck;
tombstone _t;
row_marker _marker;
row _cells;
public:
explicit clustering_row(clustering_key_prefix ck) : _ck(std::move(ck)) { }
clustering_row(clustering_key_prefix ck, tombstone t, row_marker marker, row cells)
: _ck(std::move(ck)), _t(t), _marker(std::move(marker)), _cells(std::move(cells)) { }
clustering_row(const rows_entry& re)
: _ck(re.key()), _t(re.row().deleted_at()), _marker(re.row().marker()), _cells(re.row().cells()) { }
clustering_row(rows_entry&& re)
: _ck(std::move(re.key())), _t(re.row().deleted_at()), _marker(re.row().marker()), _cells(std::move(re.row().cells())) { }
clustering_key_prefix& key() { return _ck; }
const clustering_key_prefix& key() const { return _ck; }
tombstone tomb() const { return _t; }
void remove_tombstone() { _t = tombstone(); }
const row_marker& marker() const { return _marker; }
row_marker& marker() { return _marker; }
const row& cells() const { return _cells; }
row& cells() { return _cells; }
bool empty() const {
return !_t && _marker.is_missing() && _cells.empty();
}
void apply(const schema& s, clustering_row&& cr) {
_t.apply(cr._t);
_marker.apply(std::move(cr._marker));
_cells.apply(s, column_kind::regular_column, std::move(cr._cells));
maybe_shadow_deletion(s);
}
void apply(const schema& s, const clustering_row& cr) {
_t.apply(cr._t);
_marker.apply(cr._marker);
_cells.apply(s, column_kind::regular_column, cr._cells);
maybe_shadow_deletion(s);
}
void set_cell(const column_definition& def, atomic_cell_or_collection&& value) {
_cells.apply(def, std::move(value));
}
void apply(row_marker rm) { _marker.apply(std::move(rm)); }
void apply(tombstone t) { _t.apply(t); }
void apply(const schema& s, const rows_entry& r) {
_t.apply(r.row().deleted_at());
_marker.apply(r.row().marker());
_cells.apply(s, column_kind::regular_column, r.row().cells());
maybe_shadow_deletion(s);
}
position_in_partition_view position() const;
size_t external_memory_usage() const {
return _ck.external_memory_usage() + _cells.external_memory_usage();
}
size_t memory_usage() const {
return sizeof(clustering_row) + external_memory_usage();
}
friend std::ostream& operator<<(std::ostream& os, const clustering_row& row);
private:
void maybe_shadow_deletion(const schema& s) {
if (row_tombstone_is_shadowed(s, _t, _marker)) {
_t = tombstone();
}
}
};
class static_row {
row _cells;
public:
static_row() = default;
explicit static_row(const row& r) : _cells(r) { }
explicit static_row(row&& r) : _cells(std::move(r)) { }
row& cells() { return _cells; }
const row& cells() const { return _cells; }
bool empty() const {
return _cells.empty();
}
void apply(const schema& s, const row& r) {
_cells.apply(s, column_kind::static_column, r);
}
void apply(const schema& s, static_row&& sr) {
_cells.apply(s, column_kind::static_column, std::move(sr._cells));
}
void set_cell(const column_definition& def, atomic_cell_or_collection&& value) {
_cells.apply(def, std::move(value));
}
position_in_partition_view position() const;
size_t external_memory_usage() const {
return _cells.external_memory_usage();
}
size_t memory_usage() const {
return sizeof(static_row) + external_memory_usage();
}
friend std::ostream& operator<<(std::ostream& is, const static_row& row);
};
class mutation_fragment {
public:
enum class kind {
static_row,
clustering_row,
range_tombstone,
};
private:
struct data {
data() { }
~data() { }
stdx::optional<size_t> _size_in_bytes;
union {
static_row _static_row;
clustering_row _clustering_row;
range_tombstone _range_tombstone;
};
};
private:
kind _kind;
std::unique_ptr<data> _data;
mutation_fragment() = default;
explicit operator bool() const noexcept { return bool(_data); }
void destroy_data() noexcept;
friend class optimized_optional<mutation_fragment>;
friend class position_in_partition;
public:
mutation_fragment(static_row&& r);
mutation_fragment(clustering_row&& r);
mutation_fragment(range_tombstone&& r);
mutation_fragment(const mutation_fragment&) = delete;
mutation_fragment(mutation_fragment&& other) = default;
mutation_fragment& operator=(const mutation_fragment&) = delete;
mutation_fragment& operator=(mutation_fragment&& other) noexcept {
if (this != &other) {
this->~mutation_fragment();
new (this) mutation_fragment(std::move(other));
}
return *this;
}
~mutation_fragment() {
if (_data) {
destroy_data();
}
}
position_in_partition_view position() const;
// Checks if this fragment may be relevant for any range starting at given position.
bool relevant_for_range(const schema& s, position_in_partition_view pos) const;
// Like relevant_for_range() but makes use of assumption that pos is greater
// than the starting position of this fragment.
bool relevant_for_range_assuming_after(const schema& s, position_in_partition_view pos) const;
bool has_key() const { return !is_static_row(); }
// Requirements: has_key() == true
const clustering_key_prefix& key() const;
kind mutation_fragment_kind() const { return _kind; }
bool is_static_row() const { return _kind == kind::static_row; }
bool is_clustering_row() const { return _kind == kind::clustering_row; }
bool is_range_tombstone() const { return _kind == kind::range_tombstone; }
static_row& as_mutable_static_row() {
_data->_size_in_bytes = stdx::nullopt;
return _data->_static_row;
}
clustering_row& as_mutable_clustering_row() {
_data->_size_in_bytes = stdx::nullopt;
return _data->_clustering_row;
}
range_tombstone& as_mutable_range_tombstone() {
_data->_size_in_bytes = stdx::nullopt;
return _data->_range_tombstone;
}
static_row&& as_static_row() && { return std::move(_data->_static_row); }
clustering_row&& as_clustering_row() && { return std::move(_data->_clustering_row); }
range_tombstone&& as_range_tombstone() && { return std::move(_data->_range_tombstone); }
const static_row& as_static_row() const & { return _data->_static_row; }
const clustering_row& as_clustering_row() const & { return _data->_clustering_row; }
const range_tombstone& as_range_tombstone() const & { return _data->_range_tombstone; }
// Requirements: mutation_fragment_kind() == mf.mutation_fragment_kind() && !is_range_tombstone()
void apply(const schema& s, mutation_fragment&& mf);
/*
template<typename T, typename ReturnType>
concept bool MutationFragmentConsumer() {
return requires(T t, static_row sr, clustering_row cr, range_tombstone rt) {
{ t.consume(std::move(sr)) } -> ReturnType;
{ t.consume(std::move(cr)) } -> ReturnType;
{ t.consume(std::move(rt)) } -> ReturnType;
};
}
*/
template<typename Consumer>
decltype(auto) consume(Consumer& consumer) && {
switch (_kind) {
case kind::static_row:
return consumer.consume(std::move(_data->_static_row));
case kind::clustering_row:
return consumer.consume(std::move(_data->_clustering_row));
case kind::range_tombstone:
return consumer.consume(std::move(_data->_range_tombstone));
}
abort();
}
/*
template<typename T, typename ReturnType>
concept bool MutationFragmentVisitor() {
return requires(T t, const static_row& sr, const clustering_row& cr, const range_tombstone& rt) {
{ t(sr) } -> ReturnType;
{ t(cr) } -> ReturnType;
{ t(rt) } -> ReturnType;
};
}
*/
template<typename Visitor>
decltype(auto) visit(Visitor&& visitor) const {
switch (_kind) {
case kind::static_row:
return visitor(as_static_row());
case kind::clustering_row:
return visitor(as_clustering_row());
case kind::range_tombstone:
return visitor(as_range_tombstone());
}
abort();
}
size_t memory_usage() const {
if (!_data->_size_in_bytes) {
_data->_size_in_bytes = sizeof(data) + visit([] (auto& mf) { return mf.external_memory_usage(); });
}
return *_data->_size_in_bytes;
}
friend std::ostream& operator<<(std::ostream&, const mutation_fragment& mf);
};
std::ostream& operator<<(std::ostream&, mutation_fragment::kind);
std::ostream& operator<<(std::ostream&, const mutation_fragment& mf);
class position_in_partition;
inline
lexicographical_relation relation_for_lower_bound(composite_view v) {
switch (v.last_eoc()) {
case composite::eoc::start:
case composite::eoc::none:
return lexicographical_relation::before_all_prefixed;
case composite::eoc::end:
return lexicographical_relation::after_all_prefixed;
default:
assert(0);
}
}
inline
lexicographical_relation relation_for_upper_bound(composite_view v) {
switch (v.last_eoc()) {
case composite::eoc::start:
return lexicographical_relation::before_all_prefixed;
case composite::eoc::none:
return lexicographical_relation::before_all_strictly_prefixed;
case composite::eoc::end:
return lexicographical_relation::after_all_prefixed;
default:
assert(0);
}
}
class position_in_partition_view {
friend class position_in_partition;
int _bound_weight = 0;
const clustering_key_prefix* _ck; // nullptr for static row
private:
position_in_partition_view(int bound_weight, const clustering_key_prefix* ck)
: _bound_weight(bound_weight)
, _ck(ck)
{ }
// Returns placement of this position_in_partition relative to *_ck,
// or lexicographical_relation::at_prefix if !_ck.
lexicographical_relation relation() const {
// FIXME: Currently position_range cannot represent a range end bound which
// includes just the prefix key or a range start which excludes just a prefix key.
// In both cases we should return lexicographical_relation::before_all_strictly_prefixed here.
// Refs #1446.
if (_bound_weight <= 0) {
return lexicographical_relation::before_all_prefixed;
} else {
return lexicographical_relation::after_all_prefixed;
}
}
public:
struct static_row_tag_t { };
struct clustering_row_tag_t { };
struct range_tag_t { };
using range_tombstone_tag_t = range_tag_t;
explicit position_in_partition_view(static_row_tag_t) : _ck(nullptr) { }
position_in_partition_view(clustering_row_tag_t, const clustering_key_prefix& ck)
: _ck(&ck) { }
position_in_partition_view(range_tag_t, bound_view bv)
: _bound_weight(weight(bv.kind)), _ck(&bv.prefix) { }
static position_in_partition_view for_range_start(const query::clustering_range&);
static position_in_partition_view for_range_end(const query::clustering_range&);
bool is_static_row() const { return !_ck; }
friend std::ostream& operator<<(std::ostream&, position_in_partition_view);
};
inline
position_in_partition_view position_in_partition_view::for_range_start(const query::clustering_range& r) {
return {position_in_partition_view::range_tag_t(), bound_view::from_range_start(r)};
}
inline
position_in_partition_view position_in_partition_view::for_range_end(const query::clustering_range& r) {
return {position_in_partition_view::range_tag_t(), bound_view::from_range_end(r)};
}
class position_in_partition {
int _bound_weight = 0;
stdx::optional<clustering_key_prefix> _ck;
public:
struct static_row_tag_t { };
struct after_static_row_tag_t { };
struct clustering_row_tag_t { };
struct after_clustering_row_tag_t { };
struct range_tag_t { };
using range_tombstone_tag_t = range_tag_t;
explicit position_in_partition(static_row_tag_t) { }
position_in_partition(clustering_row_tag_t, clustering_key_prefix ck)
: _ck(std::move(ck)) { }
position_in_partition(after_clustering_row_tag_t, clustering_key_prefix ck)
// FIXME: Use lexicographical_relation::before_strictly_prefixed here. Refs #1446
: _bound_weight(1), _ck(std::move(ck)) { }
position_in_partition(range_tag_t, bound_view bv)
: _bound_weight(weight(bv.kind)), _ck(bv.prefix) { }
position_in_partition(after_static_row_tag_t) :
position_in_partition(range_tag_t(), bound_view::bottom()) { }
explicit position_in_partition(position_in_partition_view view)
: _bound_weight(view._bound_weight)
{
if (view._ck) {
_ck = *view._ck;
}
}
static position_in_partition before_all_clustered_rows() {
return {position_in_partition::range_tag_t(), bound_view::bottom()};
}
static position_in_partition after_all_clustered_rows() {
return {position_in_partition::range_tag_t(), bound_view::top()};
}
static position_in_partition after_key(clustering_key ck) {
return {after_clustering_row_tag_t(), std::move(ck)};
}
static position_in_partition for_key(clustering_key ck) {
return {clustering_row_tag_t(), std::move(ck)};
}
bool is_static_row() const { return !_ck; }
bool is_clustering_row() const { return _ck && !_bound_weight; }
template<typename Hasher>
void feed_hash(Hasher& hasher, const schema& s) const {
::feed_hash(hasher, _bound_weight);
if (_ck) {
::feed_hash(hasher, true);
_ck->feed_hash(hasher, s);
} else {
::feed_hash(hasher, false);
}
}
clustering_key_prefix& key() {
return *_ck;
}
const clustering_key_prefix& key() const {
return *_ck;
}
operator position_in_partition_view() const {
return { _bound_weight, _ck ? &*_ck : nullptr };
}
// Defines total order on the union of position_and_partition and composite objects.
//
// The ordering is compatible with position_range (r). The following is satisfied for
// all cells with name c included by the range:
//
// r.start() <= c < r.end()
//
// The ordering on composites given by this is compatible with but weaker than the cell name order.
//
// The ordering on position_in_partition given by this is compatible but weaker than the ordering
// given by position_in_partition::tri_compare.
//
class composite_tri_compare {
const schema& _s;
public:
composite_tri_compare(const schema& s) : _s(s) {}
int operator()(position_in_partition_view a, position_in_partition_view b) const {
if (a.is_static_row() || b.is_static_row()) {
return b.is_static_row() - a.is_static_row();
}
auto&& types = _s.clustering_key_type()->types();
auto cmp = [&] (const data_type& t, bytes_view c1, bytes_view c2) { return t->compare(c1, c2); };
return lexicographical_tri_compare(types.begin(), types.end(),
a._ck->begin(_s), a._ck->end(_s),
b._ck->begin(_s), b._ck->end(_s),
cmp, a.relation(), b.relation());
}
int operator()(position_in_partition_view a, composite_view b) const {
if (b.empty()) {
return 1; // a cannot be empty.
}
if (a.is_static_row() || b.is_static()) {
return b.is_static() - a.is_static_row();
}
auto&& types = _s.clustering_key_type()->types();
auto b_values = b.values();
auto cmp = [&] (const data_type& t, bytes_view c1, bytes_view c2) { return t->compare(c1, c2); };
return lexicographical_tri_compare(types.begin(), types.end(),
a._ck->begin(_s), a._ck->end(_s),
b_values.begin(), b_values.end(),
cmp, a.relation(), relation_for_lower_bound(b));
}
int operator()(composite_view a, position_in_partition_view b) const {
return -(*this)(b, a);
}
int operator()(composite_view a, composite_view b) const {
if (a.is_static() != b.is_static()) {
return a.is_static() ? -1 : 1;
}
auto&& types = _s.clustering_key_type()->types();
auto a_values = a.values();
auto b_values = b.values();
auto cmp = [&] (const data_type& t, bytes_view c1, bytes_view c2) { return t->compare(c1, c2); };
return lexicographical_tri_compare(types.begin(), types.end(),
a_values.begin(), a_values.end(),
b_values.begin(), b_values.end(),
cmp,
relation_for_lower_bound(a),
relation_for_lower_bound(b));
}
};
// Less comparator giving the same order as composite_tri_compare.
class composite_less_compare {
composite_tri_compare _cmp;
public:
composite_less_compare(const schema& s) : _cmp(s) {}
template<typename T, typename U>
bool operator()(const T& a, const U& b) const {
return _cmp(a, b) < 0;
}
};
class tri_compare {
bound_view::tri_compare _cmp;
private:
template<typename T, typename U>
int compare(const T& a, const U& b) const {
bool a_rt_weight = bool(a._ck);
bool b_rt_weight = bool(b._ck);
if (!a_rt_weight || !b_rt_weight) {
return a_rt_weight - b_rt_weight;
}
return _cmp(*a._ck, a._bound_weight, *b._ck, b._bound_weight);
}
public:
tri_compare(const schema& s) : _cmp(s) { }
int operator()(const position_in_partition& a, const position_in_partition& b) const {
return compare(a, b);
}
int operator()(const position_in_partition_view& a, const position_in_partition_view& b) const {
return compare(a, b);
}
int operator()(const position_in_partition& a, const position_in_partition_view& b) const {
return compare(a, b);
}
int operator()(const position_in_partition_view& a, const position_in_partition& b) const {
return compare(a, b);
}
};
class less_compare {
tri_compare _cmp;
public:
less_compare(const schema& s) : _cmp(s) { }
bool operator()(const position_in_partition& a, const position_in_partition& b) const {
return _cmp(a, b) < 0;
}
bool operator()(const position_in_partition_view& a, const position_in_partition_view& b) const {
return _cmp(a, b) < 0;
}
bool operator()(const position_in_partition& a, const position_in_partition_view& b) const {
return _cmp(a, b) < 0;
}
bool operator()(const position_in_partition_view& a, const position_in_partition& b) const {
return _cmp(a, b) < 0;
}
};
class equal_compare {
clustering_key_prefix::equality _equal;
template<typename T, typename U>
bool compare(const T& a, const U& b) const {
bool a_rt_weight = bool(a._ck);
bool b_rt_weight = bool(b._ck);
return a_rt_weight == b_rt_weight
&& (!a_rt_weight || (_equal(*a._ck, *b._ck)
&& a._bound_weight == b._bound_weight));
}
public:
equal_compare(const schema& s) : _equal(s) { }
bool operator()(const position_in_partition& a, const position_in_partition& b) const {
return compare(a, b);
}
bool operator()(const position_in_partition_view& a, const position_in_partition_view& b) const {
return compare(a, b);
}
bool operator()(const position_in_partition_view& a, const position_in_partition& b) const {
return compare(a, b);
}
bool operator()(const position_in_partition& a, const position_in_partition_view& b) const {
return compare(a, b);
}
};
friend std::ostream& operator<<(std::ostream&, const position_in_partition&);
};
// Includes all position_in_partition objects "p" for which: start <= p < end
// And only those.
class position_range {
private:
position_in_partition _start;
position_in_partition _end;
public:
static position_range from_range(const query::clustering_range&);
static position_range for_static_row() {
return {
position_in_partition(position_in_partition::static_row_tag_t()),
position_in_partition(position_in_partition::after_static_row_tag_t())
};
}
static position_range full() {
return {
position_in_partition(position_in_partition::static_row_tag_t()),
position_in_partition::after_all_clustered_rows()
};
}
static position_range all_clustered_rows() {
return {
position_in_partition::before_all_clustered_rows(),
position_in_partition::after_all_clustered_rows()
};
}
position_range(position_range&&) = default;
position_range& operator=(position_range&&) = default;
position_range(const position_range&) = default;
position_range& operator=(const position_range&) = default;
// Constructs position_range which covers the same rows as given clustering_range.
// position_range includes a fragment if it includes position of that fragment.
position_range(const query::clustering_range&);
position_range(query::clustering_range&&);
position_range(position_in_partition start, position_in_partition end)
: _start(std::move(start))
, _end(std::move(end))
{ }
const position_in_partition& start() const { return _start; }
const position_in_partition& end() const { return _end; }
bool contains(const schema& s, position_in_partition_view pos) const;
bool overlaps(const schema& s, position_in_partition_view start, position_in_partition_view end) const;
friend std::ostream& operator<<(std::ostream&, const position_range&);
};
inline
bool position_range::contains(const schema& s, position_in_partition_view pos) const {
position_in_partition::less_compare less(s);
return !less(pos, _start) && less(pos, _end);
}
inline
bool position_range::overlaps(const schema& s, position_in_partition_view start, position_in_partition_view end) const {
position_in_partition::less_compare less(s);
return !less(end, _start) && less(start, _end);
}
inline position_in_partition_view static_row::position() const
{
return position_in_partition_view(position_in_partition_view::static_row_tag_t());
}
inline position_in_partition_view clustering_row::position() const
{
return position_in_partition_view(position_in_partition_view::clustering_row_tag_t(), _ck);
}
template<>
struct move_constructor_disengages<mutation_fragment> {
enum { value = true };
};
using mutation_fragment_opt = optimized_optional<mutation_fragment>;
// streamed_mutation represents a mutation in a form of a stream of
// mutation_fragments. streamed_mutation emits mutation fragments in the order
// they should appear in the sstables, i.e. static row is always the first one,
// then clustering rows and range tombstones are emitted according to the
// lexicographical ordering of their clustering keys and bounds of the range
// tombstones.
//
// The ordering of mutation_fragments also guarantees that by the time the
// consumer sees a clustering row it has already received all relevant tombstones.
//
// Partition key and partition tombstone are not streamed and is part of the
// streamed_mutation itself.
class streamed_mutation {
public:
// Determines whether streamed_mutation is in forwarding mode or not.
//
// In forwarding mode the stream does not return all fragments right away,
// but only those belonging to the current clustering range. Initially
// current range only covers the static row. The stream can be forwarded
// (even before end-of- stream) to a later range with fast_forward_to().
// Forwarding doesn't change initial restrictions of the stream, it can
// only be used to skip over data.
//
// Monotonicity of positions is preserved by forwarding. That is fragments
// emitted after forwarding will have greater positions than any fragments
// emitted before forwarding.
//
// For any range, all range tombstones relevant for that range which are
// present in the original stream will be emitted. Range tombstones
// emitted before forwarding which overlap with the new range are not
// necessarily re-emitted.
//
// When streamed_mutation is not in forwarding mode, fast_forward_to()
// cannot be used.
//
using forwarding = bool_class<class forwarding_tag>;
// streamed_mutation uses batching. The mutation implementations are
// supposed to fill a buffer with mutation fragments until is_buffer_full()
// or end of stream is encountered.
class impl {
circular_buffer<mutation_fragment> _buffer;
size_t _buffer_size = 0;
protected:
static constexpr size_t max_buffer_size_in_bytes = 8 * 1024;
schema_ptr _schema;
dht::decorated_key _key;
tombstone _partition_tombstone;
bool _end_of_stream = false;
friend class streamed_mutation;
protected:
template<typename... Args>
void push_mutation_fragment(Args&&... args) {
auto mf = mutation_fragment(std::forward<Args>(args)...);
_buffer_size += mf.memory_usage();
_buffer.emplace_back(std::move(mf));
}
public:
explicit impl(schema_ptr s, dht::decorated_key dk, tombstone pt)
: _schema(std::move(s)), _key(std::move(dk)), _partition_tombstone(pt)
{ }
virtual ~impl() { }
virtual future<> fill_buffer() = 0;
// See streamed_mutation::fast_forward_to().
virtual future<> fast_forward_to(position_range) {
throw std::bad_function_call(); // FIXME: make pure virtual after implementing everywhere.
}
bool is_end_of_stream() const { return _end_of_stream; }
bool is_buffer_empty() const { return _buffer.empty(); }
bool is_buffer_full() const { return _buffer_size >= max_buffer_size_in_bytes; }
mutation_fragment pop_mutation_fragment() {
auto mf = std::move(_buffer.front());
_buffer.pop_front();
_buffer_size -= mf.memory_usage();
return mf;
}
future<mutation_fragment_opt> operator()() {
if (is_buffer_empty()) {
if (is_end_of_stream()) {
return make_ready_future<mutation_fragment_opt>();
}
return fill_buffer().then([this] { return operator()(); });
}
return make_ready_future<mutation_fragment_opt>(pop_mutation_fragment());
}
// Removes all fragments from the buffer which are not relevant for any range starting at given position.
// It is assumed that pos is greater than positions of fragments already in the buffer.
void forward_buffer_to(const position_in_partition& pos);
};
private:
std::unique_ptr<impl> _impl;
streamed_mutation() = default;
explicit operator bool() const { return bool(_impl); }
friend class optimized_optional<streamed_mutation>;
public:
explicit streamed_mutation(std::unique_ptr<impl> i)
: _impl(std::move(i)) { }
const partition_key& key() const { return _impl->_key.key(); }
const dht::decorated_key& decorated_key() const { return _impl->_key; }
const schema_ptr& schema() const { return _impl->_schema; }
tombstone partition_tombstone() const { return _impl->_partition_tombstone; }
bool is_end_of_stream() const { return _impl->is_end_of_stream(); }
bool is_buffer_empty() const { return _impl->is_buffer_empty(); }
bool is_buffer_full() const { return _impl->is_buffer_full(); }
mutation_fragment pop_mutation_fragment() { return _impl->pop_mutation_fragment(); }
future<> fill_buffer() { return _impl->fill_buffer(); }
// Skips to a later range of rows.
// The new range must not overlap with the current range.
//
// See docs of streamed_mutation::forwarding for semantics.
future<> fast_forward_to(position_range pr) {
return _impl->fast_forward_to(std::move(pr));
}
future<mutation_fragment_opt> operator()() {
return _impl->operator()();
}
};
// Adapts streamed_mutation to a streamed_mutation which is in forwarding mode.
streamed_mutation make_forwardable(streamed_mutation);
std::ostream& operator<<(std::ostream& os, const streamed_mutation& sm);
template<typename Impl, typename... Args>
streamed_mutation make_streamed_mutation(Args&&... args) {
return streamed_mutation(std::make_unique<Impl>(std::forward<Args>(args)...));
}
template<>
struct move_constructor_disengages<streamed_mutation> {
enum { value = true };
};
using streamed_mutation_opt = optimized_optional<streamed_mutation>;
/*
template<typename T>
concept bool StreamedMutationConsumer() {
return MutationFragmentConsumer<T, stop_iteration>
&& requires(T t, tombstone tomb)
{
{ t.consume(tomb) } -> stop_iteration;
t.consume_end_of_stream();
};
}
*/
template<typename Consumer>
auto consume(streamed_mutation& m, Consumer consumer) {
return do_with(std::move(consumer), [&m] (Consumer& c) {
if (c.consume(m.partition_tombstone()) == stop_iteration::yes) {
return make_ready_future().then([&] { return c.consume_end_of_stream(); });
}
return repeat([&m, &c] {
if (m.is_buffer_empty()) {
if (m.is_end_of_stream()) {
return make_ready_future<stop_iteration>(stop_iteration::yes);
}
return m.fill_buffer().then([] { return stop_iteration::no; });
}
return make_ready_future<stop_iteration>(m.pop_mutation_fragment().consume(c));
}).then([&c] {
return c.consume_end_of_stream();
});
});
}
class mutation;
streamed_mutation streamed_mutation_from_mutation(mutation, streamed_mutation::forwarding fwd = streamed_mutation::forwarding::no);
streamed_mutation streamed_mutation_returning(schema_ptr, dht::decorated_key, std::vector<mutation_fragment>, tombstone t = {});
//Requires all streamed_mutations to have the same schema.
streamed_mutation merge_mutations(std::vector<streamed_mutation>);
streamed_mutation reverse_streamed_mutation(streamed_mutation);
// range_tombstone_stream is a helper object that simplifies producing a stream
// of range tombstones and merging it with a stream of clustering rows.
// Tombstones are added using apply() and retrieved using get_next().
//
// get_next(const rows_entry&) and get_next(const mutation_fragment&) allow
// merging the stream of tombstones with a stream of clustering rows. If these
// overloads return disengaged optional it means that there is no tombstone
// in the stream that should be emitted before the object given as an argument.
// (And, consequently, if the optional is engaged that tombstone should be
// emitted first). After calling any of these overloads with a mutation_fragment
// which is at some position in partition P no range tombstone can be added to
// the stream which start bound is before that position.
//
// get_next() overload which doesn't take any arguments is used to return the
// remaining tombstones. After it was called no new tombstones can be added
// to the stream.
class range_tombstone_stream {
const schema& _schema;
position_in_partition::less_compare _cmp;
range_tombstone_list _list;
bool _inside_range_tombstone = false;
private:
mutation_fragment_opt do_get_next();
public:
range_tombstone_stream(const schema& s) : _schema(s), _cmp(s), _list(s) { }
mutation_fragment_opt get_next(const rows_entry&);
mutation_fragment_opt get_next(const mutation_fragment&);
// Returns next fragment with position before upper_bound or disengaged optional if no such fragments are left.
mutation_fragment_opt get_next(position_in_partition_view upper_bound);
mutation_fragment_opt get_next();
// Forgets all tombstones which are not relevant for any range starting at given position.
void forward_to(position_in_partition_view);
void apply(range_tombstone&& rt) {
_list.apply(_schema, std::move(rt));
}
void apply(const range_tombstone_list& list) {
_list.apply(_schema, list);
}
void apply(const range_tombstone_list&, const query::clustering_range&);
void reset();
};
// mutation_hasher is an equivalent of hashing_partition_visitor for
// streamed mutations.
//
// mutation_hasher *IS NOT* compatible with hashing_partition_visitor.
//
// streamed_mutations do not guarantee that the emitted range tombstones
// are disjoint. However, we need to hash them after they are made disjoint
// because only in such form the hash won't depend on the unpredictable
// factors (e.g. which sstables contain which parts of the mutation).
template<typename Hasher>
class mutation_hasher {
const schema& _schema;
Hasher& _hasher;
bound_view::compare _cmp;
range_tombstone_list _rt_list;
bool _inside_range_tombstone = false;
private:
void consume_cell(const column_definition& col, const atomic_cell_or_collection& cell) {
feed_hash(_hasher, col.name());
feed_hash(_hasher, col.type->name());
cell.feed_hash(_hasher, col);
}
void consume_range_tombstone_start(const range_tombstone& rt) {
rt.start.feed_hash(_hasher, _schema);
feed_hash(_hasher, rt.start_kind);
feed_hash(_hasher, rt.tomb);
}
void consume_range_tombstone_end(const range_tombstone& rt) {
rt.end.feed_hash(_hasher, _schema);
feed_hash(_hasher, rt.end_kind);
}
void pop_rt_front() {
auto& rt = *_rt_list.tombstones().begin();
_rt_list.tombstones().erase(_rt_list.begin());
current_deleter<range_tombstone>()(&rt);
}
void consume_range_tombstones_until(const clustering_row& cr) {
while (!_rt_list.empty()) {
auto it = _rt_list.begin();
if (_inside_range_tombstone) {
if (_cmp(it->end_bound(), cr.key())) {
consume_range_tombstone_end(*it);
_inside_range_tombstone = false;
pop_rt_front();
} else {
break;
}
} else {
if (_cmp(it->start_bound(), cr.key())) {
consume_range_tombstone_start(*it);
_inside_range_tombstone = true;
} else {
break;
}
}
}
}
void consume_range_tombstones_until_end() {
if (_inside_range_tombstone) {
consume_range_tombstone_end(*_rt_list.begin());
pop_rt_front();
}
for (auto&& rt : _rt_list) {
consume_range_tombstone_start(rt);
consume_range_tombstone_end(rt);
}
}
public:
mutation_hasher(const schema& s, Hasher& h)
: _schema(s), _hasher(h), _cmp(s), _rt_list(s) { }
stop_iteration consume(tombstone t) {
feed_hash(_hasher, t);
return stop_iteration::no;
}
stop_iteration consume(const static_row& sr) {
sr.cells().for_each_cell([&] (column_id id, const atomic_cell_or_collection& cell) {
auto&& col = _schema.static_column_at(id);
consume_cell(col, cell);
});
return stop_iteration::no;
}
stop_iteration consume(const clustering_row& cr) {
consume_range_tombstones_until(cr);
cr.key().feed_hash(_hasher, _schema);
feed_hash(_hasher, cr.tomb());
feed_hash(_hasher, cr.marker());
cr.cells().for_each_cell([&] (column_id id, const atomic_cell_or_collection& cell) {
auto&& col = _schema.regular_column_at(id);
consume_cell(col, cell);
});
return stop_iteration::no;
}
stop_iteration consume(range_tombstone&& rt) {
_rt_list.apply(_schema, std::move(rt));
return stop_iteration::no;
}
void consume_end_of_stream() {
consume_range_tombstones_until_end();
}
};