We have added the finished percentage for repair based node operations.
This patch adds the finished percentage for node ops using the old
streaming.
Example output:
scylla_streaming_finished_percentage{ops="bootstrap",shard="0"} 1.000000
scylla_streaming_finished_percentage{ops="decommission",shard="0"} 1.000000
scylla_streaming_finished_percentage{ops="rebuild",shard="0"} 0.561945
scylla_streaming_finished_percentage{ops="removenode",shard="0"} 1.000000
scylla_streaming_finished_percentage{ops="repair",shard="0"} 1.000000
scylla_streaming_finished_percentage{ops="replace",shard="0"} 1.000000
In addition to the metrics, log shows the percentage is added.
[shard 0] range_streamer - Finished 2698 out of 2817 ranges for rebuild, finished percentage=0.95775646
Fixes #11600
Closes #11601
195 lines
7.1 KiB
C++
195 lines
7.1 KiB
C++
/*
|
|
*
|
|
* Modified by ScyllaDB
|
|
* Copyright (C) 2015-present ScyllaDB
|
|
*/
|
|
|
|
/*
|
|
* SPDX-License-Identifier: (AGPL-3.0-or-later and Apache-2.0)
|
|
*/
|
|
|
|
#pragma once
|
|
#include "streaming/stream_fwd.hh"
|
|
#include "streaming/progress_info.hh"
|
|
#include "streaming/stream_reason.hh"
|
|
#include <seastar/core/shared_ptr.hh>
|
|
#include <seastar/core/distributed.hh>
|
|
#include "utils/updateable_value.hh"
|
|
#include "utils/serialized_action.hh"
|
|
#include "gms/i_endpoint_state_change_subscriber.hh"
|
|
#include "gms/inet_address.hh"
|
|
#include "gms/endpoint_state.hh"
|
|
#include "gms/application_state.hh"
|
|
#include <seastar/core/semaphore.hh>
|
|
#include <seastar/core/metrics_registration.hh>
|
|
#include <map>
|
|
|
|
namespace db {
|
|
class config;
|
|
class system_distributed_keyspace;
|
|
namespace view {
|
|
class view_update_generator;
|
|
}
|
|
}
|
|
|
|
namespace service {
|
|
class migration_manager;
|
|
};
|
|
|
|
namespace netw {
|
|
class messaging_service;
|
|
};
|
|
|
|
namespace gms {
|
|
class gossiper;
|
|
}
|
|
|
|
namespace streaming {
|
|
|
|
struct stream_bytes {
|
|
int64_t bytes_sent = 0;
|
|
int64_t bytes_received = 0;
|
|
friend stream_bytes operator+(const stream_bytes& x, const stream_bytes& y) {
|
|
stream_bytes ret(x);
|
|
ret += y;
|
|
return ret;
|
|
}
|
|
friend bool operator!=(const stream_bytes& x, const stream_bytes& y) {
|
|
return x.bytes_sent != y.bytes_sent && x.bytes_received != y.bytes_received;
|
|
}
|
|
friend bool operator==(const stream_bytes& x, const stream_bytes& y) {
|
|
return x.bytes_sent == y.bytes_sent && x.bytes_received == y.bytes_received;
|
|
}
|
|
stream_bytes& operator+=(const stream_bytes& x) {
|
|
bytes_sent += x.bytes_sent;
|
|
bytes_received += x.bytes_received;
|
|
return *this;
|
|
}
|
|
};
|
|
|
|
/**
|
|
* StreamManager manages currently running {@link StreamResultFuture}s and provides status of all operation invoked.
|
|
*
|
|
* All stream operation should be created through this class to track streaming status and progress.
|
|
*/
|
|
class stream_manager : public gms::i_endpoint_state_change_subscriber, public enable_shared_from_this<stream_manager>, public peering_sharded_service<stream_manager> {
|
|
using inet_address = gms::inet_address;
|
|
using endpoint_state = gms::endpoint_state;
|
|
using application_state = gms::application_state;
|
|
using versioned_value = gms::versioned_value;
|
|
/*
|
|
* Currently running streams. Removed after completion/failure.
|
|
* We manage them in two different maps to distinguish plan from initiated ones to
|
|
* receiving ones withing the same JVM.
|
|
*/
|
|
private:
|
|
sharded<replica::database>& _db;
|
|
sharded<db::system_distributed_keyspace>& _sys_dist_ks;
|
|
sharded<db::view::view_update_generator>& _view_update_generator;
|
|
sharded<netw::messaging_service>& _ms;
|
|
sharded<service::migration_manager>& _mm;
|
|
gms::gossiper& _gossiper;
|
|
|
|
std::unordered_map<plan_id, shared_ptr<stream_result_future>> _initiated_streams;
|
|
std::unordered_map<plan_id, shared_ptr<stream_result_future>> _receiving_streams;
|
|
std::unordered_map<plan_id, std::unordered_map<gms::inet_address, stream_bytes>> _stream_bytes;
|
|
uint64_t _total_incoming_bytes{0};
|
|
uint64_t _total_outgoing_bytes{0};
|
|
semaphore _mutation_send_limiter{256};
|
|
seastar::metrics::metric_groups _metrics;
|
|
std::unordered_map<streaming::stream_reason, float> _finished_percentage;
|
|
|
|
utils::updateable_value<uint32_t> _io_throughput_mbs;
|
|
serialized_action _io_throughput_updater = serialized_action([this] { return update_io_throughput(_io_throughput_mbs()); });
|
|
std::optional<utils::observer<uint32_t>> _io_throughput_option_observer;
|
|
|
|
public:
|
|
stream_manager(db::config& cfg, sharded<replica::database>& db,
|
|
sharded<db::system_distributed_keyspace>& sys_dist_ks,
|
|
sharded<db::view::view_update_generator>& view_update_generator,
|
|
sharded<netw::messaging_service>& ms,
|
|
sharded<service::migration_manager>& mm,
|
|
gms::gossiper& gossiper);
|
|
|
|
future<> start();
|
|
future<> stop();
|
|
|
|
semaphore& mutation_send_limiter() { return _mutation_send_limiter; }
|
|
|
|
void register_sending(shared_ptr<stream_result_future> result);
|
|
|
|
void register_receiving(shared_ptr<stream_result_future> result);
|
|
|
|
shared_ptr<stream_result_future> get_sending_stream(streaming::plan_id plan_id) const;
|
|
|
|
shared_ptr<stream_result_future> get_receiving_stream(streaming::plan_id plan_id) const;
|
|
|
|
std::vector<shared_ptr<stream_result_future>> get_all_streams() const;
|
|
|
|
replica::database& db() noexcept { return _db.local(); }
|
|
netw::messaging_service& ms() noexcept { return _ms.local(); }
|
|
|
|
const std::unordered_map<plan_id, shared_ptr<stream_result_future>>& get_initiated_streams() const {
|
|
return _initiated_streams;
|
|
}
|
|
|
|
const std::unordered_map<plan_id, shared_ptr<stream_result_future>>& get_receiving_streams() const {
|
|
return _receiving_streams;
|
|
}
|
|
|
|
void remove_stream(streaming::plan_id plan_id);
|
|
|
|
void show_streams() const;
|
|
|
|
future<> shutdown() {
|
|
fail_all_sessions();
|
|
return make_ready_future<>();
|
|
}
|
|
|
|
void update_progress(streaming::plan_id plan_id, gms::inet_address peer, progress_info::direction dir, size_t fm_size);
|
|
future<> update_all_progress_info();
|
|
|
|
void remove_progress(streaming::plan_id plan_id);
|
|
|
|
stream_bytes get_progress(streaming::plan_id plan_id, gms::inet_address peer) const;
|
|
|
|
stream_bytes get_progress(streaming::plan_id plan_id) const;
|
|
|
|
future<> remove_progress_on_all_shards(streaming::plan_id plan_id);
|
|
|
|
future<stream_bytes> get_progress_on_all_shards(streaming::plan_id plan_id, gms::inet_address peer) const;
|
|
|
|
future<stream_bytes> get_progress_on_all_shards(streaming::plan_id plan_id) const;
|
|
|
|
future<stream_bytes> get_progress_on_all_shards(gms::inet_address peer) const;
|
|
|
|
future<stream_bytes> get_progress_on_all_shards() const;
|
|
|
|
stream_bytes get_progress_on_local_shard() const;
|
|
|
|
shared_ptr<stream_session> get_session(streaming::plan_id plan_id, gms::inet_address from, const char* verb, std::optional<table_id> cf_id = {});
|
|
|
|
public:
|
|
virtual future<> on_join(inet_address endpoint, endpoint_state ep_state) override { return make_ready_future(); }
|
|
virtual future<> before_change(inet_address endpoint, endpoint_state current_state, application_state new_state_key, const versioned_value& new_value) override { return make_ready_future(); }
|
|
virtual future<> on_change(inet_address endpoint, application_state state, const versioned_value& value) override { return make_ready_future(); }
|
|
virtual future<> on_alive(inet_address endpoint, endpoint_state state) override { return make_ready_future(); }
|
|
virtual future<> on_dead(inet_address endpoint, endpoint_state state) override;
|
|
virtual future<> on_remove(inet_address endpoint) override;
|
|
virtual future<> on_restart(inet_address endpoint, endpoint_state ep_state) override;
|
|
|
|
private:
|
|
void fail_all_sessions();
|
|
void fail_sessions(inet_address endpoint);
|
|
bool has_peer(inet_address endpoint) const;
|
|
|
|
void init_messaging_service_handler();
|
|
future<> uninit_messaging_service_handler();
|
|
future<> update_io_throughput(uint32_t value_mbs);
|
|
|
|
public:
|
|
void update_finished_percentage(streaming::stream_reason reason, float percentage);
|
|
};
|
|
|
|
} // namespace streaming
|