Files
scylladb/service/storage_proxy_stats.hh
Petr Gusev 819d59eeba storage_proxy_stats: add fenced_out_requests metric
We have to drop const qualifiers because now check_fence
needs to mutate this metric.
2025-09-15 11:24:53 +02:00

232 lines
7.8 KiB
C++

/*
* Copyright (C) 2018-present ScyllaDB
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
*/
#pragma once
#include "utils/estimated_histogram.hh"
#include "utils/histogram.hh"
#include <seastar/core/metrics.hh>
#include "locator/host_id.hh"
namespace locator { class topology; }
namespace service {
namespace storage_proxy_stats {
// split statistics counters
struct split_stats {
static seastar::metrics::label datacenter_label;
private:
struct stats_counter {
uint64_t val = 0;
};
// counter of operations performed on a local Node
stats_counter _local;
// counters of operations performed on external Nodes aggregated per Nodes' DCs
std::unordered_map<sstring, stats_counter> _dc_stats;
// collectd registrations container
seastar::metrics::metric_groups _metrics;
// a prefix string that will be used for a collectd counters' description
sstring _short_description_prefix;
sstring _long_description_prefix;
// a statistics category, e.g. "client" or "replica"
sstring _category;
// type of operation (data/digest/mutation_data)
sstring _op_type;
// whether to register per-endpoint metrics automatically
bool _auto_register_metrics;
scheduling_group _sg;
public:
/**
* @param category a statistics category, e.g. "client" or "replica"
* @param short_description_prefix a short description prefix
* @param long_description_prefix a long description prefix
*/
split_stats(const sstring& category, const sstring& short_description_prefix, const sstring& long_description_prefix, const sstring& op_type, bool auto_register_metrics = true);
void register_metrics_local();
void register_metrics_for(sstring dc, locator::host_id ep);
/**
* Get a reference to the statistics counter corresponding to the given
* destination.
*
* @param ep address of a destination
*
* @return a reference to the requested counter
*/
uint64_t& get_ep_stat(const locator::topology& topo, locator::host_id ep) noexcept;
};
struct write_stats {
// total write attempts
split_stats writes_attempts;
split_stats writes_errors;
split_stats background_replica_writes_failed;
// write attempts due to Read Repair logic
split_stats read_repair_write_attempts;
utils::timed_rate_moving_average write_unavailables;
utils::timed_rate_moving_average write_timeouts;
utils::timed_rate_moving_average write_rate_limited_by_replicas;
utils::timed_rate_moving_average write_rate_limited_by_coordinator;
utils::timed_rate_moving_average_summary_and_histogram write;
utils::timed_rate_moving_average cas_write_unavailables;
utils::timed_rate_moving_average cas_write_timeouts;
utils::timed_rate_moving_average_summary_and_histogram cas_write;
utils::estimated_histogram cas_write_contention;
uint64_t writes = 0;
// A CQL write query arrived to a non-replica node and was
// forwarded by a coordinator to a replica
uint64_t writes_coordinator_outside_replica_set = 0;
// A CQL read query arrived to a non-replica node and was
// forwarded by a coordinator to a replica
uint64_t reads_coordinator_outside_replica_set = 0;
uint64_t background_writes = 0; // client no longer waits for the write
uint64_t throttled_writes = 0; // total number of writes ever delayed due to throttling
uint64_t throttled_base_writes = 0; // current number of base writes delayed due to view update backlog
uint64_t total_throttled_base_writes = 0; // total number of base writes delayed due to view update backlog
uint64_t background_writes_failed = 0;
uint64_t writes_failed_due_to_too_many_in_flight_hints = 0;
uint64_t cas_write_unfinished_commit = 0;
uint64_t cas_write_condition_not_met = 0;
uint64_t cas_write_timeout_due_to_uncertainty = 0;
uint64_t cas_failed_read_round_optimization = 0;
uint16_t cas_now_pruning = 0;
uint64_t cas_prune = 0;
uint64_t cas_coordinator_dropped_prune = 0;
uint64_t cas_replica_dropped_prune = 0;
seastar::metrics::metric_groups _metrics;
std::chrono::microseconds last_mv_flow_control_delay; // delay added for MV flow control in the last request
uint64_t mv_flow_control_delay = 0; // total delay added for MV flow control (in microseconds)
public:
write_stats();
write_stats(const sstring& category, bool auto_register_stats);
void register_stats();
void register_split_metrics_local();
};
struct stats : public write_stats {
seastar::metrics::metric_groups _metrics;
utils::timed_rate_moving_average read_timeouts;
utils::timed_rate_moving_average read_unavailables;
utils::timed_rate_moving_average read_rate_limited_by_replicas;
utils::timed_rate_moving_average read_rate_limited_by_coordinator;
utils::timed_rate_moving_average range_slice_timeouts;
utils::timed_rate_moving_average range_slice_unavailables;
utils::timed_rate_moving_average cas_read_timeouts;
utils::timed_rate_moving_average cas_read_unavailables;
utils::estimated_histogram cas_read_contention;
uint64_t read_repair_attempts = 0;
uint64_t read_repair_repaired_blocking = 0;
uint64_t read_repair_repaired_background = 0;
uint64_t global_read_repairs_canceled_due_to_concurrent_write = 0;
// number of mutations received as a coordinator
uint64_t received_mutations = 0;
// number of counter updates received as a leader
uint64_t received_counter_updates = 0;
// number of forwarded mutations
uint64_t forwarded_mutations = 0;
uint64_t forwarding_errors = 0;
// number of read requests received as a replica
uint64_t replica_data_reads = 0;
uint64_t replica_digest_reads = 0;
uint64_t replica_mutation_data_reads = 0;
uint64_t replica_cross_shard_ops = 0;
// number of requests that resulted in a stale_topology_exception
uint64_t replica_fenced_out_requests = 0;
utils::timed_rate_moving_average_summary_and_histogram read;
utils::timed_rate_moving_average_summary_and_histogram range;
utils::timed_rate_moving_average_summary_and_histogram cas_read;
uint64_t reads = 0;
uint64_t foreground_reads = 0; // client still waits for the read
uint64_t read_retries = 0; // read is retried with new limit
uint64_t speculative_digest_reads = 0;
uint64_t speculative_data_reads = 0;
uint64_t cas_read_unfinished_commit = 0;
uint64_t cas_foreground = 0;
uint64_t cas_total_running = 0;
uint64_t cas_total_operations = 0;
// Data read attempts
split_stats data_read_attempts;
split_stats data_read_completed;
split_stats data_read_errors;
// Digest read attempts
split_stats digest_read_attempts;
split_stats digest_read_completed;
split_stats digest_read_errors;
// Mutation data read attempts
split_stats mutation_data_read_attempts;
split_stats mutation_data_read_completed;
split_stats mutation_data_read_errors;
// Received hints
uint64_t received_hints_total = 0;
uint64_t received_hints_bytes_total = 0;
public:
stats();
void register_stats();
void register_split_metrics_local();
};
/*** This struct represents stats that has meaning (only or also)
* globally. For example background_write_bytes are used to decide
* if to throttle requests and it make little sense to check it
* per scheduling group, on the other hand this statistic has value
* in figuring out how much load each scheduling group generates
* on the system, this statistic should be handled elsewhere, i.e:
* in the write_stats struct.
*/
struct global_write_stats {
seastar::metrics::metric_groups _metrics;
uint64_t background_write_bytes = 0;
uint64_t queued_write_bytes = 0;
void register_stats();
};
/***
* Following the convention of stats and write_stats
*/
struct global_stats : public global_write_stats {
void register_stats();
};
}
}