Files
scylladb/test/boost/advanced_rpc_compressor_test.cc
Michał Chojnowski 0fd1050784 utils: add advanced_rpc_compressor
Adds glue needed to pass lz4 and zstd with streaming and/or dictionaries
as the network traffic compressors for Seastar's RPC servers.

The main jobs of this glue are:
1. Implementing the API expected by Seastar from RPC compressors.
2. Expose metrics about the effectiveness of the compression.
3. Allow dynamically switching algorithms and dictionaries on a running
   connection, without any extra waits.

The biggest design decision here is that the choice of algorithm and dictionary
is negotiated by both sides of the connection, not dictated unilaterally by the
sender.

The negotiation algorithm is fairly complicated (a TLA+ model validating
it is included in the commit). Unilateral compression choice would be much simpler.
However, negotiation avoids re-sending the same dictionary over every
connection in the cluster after dictionary updates (with one-way communication,
it's the only reliable way to ensure that our receiver possesses the dictionary
we are about to start using), lets receivers ask for a cheaper compression mode
if they want, and lets them refuse to update a dictionary if they don't think
they have enough free memory for that.

In hindsight, those properties probably weren't worth the extra complexity and
extra development effort.

Zstd can be quite expensive, so this patch also includes a mechanism which
temporarily downgrades the compressor from zstd to lz4 if zstd has been
using too much CPU in a given slice of time. But it should be noted that
this can't be treated as a reliable "protection" from negative performance
effects of zstd, since a downgrade can happen on the sender side,
and receivers are at the mercy of senders.
2024-12-23 23:37:02 +01:00

292 lines
13 KiB
C++

/*
* Copyright (C) 2023-present ScyllaDB
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
*/
#include "seastar/core/manual_clock.hh"
#include "seastar/util/closeable.hh"
#include "test/lib/random_utils.hh"
#include "test/lib/scylla_test_case.hh"
#include "utils/advanced_rpc_compressor.hh"
#include "utils/advanced_rpc_compressor_protocol.hh"
using namespace seastar;
using namespace std::chrono_literals;
static utils::dict_ptr make_dict(uint64_t timestamp, std::vector<std::byte> content = {}) {
return make_lw_shared(make_foreign(make_lw_shared(utils::shared_dict(std::move(content), timestamp, {}))));
}
SEASTAR_THREAD_TEST_CASE(test_control_protocol_sanity) {
condition_variable cv;
auto dict_1 = make_dict(1);
auto dict_2 = make_dict(2);
utils::control_protocol alice(cv);
utils::control_protocol bob(cv);
auto settle = [&] {
bool run = true;
while (run) {
run = false;
if (auto msg = alice.produce_control_header()) {
bob.consume_control_header(*msg);
run = true;
}
if (auto msg = bob.produce_control_header()) {
alice.consume_control_header(*msg);
run = true;
}
}
};
alice.announce_dict(dict_1);
bob.announce_dict(dict_2);
settle();
BOOST_REQUIRE(alice.sender_current_dict().id == utils::shared_dict::dict_id());
BOOST_REQUIRE(bob.sender_current_dict().id == utils::shared_dict::dict_id());
alice.announce_dict(dict_2);
settle();
BOOST_REQUIRE(alice.sender_current_dict().id == (**dict_2).id);
BOOST_REQUIRE(bob.sender_current_dict().id == (**dict_2).id);
alice.announce_dict(nullptr);
settle();
BOOST_REQUIRE(alice.sender_current_dict().id == (**dict_2).id);
BOOST_REQUIRE(bob.sender_current_dict().id == (**dict_2).id);
bob.announce_dict(nullptr);
settle();
BOOST_REQUIRE(alice.sender_current_dict().id == utils::shared_dict::dict_id());
BOOST_REQUIRE(bob.sender_current_dict().id == utils::shared_dict::dict_id());
}
temporary_buffer<char> bytes_view_to_temporary_buffer(bytes_view bv) {
return temporary_buffer<char>(reinterpret_cast<const char*>(bv.data()), bv.size());
}
template<class T>
concept RpcBuf = std::same_as<T, rpc::rcv_buf> || std::same_as<T, rpc::snd_buf>;
template <RpcBuf Buf>
bytes rpc_buf_to_bytes(const Buf& data) {
if (auto src = std::get_if<temporary_buffer<char>>(&data.bufs)) {
return bytes(reinterpret_cast<const bytes::value_type*>(src->get()), src->size());
}
auto src = std::get<std::vector<temporary_buffer<char>>>(data.bufs).data();
auto out = bytes(bytes::initialized_later{}, data.size);
size_t i = 0;
while (i < data.size) {
std::memcpy(&out[i], src->get(), src->size());
i += src->size();
++src;
}
return out;
}
template <RpcBuf Buf, RpcBuf BufFrom>
Buf convert_rpc_buf(BufFrom data) {
Buf b;
b.size = data.size;
b.bufs = std::move(data.bufs);
return b;
}
class tracker_without_clock final : public utils::advanced_rpc_compressor::tracker {
virtual uint64_t get_steady_nanos() const override {
return 0;
}
public:
using tracker::tracker;
};
SEASTAR_THREAD_TEST_CASE(test_tracker_basic_sanity) {
for (const bool checksumming : {false, true})
for (const auto& zstd_cpu_limit : {0.0, 1.0}) {
auto cfg = utils::advanced_rpc_compressor::tracker::config{
.zstd_quota_fraction{zstd_cpu_limit},
.algo_config = utils::updateable_value<utils::algo_config>{
{utils::compression_algorithm::type::ZSTD, utils::compression_algorithm::type::LZ4},
},
.checksumming = utils::updateable_value<bool>{checksumming},
};
tracker_without_clock tracker{cfg};
auto feature_string = tracker.supported();
auto server_compressor = tracker.negotiate(feature_string, true, [] { return make_ready_future<>(); });
auto close_server_compressor = deferred_close(*server_compressor);
auto client_compressor = tracker.negotiate(server_compressor->name(), false, [] { return make_ready_future<>(); });
auto close_client_compressor = deferred_close(*client_compressor);
for (const auto [a, b] : {
std::make_pair(std::ref(server_compressor), std::ref(client_compressor)),
std::make_pair(std::ref(client_compressor), std::ref(server_compressor)),
})
for (int repeat = 0; repeat < 10; ++repeat) {
auto message = tests::random::get_bytes(100000) + bytes(size_t(100000), bytes::value_type(0));
constexpr int head_space = 4;
auto compressed = a->compress(head_space, rpc::snd_buf{bytes_view_to_temporary_buffer(message)});
compressed.front().trim_front(head_space);
compressed.size -= head_space;
// Mess with the header deserializer by prepending an empty fragment to `compressed`.
if (auto src = std::get_if<temporary_buffer<char>>(&compressed.bufs)) {
auto vec = std::vector<temporary_buffer<char>>();
vec.push_back(std::move(*src));
compressed.bufs = std::move(vec);
}
auto &vec = std::get<std::vector<temporary_buffer<char>>>(compressed.bufs);
vec.insert(vec.begin(), temporary_buffer<char>());
auto decompressed = b->decompress(convert_rpc_buf<rpc::rcv_buf>(std::move(compressed)));
BOOST_REQUIRE_EQUAL(message, rpc_buf_to_bytes(decompressed));
}
}
}
SEASTAR_THREAD_TEST_CASE(test_tracker_dict_sanity) {
for (const auto& algo : {utils::compression_algorithm::type::ZSTD, utils::compression_algorithm::type::LZ4}) {
auto cfg = utils::advanced_rpc_compressor::tracker::config{
.zstd_quota_fraction{1.0},
.algo_config = utils::updateable_value<utils::algo_config>{
{utils::compression_algorithm::type::RAW},
},
};
tracker_without_clock tracker{cfg};
auto feature_string = tracker.supported();
auto server_compressor = tracker.negotiate(feature_string, true, [] { return make_ready_future<>(); });
auto close_server_compressor = deferred_close(*server_compressor);
auto client_compressor = tracker.negotiate(server_compressor->name(), false, [] { return make_ready_future<>(); });
auto close_client_compressor = deferred_close(*client_compressor);
auto message = tests::random::get_bytes(8192);
auto message_view = std::span<const std::byte>(reinterpret_cast<const std::byte*>(message.data()), message.size());
// We will send messages which perfectly match the dict.
// If dict negotiation succeeds as expected, this should result in very small messages.
auto dict = make_dict(1, {message_view.begin(), message_view.end()});
tracker.announce_dict(dict);
tracker.set_supported_algos(utils::compression_algorithm_set::singleton(algo));
// Arbitrary number of repeats.
for (int repeat = 0; repeat < 10; ++repeat)
for (const auto [a, b] : {
std::make_pair(std::ref(server_compressor), std::ref(client_compressor)),
std::make_pair(std::ref(client_compressor), std::ref(server_compressor)),
}) {
constexpr int head_space = 4;
auto compressed = a->compress(head_space, rpc::snd_buf{bytes_view_to_temporary_buffer(message)});
// The dict negotiation should have settled after a few repeats.
if (repeat >= 5) {
// `100` here is an arbitrary "small size".
BOOST_REQUIRE_LE(compressed.size, 100);
}
compressed.front().trim_front(head_space);
compressed.size -= head_space;
auto decompressed = b->decompress(convert_rpc_buf<rpc::rcv_buf>(std::move(compressed)));
BOOST_REQUIRE_EQUAL(message, rpc_buf_to_bytes(decompressed));
}
}
}
SEASTAR_THREAD_TEST_CASE(test_tracker_cpu_limit_shortterm) {
constexpr int quota = 10;
constexpr int quota_refresh = 128;
auto cfg = utils::advanced_rpc_compressor::tracker::config{
.zstd_quota_fraction{float(quota) / quota_refresh},
.zstd_quota_refresh_ms{quota_refresh},
.algo_config = utils::updateable_value<utils::algo_config>{
{utils::compression_algorithm::type::ZSTD, utils::compression_algorithm::type::LZ4},
},
};
struct manual_clock_tracker : utils::advanced_rpc_compressor::tracker_with_clock<manual_clock, manual_clock> {
using tracker_with_clock::tracker_with_clock;
virtual uint64_t get_steady_nanos() const override {
manual_clock::advance(std::chrono::milliseconds(1));
return std::chrono::nanoseconds(manual_clock::now().time_since_epoch()).count();
}
};
manual_clock_tracker tracker{cfg};
auto feature_string = tracker.supported();
auto server_compressor = tracker.negotiate(feature_string, true, [] { return make_ready_future<>(); });
auto close_server_compressor = deferred_close(*server_compressor);
auto client_compressor = tracker.negotiate(server_compressor->name(), false, [] { return make_ready_future<>(); });
auto close_client_compressor = deferred_close(*client_compressor);
// Settle negotiations
for (int i = 0; i < 3; ++i) {
auto msg = server_compressor->compress(0, rpc::snd_buf{0});
client_compressor->decompress(convert_rpc_buf<rpc::rcv_buf>(std::move(msg)));
msg = client_compressor->compress(0, rpc::snd_buf{0});
server_compressor->decompress(convert_rpc_buf<rpc::rcv_buf>(std::move(msg)));
}
// Refresh quotas.
manual_clock::advance(std::chrono::milliseconds(1000));
for (int repeat = 0; repeat < 5; ++repeat) {
auto before = tracker.get_stats()[utils::compression_algorithm(utils::compression_algorithm::type::ZSTD).idx()];
// Do many compressions.
for (int i = 0; i < 30; ++i) {
client_compressor->compress(0, rpc::snd_buf{0});
}
// Check that the quota is respected.
auto after = tracker.get_stats()[utils::compression_algorithm(utils::compression_algorithm::type::ZSTD).idx()];
BOOST_REQUIRE_EQUAL(std::chrono::nanoseconds(after.compression_cpu_nanos - before.compression_cpu_nanos), std::chrono::milliseconds(quota));
// Refresh quotas.
manual_clock::advance(std::chrono::milliseconds(1000));
}
}
SEASTAR_THREAD_TEST_CASE(test_tracker_cpu_limit_longterm) {
constexpr static auto step = std::chrono::milliseconds(10);
constexpr static auto limit = 0.1;
auto cfg = utils::advanced_rpc_compressor::tracker::config{
.zstd_quota_fraction{1},
.zstd_quota_refresh_ms{1},
.zstd_longterm_quota_fraction{limit},
.zstd_longterm_quota_refresh_ms{1000},
.algo_config = utils::updateable_value<utils::algo_config>{
{utils::compression_algorithm::type::ZSTD, utils::compression_algorithm::type::LZ4},
},
};
struct manual_clock_tracker : utils::advanced_rpc_compressor::tracker_with_clock<manual_clock, manual_clock> {
using tracker_with_clock::tracker_with_clock;
virtual uint64_t get_steady_nanos() const override {
manual_clock::advance(step);
return std::chrono::nanoseconds(manual_clock::now().time_since_epoch()).count();
}
};
manual_clock_tracker tracker{cfg};
auto feature_string = tracker.supported();
auto server_compressor = tracker.negotiate(feature_string, true, [] { return make_ready_future<>(); });
auto close_server_compressor = deferred_close(*server_compressor);
auto client_compressor = tracker.negotiate(server_compressor->name(), false, [] { return make_ready_future<>(); });
auto close_client_compressor = deferred_close(*client_compressor);
// Settle negotiations
for (int i = 0; i < 3; ++i) {
auto msg = server_compressor->compress(0, rpc::snd_buf{0});
client_compressor->decompress(convert_rpc_buf<rpc::rcv_buf>(std::move(msg)));
msg = client_compressor->compress(0, rpc::snd_buf{0});
server_compressor->decompress(convert_rpc_buf<rpc::rcv_buf>(std::move(msg)));
}
constexpr int n_compressions = 1000;
auto used_before = tracker.get_stats()[utils::compression_algorithm(utils::compression_algorithm::type::ZSTD).idx()];
auto clock_before = manual_clock::now();
// Do many compressions.
for (int i = 0; i < n_compressions; ++i) {
client_compressor->compress(0, rpc::snd_buf{0});
}
// Check that the quota is respected.
auto used_after = tracker.get_stats()[utils::compression_algorithm(utils::compression_algorithm::type::ZSTD).idx()];
auto clock_after = manual_clock::now();
auto used = std::chrono::nanoseconds(used_after.compression_cpu_nanos - used_before.compression_cpu_nanos);
auto elapsed = clock_after - clock_before;
BOOST_REQUIRE_GE(used, elapsed * limit * 0.9);
BOOST_REQUIRE_LE(used, elapsed * limit * 1.1);
}