Files
scylladb/test/boost/continuous_data_consumer_test.cc
Botond Dénes 936619a8d3 sstables/continuous_data_consumer: track buffers used for parsing
Based on heap profiling, buffers used for storing half-parsed fields are
a major contributor to the overall memory consumption of reads. This
memory was completely "under the radar" before. Track it by using
tracked `temporary_buffer` instances everywhere in
`continuous_data_consumer`. As `continuous_data_consumer` is the basis
for parsing all index and data files, adding the tracing here
automatically covers all data, index and promoted index parsing.

I'm almost convinced that there is a better place to store the `permit`
then the three places now, but so far I was unable to completely
decipher the our data/index file parsing class hierarchy.
2020-01-28 08:13:16 +02:00

117 lines
3.4 KiB
C++

/*
* Copyright (C) 2018 ScyllaDB
*/
/*
* This file is part of Scylla.
*
* Scylla is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Scylla is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Scylla. If not, see <http://www.gnu.org/licenses/>.
*/
#include "vint-serialization.hh"
#include "sstables/consumer.hh"
#include "bytes.hh"
#include "utils/buffer_input_stream.hh"
#include <boost/test/unit_test.hpp>
#include <seastar/core/iostream.hh>
#include <seastar/core/temporary_buffer.hh>
#include <seastar/core/thread.hh>
#include <seastar/testing/test_case.hh>
#include <seastar/testing/thread_test_case.hh>
#include <random>
namespace {
class test_consumer final : public data_consumer::continuous_data_consumer<test_consumer> {
static const int MULTIPLIER = 10;
uint64_t _tested_value;
int _state = 0;
int _count = 0;
void check(uint64_t got) {
BOOST_REQUIRE_EQUAL(_tested_value, got);
}
static uint64_t calculate_length(uint64_t tested_value) {
return MULTIPLIER * unsigned_vint::serialized_size(tested_value);
}
static input_stream<char> prepare_stream(uint64_t tested_value) {
temporary_buffer<char> buf(calculate_length(tested_value));
int pos = 0;
bytes::value_type* out = reinterpret_cast<bytes::value_type*>(buf.get_write());
for (int i = 0; i < MULTIPLIER; ++i) {
pos += unsigned_vint::serialize(tested_value, out + pos);
}
return make_buffer_input_stream(std::move(buf), [] {return 1;});
}
public:
test_consumer(uint64_t tested_value)
: continuous_data_consumer(no_reader_permit(), prepare_stream(tested_value), 0, calculate_length(tested_value))
, _tested_value(tested_value)
{ }
bool non_consuming() { return false; }
void verify_end_state() {}
data_consumer::processing_result process_state(temporary_buffer<char>& data) {
switch (_state) {
case 0:
if (read_unsigned_vint(data) != read_status::ready) {
_state = 1;
break;
}
// fall-through
case 1:
check(_u64);
++_count;
_state = _count < MULTIPLIER ? 0 : 2;
break;
default:
BOOST_FAIL("wrong consumer state");
}
return _state == 2 ? data_consumer::proceed::no : data_consumer::proceed::yes;
}
void run() {
consume_input().get();
}
};
}
SEASTAR_THREAD_TEST_CASE(test_read_unsigned_vint) {
static std::random_device rd;
static std::mt19937 rng(rd());
auto nr_tests =
#ifdef SEASTAR_DEBUG
10
#else
1000
#endif
;
test_consumer(0).run();
for (int highest_bit = 0; highest_bit < 64; ++highest_bit) {
uint64_t tested_value = uint64_t{1} << highest_bit;
for (int i = 0; i < nr_tests; ++i) {
test_consumer(tested_value + (rng() % tested_value)).run();
}
}
}