Files
scylladb/sstables/random_access_reader.cc
Taras Veretilnyk 478c1eaec5 sstables: add digest_file_random_access_reader for CRC32 digest computation
Add a new reader that wraps file_random_access_reader and computes a
running CRC32 digest over the data as it is read. The digest accumulates
across sequential read_exactly() calls and is reset on seek(), since a
non-sequential read invalidates the running checksum.
2026-03-10 19:24:05 +01:00

98 lines
2.9 KiB
C++

/*
* Copyright (C) 2020-present ScyllaDB
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
*/
#include <exception>
#include "sstables/random_access_reader.hh"
#include "utils/disk-error-handler.hh"
#include "utils/log.hh"
namespace sstables {
extern logging::logger sstlog;
future <temporary_buffer<char>> random_access_reader::read_exactly(size_t n) noexcept {
try {
return _in->read_exactly(n);
} catch (...) {
return current_exception_as_future<temporary_buffer<char>>();
}
}
static future<> close_if_needed(std::unique_ptr<input_stream<char>> in) {
if (!in) {
return make_ready_future<>();
}
return in->close().finally([in = std::move(in)] {});
}
future<> random_access_reader::seek(uint64_t pos) noexcept {
try {
auto tmp = std::make_unique<input_stream<char>>(open_at(pos));
std::swap(tmp, _in);
return close_if_needed(std::move(tmp));
} catch (...) {
return current_exception_as_future();
}
}
future<> random_access_reader::close() noexcept {
return futurize_invoke(close_if_needed, std::move(_in));
}
file_random_access_reader::file_random_access_reader(file f, uint64_t file_size, size_t buffer_size, unsigned read_ahead)
: _file(std::move(f)), _buffer_size(buffer_size), _read_ahead(read_ahead), _file_size(file_size) {
set(open_at(0));
}
input_stream<char> file_random_access_reader::open_at(uint64_t pos) {
auto len = _file_size - pos;
file_input_stream_options options;
options.buffer_size = _buffer_size;
options.read_ahead = _read_ahead;
return make_file_input_stream(_file, pos, len, std::move(options));
}
future<> file_random_access_reader::close() noexcept {
return random_access_reader::close().finally([this] {
return _file.close().handle_exception([save = _file](auto ep) {
sstlog.warn("sstable close failed: {}", ep);
general_disk_error();
});
});
}
digest_file_random_access_reader::digest_file_random_access_reader(file f, uint64_t file_size, size_t buffer_size, unsigned read_ahead)
: file_random_access_reader(std::move(f), file_size, buffer_size, read_ahead) {
_digest = crc32_utils::init_checksum();
}
future<temporary_buffer<char>> digest_file_random_access_reader::read_exactly(size_t n) noexcept {
return random_access_reader::read_exactly(n).then([this] (temporary_buffer<char> buf) {
_pos += buf.size();
if (_digest) {
uint32_t per_chunk_checksum = crc32_utils::init_checksum();
per_chunk_checksum = crc32_utils::checksum(per_chunk_checksum, buf.begin(), buf.size());
_digest = checksum_combine_or_feed<crc32_utils>(*_digest, per_chunk_checksum, buf.begin(), buf.size());
}
return buf;
});
}
future<> digest_file_random_access_reader::seek(uint64_t pos) noexcept {
_pos = pos;
return random_access_reader::seek(pos).then([this] {
_digest.reset();
});
}
}