Files
scylladb/sstables/open_info.hh
Taras Veretilnyk c123f637ea sstables: add option to ignore component digest mismatches
Add `ignore_component_digest_mismatch` option to `sstable_open_config`
that logs a warning instead of throwing `malformed_sstable_exception`
on component digest mismatch. This is useful for recovering sstables
with corrupted non-vital components or working around bugs in digest
calculation.

Expose the option in scylla-sstable via the
`--ignore-component-digest-mismatch` flag for the upgrade operation.
2026-03-10 19:24:05 +01:00

95 lines
3.7 KiB
C++

/*
* Copyright (C) 2020-present ScyllaDB
*
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
*/
#pragma once
#include <seastar/core/sstring.hh>
#include <seastar/core/file.hh>
#include <seastar/core/sharded.hh>
#include <vector>
#include "sstables/version.hh"
#include "sstables/component_type.hh"
#include "sstables/shareable_components.hh"
#include "sstables/generation_type.hh"
#include <seastar/core/shared_ptr.hh>
namespace sstables {
enum class sstable_state {
normal,
staging,
quarantine,
upload,
};
struct entry_descriptor {
generation_type generation;
sstable_version_types version;
sstable_format_types format;
component_type component;
std::optional<sstable_state> state;
entry_descriptor(generation_type generation,
sstable_version_types version, sstable_format_types format,
component_type component, std::optional<sstable_state> state = {})
: generation(generation), version(version), format(format), component(component), state(state) {}
};
// Parses sstable file path extracting entry_descriptor from it. Returns the descriptor
// and the keyspace.table pair of strings.
std::tuple<entry_descriptor, sstring, sstring> parse_path(const std::filesystem::path& sst_path);
// Use the given ks and cf and don't attempt to extract it from the dir path.
// This allows loading sstables from any path, but the filename still has to be valid.
entry_descriptor parse_path(const std::filesystem::path& sst_path, sstring ks, sstring cf);
// contains data for loading a sstable using components shared by a single shard;
// can be moved across shards
struct foreign_sstable_open_info {
foreign_ptr<lw_shared_ptr<shareable_components>> components;
std::vector<shard_id> owners;
seastar::file_handle data;
std::optional<seastar::file_handle> index;
std::optional<seastar::file_handle> partitions;
std::optional<seastar::file_handle> rows;
generation_type generation;
sstable_version_types version;
sstable_format_types format;
uint64_t uncompressed_data_size;
uint64_t metadata_size_on_disk;
};
struct sstable_open_config {
// Load the first and last position in partition, populating the
// `_first_partition_first_position` and `_last_partition_last_position`
// fields respectively. Problematic sstables might fail to load. Set to
// false if you want to disable this, to be able to read such sstables.
// Should only be disabled for diagnostics purposes.
// FIXME: Enable it by default once the root cause of large allocation when reading sstable in reverse is fixed.
// Ref: https://github.com/scylladb/scylladb/issues/11642
bool load_first_and_last_position_metadata = false;
// If the bloom filter is not loaded, the SSTable will use an always-present
// filter, meaning that the SSTable will be opened on every single-partition
// read.
bool load_bloom_filter = true;
// Mimics behavior when a SSTable is streamed to a given shard, where SSTable
// writer considers the shard that created the SSTable as its owner.
bool current_shard_as_sstable_owner = false;
// Do not move the sharding metadata to the sharder, keeping it in the scylla metadata..
bool keep_sharding_metadata = false;
// Allows unsealed sstable to be loaded, since it must read components from temporary TOC instead.
bool unsealed_sstable = false;
// When true, log a warning instead of throwing on component digest mismatch.
// Useful for recovering sstables with corrupted non-vital components or
// working around bugs in digest calculation.
bool ignore_component_digest_mismatch = false;
};
}