Add `ignore_component_digest_mismatch` option to `sstable_open_config` that logs a warning instead of throwing `malformed_sstable_exception` on component digest mismatch. This is useful for recovering sstables with corrupted non-vital components or working around bugs in digest calculation. Expose the option in scylla-sstable via the `--ignore-component-digest-mismatch` flag for the upgrade operation.
95 lines
3.7 KiB
C++
95 lines
3.7 KiB
C++
/*
|
|
* Copyright (C) 2020-present ScyllaDB
|
|
*
|
|
*/
|
|
|
|
/*
|
|
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.0
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include <seastar/core/sstring.hh>
|
|
#include <seastar/core/file.hh>
|
|
#include <seastar/core/sharded.hh>
|
|
#include <vector>
|
|
#include "sstables/version.hh"
|
|
#include "sstables/component_type.hh"
|
|
#include "sstables/shareable_components.hh"
|
|
#include "sstables/generation_type.hh"
|
|
#include <seastar/core/shared_ptr.hh>
|
|
|
|
namespace sstables {
|
|
|
|
enum class sstable_state {
|
|
normal,
|
|
staging,
|
|
quarantine,
|
|
upload,
|
|
};
|
|
|
|
struct entry_descriptor {
|
|
generation_type generation;
|
|
sstable_version_types version;
|
|
sstable_format_types format;
|
|
component_type component;
|
|
std::optional<sstable_state> state;
|
|
|
|
entry_descriptor(generation_type generation,
|
|
sstable_version_types version, sstable_format_types format,
|
|
component_type component, std::optional<sstable_state> state = {})
|
|
: generation(generation), version(version), format(format), component(component), state(state) {}
|
|
};
|
|
|
|
// Parses sstable file path extracting entry_descriptor from it. Returns the descriptor
|
|
// and the keyspace.table pair of strings.
|
|
std::tuple<entry_descriptor, sstring, sstring> parse_path(const std::filesystem::path& sst_path);
|
|
|
|
// Use the given ks and cf and don't attempt to extract it from the dir path.
|
|
// This allows loading sstables from any path, but the filename still has to be valid.
|
|
entry_descriptor parse_path(const std::filesystem::path& sst_path, sstring ks, sstring cf);
|
|
|
|
// contains data for loading a sstable using components shared by a single shard;
|
|
// can be moved across shards
|
|
struct foreign_sstable_open_info {
|
|
foreign_ptr<lw_shared_ptr<shareable_components>> components;
|
|
std::vector<shard_id> owners;
|
|
seastar::file_handle data;
|
|
std::optional<seastar::file_handle> index;
|
|
std::optional<seastar::file_handle> partitions;
|
|
std::optional<seastar::file_handle> rows;
|
|
generation_type generation;
|
|
sstable_version_types version;
|
|
sstable_format_types format;
|
|
uint64_t uncompressed_data_size;
|
|
uint64_t metadata_size_on_disk;
|
|
};
|
|
|
|
struct sstable_open_config {
|
|
// Load the first and last position in partition, populating the
|
|
// `_first_partition_first_position` and `_last_partition_last_position`
|
|
// fields respectively. Problematic sstables might fail to load. Set to
|
|
// false if you want to disable this, to be able to read such sstables.
|
|
// Should only be disabled for diagnostics purposes.
|
|
// FIXME: Enable it by default once the root cause of large allocation when reading sstable in reverse is fixed.
|
|
// Ref: https://github.com/scylladb/scylladb/issues/11642
|
|
bool load_first_and_last_position_metadata = false;
|
|
// If the bloom filter is not loaded, the SSTable will use an always-present
|
|
// filter, meaning that the SSTable will be opened on every single-partition
|
|
// read.
|
|
bool load_bloom_filter = true;
|
|
// Mimics behavior when a SSTable is streamed to a given shard, where SSTable
|
|
// writer considers the shard that created the SSTable as its owner.
|
|
bool current_shard_as_sstable_owner = false;
|
|
// Do not move the sharding metadata to the sharder, keeping it in the scylla metadata..
|
|
bool keep_sharding_metadata = false;
|
|
// Allows unsealed sstable to be loaded, since it must read components from temporary TOC instead.
|
|
bool unsealed_sstable = false;
|
|
// When true, log a warning instead of throwing on component digest mismatch.
|
|
// Useful for recovering sstables with corrupted non-vital components or
|
|
// working around bugs in digest calculation.
|
|
bool ignore_component_digest_mismatch = false;
|
|
};
|
|
|
|
}
|