Files
scylladb/test/boost/gcp_object_storage_test.cc
Avi Kivity 0ae22a09d4 LICENSE: Update to version 1.1
Updated terms of non-commercial use (must be a never-customer).
2026-04-12 19:46:33 +03:00

281 lines
10 KiB
C++

/*
* Copyright (C) 2025-present ScyllaDB
*/
/*
* SPDX-License-Identifier: LicenseRef-ScyllaDB-Source-Available-1.1
*/
#include "utils/gcp/object_storage.hh"
#include "utils/gcp/gcp_credentials.hh"
#include <unordered_set>
#include <filesystem>
#include <boost/test/unit_test.hpp>
#include <boost/algorithm/string/split.hpp>
#include <boost/algorithm/string/classification.hpp>
#include <seastar/core/thread.hh>
#include <seastar/core/reactor.hh>
#include <seastar/core/file.hh>
#include <seastar/core/sleep.hh>
#include <seastar/core/with_timeout.hh>
#include "test/lib/scylla_test_case.hh"
#include "test/lib/log.hh"
#include "test/lib/random_utils.hh"
#include "test/lib/test_utils.hh"
#include "test/lib/tmpdir.hh"
#include "test/lib/gcs_fixture.hh"
#include "test/lib/test_utils.hh"
#include "utils/assert.hh"
#include "utils/UUID_gen.hh"
#include "utils/io-wrappers.hh"
#include <seastar/testing/test_fixture.hh>
using namespace std::string_view_literals;
using namespace std::chrono_literals;
using namespace utils::gcp;
/*
Simple test of GCP object storage provider. Uses either real or local, fake, endpoint.
Note: the above text blobs are service account credentials, including private keys.
_Never_ give any real priviledges to these accounts, as we are obviously exposing them here.
User1 is assumed to have permissions to read/write the bucket
User2 is assumed to only have permissions to read the bucket, but permission to
impersonate User1.
Note: fake gcp storage does not have any credentials or permissions, so
for testing with such, leave them unset to skip those tests.
This test is parameterized with env vars:
* ENABLE_GCP_STORAGE_TEST - set to non-zero (1/true) to run
* GCP_STORAGE_ENDPOINT - set to endpoint host. default is https://storage.googleapis.com
* GCP_STORAGE_PROJECT - project in which to create bucket (if not specified)
* GCP_STORAGE_USER_1_CREDENTIALS - set to credentials file for user1
* GCP_STORAGE_USER_2_CREDENTIALS - set to credentials file for user2
* GCP_STORAGE_BUCKET - set to test bucket
*/
static auto check_gcp_storage_test_enabled() {
return tests::check_run_test_decorator("ENABLE_GCP_STORAGE_TEST", true);
}
static future<> create_object_of_size(storage::client& c
, std::string_view bucket
, std::string_view name
, size_t dest_size
, std::vector<temporary_buffer<char>>* buffer_store = nullptr
, std::optional<size_t> specific_buffer_size = std::nullopt
)
{
auto sink = c.create_upload_sink(bucket, name);
size_t done = 0;
while (done < dest_size) {
auto rem = dest_size - done;
auto len = std::min(rem, specific_buffer_size.value_or(tests::random::get_int(size_t(1), size_t(4*1024*1024))));
auto rnd = tests::random::get_bytes(len);
temporary_buffer<char> buf(reinterpret_cast<char*>(rnd.data()), rnd.size());
if (buffer_store) {
buffer_store->emplace_back(buf.share());
}
co_await sink.put(std::move(buf));
done += len;
}
co_await sink.flush();
co_await sink.close();
}
static future<> compare_object_data(const local_gcs_wrapper& env, std::string_view object_name, std::vector<temporary_buffer<char>>&& bufs) {
auto& c = env.client();
auto total = std::accumulate(bufs.begin(), bufs.end(), size_t{}, [](size_t s, auto& buf) {
return s + buf.size();
});
auto source = c.create_download_source(env.bucket, object_name);
auto is1 = seastar::input_stream<char>(std::move(source));
auto is2 = seastar::input_stream<char>(create_memory_source(std::move(bufs)));
uint64_t read = 0;
while (!is1.eof()) {
auto buf = co_await is1.read();
if (buf.empty()) {
break;
}
auto buf2 = co_await is2.read_exactly(buf.size());
BOOST_REQUIRE_EQUAL(buf, buf2);
read += buf.size();
}
BOOST_REQUIRE_EQUAL(read, total);
}
using namespace std::string_literals;
static constexpr auto prefix = "bork/ninja/"s;
// #28398 include a prefix in all names.
static std::string make_name() {
return fmt::format("{}{}", prefix, utils::UUID_gen::get_time_UUID());
}
static future<> test_read_write_helper(const local_gcs_wrapper& env, size_t dest_size, std::optional<size_t> specific_buffer_size = std::nullopt) {
auto& c = env.client();
auto name = make_name();
std::vector<temporary_buffer<char>> written;
// ensure we remove the object
env.objects_to_delete.emplace_back(name);
co_await create_object_of_size(c, env.bucket, name, dest_size, &written, specific_buffer_size);
co_await compare_object_data(env, name, std::move(written));
}
BOOST_AUTO_TEST_SUITE(gcs_tests, *seastar::testing::async_fixture<gcs_fixture>())
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_create_small_object, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
co_await test_read_write_helper(*this, 8*4);
}
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_create_large_object, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
co_await test_read_write_helper(*this, 32*1024*1024 + 357 + 1022*67);
}
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_create_small_object_64kbuf, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
co_await test_read_write_helper(*this, 618480, 64*1024);
}
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_create_large_object_64kbuf, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
co_await test_read_write_helper(*this, 32*1024*1024 + 357 + 1022*67, 64*1024);
}
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_list_objects, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
auto& env = *this;
auto& c = env.client();
std::unordered_map<std::string, uint64_t> names;
for (size_t i = 0; i < 10; ++i) {
auto name = make_name();
auto size = tests::random::get_int(size_t(1), size_t(2*1024*1024));
env.objects_to_delete.emplace_back(name);
co_await create_object_of_size(c, env.bucket, name, size);
names.emplace(name, size);
}
utils::gcp::storage::bucket_paging paging;
size_t n_found = 0;
for (;;) {
auto infos = co_await c.list_objects(env.bucket, "", paging);
for (auto& info : infos) {
auto i = names.find(info.name);
if (i != names.end()) {
BOOST_REQUIRE_EQUAL(info.size, i->second);
++n_found;
}
}
if (infos.empty()) {
break;
}
}
BOOST_REQUIRE_EQUAL(n_found, names.size());
}
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_delete_object, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
auto& env = *this;
auto& c = env.client();
auto name = make_name();
env.objects_to_delete.emplace_back(name);
co_await create_object_of_size(c, env.bucket, name, 128);
{
// validate object was created.
auto infos = co_await c.list_objects(env.bucket, name);
BOOST_REQUIRE(std::find_if(infos.begin(), infos.end(), [&](auto& info) {
return info.name == name;
}) != infos.end());
}
co_await c.delete_object(env.bucket, name);
auto infos = co_await c.list_objects(env.bucket, name);
BOOST_REQUIRE(infos.empty());
}
SEASTAR_FIXTURE_TEST_CASE(test_gcp_storage_skip_read, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
auto& env = *this;
auto& c = env.client();
auto name = make_name();
std::vector<temporary_buffer<char>> bufs;
constexpr size_t file_size = 12*1024*1024 + 384*7 + 31;
co_await create_object_of_size(c, env.bucket, name, 12*1024*1024, &bufs);
for (size_t i = 0; i < 20; ++i) {
auto source = c.create_download_source(env.bucket, name);
auto copy = bufs | std::views::transform([](auto& buf) { return buf.share(); });
auto is1 = seastar::input_stream<char>(std::move(source));
auto is2 = seastar::input_stream<char>(create_memory_source(std::vector<temporary_buffer<char>>(copy.begin(), copy.end())));
std::exception_ptr p;
try {
size_t pos = 0;
while (pos < file_size) {
auto rem = file_size - pos;
auto skip = tests::random::get_int(std::min(rem, size_t(100)), rem);
auto read = std::min(rem - skip, size_t(tests::random::get_int(31, 2048)));
co_await is1.skip(skip);
co_await is2.skip(skip);
auto b1 = co_await is1.read_exactly(read);
auto b2 = co_await is2.read_exactly(read);
BOOST_REQUIRE_EQUAL(b1.size(), b2.size());
if (b1 != b2) {
BOOST_TEST_MESSAGE(fmt::format("diff at {} ({} bytes)", pos + skip, read));
auto i = std::mismatch(b1.begin(), b1.end(), b2.begin());
BOOST_TEST_MESSAGE(fmt::format("offset {}", std::distance(b1.begin(), i.first)));
}
BOOST_REQUIRE_EQUAL(b1, b2);
pos += (skip + read);
}
} catch (...) {
p = std::current_exception();
}
co_await is1.close();
co_await is2.close();
if (p) {
std::rethrow_exception(p);
}
}
}
SEASTAR_FIXTURE_TEST_CASE(test_merge_objects, local_gcs_wrapper, *check_gcp_storage_test_enabled()) {
auto& env = *this;
auto& c = env.client();
std::vector<temporary_buffer<char>> bufs;
std::vector<std::string> names;
size_t total = 0;
for (size_t i = 0; i < 32; ++i) {
auto name = make_name();
auto size = tests::random::get_int(size_t(1), size_t(2*1024*1024));
env.objects_to_delete.emplace_back(name);
co_await create_object_of_size(c, env.bucket, name, size, &bufs);
names.emplace_back(name);
total += size;
}
auto name = make_name();
env.objects_to_delete.emplace_back(name);
auto info = co_await c.merge_objects(env.bucket, name, names);
BOOST_REQUIRE_EQUAL(info.name, name);
BOOST_REQUIRE_EQUAL(info.size, total);
co_await compare_object_data(env, name, std::move(bufs));
}
BOOST_AUTO_TEST_SUITE_END()