Files
scylladb/tests/partitioner_test.cc
Asias He 9c27b5c46e byte_ordered_partitioner: Implement missing describe_ownership and midpoint
In order to support ByteOrderedPartitioner, we need to implement the
missing describe_ownership and midpoint function in
byte_ordered_partitioner class.

As a starter, this path uses a simple node token distance based method
to calculate ownership. C* uses a complicated key samples based method.
We can switch to what C* does later.

Tests are added to tests/partitioner_test.cc.

Fixes #1378
2016-07-08 17:44:55 +08:00

321 lines
14 KiB
C++

/*
* Copyright (C) 2015 ScyllaDB
*/
/*
* This file is part of Scylla.
*
* Scylla is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Scylla is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Scylla. If not, see <http://www.gnu.org/licenses/>.
*/
#define BOOST_TEST_DYN_LINK
#define BOOST_TEST_MODULE core
#include <boost/test/unit_test.hpp>
#include "dht/i_partitioner.hh"
#include "dht/murmur3_partitioner.hh"
#include "dht/byte_ordered_partitioner.hh"
#include "schema.hh"
#include "types.hh"
#include "schema_builder.hh"
#include "disk-error-handler.hh"
thread_local disk_error_signal_type commit_error;
thread_local disk_error_signal_type general_disk_error;
static dht::token token_from_long(uint64_t value) {
auto t = net::hton(value);
bytes b(bytes::initialized_later(), 8);
std::copy_n(reinterpret_cast<int8_t*>(&t), 8, b.begin());
return { dht::token::kind::key, std::move(b) };
}
BOOST_AUTO_TEST_CASE(test_decorated_key_is_compatible_with_origin) {
auto s = schema_builder("ks", "cf")
.with_column("c1", int32_type, column_kind::partition_key)
.with_column("c2", int32_type, column_kind::partition_key)
.with_column("v", int32_type)
.build();
dht::murmur3_partitioner partitioner;
auto key = partition_key::from_deeply_exploded(*s, {143, 234});
auto dk = partitioner.decorate_key(*s, key);
// Expected value was taken from Origin
BOOST_REQUIRE_EQUAL(dk._token, token_from_long(4958784316840156970));
BOOST_REQUIRE(dk._key.equal(*s, key));
}
BOOST_AUTO_TEST_CASE(test_token_wraparound_1) {
auto t1 = token_from_long(0x7000'0000'0000'0000);
auto t2 = token_from_long(0xa000'0000'0000'0000);
dht::murmur3_partitioner partitioner;
BOOST_REQUIRE(t1 > t2);
// Even without knowing what the midpoint is, it needs to be inside the
// wrapped range, i.e., between t1 and inf, OR between -inf and t2
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 || midpoint < t2);
// We can also calculate the actual value the midpoint should have:
BOOST_REQUIRE_EQUAL(midpoint, token_from_long(0x8800'0000'0000'0000));
}
BOOST_AUTO_TEST_CASE(test_token_wraparound_2) {
auto t1 = token_from_long(0x6000'0000'0000'0000);
auto t2 = token_from_long(0x9000'0000'0000'0000);
dht::murmur3_partitioner partitioner;
BOOST_REQUIRE(t1 > t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 || midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, token_from_long(0x7800'0000'0000'0000));
}
BOOST_AUTO_TEST_CASE(test_ring_position_is_comparable_with_decorated_key) {
auto s = schema_builder("ks", "cf")
.with_column("pk", bytes_type, column_kind::partition_key)
.with_column("v", int32_type)
.build();
std::vector<dht::decorated_key> keys = {
dht::global_partitioner().decorate_key(*s,
partition_key::from_single_value(*s, "key1")),
dht::global_partitioner().decorate_key(*s,
partition_key::from_single_value(*s, "key2")),
};
std::sort(keys.begin(), keys.end(), dht::decorated_key::less_comparator(s));
auto& k1 = keys[0];
auto& k2 = keys[1];
BOOST_REQUIRE(k1._token != k2._token); // The rest of the test assumes that.
BOOST_REQUIRE(k1.tri_compare(*s, dht::ring_position::starting_at(k1._token)) > 0);
BOOST_REQUIRE(k1.tri_compare(*s, dht::ring_position::ending_at(k1._token)) < 0);
BOOST_REQUIRE(k1.tri_compare(*s, dht::ring_position(k1)) == 0);
BOOST_REQUIRE(k1.tri_compare(*s, dht::ring_position::starting_at(k2._token)) < 0);
BOOST_REQUIRE(k1.tri_compare(*s, dht::ring_position::ending_at(k2._token)) < 0);
BOOST_REQUIRE(k1.tri_compare(*s, dht::ring_position(k2)) < 0);
BOOST_REQUIRE(k2.tri_compare(*s, dht::ring_position::starting_at(k1._token)) > 0);
BOOST_REQUIRE(k2.tri_compare(*s, dht::ring_position::ending_at(k1._token)) > 0);
BOOST_REQUIRE(k2.tri_compare(*s, dht::ring_position(k1)) > 0);
}
BOOST_AUTO_TEST_CASE(test_token_no_wraparound_1) {
auto t1 = token_from_long(0x5000'0000'0000'0000);
auto t2 = token_from_long(0x7000'0000'0000'0000);
dht::murmur3_partitioner partitioner;
BOOST_REQUIRE(t1 < t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 && midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, token_from_long(0x6000'0000'0000'0000));
}
BOOST_AUTO_TEST_CASE(test_bop_token_nowraparound_1) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("03");
auto t2 = partitioner.from_sstring("09");
BOOST_REQUIRE(t1 < t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 && midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("06"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_nowraparound_2) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("20000000000000000000000000000003");
auto t2 = partitioner.from_sstring("A0000000000000000000000000000009");
BOOST_REQUIRE(t1 < t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 && midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("60000000000000000000000000000006"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_nowraparound_3) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("2000000000000000000000000000000320000000000000000000000000000003");
auto t2 = partitioner.from_sstring("A0000000000000000000000000000009A0000000000000000000000000000009");
BOOST_REQUIRE(t1 < t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 && midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("6000000000000000000000000000000660000000000000000000000000000006"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_nowraparound_4) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("");
auto t2 = partitioner.from_sstring("2000");
BOOST_REQUIRE(t1 < t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 && midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("1000"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_nowraparound_5) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("00");
auto t2 = partitioner.from_sstring("2000");
BOOST_REQUIRE(t1 < t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 && midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("1000"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_nowraparound_6) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring(sstring());
auto t2 = partitioner.from_sstring(sstring());
BOOST_REQUIRE(t1 <= t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint >= t1 && midpoint <= t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring(""));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_wraparound_1) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("00000000000000000000000000000009");
auto t2 = partitioner.from_sstring("00000000000000000000000000000003");
BOOST_REQUIRE(t1 > t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 || midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("80000000000000000000000000000006"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_wraparound_2) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("A0000000000000000000000000000009");
auto t2 = partitioner.from_sstring("20000000000000000000000000000003");
BOOST_REQUIRE(t1 > t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 || midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("E0000000000000000000000000000006"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_wraparound_3) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("A000000000000000000000000000000900000000000000000000000000000009");
auto t2 = partitioner.from_sstring("2000000000000000000000000000000300000000000000000000000000000003");
BOOST_REQUIRE(t1 > t2);
auto midpoint = partitioner.midpoint(t1, t2);
BOOST_REQUIRE(midpoint > t1 || midpoint < t2);
BOOST_REQUIRE_EQUAL(midpoint, partitioner.from_sstring("E000000000000000000000000000000600000000000000000000000000000006"));
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_describe_ownership) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("10000000000000000000000000000000");
auto t2 = partitioner.from_sstring("30000000000000000000000000000000");
auto t3 = partitioner.from_sstring("A0000000000000000000000000000000");
auto t4 = partitioner.from_sstring("F0000000000000000000000000000000");
auto sorted_tokens = std::vector<dht::token>{t1, t2, t3, t4};
auto own_map = partitioner.describe_ownership(sorted_tokens);
BOOST_REQUIRE_EQUAL(own_map[t1], 0.1250);
BOOST_REQUIRE_EQUAL(own_map[t2], 0.1250);
BOOST_REQUIRE_EQUAL(own_map[t3], 0.4375);
BOOST_REQUIRE_EQUAL(own_map[t4], 0.3125);
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_order) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("123456");
auto t2 = partitioner.from_sstring("12345678");
BOOST_REQUIRE(t1 < t2);
t1 = partitioner.from_sstring("22");
t2 = partitioner.from_sstring("12345678");
BOOST_REQUIRE(t1 > t2);
t1 = partitioner.from_sstring("123456");
t2 = partitioner.from_sstring("123457");
BOOST_REQUIRE(t1 < t2);
t1 = partitioner.from_sstring("123456");
t2 = partitioner.from_sstring("A23456");
BOOST_REQUIRE(t1 < t2);
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_midpoint1) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("010000");
auto t2 = partitioner.from_sstring("20");
auto mid = partitioner.midpoint(t1, t2);
// The length of the midpoint token is supposed to be 3 bytes, filled with one zero byte
auto mid_expected = partitioner.from_sstring("008010");
BOOST_REQUIRE(t1 < t2);
BOOST_REQUIRE(mid_expected._data.size() == 3);
BOOST_REQUIRE(mid._data.size() == 3);
BOOST_REQUIRE(mid == mid_expected);
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_midpoint2) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("020001");
auto t2 = partitioner.from_sstring("60");
auto mid = partitioner.midpoint(t1, t2);
// The length of the midpoint token is supposed to be 3 bytes, filled with one zero byte
auto mid_expected = partitioner.from_sstring("01003080");
BOOST_REQUIRE(t1 < t2);
BOOST_REQUIRE(mid == mid_expected);
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}
BOOST_AUTO_TEST_CASE(test_bop_token_midpoint3) {
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.ByteOrderedPartitioner"));
dht::byte_ordered_partitioner partitioner;
auto t1 = partitioner.from_sstring("20");
auto t2 = partitioner.from_sstring("81");
auto mid = partitioner.midpoint(t1, t2);
auto mid_expected = partitioner.from_sstring("5080");
BOOST_REQUIRE(t1 < t2);
BOOST_REQUIRE(mid == mid_expected);
dht::set_global_partitioner(to_sstring("org.apache.cassandra.dht.Murmur3Partitioner"));
}