/* * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.facebook.presto.raptor.metadata; import com.facebook.presto.client.NodeVersion; import com.facebook.presto.metadata.PrestoNode; import com.facebook.presto.raptor.NodeSupplier; import com.facebook.presto.raptor.RaptorColumnHandle; import com.facebook.presto.raptor.util.DaoSupplier; import com.facebook.presto.spi.Node; import com.facebook.presto.spi.PrestoException; import com.facebook.presto.spi.predicate.Domain; import com.facebook.presto.spi.predicate.Range; import com.facebook.presto.spi.predicate.TupleDomain; import com.facebook.presto.spi.predicate.ValueSet; import com.facebook.presto.spi.type.Type; import com.google.common.base.Ticker; import com.google.common.collect.HashMultimap; import com.google.common.collect.ImmutableList; import com.google.common.collect.ImmutableMap; import com.google.common.collect.ImmutableSet; import com.google.common.collect.Multimap; import com.google.common.io.Files; import io.airlift.slice.Slice; import io.airlift.testing.FileUtils; import io.airlift.testing.TestingTicker; import io.airlift.units.Duration; import org.skife.jdbi.v2.DBI; import org.skife.jdbi.v2.Handle; import org.skife.jdbi.v2.IDBI; import org.skife.jdbi.v2.ResultIterator; import org.testng.annotations.AfterMethod; import org.testng.annotations.BeforeMethod; import org.testng.annotations.Test; import java.io.File; import java.net.URI; import java.sql.ResultSet; import java.sql.SQLException; import java.sql.Statement; import java.time.LocalDate; import java.time.ZonedDateTime; import java.util.Collection; import java.util.HashMap; import java.util.HashSet; import java.util.List; import java.util.Map; import java.util.Optional; import java.util.OptionalInt; import java.util.OptionalLong; import java.util.Set; import java.util.UUID; import static com.facebook.presto.raptor.RaptorErrorCode.RAPTOR_EXTERNAL_BATCH_ALREADY_EXISTS; import static com.facebook.presto.raptor.metadata.DatabaseShardManager.shardIndexTable; import static com.facebook.presto.raptor.metadata.SchemaDaoUtil.createTablesWithRetry; import static com.facebook.presto.raptor.storage.ShardStats.MAX_BINARY_INDEX_SIZE; import static com.facebook.presto.spi.StandardErrorCode.SERVER_STARTING_UP; import static com.facebook.presto.spi.StandardErrorCode.TRANSACTION_CONFLICT; import static com.facebook.presto.spi.predicate.Range.greaterThan; import static com.facebook.presto.spi.predicate.Range.greaterThanOrEqual; import static com.facebook.presto.spi.predicate.Range.lessThan; import static com.facebook.presto.spi.type.BigintType.BIGINT; import static com.facebook.presto.spi.type.BooleanType.BOOLEAN; import static com.facebook.presto.spi.type.DateType.DATE; import static com.facebook.presto.spi.type.DoubleType.DOUBLE; import static com.facebook.presto.spi.type.TimestampType.TIMESTAMP; import static com.facebook.presto.spi.type.VarbinaryType.VARBINARY; import static com.facebook.presto.spi.type.VarcharType.createVarcharType; import static com.google.common.base.Strings.repeat; import static com.google.common.base.Ticker.systemTicker; import static com.google.common.collect.Iterables.getOnlyElement; import static com.google.common.collect.Iterators.concat; import static com.google.common.collect.Iterators.transform; import static io.airlift.slice.Slices.utf8Slice; import static java.lang.String.format; import static java.time.ZoneOffset.UTC; import static java.util.concurrent.TimeUnit.DAYS; import static java.util.stream.Collectors.toSet; import static org.testng.Assert.assertEquals; import static org.testng.Assert.assertFalse; import static org.testng.Assert.fail; @Test(singleThreaded = true) public class TestDatabaseShardManager { private IDBI dbi; private Handle dummyHandle; private File dataDir; private ShardManager shardManager; @BeforeMethod public void setup() { dbi = new DBI("jdbc:h2:mem:test" + System.nanoTime()); dummyHandle = dbi.open(); createTablesWithRetry(dbi); dataDir = Files.createTempDir(); shardManager = createShardManager(dbi); } @AfterMethod public void teardown() { dummyHandle.close(); FileUtils.deleteRecursively(dataDir); } @Test public void testCommit() throws Exception { long tableId = createTable("test"); List<ShardInfo> shards = ImmutableList.<ShardInfo>builder() .add(shardInfo(UUID.randomUUID(), "node1")) .add(shardInfo(UUID.randomUUID(), "node1")) .add(shardInfo(UUID.randomUUID(), "node2")) .build(); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shards, Optional.empty(), 0); Set<ShardNodes> actual = getShardNodes(tableId, TupleDomain.all()); assertEquals(actual, toShardNodes(shards)); } @Test public void testRollback() { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); List<ShardInfo> shards = ImmutableList.of(shardInfo(UUID.randomUUID(), "node1")); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.rollbackTransaction(transactionId); try { shardManager.commitShards(transactionId, tableId, columns, shards, Optional.empty(), 0); fail("expected exception"); } catch (PrestoException e) { assertEquals(e.getErrorCode(), TRANSACTION_CONFLICT.toErrorCode()); } } @Test public void testAssignShard() { long tableId = createTable("test"); UUID shard = UUID.randomUUID(); List<ShardInfo> shardNodes = ImmutableList.of(shardInfo(shard, "node1")); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shardNodes, Optional.empty(), 0); ShardNodes actual = getOnlyElement(getShardNodes(tableId, TupleDomain.all())); assertEquals(actual, new ShardNodes(shard, ImmutableSet.of("node1"))); try { shardManager.assignShard(tableId, shard, "node2", true); fail("expected exception"); } catch (PrestoException e) { assertEquals(e.getErrorCode(), SERVER_STARTING_UP.toErrorCode()); } shardManager.assignShard(tableId, shard, "node2", false); // assign shard to another node actual = getOnlyElement(getShardNodes(tableId, TupleDomain.all())); assertEquals(actual, new ShardNodes(shard, ImmutableSet.of("node1", "node2"))); // assigning a shard should be idempotent shardManager.assignShard(tableId, shard, "node2", false); // remove assignment from first node shardManager.unassignShard(tableId, shard, "node1"); actual = getOnlyElement(getShardNodes(tableId, TupleDomain.all())); assertEquals(actual, new ShardNodes(shard, ImmutableSet.of("node2"))); // removing an assignment should be idempotent shardManager.unassignShard(tableId, shard, "node1"); } @Test public void testGetNodeBytes() { long tableId = createTable("test"); OptionalInt bucketNumber = OptionalInt.empty(); UUID shard1 = UUID.randomUUID(); UUID shard2 = UUID.randomUUID(); List<ShardInfo> shardNodes = ImmutableList.of( new ShardInfo(shard1, bucketNumber, ImmutableSet.of("node1"), ImmutableList.of(), 3, 33, 333), new ShardInfo(shard2, bucketNumber, ImmutableSet.of("node1"), ImmutableList.of(), 5, 55, 555)); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shardNodes, Optional.empty(), 0); assertEquals(getShardNodes(tableId, TupleDomain.all()), ImmutableSet.of( new ShardNodes(shard1, ImmutableSet.of("node1")), new ShardNodes(shard2, ImmutableSet.of("node1")))); assertEquals(shardManager.getNodeBytes(), ImmutableMap.of("node1", 88L)); shardManager.assignShard(tableId, shard1, "node2", false); assertEquals(getShardNodes(tableId, TupleDomain.all()), ImmutableSet.of( new ShardNodes(shard1, ImmutableSet.of("node1", "node2")), new ShardNodes(shard2, ImmutableSet.of("node1")))); assertEquals(shardManager.getNodeBytes(), ImmutableMap.of("node1", 88L, "node2", 33L)); } @Test public void testGetNodeTableShards() throws Exception { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); List<String> nodes = ImmutableList.of("node1", "node2", "node3"); ImmutableList.Builder<ShardInfo> inputShards = ImmutableList.builder(); Multimap<String, UUID> nodeShardMap = HashMultimap.create(); for (String node : nodes) { UUID uuid = UUID.randomUUID(); nodeShardMap.put(node, uuid); inputShards.add(shardInfo(uuid, node)); } shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, inputShards.build(), Optional.empty(), 0); for (String node : nodes) { Set<ShardMetadata> shardMetadata = shardManager.getNodeShards(node); Set<UUID> expectedUuids = ImmutableSet.copyOf(nodeShardMap.get(node)); Set<UUID> actualUuids = shardMetadata.stream().map(ShardMetadata::getShardUuid).collect(toSet()); assertEquals(actualUuids, expectedUuids); } } @Test public void testGetExistingShards() throws Exception { long tableId = createTable("test"); UUID shard1 = UUID.randomUUID(); UUID shard2 = UUID.randomUUID(); List<ShardInfo> shardNodes = ImmutableList.of(shardInfo(shard1, "node1"), shardInfo(shard2, "node1")); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shardNodes, Optional.empty(), 0); Set<UUID> actual = shardManager.getExistingShardUuids(tableId, ImmutableSet.of(shard1, shard2, UUID.randomUUID())); Set<UUID> expected = ImmutableSet.of(shard1, shard2); assertEquals(actual, expected); } @Test public void testReplaceShardUuids() throws Exception { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); List<String> nodes = ImmutableList.of("node1", "node2", "node3"); List<UUID> originalUuids = ImmutableList.of(UUID.randomUUID(), UUID.randomUUID(), UUID.randomUUID()); List<ShardInfo> oldShards = ImmutableList.<ShardInfo>builder() .add(shardInfo(originalUuids.get(0), nodes.get(0))) .add(shardInfo(originalUuids.get(1), nodes.get(1))) .add(shardInfo(originalUuids.get(2), nodes.get(2))) .build(); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, oldShards, Optional.empty(), 0); List<UUID> expectedUuids = ImmutableList.of(UUID.randomUUID(), UUID.randomUUID()); List<ShardInfo> newShards = ImmutableList.<ShardInfo>builder() .add(shardInfo(expectedUuids.get(0), nodes.get(0))) .add(shardInfo(expectedUuids.get(1), nodes.get(0))) .build(); Set<ShardMetadata> shardMetadata = shardManager.getNodeShards(nodes.get(0)); Set<UUID> replacedUuids = shardMetadata.stream().map(ShardMetadata::getShardUuid).collect(toSet()); transactionId = shardManager.beginTransaction(); shardManager.replaceShardUuids(transactionId, tableId, columns, replacedUuids, newShards, OptionalLong.of(0)); shardMetadata = shardManager.getNodeShards(nodes.get(0)); Set<UUID> actualUuids = shardMetadata.stream().map(ShardMetadata::getShardUuid).collect(toSet()); assertEquals(actualUuids, ImmutableSet.copyOf(expectedUuids)); // Compute expected all uuids for this table Set<UUID> expectedAllUuids = new HashSet<>(originalUuids); expectedAllUuids.removeAll(replacedUuids); expectedAllUuids.addAll(expectedUuids); // check that shards are replaced in index table as well Set<BucketShards> shardNodes = ImmutableSet.copyOf(shardManager.getShardNodes(tableId, TupleDomain.all())); Set<UUID> actualAllUuids = shardNodes.stream() .map(BucketShards::getShards) .flatMap(Collection::stream) .map(ShardNodes::getShardUuid) .collect(toSet()); assertEquals(actualAllUuids, expectedAllUuids); // verify that conflicting updates are handled newShards = ImmutableList.of(shardInfo(UUID.randomUUID(), nodes.get(0))); try { transactionId = shardManager.beginTransaction(); shardManager.replaceShardUuids(transactionId, tableId, columns, replacedUuids, newShards, OptionalLong.of(0)); fail("expected exception"); } catch (PrestoException e) { assertEquals(e.getErrorCode(), TRANSACTION_CONFLICT.toErrorCode()); } } @Test public void testExternalBatches() throws Exception { long tableId = createTable("test"); Optional<String> externalBatchId = Optional.of("foo"); List<ShardInfo> shards = ImmutableList.of(shardInfo(UUID.randomUUID(), "node1")); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shards, externalBatchId, 0); shards = ImmutableList.of(shardInfo(UUID.randomUUID(), "node1")); try { transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shards, externalBatchId, 0); fail("expected external batch exception"); } catch (PrestoException e) { assertEquals(e.getErrorCode(), RAPTOR_EXTERNAL_BATCH_ALREADY_EXISTS.toErrorCode()); } } @Test public void testBucketAssignments() { Node node1 = createTestingNode(); Node node2 = createTestingNode(); Node node3 = createTestingNode(); TestingTicker ticker = new TestingTicker(); MetadataDao metadataDao = dbi.onDemand(MetadataDao.class); int bucketCount = 13; long distributionId = metadataDao.insertDistribution(null, "test", bucketCount); Set<Node> originalNodes = ImmutableSet.of(node1, node2); ShardManager shardManager = createShardManager(dbi, () -> originalNodes, ticker); shardManager.createBuckets(distributionId, bucketCount); Map<Integer, String> assignments = shardManager.getBucketAssignments(distributionId); assertEquals(assignments.size(), bucketCount); assertEquals(ImmutableSet.copyOf(assignments.values()), nodeIds(originalNodes)); Set<Node> newNodes = ImmutableSet.of(node1, node3); shardManager = createShardManager(dbi, () -> newNodes, ticker); try { shardManager.getBucketAssignments(distributionId); fail("expected exception"); } catch (PrestoException e) { assertEquals(e.getErrorCode(), SERVER_STARTING_UP.toErrorCode()); } ticker.increment(2, DAYS); assignments = shardManager.getBucketAssignments(distributionId); assertEquals(assignments.size(), bucketCount); assertEquals(ImmutableSet.copyOf(assignments.values()), nodeIds(newNodes)); } @Test public void testEmptyTable() { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); try (ResultIterator<BucketShards> iterator = shardManager.getShardNodes(tableId, TupleDomain.all())) { assertFalse(iterator.hasNext()); } } @Test public void testEmptyTableBucketed() { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, true, OptionalLong.empty()); try (ResultIterator<BucketShards> iterator = shardManager.getShardNodesBucketed(tableId, true, ImmutableMap.of(), TupleDomain.all())) { assertFalse(iterator.hasNext()); } } @Test public void testTemporalColumnTableCreation() throws Exception { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, TIMESTAMP)); shardManager.createTable(tableId, columns, false, OptionalLong.of(1)); long tableId2 = createTable("test2"); List<ColumnInfo> columns2 = ImmutableList.of(new ColumnInfo(1, TIMESTAMP)); shardManager.createTable(tableId2, columns2, true, OptionalLong.of(1)); } @Test public void testShardPruning() throws Exception { ShardInfo shard1 = shardInfo( UUID.randomUUID(), "node1", ImmutableList.<ColumnStats>builder() .add(new ColumnStats(1, 5, 10)) .add(new ColumnStats(2, -20.0, 20.0)) .add(new ColumnStats(3, date(2013, 5, 11), date(2013, 6, 13))) .add(new ColumnStats(4, timestamp(2013, 5, 11, 4, 5, 6), timestamp(2013, 6, 13, 7, 8, 9))) .add(new ColumnStats(5, "hello", "world")) .add(new ColumnStats(6, false, true)) .build()); ShardInfo shard2 = shardInfo( UUID.randomUUID(), "node2", ImmutableList.<ColumnStats>builder() .add(new ColumnStats(1, 2, 8)) .add(new ColumnStats(2, null, 50.0)) .add(new ColumnStats(3, date(2012, 1, 1), date(2012, 12, 31))) .add(new ColumnStats(4, timestamp(2012, 1, 1, 2, 3, 4), timestamp(2012, 12, 31, 5, 6, 7))) .add(new ColumnStats(5, "cat", "dog")) .add(new ColumnStats(6, true, true)) .build()); ShardInfo shard3 = shardInfo( UUID.randomUUID(), "node3", ImmutableList.<ColumnStats>builder() .add(new ColumnStats(1, 15, 20)) .add(new ColumnStats(2, null, null)) .add(new ColumnStats(3, date(2013, 4, 1), date(2013, 6, 1))) .add(new ColumnStats(4, timestamp(2013, 4, 1, 8, 7, 6), timestamp(2013, 6, 1, 6, 5, 4))) .add(new ColumnStats(5, "grape", "orange")) .add(new ColumnStats(6, false, false)) .build()); List<ShardInfo> shards = ImmutableList.<ShardInfo>builder() .add(shard1) .add(shard2) .add(shard3) .build(); List<ColumnInfo> columns = ImmutableList.<ColumnInfo>builder() .add(new ColumnInfo(1, BIGINT)) .add(new ColumnInfo(2, DOUBLE)) .add(new ColumnInfo(3, DATE)) .add(new ColumnInfo(4, TIMESTAMP)) .add(new ColumnInfo(5, createVarcharType(10))) .add(new ColumnInfo(6, BOOLEAN)) .add(new ColumnInfo(7, VARBINARY)) .build(); RaptorColumnHandle c1 = new RaptorColumnHandle("raptor", "c1", 1, BIGINT); RaptorColumnHandle c2 = new RaptorColumnHandle("raptor", "c2", 2, DOUBLE); RaptorColumnHandle c3 = new RaptorColumnHandle("raptor", "c3", 3, DATE); RaptorColumnHandle c4 = new RaptorColumnHandle("raptor", "c4", 4, TIMESTAMP); RaptorColumnHandle c5 = new RaptorColumnHandle("raptor", "c5", 5, createVarcharType(10)); RaptorColumnHandle c6 = new RaptorColumnHandle("raptor", "c6", 6, BOOLEAN); long tableId = createTable("test"); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shards, Optional.empty(), 0); shardAssertion(tableId).expected(shards); shardAssertion(tableId).equal(c1, BIGINT, 3L).expected(shard2); shardAssertion(tableId).equal(c1, BIGINT, 8L).expected(shard1, shard2); shardAssertion(tableId).equal(c1, BIGINT, 9L).expected(shard1); shardAssertion(tableId).equal(c1, BIGINT, 13L).expected(); shardAssertion(tableId).between(c1, BIGINT, 8L, 14L).expected(shard1, shard2); shardAssertion(tableId).between(c1, BIGINT, 8L, 15L).expected(shards); shardAssertion(tableId).between(c1, BIGINT, 8L, 16L).expected(shards); shardAssertion(tableId).between(c1, BIGINT, 12L, 14L).expected(); shardAssertion(tableId).between(c1, BIGINT, 5L, 10L).expected(shard1, shard2); shardAssertion(tableId).between(c1, BIGINT, 16L, 18L).expected(shard3); shardAssertion(tableId).between(c1, BIGINT, 1L, 25L).expected(shards); shardAssertion(tableId).between(c1, BIGINT, 4L, 12L).expected(shard1, shard2); shardAssertion(tableId).range(c1, lessThan(BIGINT, 5L)).expected(shard1, shard2); shardAssertion(tableId).range(c1, lessThan(BIGINT, 4L)).expected(shard2); shardAssertion(tableId).range(c1, lessThan(BIGINT, 11L)).expected(shard1, shard2); shardAssertion(tableId).range(c1, lessThan(BIGINT, 25L)).expected(shards); shardAssertion(tableId).range(c1, greaterThan(BIGINT, 1L)).expected(shards); shardAssertion(tableId).range(c1, greaterThan(BIGINT, 8L)).expected(shards); shardAssertion(tableId).range(c1, greaterThan(BIGINT, 9L)).expected(shard1, shard3); shardAssertion(tableId) .between(c1, BIGINT, -25L, 25L) .between(c2, DOUBLE, -1000.0, 1000.0) .between(c3, BIGINT, 0L, 50000L) .between(c4, TIMESTAMP, 0L, timestamp(2015, 1, 2, 3, 4, 5)) .between(c5, createVarcharType(10), utf8Slice("a"), utf8Slice("zzzzz")) .between(c6, BOOLEAN, false, true) .expected(shards); shardAssertion(tableId) .between(c1, BIGINT, 4L, 12L) .between(c3, DATE, date(2013, 3, 3), date(2013, 5, 25)) .expected(shard1); shardAssertion(tableId).equal(c2, DOUBLE, 25.0).expected(shard2, shard3); shardAssertion(tableId).equal(c2, DOUBLE, 50.1).expected(shard3); shardAssertion(tableId).equal(c3, DATE, date(2013, 5, 12)).expected(shard1, shard3); shardAssertion(tableId).range(c4, greaterThan(TIMESTAMP, timestamp(2013, 1, 1, 0, 0, 0))).expected(shard1, shard3); shardAssertion(tableId).between(c5, createVarcharType(10), utf8Slice("cow"), utf8Slice("milk")).expected(shards); shardAssertion(tableId).equal(c5, createVarcharType(10), utf8Slice("fruit")).expected(); shardAssertion(tableId).equal(c5, createVarcharType(10), utf8Slice("pear")).expected(shard1); shardAssertion(tableId).equal(c5, createVarcharType(10), utf8Slice("cat")).expected(shard2); shardAssertion(tableId).range(c5, greaterThan(createVarcharType(10), utf8Slice("gum"))).expected(shard1, shard3); shardAssertion(tableId).range(c5, lessThan(createVarcharType(10), utf8Slice("air"))).expected(); shardAssertion(tableId).equal(c6, BOOLEAN, true).expected(shard1, shard2); shardAssertion(tableId).equal(c6, BOOLEAN, false).expected(shard1, shard3); shardAssertion(tableId).range(c6, greaterThanOrEqual(BOOLEAN, false)).expected(shards); shardAssertion(tableId).range(c6, lessThan(BOOLEAN, true)).expected(shards); shardAssertion(tableId).range(c6, lessThan(BOOLEAN, false)).expected(shard1, shard3); // TODO: support multiple ranges shardAssertion(tableId) .domain(c1, createDomain(lessThan(BIGINT, 0L), greaterThan(BIGINT, 25L))) .expected(shards); } @Test public void testShardPruningTruncatedValues() throws Exception { String prefix = repeat("x", MAX_BINARY_INDEX_SIZE); ColumnStats stats = new ColumnStats(1, prefix + "a", prefix + "z"); ShardInfo shard = shardInfo(UUID.randomUUID(), "node", ImmutableList.of(stats)); List<ShardInfo> shards = ImmutableList.of(shard); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, createVarcharType(10))); RaptorColumnHandle c1 = new RaptorColumnHandle("raptor", "c1", 1, createVarcharType(10)); long tableId = createTable("test"); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shards, Optional.empty(), 0); shardAssertion(tableId).expected(shards); shardAssertion(tableId).equal(c1, createVarcharType(10), utf8Slice(prefix)).expected(shards); shardAssertion(tableId).equal(c1, createVarcharType(10), utf8Slice(prefix + "c")).expected(shards); shardAssertion(tableId).range(c1, lessThan(createVarcharType(10), utf8Slice(prefix + "c"))).expected(shards); shardAssertion(tableId).range(c1, greaterThan(createVarcharType(10), utf8Slice(prefix + "zzz"))).expected(shards); shardAssertion(tableId).between(c1, createVarcharType(10), utf8Slice("w"), utf8Slice("y")).expected(shards); shardAssertion(tableId).range(c1, greaterThan(createVarcharType(10), utf8Slice("x"))).expected(shards); shardAssertion(tableId).between(c1, createVarcharType(10), utf8Slice("x"), utf8Slice("x")).expected(); shardAssertion(tableId).range(c1, lessThan(createVarcharType(10), utf8Slice("w"))).expected(); shardAssertion(tableId).range(c1, lessThan(createVarcharType(10), utf8Slice("x"))).expected(); shardAssertion(tableId).range(c1, greaterThan(createVarcharType(10), utf8Slice("y"))).expected(); Slice shorter = utf8Slice(prefix.substring(0, prefix.length() - 1)); shardAssertion(tableId).equal(c1, createVarcharType(10), shorter).expected(); shardAssertion(tableId).range(c1, lessThan(createVarcharType(10), shorter)).expected(); shardAssertion(tableId).range(c1, greaterThan(createVarcharType(10), shorter)).expected(shards); } @Test public void testShardPruningNoStats() throws Exception { ShardInfo shard = shardInfo(UUID.randomUUID(), "node"); List<ShardInfo> shards = ImmutableList.of(shard); long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); RaptorColumnHandle c1 = new RaptorColumnHandle("raptor", "c1", 1, BIGINT); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); long transactionId = shardManager.beginTransaction(); shardManager.commitShards(transactionId, tableId, columns, shards, Optional.empty(), 0); shardAssertion(tableId).expected(shards); shardAssertion(tableId).equal(c1, BIGINT, 3L).expected(shards); } @Test public void testAddNewColumn() throws Exception { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); int before = columnCount(tableId); ColumnInfo newColumn = new ColumnInfo(2, BIGINT); shardManager.addColumn(tableId, newColumn); int after = columnCount(tableId); // should be 2 more: min and max columns assertEquals(after, before + 2); } @Test public void testAddDuplicateColumn() throws Exception { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); shardManager.createTable(tableId, columns, false, OptionalLong.empty()); int before = columnCount(tableId); shardManager.addColumn(tableId, columns.get(0)); int after = columnCount(tableId); // no error, no columns added assertEquals(after, before); } @Test public void testMaintenanceBlocked() { long tableId = createTable("test"); List<ColumnInfo> columns = ImmutableList.of(new ColumnInfo(1, BIGINT)); Set<UUID> oldShards = ImmutableSet.of(UUID.randomUUID()); dbi.onDemand(MetadataDao.class).blockMaintenance(tableId); long transactionId = shardManager.beginTransaction(); try { shardManager.replaceShardUuids(transactionId, tableId, columns, oldShards, ImmutableSet.of(), OptionalLong.empty()); fail("expected exception"); } catch (PrestoException e) { assertEquals(e.getErrorCode(), TRANSACTION_CONFLICT.toErrorCode()); assertEquals(e.getMessage(), "Maintenance is blocked for table"); } } private Set<ShardNodes> getShardNodes(long tableId, TupleDomain<RaptorColumnHandle> predicate) { try (ResultIterator<BucketShards> iterator = shardManager.getShardNodes(tableId, predicate)) { return ImmutableSet.copyOf(concat(transform(iterator, i -> i.getShards().iterator()))); } } private long createTable(String name) { return dbi.onDemand(MetadataDao.class).insertTable("test", name, false, false, null, 0); } public static ShardInfo shardInfo(UUID shardUuid, String nodeIdentifier) { return shardInfo(shardUuid, nodeIdentifier, ImmutableList.of()); } public static ShardInfo shardInfo(UUID shardUuid, String nodeId, List<ColumnStats> columnStats) { return new ShardInfo(shardUuid, OptionalInt.empty(), ImmutableSet.of(nodeId), columnStats, 0, 0, 0); } private static Set<ShardNodes> toShardNodes(List<ShardInfo> shards) { return shards.stream() .map(shard -> new ShardNodes(shard.getShardUuid(), shard.getNodeIdentifiers())) .collect(toSet()); } public static ShardManager createShardManager(IDBI dbi) { return createShardManager(dbi, ImmutableSet::of, systemTicker()); } public static ShardManager createShardManager(IDBI dbi, NodeSupplier nodeSupplier) { return createShardManager(dbi, nodeSupplier, systemTicker()); } public static ShardManager createShardManager(IDBI dbi, NodeSupplier nodeSupplier, Ticker ticker) { DaoSupplier<ShardDao> shardDaoSupplier = new DaoSupplier<>(dbi, H2ShardDao.class); AssignmentLimiter assignmentLimiter = new AssignmentLimiter(nodeSupplier, ticker, new MetadataConfig()); return new DatabaseShardManager(dbi, shardDaoSupplier, nodeSupplier, assignmentLimiter, ticker, new Duration(1, DAYS)); } private static Domain createDomain(Range first, Range... ranges) { return Domain.create(ValueSet.ofRanges(first, ranges), false); } private ShardAssertion shardAssertion(long tableId) { return new ShardAssertion(tableId); } private class ShardAssertion { private final Map<RaptorColumnHandle, Domain> domains = new HashMap<>(); private final long tableId; public ShardAssertion(long tableId) { this.tableId = tableId; } public ShardAssertion domain(RaptorColumnHandle column, Domain domain) { domains.put(column, domain); return this; } public ShardAssertion range(RaptorColumnHandle column, Range range) { return domain(column, createDomain(range)); } public ShardAssertion equal(RaptorColumnHandle column, Type type, Object value) { return domain(column, Domain.singleValue(type, value)); } public ShardAssertion between(RaptorColumnHandle column, Type type, Object low, Object high) { return range(column, Range.range(type, low, true, high, true)); } public void expected(ShardInfo... shards) { expected(ImmutableList.copyOf(shards)); } public void expected(List<ShardInfo> shards) { TupleDomain<RaptorColumnHandle> predicate = TupleDomain.withColumnDomains(domains); Set<ShardNodes> actual = getShardNodes(tableId, predicate); assertEquals(actual, toShardNodes(shards)); } } private static long date(int year, int month, int day) { return LocalDate.of(year, month, day).toEpochDay(); } private static long timestamp(int year, int month, int day, int hour, int minute, int second) { return ZonedDateTime.of(year, month, day, hour, minute, second, 0, UTC).toInstant().toEpochMilli(); } private static Set<String> nodeIds(Collection<Node> nodes) { return nodes.stream().map(Node::getNodeIdentifier).collect(toSet()); } private static Node createTestingNode() { return new PrestoNode(UUID.randomUUID().toString(), URI.create("http://test"), NodeVersion.UNKNOWN, false); } private int columnCount(long tableId) throws SQLException { try (Statement statement = dummyHandle.getConnection().createStatement()) { try (ResultSet rs = statement.executeQuery(format("SELECT * FROM %s LIMIT 0", shardIndexTable(tableId)))) { return rs.getMetaData().getColumnCount(); } } } }