/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.ignite.internal.managers.checkpoint; import java.io.Serializable; import java.util.Arrays; import java.util.Collection; import java.util.Collections; import java.util.List; import java.util.concurrent.CountDownLatch; import java.util.concurrent.atomic.AtomicInteger; import org.apache.ignite.Ignite; import org.apache.ignite.IgniteException; import org.apache.ignite.compute.ComputeJob; import org.apache.ignite.compute.ComputeJobAdapter; import org.apache.ignite.compute.ComputeJobResult; import org.apache.ignite.compute.ComputeTaskFuture; import org.apache.ignite.compute.ComputeTaskSession; import org.apache.ignite.compute.ComputeTaskSessionFullSupport; import org.apache.ignite.compute.ComputeTaskSplitAdapter; import org.apache.ignite.configuration.CacheConfiguration; import org.apache.ignite.configuration.IgniteConfiguration; import org.apache.ignite.events.CheckpointEvent; import org.apache.ignite.events.Event; import org.apache.ignite.internal.IgniteInterruptedCheckedException; import org.apache.ignite.internal.IgniteKernal; import org.apache.ignite.internal.util.lang.GridAbsClosure; import org.apache.ignite.internal.util.lang.GridAbsClosureX; import org.apache.ignite.internal.util.typedef.G; import org.apache.ignite.internal.util.typedef.X; import org.apache.ignite.lang.IgnitePredicate; import org.apache.ignite.lang.IgniteUuid; import org.apache.ignite.mxbean.IgniteMXBean; import org.apache.ignite.resources.IgniteInstanceResource; import org.apache.ignite.resources.TaskSessionResource; import org.apache.ignite.spi.checkpoint.cache.CacheCheckpointSpi; import org.apache.ignite.spi.checkpoint.jdbc.JdbcCheckpointSpi; import org.apache.ignite.spi.discovery.tcp.TcpDiscoverySpi; import org.apache.ignite.spi.discovery.tcp.ipfinder.TcpDiscoveryIpFinder; import org.apache.ignite.spi.discovery.tcp.ipfinder.vm.TcpDiscoveryVmIpFinder; import org.apache.ignite.testframework.GridTestUtils; import org.apache.ignite.testframework.junits.common.GridCommonAbstractTest; import org.hsqldb.jdbc.jdbcDataSource; import org.jetbrains.annotations.Nullable; import static org.apache.ignite.cache.CacheWriteSynchronizationMode.FULL_SYNC; import static org.apache.ignite.compute.ComputeTaskSessionScope.GLOBAL_SCOPE; import static org.apache.ignite.compute.ComputeTaskSessionScope.SESSION_SCOPE; import static org.apache.ignite.events.EventType.EVT_CHECKPOINT_LOADED; import static org.apache.ignite.events.EventType.EVT_CHECKPOINT_REMOVED; import static org.apache.ignite.events.EventType.EVT_CHECKPOINT_SAVED; /** * */ public abstract class GridCheckpointManagerAbstractSelfTest extends GridCommonAbstractTest { /** */ private static volatile CountDownLatch startLatch; /** */ private static volatile CountDownLatch read1Latch; /** */ private static volatile CountDownLatch read1FinishedLatch; /** */ private static volatile CountDownLatch read2Latch; /** */ private static volatile CountDownLatch read2FinishedLatch; /** */ private static volatile CountDownLatch read3Latch; /** */ private static volatile CountDownLatch read3FinishedLatch; /** */ private static volatile CountDownLatch rmvLatch; /** */ private static final String GLOBAL_KEY = "test-checkpoint-globalKey"; /** */ private static final String GLOBAL_VAL = "test-checkpoint-globalVal"; /** */ private static final String GLOBAL_VAL_OVERWRITTEN = GLOBAL_VAL + "-overwritten"; /** */ private static final String SES_KEY = "test-checkpoint-sesKey"; /** */ private static final String SES_VAL = "test-checkpoint-sesVal"; /** */ private static final String SES_VAL_OVERWRITTEN = SES_VAL + "-overwritten"; /** IP finder. */ private static final TcpDiscoveryIpFinder IP_FINDER = new TcpDiscoveryVmIpFinder(true); /** * Static variable to control whether test should retry checkpoint read attempts. * It is needed for s3-based tests because of weak s3 consistency model. */ @SuppressWarnings("RedundantFieldInitialization") protected static int retries = 0; /** * Returns checkpoint manager instance for given Grid. * * @param ignite Grid instance. * @return Checkpoint manager. */ private GridCheckpointManager checkpoints(Ignite ignite) { assert ignite != null; return ((IgniteKernal) ignite).context().checkpoint(); } /** {@inheritDoc} */ @Override protected IgniteConfiguration getConfiguration(String igniteInstanceName) throws Exception { assert igniteInstanceName != null; IgniteConfiguration cfg = super.getConfiguration(igniteInstanceName); TcpDiscoverySpi discoSpi = new TcpDiscoverySpi(); discoSpi.setIpFinder(IP_FINDER); cfg.setDiscoverySpi(discoSpi); if (igniteInstanceName.contains("cache")) { String cacheName = "test-checkpoints"; CacheConfiguration cacheCfg = defaultCacheConfiguration(); cacheCfg.setName(cacheName); cacheCfg.setWriteSynchronizationMode(FULL_SYNC); CacheCheckpointSpi spi = new CacheCheckpointSpi(); spi.setCacheName(cacheName); cfg.setCacheConfiguration(cacheCfg); cfg.setCheckpointSpi(spi); } else if (igniteInstanceName.contains("jdbc")) { JdbcCheckpointSpi spi = new JdbcCheckpointSpi(); jdbcDataSource ds = new jdbcDataSource(); ds.setDatabase("jdbc:hsqldb:mem:gg_test_" + getClass().getSimpleName()); ds.setUser("sa"); ds.setPassword(""); spi.setDataSource(ds); spi.setCheckpointTableName("test_checkpoints"); spi.setKeyFieldName("key"); spi.setValueFieldName("value"); spi.setValueFieldType("longvarbinary"); spi.setExpireDateFieldName("expire_date"); cfg.setCheckpointSpi(spi); } return cfg; } /** * @param igniteInstanceName Ignite instance name. * @throws Exception If test failed. */ protected void doTest(String igniteInstanceName) throws Exception { final AtomicInteger savedCnt = new AtomicInteger(); final AtomicInteger loadedCnt = new AtomicInteger(); final AtomicInteger rmvCnt = new AtomicInteger(); try { Ignite ignite = startGrid(igniteInstanceName); ignite.events().localListen(new IgnitePredicate<Event>() { @Override public boolean apply(Event evt) { assert evt instanceof CheckpointEvent; CheckpointEvent e = (CheckpointEvent) evt; info("Checkpoint event: " + e); switch (evt.type()) { case EVT_CHECKPOINT_SAVED: { savedCnt.incrementAndGet(); break; } case EVT_CHECKPOINT_LOADED: { loadedCnt.incrementAndGet(); break; } case EVT_CHECKPOINT_REMOVED: { rmvCnt.incrementAndGet(); break; } } return true; } }, EVT_CHECKPOINT_SAVED, EVT_CHECKPOINT_LOADED, EVT_CHECKPOINT_REMOVED); executeAsync(ignite.compute(), GridTestCheckpointTask.class, null).get(2 * 60 * 1000); assert checkCheckpointManager(ignite) : "Session IDs got stuck after task completion: " + checkpoints(ignite).sessionIds(); } finally { stopGrid(igniteInstanceName); } assertEquals(8, savedCnt.get()); assertEquals(10, loadedCnt.get()); if ("jdbc".equals(igniteInstanceName)) assertEquals(5, rmvCnt.get()); else assertEquals(6, rmvCnt.get()); } /** * @param igniteInstanceName Ignite instance name. * @throws Exception If test failed. */ protected void doMultiNodeTest(String igniteInstanceName) throws Exception { startLatch = new CountDownLatch(3); read1Latch = new CountDownLatch(1); read1FinishedLatch = new CountDownLatch(2); read2Latch = new CountDownLatch(1); read2FinishedLatch = new CountDownLatch(2); read3Latch = new CountDownLatch(1); read3FinishedLatch = new CountDownLatch(2); rmvLatch = new CountDownLatch(1); try { startGrid(igniteInstanceName + 1); Ignite ignite = startGrid(igniteInstanceName); ComputeTaskFuture fut = executeAsync(ignite.compute(), new GridMultiNodeGlobalConsumerTask(), null); executeAsync(ignite.compute(), GridMultiNodeTestCheckPointTask.class, null).get(2 * 60 * 1000); fut.get(); for (Ignite g : G.allGrids()) { assert checkCheckpointManager(g) : "Session IDs got stuck after task completion [igniteInstanceName=" + g.name() + ", sesIds=" + checkpoints(g).sessionIds() + ']'; } } finally { stopAllGrids(); } } /** * @param g Grid. * @return {@code True} if checkpoint manager is OK. * @throws Exception If failed. */ @SuppressWarnings( {"BusyWait"}) private boolean checkCheckpointManager(Ignite g) throws Exception { int i = 0; while (true) { Collection<IgniteUuid> sesIds = checkpoints(g).sessionIds(); if (sesIds.isEmpty()) return true; if (++i == 3) return false; Thread.sleep(1000); } } /** * Test job. */ private static class GridTestCheckpointJob extends ComputeJobAdapter { /** */ @IgniteInstanceResource private Ignite ignite; /** */ @TaskSessionResource private ComputeTaskSession taskSes; /** {@inheritDoc} */ @SuppressWarnings({"TooBroadScope"}) @Override public String execute() { assert ignite != null; assert taskSes != null; final String key1 = "test-checkpoint-key1"; final String val1 = "test-checkpoint-value1"; final String key2 = "test-checkpoint-key2"; final String val2 = "test-checkpoint-value2"; String key3 = "test-checkpoint-key3"; String val3 = "test-checkpoint-value3"; taskSes.saveCheckpoint(key1, val1, GLOBAL_SCOPE, 0); taskSes.saveCheckpoint(key2, val2, SESSION_SCOPE, 0); assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert val1.equals(taskSes.loadCheckpoint(key1)); assert val2.equals(taskSes.loadCheckpoint(key2)); } }); // Don't overwrite. taskSes.saveCheckpoint(key1, val2, GLOBAL_SCOPE, 0, false); taskSes.saveCheckpoint(key2, val1, SESSION_SCOPE, 0, false); assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert val1.equals(taskSes.loadCheckpoint(key1)); assert val2.equals(taskSes.loadCheckpoint(key2)); } }); taskSes.saveCheckpoint(key1, val2, GLOBAL_SCOPE, 0, true); taskSes.saveCheckpoint(key2, val1, SESSION_SCOPE, 0, true); assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert val2.equals(taskSes.loadCheckpoint(key1)); assert val1.equals(taskSes.loadCheckpoint(key2)); } }); assert taskSes.removeCheckpoint(key1); assert taskSes.removeCheckpoint(key2); assert !taskSes.removeCheckpoint(key1); assert !taskSes.removeCheckpoint(key2); assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert taskSes.loadCheckpoint(key1) == null; assert taskSes.loadCheckpoint(key2) == null; } }); taskSes.saveCheckpoint(key1, val1, GLOBAL_SCOPE, 0); ((IgniteMXBean) ignite).removeCheckpoint(key1); // This checkpoint will not be automatically removed for cache SPI. taskSes.saveCheckpoint(key1, val1, GLOBAL_SCOPE, 5000); // This will be automatically removed by cache SPI. taskSes.saveCheckpoint(key2, val2, SESSION_SCOPE, 5000); try { Thread.sleep(6000); } catch (InterruptedException e) { throw new IgniteException(e); } assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert taskSes.loadCheckpoint(key1) == null; assert taskSes.loadCheckpoint(key2) == null; } }); // This checkpoint will be removed when task session end. taskSes.saveCheckpoint(key3, val3, SESSION_SCOPE, 0); return null; } } /** * Test task. */ @ComputeTaskSessionFullSupport private static class GridTestCheckpointTask extends ComputeTaskSplitAdapter<Object, Object> { /** {@inheritDoc} */ @Override protected Collection<? extends ComputeJob> split(int gridSize, Object arg) { return Collections.singleton(new GridTestCheckpointJob()); } /** {@inheritDoc} */ @Override public Serializable reduce(List<ComputeJobResult> results) { return null; } } /** * Multi-node test consumer job. */ private static class GridMultiNodeTestCheckpointProducerJob extends ComputeJobAdapter { /** */ @IgniteInstanceResource private Ignite ignite; /** */ @TaskSessionResource private ComputeTaskSession taskSes; /** {@inheritDoc} */ @Override public String execute() { assert ignite != null; assert taskSes != null; assert startLatch != null; assert read1Latch != null; assert read2Latch != null; assert read3Latch != null; assert read1FinishedLatch != null; assert read2FinishedLatch != null; assert read3FinishedLatch != null; assert rmvLatch != null; startLatch.countDown(); try { startLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } X.println(">>> Producer started."); taskSes.saveCheckpoint(GLOBAL_KEY, GLOBAL_VAL, GLOBAL_SCOPE, 0); taskSes.saveCheckpoint(SES_KEY, SES_VAL, SESSION_SCOPE, 0); read1Latch.countDown(); try { read1FinishedLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // No retries here as other thread should have seen checkpoint already. assert GLOBAL_VAL.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert SES_VAL.equals(taskSes.loadCheckpoint(SES_KEY)); taskSes.saveCheckpoint(GLOBAL_KEY, SES_VAL + "-notoverwritten", GLOBAL_SCOPE, 0, false); taskSes.saveCheckpoint(SES_KEY, GLOBAL_VAL + "-notoverwritten", SESSION_SCOPE, 0, false); read2Latch.countDown(); try { read2FinishedLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } assert GLOBAL_VAL.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert SES_VAL.equals(taskSes.loadCheckpoint(SES_KEY)); // Swap values. taskSes.saveCheckpoint(GLOBAL_KEY, SES_VAL_OVERWRITTEN, GLOBAL_SCOPE, 0, true); taskSes.saveCheckpoint(SES_KEY, GLOBAL_VAL_OVERWRITTEN, SESSION_SCOPE, 0, true); read3Latch.countDown(); try { read3FinishedLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } assert SES_VAL_OVERWRITTEN.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert GLOBAL_VAL_OVERWRITTEN.equals(taskSes.loadCheckpoint(SES_KEY)); // Remove checkpoints. assert taskSes.removeCheckpoint(GLOBAL_KEY); assert taskSes.removeCheckpoint(SES_KEY); // Check checkpoints are actually removed. assert !taskSes.removeCheckpoint(GLOBAL_KEY); assert !taskSes.removeCheckpoint(SES_KEY); rmvLatch.countDown(); assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert taskSes.loadCheckpoint(GLOBAL_KEY) == null; assert taskSes.loadCheckpoint(SES_KEY) == null; } }); return null; } } /** * Multi-node test consumer job. */ private static class GridMultiNodeTestCheckpointConsumerJob extends ComputeJobAdapter { /** */ @TaskSessionResource private ComputeTaskSession taskSes; /** {@inheritDoc} */ @Override public String execute() { assert taskSes != null; assert startLatch != null; assert read1Latch != null; assert read2Latch != null; assert read3Latch != null; assert read1FinishedLatch != null; assert read2FinishedLatch != null; assert read3FinishedLatch != null; assert rmvLatch != null; startLatch.countDown(); try { startLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } X.println(">>> Consumer started."); try { read1Latch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // Test that checkpoints were saved properly. assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert GLOBAL_VAL.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert SES_VAL.equals(taskSes.loadCheckpoint(SES_KEY)); } }); read1FinishedLatch.countDown(); try { read2Latch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // Test that checkpoints were not overwritten. assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert GLOBAL_VAL.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert SES_VAL.equals(taskSes.loadCheckpoint(SES_KEY)); } }); read2FinishedLatch.countDown(); try { read3Latch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assertEquals(SES_VAL_OVERWRITTEN, taskSes.loadCheckpoint(GLOBAL_KEY)); assertEquals(GLOBAL_VAL_OVERWRITTEN, taskSes.loadCheckpoint(SES_KEY)); } }); read3FinishedLatch.countDown(); try { rmvLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // Check checkpoints are actually removed. assert !taskSes.removeCheckpoint(GLOBAL_KEY); assert !taskSes.removeCheckpoint(SES_KEY); assertWithRetries(new GridAbsClosureX() { @Override public void applyx() { assert taskSes.loadCheckpoint(GLOBAL_KEY) == null; assert taskSes.loadCheckpoint(SES_KEY) == null; } }); return null; } } /** * Multi-node test task. */ @ComputeTaskSessionFullSupport private static class GridMultiNodeTestCheckPointTask extends ComputeTaskSplitAdapter<Object, Object> { /** {@inheritDoc} */ @Override protected Collection<? extends ComputeJob> split(int gridSize, Object arg) { assert gridSize == 2; return Arrays.asList( new GridMultiNodeTestCheckpointProducerJob(), new GridMultiNodeTestCheckpointConsumerJob() ); } /** {@inheritDoc} */ @Override public Object reduce(List<ComputeJobResult> results) { return null; } } /** */ @ComputeTaskSessionFullSupport private static class GridMultiNodeGlobalConsumerTask extends ComputeTaskSplitAdapter<Object, Integer> { /** */ @TaskSessionResource private ComputeTaskSession taskSes; /** {@inheritDoc} */ @Override protected Collection<? extends ComputeJob> split(int gridSize, Object arg) { return Collections.singleton(new ComputeJobAdapter() { @Nullable @Override public Object execute() { assert taskSes != null; assert startLatch != null; assert read1Latch != null; assert read2Latch != null; assert read3Latch != null; assert read1FinishedLatch != null; assert read2FinishedLatch != null; assert read3FinishedLatch != null; assert rmvLatch != null; startLatch.countDown(); try { startLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } X.println(">>> Global consumer started."); try { read1Latch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // Test that checkpoints were saved properly. assert GLOBAL_VAL.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert SES_VAL.equals(taskSes.loadCheckpoint(SES_KEY)); read1FinishedLatch.countDown(); try { read2Latch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // Test that checkpoints were not overwritten. assert GLOBAL_VAL.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); assert SES_VAL.equals(taskSes.loadCheckpoint(SES_KEY)); read2FinishedLatch.countDown(); try { read3Latch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } assert GLOBAL_VAL_OVERWRITTEN.equals(taskSes.loadCheckpoint(SES_KEY)); assert SES_VAL_OVERWRITTEN.equals(taskSes.loadCheckpoint(GLOBAL_KEY)); read3FinishedLatch.countDown(); try { rmvLatch.await(); } catch (InterruptedException e) { throw new IgniteException("Thread has been interrupted.", e); } // Check checkpoints are actually removed. assert !taskSes.removeCheckpoint(GLOBAL_KEY); assert !taskSes.removeCheckpoint(SES_KEY); assert taskSes.loadCheckpoint(GLOBAL_KEY) == null; assert taskSes.loadCheckpoint(SES_KEY) == null; return 0; } }); } /** {@inheritDoc} */ @Nullable @Override public Integer reduce(List<ComputeJobResult> results) { int sum = 0; for (ComputeJobResult res : results) sum += res.<Integer>getData(); return sum; } } /** * Wrapper around {@link GridTestUtils#retryAssert(org.apache.ignite.IgniteLogger, int, long, GridAbsClosure)}. * For the given closure provides count of retries, configured by {@link #retries} attribute. * @param assertion Closure with assertion inside. */ private static void assertWithRetries(GridAbsClosureX assertion) { try { GridTestUtils.retryAssert(null, retries, 5000, assertion); } catch (IgniteInterruptedCheckedException e) { throw new IgniteException(e); } } }