/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.ignite.internal.processors.cache.distributed; import java.util.ArrayList; import java.util.Collection; import java.util.Collections; import java.util.HashMap; import java.util.HashSet; import java.util.Map; import java.util.Set; import java.util.UUID; import java.util.concurrent.Callable; import java.util.concurrent.TimeUnit; import org.apache.ignite.Ignite; import org.apache.ignite.IgniteCache; import org.apache.ignite.IgniteException; import org.apache.ignite.Ignition; import org.apache.ignite.cache.CacheMode; import org.apache.ignite.cluster.ClusterNode; import org.apache.ignite.configuration.CacheConfiguration; import org.apache.ignite.configuration.IgniteConfiguration; import org.apache.ignite.internal.IgniteEx; import org.apache.ignite.internal.IgniteKernal; import org.apache.ignite.internal.managers.communication.GridIoMessage; import org.apache.ignite.internal.processors.cache.GridCacheAbstractSelfTest; import org.apache.ignite.internal.processors.cache.GridCacheAdapter; import org.apache.ignite.internal.processors.cache.distributed.near.GridNearCacheAdapter; import org.apache.ignite.internal.processors.cache.distributed.near.GridNearTxLocal; import org.apache.ignite.internal.processors.cache.transactions.IgniteTxManager; import org.apache.ignite.internal.processors.cache.transactions.TransactionProxyImpl; import org.apache.ignite.internal.util.lang.GridAbsPredicate; import org.apache.ignite.internal.util.typedef.F; import org.apache.ignite.internal.util.typedef.G; import org.apache.ignite.lang.IgniteCallable; import org.apache.ignite.lang.IgniteFuture; import org.apache.ignite.lang.IgniteFutureTimeoutException; import org.apache.ignite.lang.IgniteInClosure; import org.apache.ignite.plugin.extensions.communication.Message; import org.apache.ignite.resources.IgniteInstanceResource; import org.apache.ignite.spi.IgniteSpiException; import org.apache.ignite.spi.communication.tcp.TcpCommunicationSpi; import org.apache.ignite.testframework.GridTestUtils; import org.apache.ignite.transactions.Transaction; import static org.apache.ignite.transactions.TransactionConcurrency.PESSIMISTIC; /** * Abstract test for originating node failure. */ public abstract class IgniteTxPessimisticOriginatingNodeFailureAbstractSelfTest extends GridCacheAbstractSelfTest { /** */ protected static final int GRID_CNT = 5; /** Ignore node ID. */ private volatile Collection<UUID> ignoreMsgNodeIds; /** Ignore message class. */ private Collection<Class<?>> ignoreMsgCls; /** Failing node ID. */ private UUID failingNodeId; /** * @throws Exception If failed. */ public void testManyKeysCommit() throws Exception { Collection<Integer> keys = new ArrayList<>(200); for (int i = 0; i < 200; i++) keys.add(i); testTxOriginatingNodeFails(keys, false); } /** * @throws Exception If failed. */ public void testManyKeysRollback() throws Exception { Collection<Integer> keys = new ArrayList<>(200); for (int i = 0; i < 200; i++) keys.add(i); testTxOriginatingNodeFails(keys, true); } /** * @throws Exception If failed. */ public void testPrimaryNodeFailureCommit() throws Exception { checkPrimaryNodeCrash(true); } /** * @throws Exception If failed. */ public void testPrimaryNodeFailureRollback() throws Exception { checkPrimaryNodeCrash(false); } /** * @return Index of node starting transaction. */ protected int originatingNode() { return 0; } /** * Ignores messages to given node of given type. * * @param dstNodeIds Destination node IDs. * @param msgCls Message type. */ protected void ignoreMessages(Collection<Class<?>> msgCls, Collection<UUID> dstNodeIds) { ignoreMsgNodeIds = dstNodeIds; ignoreMsgCls = msgCls; } /** * Gets ignore message class to simulate partial prepare message. * * @return Ignore message class. */ protected abstract Collection<Class<?>> ignoreMessageClasses(); /** * @param keys Keys to update. * @param fullFailure Flag indicating whether to simulate rollback state. * @throws Exception If failed. */ protected void testTxOriginatingNodeFails(Collection<Integer> keys, final boolean fullFailure) throws Exception { assertFalse(keys.isEmpty()); final Collection<IgniteKernal> grids = new ArrayList<>(); ClusterNode txNode = grid(originatingNode()).localNode(); for (int i = 1; i < gridCount(); i++) grids.add((IgniteKernal)grid(i)); failingNodeId = grid(0).localNode().id(); final Map<Integer, String> map = new HashMap<>(); final String initVal = "initialValue"; for (Integer key : keys) { grid(originatingNode()).cache(DEFAULT_CACHE_NAME).put(key, initVal); map.put(key, String.valueOf(key)); } Map<Integer, Collection<ClusterNode>> nodeMap = new HashMap<>(); info("Node being checked: " + grid(1).localNode().id()); for (Integer key : keys) { Collection<ClusterNode> nodes = new ArrayList<>(); nodes.addAll(grid(1).affinity(DEFAULT_CACHE_NAME).mapKeyToPrimaryAndBackups(key)); nodes.remove(txNode); nodeMap.put(key, nodes); } info("Starting tx [values=" + map + ", topVer=" + ((IgniteKernal)grid(1)).context().discovery().topologyVersion() + ']'); if (fullFailure) ignoreMessages(ignoreMessageClasses(), F.asList(grid(1).localNode().id())); final IgniteEx originatingNodeGrid = grid(originatingNode()); GridTestUtils.runAsync(new Callable<Void>() { @Override public Void call() throws Exception { IgniteCache<Integer, String> cache = originatingNodeGrid.cache(DEFAULT_CACHE_NAME); assertNotNull(cache); Transaction tx = originatingNodeGrid.transactions().txStart(); assertEquals(PESSIMISTIC, tx.concurrency()); try { cache.putAll(map); info("Before commitAsync"); IgniteFuture<?> fut = tx.commitAsync(); info("Got future for commitAsync()."); fut.get(3, TimeUnit.SECONDS); } catch (IgniteFutureTimeoutException ignored) { info("Failed to wait for commit future completion [fullFailure=" + fullFailure + ']'); } return null; } }).get(); info(">>> Stopping originating node " + txNode); G.stop(grid(originatingNode()).name(), true); ignoreMessages(Collections.<Class<?>>emptyList(), Collections.<UUID>emptyList()); info(">>> Stopped originating node: " + txNode.id()); boolean txFinished = GridTestUtils.waitForCondition(new GridAbsPredicate() { @Override public boolean apply() { for (IgniteKernal g : grids) { GridCacheAdapter<?, ?> cache = g.internalCache(DEFAULT_CACHE_NAME); IgniteTxManager txMgr = cache.isNear() ? ((GridNearCacheAdapter)cache).dht().context().tm() : cache.context().tm(); int txNum = txMgr.idMapSize(); if (txNum != 0) return false; } return true; } }, 10000); assertTrue(txFinished); info("Transactions finished."); for (Map.Entry<Integer, Collection<ClusterNode>> e : nodeMap.entrySet()) { final Integer key = e.getKey(); final String val = map.get(key); assertFalse(e.getValue().isEmpty()); for (ClusterNode node : e.getValue()) { final UUID checkNodeId = node.id(); compute(G.ignite(checkNodeId).cluster().forNode(node)).call(new IgniteCallable<Void>() { /** */ @IgniteInstanceResource private Ignite ignite; @Override public Void call() throws Exception { IgniteCache<Integer, String> cache = ignite.cache(DEFAULT_CACHE_NAME); assertNotNull(cache); assertEquals("Failed to check entry value on node: " + checkNodeId, fullFailure ? initVal : val, cache.localPeek(key)); return null; } }); } } for (Map.Entry<Integer, String> e : map.entrySet()) { for (Ignite g : G.allGrids()) assertEquals(fullFailure ? initVal : e.getValue(), g.cache(DEFAULT_CACHE_NAME).get(e.getKey())); } } /** * Checks tx data consistency in case when primary node crashes. * * @param commmit Whether to commit or rollback a transaction. * @throws Exception If failed. */ private void checkPrimaryNodeCrash(final boolean commmit) throws Exception { Set<Integer> keys = new HashSet<>(); for (int i = 0; i < 20; i++) keys.add(i); final Collection<IgniteKernal> grids = new ArrayList<>(); ClusterNode primaryNode = grid(1).localNode(); for (int i = 0; i < gridCount(); i++) { if (i != 1) grids.add((IgniteKernal)grid(i)); } failingNodeId = primaryNode.id(); final Map<Integer, String> map = new HashMap<>(); final String initVal = "initialValue"; for (Integer key : keys) { grid(originatingNode()).cache(DEFAULT_CACHE_NAME).put(key, initVal); map.put(key, String.valueOf(key)); } Map<Integer, Collection<ClusterNode>> nodeMap = new HashMap<>(); IgniteCache<Integer, String> cache = grid(0).cache(DEFAULT_CACHE_NAME); info("Failing node ID: " + grid(1).localNode().id()); for (Integer key : keys) { Collection<ClusterNode> nodes = new ArrayList<>(); nodes.addAll(affinity(cache).mapKeyToPrimaryAndBackups(key)); nodes.remove(primaryNode); nodeMap.put(key, nodes); } info("Starting tx [values=" + map + ", topVer=" + grid(1).context().discovery().topologyVersion() + ']'); assertNotNull(cache); try (Transaction tx = grid(0).transactions().txStart()) { cache.getAll(keys); // Should not send any messages. cache.putAll(map); TransactionProxyImpl txProxy = (TransactionProxyImpl)tx; GridNearTxLocal txEx = txProxy.tx(); assertTrue(txEx.pessimistic()); if (commmit) { txEx.prepare(); // Fail the node in the middle of transaction. info(">>> Stopping primary node " + primaryNode); G.stop(Ignition.ignite(primaryNode.id()).name(), true); info(">>> Stopped originating node, finishing transaction: " + primaryNode.id()); tx.commit(); } else { // Fail the node in the middle of transaction. info(">>> Stopping primary node " + primaryNode); G.stop(G.ignite(primaryNode.id()).name(), true); info(">>> Stopped originating node, finishing transaction: " + primaryNode.id()); tx.rollback(); } } boolean txFinished = GridTestUtils.waitForCondition(new GridAbsPredicate() { @Override public boolean apply() { for (IgniteKernal g : grids) { GridCacheAdapter<?, ?> cache = g.internalCache(DEFAULT_CACHE_NAME); IgniteTxManager txMgr = cache.isNear() ? ((GridNearCacheAdapter)cache).dht().context().tm() : cache.context().tm(); int txNum = txMgr.idMapSize(); if (txNum != 0) return false; } return true; } }, 10000); assertTrue(txFinished); info("Transactions finished."); for (Map.Entry<Integer, Collection<ClusterNode>> e : nodeMap.entrySet()) { final Integer key = e.getKey(); final String val = map.get(key); assertFalse(e.getValue().isEmpty()); for (ClusterNode node : e.getValue()) { final UUID checkNodeId = node.id(); compute(G.ignite(checkNodeId).cluster().forNode(node)).call(new IgniteCallable<Void>() { /** */ @IgniteInstanceResource private Ignite ignite; @Override public Void call() throws Exception { IgniteCache<Integer, String> cache = ignite.cache(DEFAULT_CACHE_NAME); assertNotNull(cache); assertEquals("Failed to check entry value on node: " + checkNodeId, !commmit ? initVal : val, cache.localPeek(key)); return null; } }); } } for (Map.Entry<Integer, String> e : map.entrySet()) { for (Ignite g : G.allGrids()) assertEquals(!commmit ? initVal : e.getValue(), g.cache(DEFAULT_CACHE_NAME).get(e.getKey())); } } /** * @return All node IDs. */ private Collection<UUID> allNodeIds() { Collection<UUID> nodeIds = new ArrayList<>(gridCount()); for (int i = 0; i < gridCount(); i++) nodeIds.add(grid(i).localNode().id()); return nodeIds; } /** {@inheritDoc} */ @Override protected IgniteConfiguration getConfiguration(String igniteInstanceName) throws Exception { IgniteConfiguration cfg = super.getConfiguration(igniteInstanceName); cfg.setCommunicationSpi(new TcpCommunicationSpi() { @Override public void sendMessage(ClusterNode node, Message msg, IgniteInClosure<IgniteException> ackClosure) throws IgniteSpiException { if (getSpiContext().localNode().id().equals(failingNodeId)) { if (ignoredMessage((GridIoMessage)msg) && ignoreMsgNodeIds != null) { for (UUID ignored : ignoreMsgNodeIds) { if (node.id().equals(ignored)) return; } } } super.sendMessage(node, msg, ackClosure); } }); cfg.getTransactionConfiguration().setDefaultTxConcurrency(PESSIMISTIC); return cfg; } /** {@inheritDoc} */ @Override protected CacheConfiguration cacheConfiguration(String igniteInstanceName) throws Exception { CacheConfiguration cfg = super.cacheConfiguration(igniteInstanceName); cfg.setCacheStoreFactory(null); cfg.setReadThrough(false); cfg.setWriteThrough(false); return cfg; } /** {@inheritDoc} */ @Override protected int gridCount() { return GRID_CNT; } /** {@inheritDoc} */ @Override protected abstract CacheMode cacheMode(); /** {@inheritDoc} */ @Override protected void beforeTestsStarted() throws Exception { // No-op. } /** {@inheritDoc} */ @Override protected void beforeTest() throws Exception { startGridsMultiThreaded(GRID_CNT); } /** {@inheritDoc} */ @Override protected void afterTestsStopped() throws Exception { // No-op } /** {@inheritDoc} */ @Override protected void afterTest() throws Exception { stopAllGrids(); ignoreMsgCls = null; ignoreMsgNodeIds = null; } /** * Checks if message should be ignored. * * @param msg Message. * @return {@code True} if message should be ignored. */ private boolean ignoredMessage(GridIoMessage msg) { Collection<Class<?>> ignoreClss = ignoreMsgCls; if (ignoreClss != null) { for (Class<?> ignoreCls : ignoreClss) { if (ignoreCls.isAssignableFrom(msg.message().getClass())) return true; } return false; } else return false; } }