/*
* JBoss, Home of Professional Open Source
* Copyright 2011 Red Hat Inc. and/or its affiliates and other
* contributors as indicated by the @author tags. All rights reserved.
* See the copyright.txt in the distribution for a full listing of
* individual contributors.
*
* This is free software; you can redistribute it and/or modify it
* under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation; either version 2.1 of
* the License, or (at your option) any later version.
*
* This software is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this software; if not, write to the Free
* Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
* 02110-1301 USA, or see the FSF site: http://www.fsf.org.
*/
package org.infinispan.distribution.rehash;
import org.infinispan.Cache;
import org.infinispan.config.Configuration;
import org.infinispan.config.GlobalConfiguration;
import org.infinispan.context.Flag;
import org.infinispan.distribution.DistributionTestHelper;
import org.infinispan.distribution.ch.AbstractWheelConsistentHash;
import org.infinispan.manager.EmbeddedCacheManager;
import org.infinispan.remoting.transport.Address;
import org.infinispan.test.MultipleCacheManagersTest;
import org.infinispan.test.TestingUtil;
import org.infinispan.transaction.lookup.DummyTransactionManagerLookup;
import org.infinispan.util.concurrent.IsolationLevel;
import org.infinispan.util.concurrent.TimeoutException;
import org.infinispan.util.logging.Log;
import org.infinispan.util.logging.LogFactory;
import org.testng.annotations.Test;
import javax.transaction.HeuristicMixedException;
import javax.transaction.HeuristicRollbackException;
import javax.transaction.NotSupportedException;
import javax.transaction.RollbackException;
import javax.transaction.SystemException;
import javax.transaction.TransactionManager;
import java.util.HashMap;
import java.util.HashSet;
import java.util.LinkedList;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.Callable;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.Future;
import java.util.concurrent.ThreadFactory;
import static java.lang.String.format;
import static org.infinispan.test.TestingUtil.sleepRandom;
import static org.infinispan.test.fwk.TestCacheManagerFactory.createCacheManager;
// As this is a SLOW stress test, leave it disabled by default. Only run it manually.
@Test(groups = "stress", testName = "distribution.rehash.ConsistencyStressTest", enabled = false)
public class ConsistencyStressTest extends MultipleCacheManagersTest {
private static final int NUM_NODES = 10;
private static final int WORKERS_PER_NODE = 2;
private static final int NUM_ITERATIONS = 5000;
private static final boolean IGNORE_TX_FAILURES = true;
private static final Log log = LogFactory.getLog(ConsistencyStressTest.class);
@Override
protected void createCacheManagers() throws Throwable {
Configuration c = new Configuration();
c.setIsolationLevel(IsolationLevel.READ_COMMITTED);
c.setLockAcquisitionTimeout(60000);
c.setUseLockStriping(false);
c.setCacheMode(Configuration.CacheMode.DIST_SYNC);
c.setL1CacheEnabled(false);
c.setSyncReplTimeout(30000);
c.setUseEagerLocking(true);
c.setEagerLockSingleNode(true);
c.setTransactionManagerLookupClass(DummyTransactionManagerLookup.class.getName());
c.setSyncCommitPhase(true);
c.setSyncRollbackPhase(true);
GlobalConfiguration gc = GlobalConfiguration.getClusteredDefault();
gc.setDistributedSyncTimeout(60000);
List<EmbeddedCacheManager> cacheManagers = new LinkedList<EmbeddedCacheManager>();
for (int i = 0; i < NUM_NODES; i++)
cacheManagers.add(createCacheManager(gc, c));
registerCacheManager(cacheManagers.toArray(new EmbeddedCacheManager[NUM_NODES]));
}
@SuppressWarnings("unchecked")
public void testConsistency() throws Throwable, InterruptedException {
// create an executor...
ExecutorService executorService = Executors.newFixedThreadPool(NUM_NODES * WORKERS_PER_NODE, new ThreadFactory() {
int i = 0;
@Override
public synchronized Thread newThread(Runnable r) {
return new Thread(r, "Worker-" + i++);
}
});
Set<Future<Void>> futures = new HashSet<Future<Void>>(NUM_NODES * WORKERS_PER_NODE);
Set<String> keysToIgnore = new HashSet<String>();
for (int i = 0; i < NUM_NODES; i++) {
Cache<String, String> c = cache(i);
for (int j = 0; j < WORKERS_PER_NODE; j++) {
Future<Void> f = executorService.submit(new Stressor(c, i, j, keysToIgnore));
futures.add(f);
sleepRandom(500);
}
}
// stressors are now running, generating a lot of data.
// wait for all stressors to finish.
log.info("Waiting for stressors to finish");
for (Future<Void> f : futures) f.get();
// Now shut down a node:
TestingUtil.killCacheManagers(cacheManagers.get(0));
// ... and ensure no data is lost.
// Stressors encode data in the format nodeNumber|workerNumber|iterationNumber, and all have the value "value".
Map<Address, Cache<Object, Object>> cacheMap = new HashMap<Address, Cache<Object, Object>>();
for (int i = 1; i < NUM_NODES; i++) {
Cache<Object, Object> c = cache(i);
cacheMap.put(address(c), c);
}
// Let's enforce a quiet period to allow queued up transactions to complete.
Thread.sleep(25000);
// lets make sure any rehashing work has completed
TestingUtil.blockUntilViewsReceived(60000, false, cacheMap.values());
TestingUtil.waitForRehashToComplete(cacheMap.values());
AbstractWheelConsistentHash hash = (AbstractWheelConsistentHash) cache(1).getAdvancedCache().getDistributionManager().getConsistentHash();
for (int i = 0; i < NUM_NODES; i++) {
for (int j = 0; j < WORKERS_PER_NODE; j++) {
for (int k = 0; k < NUM_ITERATIONS; k++) {
String key = keyFor(i, j, k);
if (keysToIgnore.contains(key)) {
log.infof("Skipping test on failing key %s", key);
} else {
List<Address> owners = hash.locate(key, 2);
for (Map.Entry<Address, Cache<Object, Object>> e : cacheMap.entrySet()) {
try {
if (owners.contains(e.getKey())) DistributionTestHelper.assertIsInContainerImmortal(e.getValue(), key);
// Don't bother testing non-owners since invalidations caused by rehashing are async!
} catch (Throwable th) {
log.fatalf("Key %s (hash %s) should be on owners %s according to %s", key, hash.getNormalizedHash(key), owners, hash);
throw th;
}
}
}
}
}
}
executorService.shutdownNow();
}
private static String keyFor(int nodeId, int workerId, int iterationId) {
return format("__%s_%s_%s__", nodeId, workerId, iterationId);
}
private static class Stressor implements Callable<Void> {
private final Cache<String, String> cache;
private final TransactionManager tm;
private final int cacheId, workerId;
private final Set<String> keysToIgnore;
private Stressor(Cache<String, String> cache, int cacheId, int workerId, Set<String> keysToIgnore) {
this.cache = cache;
tm = TestingUtil.getTransactionManager(cache);
this.cacheId = cacheId;
this.workerId = workerId;
this.keysToIgnore = keysToIgnore;
}
@Override
public Void call() {
for (int iterationId = 0; iterationId < NUM_ITERATIONS; iterationId++) {
if (iterationId % 500 == 0)
log.infof(" >> Stressor %s Worker %s Iteration %s", cacheId, workerId, iterationId);
boolean txError = false;
Exception exception = null;
String key = keyFor(cacheId, workerId, iterationId);
try {
tm.begin();
cache.getAdvancedCache().withFlags(Flag.SKIP_REMOTE_LOOKUP).put(key, "value");
tm.commit();
} catch (HeuristicRollbackException e) {
txError = true;
exception = e;
} catch (RollbackException e) {
txError = true;
exception = e;
} catch (SystemException e) {
txError = true;
exception = e;
} catch (HeuristicMixedException e) {
txError = true;
exception = e;
} catch (NotSupportedException e) {
txError = true;
exception = e;
} catch (TimeoutException e) {
txError = true;
exception = e;
}
if (txError) {
//first try and roll back the tx
try {
tm.rollback();
} catch (Exception exc) {
// rollback failed?
log.error(" >> Rollback failed");
}
if (IGNORE_TX_FAILURES) {
keysToIgnore.add(key);
log.errorf(" >> Saw a %s when trying to process key %s", exception.getClass().getSimpleName(), key);
} else {
throw new RuntimeException(exception);
}
}
}
return null;
}
}
}