/** * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.zookeeper.test; import java.io.IOException; import java.util.ArrayList; import java.util.Arrays; import java.util.List; import java.util.concurrent.Semaphore; import java.util.concurrent.TimeUnit; import org.apache.zookeeper.AsyncCallback; import org.apache.zookeeper.CreateMode; import org.apache.zookeeper.KeeperException; import org.apache.zookeeper.Op; import org.apache.zookeeper.OpResult; import org.apache.zookeeper.WatchedEvent; import org.apache.zookeeper.Watcher; import org.apache.zookeeper.Watcher.Event.KeeperState; import org.apache.zookeeper.ZKTestCase; import org.apache.zookeeper.ZooDefs; import org.apache.zookeeper.ZooDefs.Ids; import org.apache.zookeeper.ZooKeeper; import org.apache.zookeeper.data.Stat; import org.apache.zookeeper.server.quorum.Leader; import org.apache.zookeeper.server.quorum.LearnerHandler; import org.apache.zookeeper.test.ClientBase.CountdownWatcher; import org.junit.After; import org.junit.Assert; import org.junit.Before; import org.junit.Ignore; import org.junit.Test; import org.slf4j.Logger; import org.slf4j.LoggerFactory; public class QuorumTest extends ZKTestCase { private static final Logger LOG = LoggerFactory.getLogger(QuorumTest.class); public static final long CONNECTION_TIMEOUT = ClientTest.CONNECTION_TIMEOUT; private final QuorumBase qb = new QuorumBase(); private final ClientTest ct = new ClientTest(); @Before public void setUp() throws Exception { qb.setUp(); ct.hostPort = qb.hostPort; ct.setUpAll(); } @After public void tearDown() throws Exception { ct.tearDownAll(); qb.tearDown(); } @Test public void testDeleteWithChildren() throws Exception { ct.testDeleteWithChildren(); } @Test public void testPing() throws Exception { ct.testPing(); } @Test public void testSequentialNodeNames() throws IOException, InterruptedException, KeeperException { ct.testSequentialNodeNames(); } @Test public void testACLs() throws Exception { ct.testACLs(); } @Test public void testClientwithoutWatcherObj() throws IOException, InterruptedException, KeeperException { ct.testClientwithoutWatcherObj(); } @Test public void testClientWithWatcherObj() throws IOException, InterruptedException, KeeperException { ct.testClientWithWatcherObj(); } @Test public void testGetView() { Assert.assertEquals(5,qb.s1.getView().size()); Assert.assertEquals(5,qb.s2.getView().size()); Assert.assertEquals(5,qb.s3.getView().size()); Assert.assertEquals(5,qb.s4.getView().size()); Assert.assertEquals(5,qb.s5.getView().size()); } @Test public void testViewContains() { // Test view contains self Assert.assertTrue(qb.s1.viewContains(qb.s1.getId())); // Test view contains other servers Assert.assertTrue(qb.s1.viewContains(qb.s2.getId())); // Test view does not contain non-existant servers Assert.assertFalse(qb.s1.viewContains(-1L)); } volatile int counter = 0; volatile int errors = 0; @Test public void testLeaderShutdown() throws IOException, InterruptedException, KeeperException { ZooKeeper zk = new DisconnectableZooKeeper(qb.hostPort, ClientBase.CONNECTION_TIMEOUT, new Watcher() { public void process(WatchedEvent event) { }}); zk.create("/blah", new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT); zk.create("/blah/blah", new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT); Leader leader = qb.s1.leader; if (leader == null) leader = qb.s2.leader; if (leader == null) leader = qb.s3.leader; if (leader == null) leader = qb.s4.leader; if (leader == null) leader = qb.s5.leader; Assert.assertNotNull(leader); for(int i = 0; i < 5000; i++) { zk.setData("/blah/blah", new byte[0], -1, new AsyncCallback.StatCallback() { public void processResult(int rc, String path, Object ctx, Stat stat) { counter++; if (rc != 0) { errors++; } } }, null); } ArrayList<LearnerHandler> fhs = new ArrayList<LearnerHandler>(leader.forwardingFollowers); for(LearnerHandler f: fhs) { f.getSocket().shutdownInput(); } for(int i = 0; i < 5000; i++) { zk.setData("/blah/blah", new byte[0], -1, new AsyncCallback.StatCallback() { public void processResult(int rc, String path, Object ctx, Stat stat) { counter++; if (rc != 0) { errors++; } } }, null); } // check if all the followers are alive Assert.assertTrue(qb.s1.isAlive()); Assert.assertTrue(qb.s2.isAlive()); Assert.assertTrue(qb.s3.isAlive()); Assert.assertTrue(qb.s4.isAlive()); Assert.assertTrue(qb.s5.isAlive()); zk.close(); } @Test public void testMultipleWatcherObjs() throws IOException, InterruptedException, KeeperException { ct.testMutipleWatcherObjs(); } /** * Make sure that we can change sessions * from follower to leader. * * @throws IOException * @throws InterruptedException * @throws KeeperException */ @Test public void testSessionMoved() throws Exception { String hostPorts[] = qb.hostPort.split(","); DisconnectableZooKeeper zk = new DisconnectableZooKeeper(hostPorts[0], ClientBase.CONNECTION_TIMEOUT, new Watcher() { public void process(WatchedEvent event) { }}); zk.create("/sessionMoveTest", new byte[0], Ids.OPEN_ACL_UNSAFE, CreateMode.EPHEMERAL); // we want to loop through the list twice for(int i = 0; i < hostPorts.length*2; i++) { zk.dontReconnect(); // This should stomp the zk handle DisconnectableZooKeeper zknew = new DisconnectableZooKeeper(hostPorts[(i+1)%hostPorts.length], ClientBase.CONNECTION_TIMEOUT, new Watcher() {public void process(WatchedEvent event) { }}, zk.getSessionId(), zk.getSessionPasswd()); zknew.setData("/", new byte[1], -1); final int result[] = new int[1]; result[0] = Integer.MAX_VALUE; zknew.sync("/", new AsyncCallback.VoidCallback() { public void processResult(int rc, String path, Object ctx) { synchronized(result) { result[0] = rc; result.notify(); } } }, null); synchronized(result) { if(result[0] == Integer.MAX_VALUE) { result.wait(5000); } } LOG.info(hostPorts[(i+1)%hostPorts.length] + " Sync returned " + result[0]); Assert.assertTrue(result[0] == KeeperException.Code.OK.intValue()); try { zk.setData("/", new byte[1], -1); Assert.fail("Should have lost the connection"); } catch(KeeperException.ConnectionLossException e) { } zk = zknew; } zk.close(); } private static class DiscoWatcher implements Watcher { volatile boolean zkDisco = false; public void process(WatchedEvent event) { if (event.getState() == KeeperState.Disconnected) { zkDisco = true; } } } /** * Connect to two different servers with two different handles using the same session and * make sure we cannot do any changes. */ @Test @Ignore public void testSessionMove() throws Exception { String hps[] = qb.hostPort.split(","); DiscoWatcher oldWatcher = new DiscoWatcher(); DisconnectableZooKeeper zk = new DisconnectableZooKeeper(hps[0], ClientBase.CONNECTION_TIMEOUT, oldWatcher); zk.create("/t1", new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.EPHEMERAL); zk.dontReconnect(); // This should stomp the zk handle DiscoWatcher watcher = new DiscoWatcher(); DisconnectableZooKeeper zknew = new DisconnectableZooKeeper(hps[1], ClientBase.CONNECTION_TIMEOUT, watcher, zk.getSessionId(), zk.getSessionPasswd()); zknew.create("/t2", new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.EPHEMERAL); try { zk.create("/t3", new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.EPHEMERAL); Assert.fail("Should have lost the connection"); } catch(KeeperException.ConnectionLossException e) { // wait up to 30 seconds for the disco to be delivered for (int i = 0; i < 30; i++) { if (oldWatcher.zkDisco) { break; } Thread.sleep(1000); } Assert.assertTrue(oldWatcher.zkDisco); } ArrayList<ZooKeeper> toClose = new ArrayList<ZooKeeper>(); toClose.add(zknew); // Let's just make sure it can still move for(int i = 0; i < 10; i++) { zknew.dontReconnect(); zknew = new DisconnectableZooKeeper(hps[1], ClientBase.CONNECTION_TIMEOUT, new DiscoWatcher(), zk.getSessionId(), zk.getSessionPasswd()); toClose.add(zknew); zknew.create("/t-"+i, new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.EPHEMERAL); } for (ZooKeeper z: toClose) { z.close(); } zk.close(); } /** * See ZOOKEEPER-790 for details * */ @Test public void testFollowersStartAfterLeader() throws Exception { QuorumUtil qu = new QuorumUtil(1); CountdownWatcher watcher = new CountdownWatcher(); qu.startQuorum(); int index = 1; while(qu.getPeer(index).peer.leader == null) index++; ZooKeeper zk = new ZooKeeper( "127.0.0.1:" + qu.getPeer((index == 1)?2:1).peer.getClientPort(), ClientBase.CONNECTION_TIMEOUT, watcher); watcher.waitForConnected(CONNECTION_TIMEOUT); // break the quorum qu.shutdown(index); // try to reestablish the quorum qu.start(index); Assert.assertTrue("quorum reestablishment failed", QuorumBase.waitForServerUp( "127.0.0.1:" + qu.getPeer(2).clientPort, CONNECTION_TIMEOUT)); for (int i = 0; i < 30; i++) { try { zk.create("/test", "test".getBytes(), ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT); break; } catch(KeeperException.ConnectionLossException e) { Thread.sleep(1000); } // test fails if we still can't connect to the quorum after 30 seconds. Assert.fail("client could not connect to reestablished quorum: giving up after 30+ seconds."); } zk.close(); } /** * Tests if closeSession can be logged before a leader gets established, which * could lead to a locked-out follower (see ZOOKEEPER-790). * * The test works as follows. It has a client connecting to a follower f and * sending batches of 1,000 updates. The goal is that f has a zxid higher than * all other servers in the initial leader election. This way we can crash and * recover the follower so that the follower believes it is the leader once it * recovers (LE optimization: once a server receives a message from all other * servers, it picks a leader. * * It also makes the session timeout very short so that we force the false * leader to close the session and write it to the log in the buggy code (before * ZOOKEEPER-790). Once f drops leadership and finds the current leader, its epoch * is higher, and it rejects the leader. Now, if we prevent the leader from closing * the session by only starting up (see Leader.lead()) once it obtains a quorum of * supporters, then f will find the current leader and support it because it won't * have a highe epoch. * */ @Test public void testNoLogBeforeLeaderEstablishment () throws IOException, InterruptedException, KeeperException{ final Semaphore sem = new Semaphore(0); QuorumUtil qu = new QuorumUtil(2); qu.startQuorum(); int index = 1; while(qu.getPeer(index).peer.leader == null) index++; Leader leader = qu.getPeer(index).peer.leader; Assert.assertNotNull(leader); /* * Reusing the index variable to select a follower to connect to */ index = (index == 1) ? 2 : 1; ZooKeeper zk = new DisconnectableZooKeeper("127.0.0.1:" + qu.getPeer(index).peer.getClientPort(), 1000, new Watcher() { public void process(WatchedEvent event) { }}); zk.create("/blah", new byte[0], ZooDefs.Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT); for(int i = 0; i < 50000; i++) { zk.setData("/blah", new byte[0], -1, new AsyncCallback.StatCallback() { public void processResult(int rc, String path, Object ctx, Stat stat) { counter++; if (rc != 0) { errors++; } if(counter == 20000){ sem.release(); } } }, null); if(i == 5000){ qu.shutdown(index); LOG.info("Shutting down s1"); } if(i == 12000){ qu.start(index); LOG.info("Setting up server: " + index); } if((i % 1000) == 0){ Thread.sleep(500); } } // Wait until all updates return sem.tryAcquire(15000, TimeUnit.MILLISECONDS); // Verify that server is following and has the same epoch as the leader Assert.assertTrue("Not following", qu.getPeer(index).peer.follower != null); long epochF = (qu.getPeer(index).peer.getActiveServer().getZxid() >> 32L); long epochL = (leader.getEpoch() >> 32L); Assert.assertTrue("Zxid: " + qu.getPeer(index).peer.getActiveServer().getZxid() + "Current epoch: " + epochF, epochF == epochL); } // skip superhammer and clientcleanup as they are too expensive for quorum /** * Tests if a multiop submitted to a non-leader propagates to the leader properly * (see ZOOKEEPER-1124). * * The test works as follows. It has a client connect to a follower and submit a multiop * to the follower. It then verifies that the multiop successfully gets committed by the leader. * * Without the fix in ZOOKEEPER-1124, this fails with a ConnectionLoss KeeperException. */ @Test public void testMultiToFollower() throws Exception { QuorumUtil qu = new QuorumUtil(1); CountdownWatcher watcher = new CountdownWatcher(); qu.startQuorum(); int index = 1; while(qu.getPeer(index).peer.leader == null) index++; ZooKeeper zk = new ZooKeeper( "127.0.0.1:" + qu.getPeer((index == 1)?2:1).peer.getClientPort(), ClientBase.CONNECTION_TIMEOUT, watcher); watcher.waitForConnected(CONNECTION_TIMEOUT); List<OpResult> results = new ArrayList<OpResult>(); results = zk.multi(Arrays.asList( Op.create("/multi0", new byte[0], Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT), Op.create("/multi1", new byte[0], Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT), Op.create("/multi2", new byte[0], Ids.OPEN_ACL_UNSAFE, CreateMode.PERSISTENT) )); zk.getData("/multi0", false, null); zk.getData("/multi1", false, null); zk.getData("/multi2", false, null); zk.close(); } }