AbstractSubtask.java example

Explorer
blazegraph-master
- database-master
/*

Copyright (C) SYSTAP, LLC DBA Blazegraph 2006-2016.  All rights reserved.

Contact:
     SYSTAP, LLC DBA Blazegraph
     2501 Calvert ST NW #106
     Washington, DC 20008
     licenses@blazegraph.com

This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

*/
/*
 * Created on Apr 16, 2009
 */

package com.bigdata.service.ndx.pipeline;

import java.util.Arrays;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.NoSuchElementException;
import java.util.concurrent.Callable;
import java.util.concurrent.TimeUnit;

import org.apache.log4j.Logger;

import com.bigdata.relation.accesspath.BlockingBuffer;
import com.bigdata.relation.accesspath.ChunkMergeSortHelper;
import com.bigdata.relation.accesspath.IAsynchronousIterator;

/**
 * Abstract implementation of a subtask for the {@link AbstractMasterTask}
 * handles the protocol for startup and termination of the subtask. A concrete
 * implementation must handle the chunks of elements being drained from the
 * subtask's {@link #buffer} via {@link #handleChunk(Object[])}.
 * 
 * @param <HS>
 *            The generic type of the value returned by {@link Callable#call()}
 *            for the subtask.
 * @param <M>
 *            The generic type of the master task implementation class.
 * @param <E>
 *            The generic type of the elements in the chunks stored in the
 *            {@link BlockingBuffer}.
 * @param <L>
 *            The generic type of the key used to lookup a subtask in the
 *            internal map (must be unique and must implement hashCode() and
 *            equals() per their contracts).
 * 
 * @author <a href="mailto:thompsonbry@users.sourceforge.net">Bryan Thompson</a>
 * @version $Id$
 */
public abstract class AbstractSubtask<//
HS extends AbstractSubtaskStats,//
M extends AbstractMasterTask<? extends AbstractMasterStats<L, HS>, E, ? extends AbstractSubtask, L>,//
E,//
L>//
        implements Callable<HS> {

    protected static transient final Logger log = Logger
            .getLogger(AbstractSubtask.class);

    /**
     * The master.
     */
    protected final M master;

    /**
     * The unique key for the subtask.
     */
    protected final L locator;
    
    /**
     * The buffer on which the {@link #master} is writing.
     */
    protected final BlockingBuffer<E[]> buffer;

    /**
     * The iterator draining the {@link #buffer}.
     * <p>
     * Note: DO NOT close this iterator from within {@link #call()} as that
     * would cause this task to interrupt itself!
     */
    protected final IAsynchronousIterator<E[]> src;

    /**
     * The statistics used by this task.
     */
    protected final HS stats;

    /**
     * The timestamp at which a chunk was last written on the buffer for this
     * sink by the master. This is used to help determine whether or not a sink
     * has become idle. A sink on which a master has recently written a chunk is
     * not idle even if the sink has not read any chunks from its buffer.
     */
    protected volatile long lastChunkNanos = System.nanoTime();

    /**
     * The timestamp at {@link IAsynchronousIterator#hasNext(long, TimeUnit)}
     * last returned true when queried with a timeout of
     * {@link AbstractMasterTask#sinkPollTimeoutNanos} nanoseconds. This tests
     * whether or not a chunk is available and is used to help decide if the
     * sink has become idle. (A sink with an available chunk is never idle.)
     */
    protected volatile long lastChunkAvailableNanos = lastChunkNanos;

    public String toString() {

        return getClass().getName() + "{locator=" + locator + ", open="
                + buffer.isOpen() + "}";

    }

    public AbstractSubtask(final M master, final L locator,
            final BlockingBuffer<E[]> buffer) {

        if (master == null)
            throw new IllegalArgumentException();

        if (locator == null)
            throw new IllegalArgumentException();

        if (buffer == null)
            throw new IllegalArgumentException();

        this.master = master;
        
        this.locator = locator;

        this.buffer = buffer;

        this.src = buffer.iterator();

        this.stats = (HS) master.stats.getSubtaskStats(locator);

    }

    public HS call() throws Exception {

        try {

            final NonBlockingChunkedIterator itr = new NonBlockingChunkedIterator(
                    src);
            
            /*
             * Timestamp of the last chunk handled (written out on the index
             * partition). This is used to compute the average time between
             * chunks written on the index partition by this sink and across all
             * sinks.
             */
            long lastHandledChunkNanos = System.nanoTime();

            while (itr.hasNext()) {

                final E[] chunk = itr.next();

                // how long we waited for this chunk.
                final long elapsedChunkWaitNanos = System.nanoTime()
                        - lastHandledChunkNanos;

                synchronized (master.stats) {
                    master.stats.elapsedSinkChunkWaitingNanos += elapsedChunkWaitNanos;
                }
                synchronized(stats) {
                    stats.elapsedChunkWaitingNanos += elapsedChunkWaitNanos;
                }

                if (handleChunk(chunk)) {

                    if (log.isInfoEnabled())
                        log.info("Eager termination.");

                    // Done (eager termination).
                    break;

                }

                // reset the timestamp now that we will wait again.
                lastHandledChunkNanos = System.nanoTime();

            }
            
            if(buffer.isOpen())
                throw new AssertionError(toString());
            
            if (log.isInfoEnabled())
                log.info("Done: " + locator);

            /*
             * Wait until any asynchronous processing for the subtask is done
             * (extension hook).
             */ 
            awaitPending();
            
            // done.
            return stats;

        } catch (Throwable t) {

            if (log.isInfoEnabled()) {
                // show stack trace @ log.isInfoEnabled()
                log.warn(this, t);
            } else {
                // else only abbreviated warning.
                log.warn(this + " : " + t);
            }

            // make sure the buffer is closed.
            buffer.abort(t);
            
            // clear the backing queue.
            buffer.clear();
            
            // interrupt the remote task (extension hook).
            cancelRemoteTask(true/* mayInterruptIfRunning */);
            
            /*
             * Halt processing.
             * 
             * Note: This is responsible for propagating any errors such that
             * the master halts in a timely manner. This is necessary since no
             * one is checking the Future for the sink tasks (except when we
             * wait for them to complete before we reopen an output buffer).
             */
            throw master.halt(new RuntimeException(toString(), t));

        } finally {

            /*
             * Signal the master than the subtask is done.
             */
            master.notifySubtaskDone(this);

        }

    }

    /**
     * Wait until any asynchronous processing for the subtask is done. This is
     * an extension hook which is used if the remote task accepts chunks for
     * processing and uses an asynchronous notification mechanism to indicate
     * the success or failure of elements. The default implementation is a NOP.
     */
    protected void awaitPending() throws InterruptedException {

        // NOP - overriden by subclass which supports pendingSets.
        
    }

    /**
     * Cancel the remote task. This is an extension hook which is used if the
     * remote task accepts chunks for processing and uses an asynchronous
     * notification mechanism to indicate the success or failure of elements.
     * The default implementation is a NOP.
     * 
     * @throws InterruptedException
     */
    protected void cancelRemoteTask(boolean mayInterruptIfRunning)
            throws InterruptedException {

        // NOP - overriden by subclass which supports pendingSets.
        
    }

    /**
     * Inner class is responsible for combining chunks as they become available
     * from the {@link IAsynchronousIterator} while maintaining liveness. It
     * works with the {@link IAsynchronousIterator} API internally and polls the
     * {@link AbstractSubtask#src}. If a chunk is available, then it is added to
     * an ordered list of chunks which is maintained internally by this class.
     * {@link #next()} combines those chunks, using a merge sort to maintain
     * their order, and returns their data in a single chunk.
     * <p>
     * Note: This does not implement {@link Iterator} since its methods throw
     * {@link InterruptedException}.
     * 
     * @author <a href="mailto:thompsonbry@users.sourceforge.net">Bryan
     *         Thompson</a>
     * @version $Id$
     */
    private class NonBlockingChunkedIterator {

        /**
         * The source iterator that is being drained.
         */
        private final IAsynchronousIterator<E[]> src;
        
        /** #of elements across the set of {@link #chunks}. */
        private int chunkSize;

        /**
         * The set of chunks that have been buffered so far.
         */
        private LinkedList<E[]> chunks = new LinkedList<E[]>();

        /**
         * Clear the internal state after returning a chunk to the caller.
         */
        private void clear() {
            
            chunkSize = 0;

            chunks = new LinkedList<E[]>();
            
        }
        
        public String toString() {
            
            // Note: toString() on the outer class.
            return AbstractSubtask.this.toString() + "{chunkSize=" + chunkSize
                    + "}";
            
        }
        
        public NonBlockingChunkedIterator(final IAsynchronousIterator<E[]> src) {

            if (src == null)
                throw new IllegalArgumentException();
            
            this.src = src;
            
        }
        
        public boolean hasNext() throws InterruptedException {

//            // The thread in which this method runs.
//            final Thread t = Thread.currentThread();

            // when we start looking for a chunk.
            final long begin = System.nanoTime();

            while (true) {
            
                // halt?
                master.halted();

                // interrupted?
                if (Thread.interrupted()) {

                    throw master.halt(new InterruptedException(toString()));

                }

                // current time.
                final long now = System.nanoTime();
                
                // elapsed since we entered hasNext.
                final long elapsedNanos = now - begin;

                // elapsed since the master last wrote a chunk on this sink.
                final long elapsedSinceLastChunk = now - lastChunkNanos;

                // elapsed since src.hasNext(0L,NANOS) last return true.
                final long elapsedSinceLastChunkAvailable = now - lastChunkAvailableNanos;

                // true iff the sink has become idle.
//                final boolean idle = elapsedSinceLastChunk > master.sinkIdleTimeoutNanos;
                final boolean idle = elapsedSinceLastChunk > master.sinkIdleTimeoutNanos
                        && elapsedSinceLastChunkAvailable > master.sinkIdleTimeoutNanos;

                if ((idle || master.src.isExhausted()) && buffer.isOpen()) {
                    if (buffer.isEmpty()) {
                        /*
                         * Close out buffer. Since the buffer is empty the
                         * iterator will be quickly be exhausted (it is possible
                         * there is one chunk waiting in the iterator) and the
                         * subtask will quit the next time through the loop.
                         * 
                         * Note: This can happen either if the master is closed
                         * or if idle too long.
                         */
                        if (log.isInfoEnabled())
                            log.info("Closing buffer: idle=" + idle + " : "
                                    + this);
                        if (idle) {
                            /*
                             * An idle timeout is a conditional close and the
                             * sink MAY be reopened.
                             */
                            buffer.abort(new IdleTimeoutException());
                            master.stats.subtaskIdleTimeoutCount.incrementAndGet();
                        } else {
                            /*
                             * Since redirects of outstanding writes can cause
                             * the master to (re-)process redirected chunks,
                             * this is treated as a conditional close and the
                             * sink MAY be reopened.
                             */
                            buffer.abort(new MasterExhaustedException());
                        }
                        if (chunkSize == 0 && !src.hasNext()) {
                            /*
                             * The iterator is already exhausted so we break out
                             * of the loop now.
                             */
                            if (log.isInfoEnabled())
                                log.info("No more data: " + this);
                            return false;
                        }
                    }
                }

                if (chunkSize >= buffer.getMinimumChunkSize()) {
                    /*
                     * We have a full chunk worth of data so do not wait longer.
                     */
                    if (log.isInfoEnabled())
                        log.info("Full chunk: " + chunkSize + ", elapsed="
                                + TimeUnit.NANOSECONDS.toMillis(elapsedNanos)
                                + " : "+this);
                    return true;
                }

                if (chunkSize > 0
                        && (   (elapsedNanos > buffer.getChunkTimeout())//
                            || (!buffer.isOpen() && !src.hasNext())//
                            )) {
                    /*
                     * We have SOME data and either (a) the chunk timeout has
                     * expired -or- (b) the buffer is closed and there is
                     * nothing more to be read from the iterator. Note that the
                     * sink was closed above if the master's buffer was closed.
                     * The master's buffer is closed as a precondition to
                     * master.awaitAll(), so the sink WILL NOT block once the
                     * master enter's awaitAll().
                     */
                    if (log.isInfoEnabled())
                        log.info("Partial chunk: " + chunkSize + ", elapsed="
                                + TimeUnit.NANOSECONDS.toMillis(elapsedNanos)
                                + " : "+this);
                    // Done.
                    return true;
                }

                /*
                 * Poll the source iterator for another chunk.
                 * 
                 * @todo I need to review the logic for choosing a short poll
                 * duration here. I believe that this choice is leading to high
                 * CPU utilization when there are a lot of index partitions and
                 * hence a large #of threads running on the clients. In fact, I
                 * am not certain that the rational for the specialized
                 * non-blocking iterator class in AbstractSubtask is still valid
                 * now that we are not holding onto the master's lock. Perhaps
                 * we can just get by now with the BlockingBuffer's asynchronous
                 * iterator and a timeout equal to
                 * Min(chunkTimeout,idleTimeout). The problem may be noticing
                 * when the master is exhausted, in which case we can flush this
                 * sink without waiting up to the chunk/idle timeout. Since the
                 * lock in the BlockingQueue is not visible, we can not signal
                 * it if it is waiting. An blocking take combined with an
                 * interrupt of the sink by the master when it is exhausted
                 * where halted() still returns false might be the way to go.
                 * 
                 * However, on reflection, I think that the correct route is to
                 * have the BlockingBuffer recognize a distinguished value, such
                 * as an empty array, as closing the queue. That way the master
                 * can invoke close(), which drops an empty array, and a
                 * blocking take will notice it. That works for normal
                 * termination. For abort, I can do what I already do - set the
                 * Throwable an interrupt the thread draining the queue. The only
                 * catch is that this will not work with scalar elements.
                 */
                if (src.hasNext(master.sinkPollTimeoutNanos,
                        TimeUnit.NANOSECONDS)) {

                    /*
                     * Take whatever is already buffered but do not allow the
                     * source iterator to combine chunks since that would
                     * increase our blocking time by whatever the chunkTimeout
                     * is.
                     */
                    final E[] a = src.next(1L, TimeUnit.NANOSECONDS);

                    assert a != null;
                    assert a.length != 0;
                    assert a[0] != null : "chunk with nulls: chunkSize="
                            + a.length + ", chunk=" + Arrays.toString(a);

                    // add to the list of chunks which are already available.
                    chunks.add(a);

                    // track the #of elements available across those chunks.
                    chunkSize += a.length;
                    
                    master.stats.elementsOnSinkQueues.addAndGet(-a.length);

                    // reset the available aspect of the idle timeout.
                    lastChunkAvailableNanos = System.nanoTime();
                    
                    if (log.isDebugEnabled())
                        log.debug("Combining chunks: chunkSize="
                                + a.length
                                + ", ncombined="
                                + chunks.size()
                                + ", elapsed="
                                + TimeUnit.NANOSECONDS.toMillis(System
                                        .nanoTime()
                                        - begin));
                    
                    continue;

                }
                
                if (chunkSize == 0 && !buffer.isOpen() && !src.hasNext()) {
                    // We are done.
                    if (log.isInfoEnabled())
                        log.info("No more data: " + this);
                    return false;
                }

                // poll the itr again.

            } // while(true)

        }

        /**
         * Return the buffered chunk(s) as a single combined chunk. If more than
         * one chunk is combined to produce the returned chunk and
         * {@link BlockingBuffer#isOrdered()}, then a merge sort is applied to
         * the the elements of the chunk before it is returned to the caller in
         * order to keep the data in the chunk fully ordered.
         */
        public E[] next() {

            if (chunkSize == 0) {

                // nothing buffered.
                throw new NoSuchElementException();

            }

            final E[] firstChunk = chunks.getFirst();
            
            assert firstChunk != null;
            
            assert firstChunk.length != 0;
            
            assert firstChunk[0] != null;
            
            // Dynamic instantiation of array of the same component type.
            @SuppressWarnings("unchecked")
            final E[] a = (E[]) java.lang.reflect.Array.newInstance(
//                    firstChunk[0].getClass(),
                    firstChunk.getClass().getComponentType(),
                    chunkSize);

            // Combine the chunk(s) into a single chunk.
            int dstpos = 0;
            int ncombined = 0;
            for (E[] t : chunks) {

                final int len = t.length;

                System.arraycopy(t, 0, a, dstpos, len);

                dstpos += len;

                ncombined++;

            }

            if (ncombined > 0 && buffer.isOrdered()) {

                ChunkMergeSortHelper.mergeSort(a);

            }

            // clear internal state.
            clear();

            return a;
            
        }

    }

    /**
     * This method MUST be invoked if a sink receives a
     * "stale locator exception" within {@link #handleChunk(Object[])}.
     * <p>
     * This method asynchronously closes the <i>sink</i>, so that no further
     * data may be written on it by setting the <i>cause</i> on
     * {@link BlockingBuffer#abort(Throwable)}. Next, the current chunk is
     * placed onto the master's redirectQueue and the sink's {@link #buffer} is
     * drained, transferring all chunks which can be read from that buffer onto
     * the master's redirectQueue.
     * 
     * @param chunk
     *            The chunk which the sink was processing when it discovered
     *            that it need to redirect its outputs to a different sink (that
     *            is, a chunk which it had already read from its buffer and
     *            hence which needs to be redirected now).
     * @param cause
     *            The stale locator exception.
     * 
     * @throws InterruptedException
     */
    protected void handleRedirect(final E[] chunk, final Throwable cause)
            throws InterruptedException {

        if (chunk == null)
            throw new IllegalArgumentException();

        if (cause == null)
            throw new IllegalArgumentException();
        
        final long begin = System.nanoTime();

        /*
         * Notify the client so it can refresh the information for this locator.
         */
        notifyClientOfRedirect(locator, cause);

        /*
         * Close the output buffer for this sink - nothing more may be written
         * onto it now that we have seen the StaleLocatorException.
         */
        buffer.abort(cause);
        
        /*
         * Handle the chunk for which we got the stale locator exception by
         * placing it onto the master's redirect queue.
         */
        master.redirectChunk(chunk);

        /*
         * Drain the rest of the buffered chunks from the closed sink, feeding
         * them onto the master's redirect queue.
         */
        while (src.hasNext()) {

            master.redirectChunk(src.next());

        }
        
        synchronized (master.stats) {

            master.stats.elapsedRedirectNanos += System.nanoTime() - begin;

            master.stats.redirectCount.incrementAndGet();

        }
        
    }

    /**
     * Process a chunk from the buffer.
     * 
     * @return <code>true</code> iff the task should exit immediately.
     */
    abstract protected boolean handleChunk(E[] chunk) throws Exception;

    /**
     * Notify the client that the locator is stale.
     * 
     * @param locator
     *            The locator.
     * @param cause
     *            The cause.
     */
    abstract protected void notifyClientOfRedirect(L locator, Throwable cause);

}