MutableBucketData.java example

Explorer
blazegraph-master
- database-master
/*

Copyright (C) SYSTAP, LLC DBA Blazegraph 2006-2016.  All rights reserved.

Contact:
     SYSTAP, LLC DBA Blazegraph
     2501 Calvert ST NW #106
     Washington, DC 20008
     licenses@blazegraph.com

This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.

This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
*/
/*
 * Created on Aug 25, 2009
 */

package com.bigdata.htree;

import com.bigdata.btree.AbstractBTree;
import com.bigdata.btree.ITuple;
import com.bigdata.btree.IndexSegment;
import com.bigdata.btree.MutableLeafData;
import com.bigdata.btree.data.ILeafData;
import com.bigdata.btree.raba.IRaba;
import com.bigdata.htree.raba.MutableKeyBuffer;
import com.bigdata.htree.raba.MutableValueBuffer;
import com.bigdata.io.AbstractFixedByteArrayBuffer;
import com.bigdata.io.IDataRecord;
import com.bigdata.rawstore.IRawStore;

/**
 * Implementation maintains Java objects corresponding to the persistent data
 * and defines methods for a variety of mutations on the {@link ILeafData}
 * record which operate by direct manipulation of the Java objects. The bucket
 * page is logically divided into buddy hash buckets. Unlike a B+Tree, the
 * tuples are neither ordered nor dense and the same key MAY appear multiple
 * times within a given buddy bucket.
 * <p>
 * Note: Overflow pages must be provided for when the #of duplicates in a bucket
 * exceeds the capacity of the bucket (this can be done by conversion of the
 * bucket to a blob record or by chaining the bucket).
 * <p>
 * Note: package private fields are used so that they may be directly accessed
 * by the {@link HashBucket} class.
 * 
 * @author <a href="mailto:thompsonbry@users.sourceforge.net">Bryan Thompson</a>
 * @version $Id: MutableLeafData.java 2265 2009-10-26 12:51:06Z thompsonbry $
 * 
 *          TODO Consider mutable implementation based on a compacting record
 *          ala GOM. This is especially attractive for the hash tree. The
 *          implementation would have to be wholly different from the
 *          {@link MutableLeafData} class. Instead of managing the {@link IRaba}
 *          for the keys and values separately, each {@link ITuple} would be
 *          appended into a byte[] (or {@link IDataRecord}). There would be a
 *          budget for that backing buffer which is the maximum in-memory size
 *          of the bucket. An index would provide random access into the buffer
 *          for only those entries which are "live" and a counter is maintain of
 *          the #of entries in the buffer which are no longer in use. When the
 *          buffer capacity is reached, the buffer is compacted by copying all
 *          of the entries accessible from the index into a new buffer and the
 *          old buffer is released.
 *          <p>
 *          Records which are too large for the buffer should be moved out of
 *          line.
 *          <p>
 *          This can be used in combination with a dynamically maintained trie
 *          for fast hash lookup, or we could just scan the entries.
 *          <p>
 *          Lexicon key search can scan the entries using the index. Scanning
 *          can have a side-effect in which the position of the entry offsets in
 *          the index is swapped if the keys are out of order. This would give
 *          us MonetDB style "cracking". The keys would have to be put into full
 *          order no later than when the record is made persistent.
 *          <p>
 *          Even though mutation is not thread safe, compacting the data record
 *          must not cause the assignment of indices to tuples to change when
 *          the caller is iterating through the entries by index.
 * 
 *          TODO Consider disallowing delete markers and version timestamps for
 *          the {@link HTree} if it is to be used only with in unisolated
 *          contexts in which case we can drop support for that stuff from this
 *          class.
 */
public class MutableBucketData implements ILeafData {

    /**
     * A keys associated with each tuple in the bucket page. Each key is a
     * variable length unsigned byte[]. The keys are neither ordered nor dense.
     */
    final MutableKeyBuffer keys;

    /**
     * The values associated with each tuple in the bucket page. Each value is a
     * variable length byte[].The indices into the values are correlated with
     * the indices into the {@link #keys}.
     */
    final MutableValueBuffer vals;

    /**
     * The deletion markers IFF isolation is supported by the index. The indices
     * into the delete markers are correlated with the indices into the
     * {@link #keys}.
     */
    final boolean[] deleteMarkers;

    /**
     * The version timestamps IFF isolation is supported by the index. The
     * indices into the version timestamps are correlated with the indices into
     * the {@link #keys} .
     */
    final long[] versionTimestamps;

    /**
     * The minimum version timestamp.
     * 
     * @todo these fields at 16 bytes to each {@link MutableBucketData} object
     *       even when we do not use them. It would be better to use a subclass
     *       or tack them onto the end of the {@link #versionTimestamps} array.
     */
    long minimumVersionTimestamp;
    long maximumVersionTimestamp;

    /**
     * Bit markers indicating whether the value associated with the tuple is a
     * raw record or an inline byte[] stored within {@link #getValues() values
     * raba}.
     */
    final boolean[] rawRecords;

    /**
     * Create an empty data record with internal arrays dimensioned for the
     * specified branching factor.
     * 
     * @param branchingFactor
     *            The branching factor for the owning B+Tree.
     * @param hasVersionTimestamps
     *            <code>true</code> iff version timestamps will be maintained.
     * @param hasDeleteMarkers
     *            <code>true</code> iff delete markers will be maintained.
     * @param hasRawRecords
     *            <code>true</code> iff raw record markers will be maintained.
     */
    public MutableBucketData(final int branchingFactor,
            final boolean hasVersionTimestamps, final boolean hasDeleteMarkers,
            final boolean hasRawRecords) {

        keys = new MutableKeyBuffer(branchingFactor /*+ 1*/);

        vals = new MutableValueBuffer(branchingFactor /*+ 1*/);

        versionTimestamps = (hasVersionTimestamps ? new long[branchingFactor /*+ 1*/]
                : null);

        // init per API specification.
        minimumVersionTimestamp = Long.MAX_VALUE;
        maximumVersionTimestamp = Long.MIN_VALUE;
        
        deleteMarkers = (hasDeleteMarkers ? new boolean[branchingFactor /*+ 1*/]
                : null);
        
        rawRecords = (hasRawRecords ? new boolean[branchingFactor /*+ 1*/] : null);

    }

    /**
     * Copy ctor.
     * 
     * @param branchingFactor
     *            The branching factor for the owning B+Tree.
     * @param src
     *            The source leaf.
     */
    public MutableBucketData(final int branchingFactor, final ILeafData src) {

        keys = new MutableKeyBuffer(branchingFactor /*+ 1*/, src.getKeys());

        vals = new MutableValueBuffer(branchingFactor /*+ 1*/, src.getValues());

        versionTimestamps = (src.hasVersionTimestamps() ? new long[branchingFactor /*+ 1*/]
                : null);

        deleteMarkers = (src.hasDeleteMarkers() ? new boolean[branchingFactor /*+ 1*/]
                                                              : null);

        rawRecords = (src.hasRawRecords() ? new boolean[branchingFactor /*+ 1*/]
                : null);

//        final int nkeys = keys.size();
        
        /**
         * Only initialize values for number of key/values stored
         */
        final int dataslots = keys.nkeys;
        
        if (versionTimestamps != null) {

            for (int i = 0; i < dataslots; i++) {

                versionTimestamps[i] = src.getVersionTimestamp(i);
                
            }

            minimumVersionTimestamp = src.getMinimumVersionTimestamp();

            maximumVersionTimestamp = src.getMaximumVersionTimestamp();

        } else {

            minimumVersionTimestamp = Long.MAX_VALUE;

            maximumVersionTimestamp = Long.MIN_VALUE;

        }
        
        if (deleteMarkers != null) {

            for (int i = 0; i < dataslots; i++) {

                deleteMarkers[i] = src.getDeleteMarker(i);
                
            }
            
        }

        if (rawRecords != null) {

            for (int i = 0; i < dataslots; i++) {

                rawRecords[i] = src.getRawRecord(i) != IRawStore.NULL;
                
            }
            
        }

    }

    /**
     * Ctor based on just "data" -- used by unit tests.
     * 
     * @param keys
     *            A representation of the defined keys in the leaf.
     * @param values
     *            An array containing the values found in the leaf.
     * @param versionTimestamps
     *            An array of the version timestamps (iff the version metadata
     *            is being maintained).
     * @param deleteMarkers
     *            An array of the delete markers (iff the version metadata is
     *            being maintained).
     */
    MutableBucketData(final MutableKeyBuffer keys,
            final MutableValueBuffer values, final long[] versionTimestamps,
            final boolean[] deleteMarkers, final boolean[] rawRecords) {
        
        assert keys != null;
        assert values != null;
        assert keys.capacity() == values.capacity();
        if (versionTimestamps != null) {
            assert versionTimestamps.length == keys.capacity();
        }
        if (deleteMarkers != null) {
            assert deleteMarkers.length == keys.capacity();
        }
        if (rawRecords != null) {
            assert rawRecords.length == keys.capacity();
        }

        this.keys = keys;
        this.vals = values;
        this.versionTimestamps = versionTimestamps;
        this.deleteMarkers = deleteMarkers;
        this.rawRecords = rawRecords;

        if (versionTimestamps != null)
            recalcMinMaxVersionTimestamp();

    }
    
    /**
     * The capacity of the bucket page (<code>2^addressBits</code>).
     */
    final public int capacity() {

        return keys.capacity();
        
    }

    /**
     * Range check a tuple index.
     * 
     * @param index
     *            The index of a tuple in [0:#capacity()-1].
     * @return <code>true</code>
     * 
     * @throws IndexOutOfBoundsException
     *             if the index is not in the legal range.
     */
    final protected boolean rangeCheckTupleIndex(final int index) {

        if (index < 0 || index > keys.capacity())
            throw new IndexOutOfBoundsException();

        return true;

    }
    
    /**
     * No - this is a mutable data record.
     */
    final public boolean isReadOnly() {
        
        return false;
        
    }

    /**
     * No.
     */
    final public boolean isCoded() {
        
        return false;
        
    }
    
    final public AbstractFixedByteArrayBuffer data() {
        
        throw new UnsupportedOperationException();
        
    }

    public final long getVersionTimestamp(final int index) {

        if (versionTimestamps == null)
            throw new UnsupportedOperationException();

        assert rangeCheckTupleIndex(index);
        
        return versionTimestamps[index];

    }
    
    final public long getMinimumVersionTimestamp() {

        if (versionTimestamps == null)
            throw new UnsupportedOperationException();

        return minimumVersionTimestamp;

    }
    
    final public long getMaximumVersionTimestamp() {

        if (versionTimestamps == null)
            throw new UnsupportedOperationException();

        return maximumVersionTimestamp;

    }

    public final boolean getDeleteMarker(final int index) {

        if (deleteMarkers == null)
            throw new UnsupportedOperationException();

        assert rangeCheckTupleIndex(index);

        return deleteMarkers[index];

    }

    public final long getRawRecord(final int index) {

        if (rawRecords == null)
            throw new UnsupportedOperationException();

        assert rangeCheckTupleIndex(index);

        if (!rawRecords[index])
            return IRawStore.NULL;

        final byte[] val = vals.get(index);
        
        final long addr = AbstractBTree.decodeRecordAddr(val);
        
        return addr;
        
    }

    final public IRaba getValues() {
        
        return vals;
        
    }
    
    final public IRaba getKeys() {
        
        return keys;
        
    }
    
    /**
     * Always returns <code>true</code>.
     */
    final public boolean isLeaf() {

        return true;

    }

//    /**
//     * For a leaf the #of entries is always the #of keys.
//     */
//    final public int getSpannedTupleCount() {
//        
//        return getKeys().size();
//        
//    }
    
    final public int getValueCount() {
        
        return vals.size();
        
    }
    
    final public boolean hasRawRecords() {
        
        return rawRecords != null; 
        
    }
    
    final public boolean hasDeleteMarkers() {
        
        return deleteMarkers != null; 
        
    }
    
    final public boolean hasVersionTimestamps() {
        
        return versionTimestamps != null; 
        
    }

    final public int getKeyCount() {
        
        return keys.size();
        
    }

    /**
     * No - this class does not support double-linked leaves (only the
     * {@link IndexSegment} actually uses double-linked leaves).
     */
    final public boolean isDoubleLinked() {
     
        return false;

    }

    final public long getNextAddr() {
    
        throw new UnsupportedOperationException();
        
    }

    final public long getPriorAddr() {
        
        throw new UnsupportedOperationException();
        
    }

    /**
     * Recalculate the min/max version timestamp on the leaf. The caller is
     * responsible for propagating the new min/max to the ancestors of the leaf.
     * 
     * @throws UnsupportedOperationException
     *             if the leaf is not maintaining per-tuple version timestamps.
     */
    void recalcMinMaxVersionTimestamp() {

        // must be maintaining version timestamps.
        if (versionTimestamps == null)
            throw new UnsupportedOperationException();

        final int nkeys = keys.nkeys;

        long min = Long.MAX_VALUE;
        long max = Long.MIN_VALUE;

        for (int i = 0; i < nkeys; i++) {

            final long t = versionTimestamps[i];

            if (t < min)
                min = t;

            if (t > max)
                max = t;

        }

        minimumVersionTimestamp = min;
        maximumVersionTimestamp = max;

    }

    /**
     * Inserts a new index/value, maintaining version timestamps and delete markers
     * when necessary
     * 
     * @param insIndex
     * @param key
     * @param val
     * @param rawRecord
     */
	public void insert(final int insIndex, final byte[] key, final byte[] val, final boolean rawRecord) {
		keys.insert(insIndex, key);
		vals.insert(insIndex, val);
		
		if (hasRawRecords()) {
			System.arraycopy(rawRecords, insIndex, rawRecords, insIndex+1, vals.nvalues-insIndex-1);
			rawRecords[insIndex] = rawRecord;
		} else {
			assert !rawRecord;
		}
		if (hasDeleteMarkers()) {
			System.arraycopy(deleteMarkers, insIndex, deleteMarkers, insIndex+1, vals.nvalues-insIndex-1);
			deleteMarkers[insIndex] = false;
		}
		if (hasVersionTimestamps()) {
			System.arraycopy(versionTimestamps, insIndex, versionTimestamps, insIndex+1, vals.nvalues-insIndex-1);
			versionTimestamps[insIndex] = 0; // current version
		}
	}
	
	/**
	 * 
	 * @param index - slot to be removed
	 */
	public void remove(final int index) {
		if (hasDeleteMarkers()) {
			deleteMarkers[index] = true;
		} else {
			keys.remove(index);
			vals.remove(index);

			if (hasRawRecords()) {
				System.arraycopy(rawRecords, index+1, rawRecords, index, vals.nvalues-index);
				rawRecords[vals.nvalues] = false;
			}
			if (hasVersionTimestamps()) {
				System.arraycopy(versionTimestamps, index+1, versionTimestamps, index, vals.nvalues-index);
				versionTimestamps[vals.nvalues] = 0; // current version
			}
		}
	}

}