SharedFieldCache.java example

Explorer
jackrabbit-master
- jackrabbit-trunk
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.jackrabbit.core.query.lucene;

import java.io.IOException;
import java.util.Arrays;
import java.util.HashMap;
import java.util.Map;
import java.util.WeakHashMap;

import javax.jcr.PropertyType;

import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermDocs;
import org.apache.lucene.index.TermEnum;
import org.apache.lucene.index.TermPositions;

/**
 * Implements a variant of the lucene class <code>org.apache.lucene.search.FieldCacheImpl</code>.
 * The lucene FieldCache class has some sort of support for custom comparators
 * but it only works on the basis of a field name. There is no further control
 * over the terms to iterate, that's why we use our own implementation.
 */
public class SharedFieldCache {

    /**
     * Expert: Stores term text values and document ordering data.
     */
    public static class ValueIndex {

        /**
         * Some heuristic factor that determines whether the array is sparse. Note that if less then
         * 1% is set, we already count the array as sparse. This is because it will become memory consuming
         * quickly by keeping the (sparse) arrays 
         */
        private static final int SPARSE_FACTOR = 100;

        /**
         * Values indexed by document id.
         */
        private final Comparable<?>[] values;

        /**
         * Values (Comparable) map indexed by document id.
         */
        public final Map<Integer, Comparable<?>> valuesMap;

        /**
         * Boolean indicating whether the {@link #valuesMap} impl has to be used
         */
        public final boolean sparse;

        /**
         * Creates one of these objects
         */
        public ValueIndex(Comparable<?>[] values, int setValues) {
            if (isSparse(values, setValues)) {
                this.sparse = true;
                this.values = null;
                if (setValues == 0) {
                    this.valuesMap = null;
                } else {
                    this.valuesMap = getValuesMap(values, setValues);
                }
            } else {
                this.sparse = false;
                this.values = values;
                this.valuesMap = null;
            }
        }

        public Comparable<?> getValue(int i) {
            if (sparse) {
                return valuesMap == null ? null : valuesMap.get(i);
            } else {
                return values[i];
            }
        }

        private static Map<Integer, Comparable<?>> getValuesMap(Comparable<?>[] values, int setValues) {
            Map<Integer, Comparable<?>> map = new HashMap<Integer, Comparable<?>>(setValues);
            for (int i = 0; i < values.length && setValues > 0; i++) {
                if (values[i] != null) {
                    map.put(i, values[i]);
                    setValues--;
                }
            }
            return map;
        }

        private static boolean isSparse(Comparable<?>[] values, int setValues) {
            // some really simple test to test whether the array is sparse. Currently, when less then 1% is set, the array is already sparse 
            // for this typical cache to avoid memory issues
            if (setValues * SPARSE_FACTOR < values.length) {
                return true;
            }
            return false;
        }
    }

    static class ComparableArray implements Comparable<ComparableArray> {

        private int offset = 0;

        private Comparable<?>[] c = new Comparable[0];

        public ComparableArray(Comparable<?> item, int index) {
            insert(item, index);
        }

        public int compareTo(ComparableArray o) {
            return Util.compare(c, o.c);
        }

        /**
         * testing purpose only.
         * 
         * @return the offset
         */
        int getOffset() {
            return offset;
        }

        public ComparableArray insert(Comparable<?> item, int index) {
            // optimize for most common scenario
            if (c.length == 0) {
                offset = index;
                c = new Comparable<?>[] { item };
                return this;
            }

            // inside
            if (index >= offset && index < offset + c.length) {
                c[index - offset] = item;
                return this;
            }

            // before
            if (index < offset) {
                int relativeOffset = offset - index;
                Comparable<?>[] newC = new Comparable[relativeOffset + c.length];
                newC[0] = item;
                System.arraycopy(c, 0, newC, relativeOffset, c.length);
                c = newC;
                offset = index;
                return this;
            }

            // after
            if (index >= offset + c.length) {
                Comparable<?>[] newC = new Comparable[index - offset + 1];
                System.arraycopy(c, 0, newC, 0, c.length);
                newC[index - offset] = item;
                c = newC;
                return this;
            }
            return this;
        }

        /*
         * This is needed by {@link UpperCaseSortComparator} and {@link LowerCaseSortComparator}
         */
        @Override
        public String toString() {
            if (c == null) {
                return null;
            }
            if (c.length == 1) {
                return c[0].toString();
            }
            return Arrays.toString(c);
        }
    }

    /**
     * Reference to the single instance of <code>SharedFieldCache</code>.
     */
    public static final SharedFieldCache INSTANCE = new SharedFieldCache();

    /**
     * The internal cache. Maps Entry to array of interpreted term values.
     */
    private final Map<IndexReader, Map<Key, ValueIndex>> cache = new WeakHashMap<IndexReader, Map<Key, ValueIndex>>();

    /**
     * Private constructor.
     */
    private SharedFieldCache() {
    }

    /**
     * Creates a <code>ValueIndex</code> for a <code>field</code> and a term
     * <code>prefix</code>. The term prefix acts as the property name for the
     * shared <code>field</code>.
     * <p>
     * This method is an adapted version of: <code>FieldCacheImpl.getStringIndex()</code>
     *
     * @param reader     the <code>IndexReader</code>.
     * @param field      name of the shared field.
     * @param prefix     the property name, will be used as term prefix.
     * @return a ValueIndex that contains the field values and order
     *         information.
     * @throws IOException if an error occurs while reading from the index.
     */
    public ValueIndex getValueIndex(IndexReader reader, String field,
            String prefix) throws IOException {

        if (reader instanceof ReadOnlyIndexReader) {
            reader = ((ReadOnlyIndexReader) reader).getBase();
        }

        field = field.intern();
        ValueIndex ret = lookup(reader, field, prefix);
        if (ret == null) {
            final int maxDocs = reader.maxDoc();
            Comparable<?>[] retArray = new Comparable<?>[maxDocs];
            Map<Integer, Integer> positions = new HashMap<Integer, Integer>();
            boolean usingSimpleComparable = true;
            int setValues = 0;
            if (maxDocs > 0) {
                IndexFormatVersion version = IndexFormatVersion.getVersion(reader);
                boolean hasPayloads = version.isAtLeast(IndexFormatVersion.V3);
                TermDocs termDocs;
                byte[] payload = null;
                int type;
                if (hasPayloads) {
                    termDocs = reader.termPositions();
                    payload = new byte[1];
                } else {
                    termDocs = reader.termDocs();
                }
                TermEnum termEnum = reader.terms(new Term(field, prefix));
                try {
                    if (termEnum.term() == null) {
                        throw new RuntimeException("no terms in field " + field);
                    }
                    do {
                        Term term = termEnum.term();
                        if (term.field() != field || !term.text().startsWith(prefix)) {
                            break;
                        }
                        final String value = termValueAsString(term, prefix);
                        termDocs.seek(term);
                        while (termDocs.next()) {
                            int termPosition = 0;
                            type = PropertyType.UNDEFINED;
                            if (hasPayloads) {
                                TermPositions termPos = (TermPositions) termDocs;
                                termPosition = termPos.nextPosition();
                                if (termPos.isPayloadAvailable()) {
                                    payload = termPos.getPayload(payload, 0);
                                    type = PropertyMetaData.fromByteArray(payload).getPropertyType();
                                }
                            }
                            setValues++;
                            Comparable<?> v = getValue(value, type);
                            int doc = termDocs.doc();
                            Comparable<?> ca = retArray[doc];
                            if (ca == null) {
                                if (usingSimpleComparable) {
                                    // put simple value on the queue
                                    positions.put(doc, termPosition);
                                    retArray[doc] = v;
                                } else {
                                    retArray[doc] = new ComparableArray(v,
                                            termPosition);
                                }
                            } else {
                                if (ca instanceof ComparableArray) {
                                    ((ComparableArray) ca).insert(v,
                                            termPosition);
                                } else {
                                    // transform all of the existing values from
                                    // Comparable to ComparableArray
                                    for (int pos : positions.keySet()) {
                                        retArray[pos] = new ComparableArray(
                                                retArray[pos],
                                                positions.get(pos));
                                    }
                                    positions = null;
                                    usingSimpleComparable = false;
                                    ComparableArray caNew = (ComparableArray) retArray[doc];
                                    retArray[doc] = caNew.insert(v,
                                            termPosition);
                                }
                            }
                        }
                    } while (termEnum.next());
                } finally {
                    termDocs.close();
                    termEnum.close();
                }
            }
            ValueIndex value = new ValueIndex(retArray, setValues);
            store(reader, field, prefix, value);
            return value;
        }
        return ret;
    }

    /**
     * Extracts the value from a given Term as a String
     * 
     * @param term
     * @param prefix
     * @return string value contained in the term
     */
    private static String termValueAsString(Term term, String prefix) {
        // make sure term is compacted
        String text = term.text();
        int length = text.length() - prefix.length();
        char[] tmp = new char[length];
        text.getChars(prefix.length(), text.length(), tmp, 0);
        return new String(tmp, 0, length);
    }

    /**
     * See if a <code>ValueIndex</code> object is in the cache.
     */
    ValueIndex lookup(IndexReader reader, String field, String prefix) {
        synchronized (cache) {
            Map<Key, ValueIndex> readerCache = cache.get(reader);
            if (readerCache == null) {
                return null;
            }
            return readerCache.get(new Key(field, prefix));
        }
    }

    /**
     * Put a <code>ValueIndex</code> <code>value</code> to cache.
     */
    void store(IndexReader reader, String field, String prefix, ValueIndex value) {
        synchronized (cache) {
            Map<Key, ValueIndex> readerCache = cache.get(reader);
            if (readerCache == null) {
                readerCache = new HashMap<Key, ValueIndex>();
                cache.put(reader, readerCache);
            }
            readerCache.put(new Key(field, prefix), value);
        }
    }

    /**
     * Returns a comparable for the given <code>value</code> that is read from
     * the index.
     *
     * @param value the value as read from the index.
     * @param type the property type.
     * @return a comparable for the <code>value</code>.
     */
    private Comparable<?> getValue(String value, int type) {
        switch (type) {
            case PropertyType.BOOLEAN:
                return Boolean.valueOf(value);
            case PropertyType.DATE:
                return DateField.stringToTime(value);
            case PropertyType.LONG:
                return LongField.stringToLong(value);
            case PropertyType.DOUBLE:
                return DoubleField.stringToDouble(value);
            case PropertyType.DECIMAL:
                return DecimalField.stringToDecimal(value);
            default:
                return value;
        }
    }

    /**
     * A compound <code>Key</code> that consist of <code>field</code>
     * and <code>prefix</code>.
     */
    static class Key {

        private final String field;
        private final String prefix;

        /**
         * Creates <code>Key</code> for ValueIndex lookup.
         */
        Key(String field, String prefix) { 
            this.field = field.intern();
            this.prefix = prefix.intern();
        }

        /**
         * Returns <code>true</code> if <code>o</code> is a <code>Key</code>
         * instance and refers to the same field and prefix.
         */
        public boolean equals(Object o) {
            if (o instanceof Key) {
                Key other = (Key) o;
                return other.field == field
                        && other.prefix == prefix;
            }
            return false;
        }

        /**
         * Composes a hashcode based on the field and prefix.
         */
        public int hashCode() {
            return field.hashCode() ^ prefix.hashCode();
        }
    }

}