/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.lucene.util.packed; import static org.apache.lucene.util.BitUtil.zigZagDecode; import static org.apache.lucene.util.packed.AbstractBlockPackedWriter.BPV_SHIFT; import static org.apache.lucene.util.packed.AbstractBlockPackedWriter.MAX_BLOCK_SIZE; import static org.apache.lucene.util.packed.AbstractBlockPackedWriter.MIN_BLOCK_SIZE; import static org.apache.lucene.util.packed.AbstractBlockPackedWriter.MIN_VALUE_EQUALS_0; import static org.apache.lucene.util.packed.BlockPackedReaderIterator.readVLong; import static org.apache.lucene.util.packed.PackedInts.checkBlockSize; import static org.apache.lucene.util.packed.PackedInts.numBlocks; import java.io.IOException; import org.apache.lucene.index.CorruptIndexException; import org.apache.lucene.store.IndexInput; import org.apache.lucene.util.Accountable; import org.apache.lucene.util.LongValues; /** * Provides random access to a stream written with {@link BlockPackedWriter}. * @lucene.internal */ public final class BlockPackedReader extends LongValues implements Accountable { private final int blockShift, blockMask; private final long valueCount; private final long[] minValues; private final PackedInts.Reader[] subReaders; private final long sumBPV; /** Sole constructor. */ public BlockPackedReader(IndexInput in, int packedIntsVersion, int blockSize, long valueCount, boolean direct) throws IOException { this.valueCount = valueCount; blockShift = checkBlockSize(blockSize, MIN_BLOCK_SIZE, MAX_BLOCK_SIZE); blockMask = blockSize - 1; final int numBlocks = numBlocks(valueCount, blockSize); long[] minValues = null; subReaders = new PackedInts.Reader[numBlocks]; long sumBPV = 0; for (int i = 0; i < numBlocks; ++i) { final int token = in.readByte() & 0xFF; final int bitsPerValue = token >>> BPV_SHIFT; sumBPV += bitsPerValue; if (bitsPerValue > 64) { throw new CorruptIndexException("Corrupted Block#" + i, in); } if ((token & MIN_VALUE_EQUALS_0) == 0) { if (minValues == null) { minValues = new long[numBlocks]; } minValues[i] = zigZagDecode(1L + readVLong(in)); } if (bitsPerValue == 0) { subReaders[i] = new PackedInts.NullReader(blockSize); } else { final int size = (int) Math.min(blockSize, valueCount - (long) i * blockSize); if (direct) { final long pointer = in.getFilePointer(); subReaders[i] = PackedInts.getDirectReaderNoHeader(in, PackedInts.Format.PACKED, packedIntsVersion, size, bitsPerValue); in.seek(pointer + PackedInts.Format.PACKED.byteCount(packedIntsVersion, size, bitsPerValue)); } else { subReaders[i] = PackedInts.getReaderNoHeader(in, PackedInts.Format.PACKED, packedIntsVersion, size, bitsPerValue); } } } this.minValues = minValues; this.sumBPV = sumBPV; } @Override public long get(long index) { assert index >= 0 && index < valueCount; final int block = (int) (index >>> blockShift); final int idx = (int) (index & blockMask); return (minValues == null ? 0 : minValues[block]) + subReaders[block].get(idx); } @Override public long ramBytesUsed() { long size = 0; for (PackedInts.Reader reader : subReaders) { size += reader.ramBytesUsed(); } return size; } @Override public String toString() { long avgBPV = subReaders.length == 0 ? 0 : sumBPV / subReaders.length; return getClass().getSimpleName() + "(blocksize=" + (1<<blockShift) + ",size=" + valueCount + ",avgBPV=" + avgBPV + ")"; } }