/** * Copyright (C) 2014-2016 LinkedIn Corp. (pinot-core@linkedin.com) * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.linkedin.pinot.index.writer; import java.io.DataInputStream; import java.io.File; import java.io.FileInputStream; import java.io.RandomAccessFile; import java.util.Random; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.testng.Assert; import org.testng.annotations.Test; import com.linkedin.pinot.core.io.writer.impl.FixedBitSingleColumnMultiValueWriter; import com.linkedin.pinot.core.util.CustomBitSet; public class FixedBitWidthSingleColumnMultiValueWriterTest { private static final Logger LOGGER = LoggerFactory.getLogger(FixedBitWidthSingleColumnMultiValueWriterTest.class); @Test public void testSingleColMultiValue() throws Exception { int maxBits = 2; while (maxBits < 32) { LOGGER.trace("START test maxBit:" + maxBits); File file = new File("test_single_col_multi_value_writer.dat"); file.delete(); int rows = 100; int[][] data = new int[rows][]; int maxValue = (int) Math.pow(2, maxBits); Random r = new Random(); int totalNumValues = 0; for (int i = 0; i < rows; i++) { int numValues = r.nextInt(100) + 1; data[i] = new int[numValues]; for (int j = 0; j < numValues; j++) { data[i][j] = r.nextInt(maxValue); } totalNumValues += numValues; } FixedBitSingleColumnMultiValueWriter writer = new FixedBitSingleColumnMultiValueWriter( file, rows, totalNumValues, maxBits); CustomBitSet bitSet = CustomBitSet .withBitLength(totalNumValues * maxBits); int index = 0; for (int i = 0; i < rows; i++) { writer.setIntArray(i, data[i]); for (int j = 0; j < data[i].length; j++) { int value = data[i][j]; for (int bitPos = maxBits - 1; bitPos >= 0; bitPos--) { if ((value & (1 << bitPos)) != 0) { bitSet.setBit(index * maxBits + (maxBits - bitPos - 1)); } } index = index + 1; } } writer.close(); // verify header DataInputStream dis = new DataInputStream(new FileInputStream(file)); int totalLength = 0; for (int i = 0; i < rows; i++) { Assert.assertEquals(dis.readInt(), totalLength); Assert.assertEquals(dis.readInt(), data[i].length); totalLength += data[i].length; } dis.close(); // verify data byte[] byteArray = bitSet.toByteArray(); RandomAccessFile raf = new RandomAccessFile(file, "r"); // Header contains 1 row for each doc and each row contains 2 ints int headerSize = rows * 2 * 4; int dataLength = (int) raf.length() - headerSize; byte[] b = new byte[dataLength]; // read the data segment that starts after the header. raf.seek(headerSize); raf.read(b, 0, dataLength); Assert.assertEquals(byteArray.length, b.length); Assert.assertEquals(byteArray, b); raf.close(); file.delete(); LOGGER.trace("END test maxBit:" + maxBits); maxBits = maxBits + 1; bitSet.close(); } } }