/** * Copyright (C) 2014-2016 LinkedIn Corp. (pinot-core@linkedin.com) * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.linkedin.pinot.core.operator.query; import com.linkedin.pinot.common.request.Selection; import com.linkedin.pinot.common.utils.DataSchema; import com.linkedin.pinot.core.common.Block; import com.linkedin.pinot.core.common.BlockId; import com.linkedin.pinot.core.common.Operator; import com.linkedin.pinot.core.indexsegment.IndexSegment; import com.linkedin.pinot.core.operator.BaseOperator; import com.linkedin.pinot.core.operator.ExecutionStatistics; import com.linkedin.pinot.core.operator.MProjectionOperator; import com.linkedin.pinot.core.operator.blocks.DocIdSetBlock; import com.linkedin.pinot.core.operator.blocks.IntermediateResultsBlock; import com.linkedin.pinot.core.operator.blocks.ProjectionBlock; import com.linkedin.pinot.core.query.selection.SelectionFetcher; import com.linkedin.pinot.core.query.selection.SelectionOperatorUtils; import java.io.Serializable; import java.util.ArrayList; import java.util.Collection; import java.util.List; import org.slf4j.Logger; import org.slf4j.LoggerFactory; /** * This MSelectionOnlyOperator will take care of applying a selection query to one IndexSegment. * nextBlock() will return an IntermediateResultBlock for the given IndexSegment. * * */ public class MSelectionOnlyOperator extends BaseOperator { private static final Logger LOGGER = LoggerFactory.getLogger(MSelectionOnlyOperator.class); private static final String OPERATOR_NAME = "MSelectionOnlyOperator"; private final IndexSegment _indexSegment; private final MProjectionOperator _projectionOperator; private final DataSchema _dataSchema; private final Block[] _blocks; private final int _limitDocs; private final Collection<Serializable[]> _rowEvents; private ExecutionStatistics _executionStatistics; public MSelectionOnlyOperator(IndexSegment indexSegment, Selection selection, Operator projectionOperator) { _indexSegment = indexSegment; _limitDocs = selection.getSize(); _projectionOperator = (MProjectionOperator) projectionOperator; List<String> selectionColumns = SelectionOperatorUtils.getSelectionColumns(selection.getSelectionColumns(), indexSegment); _dataSchema = SelectionOperatorUtils.extractDataSchema(null, selectionColumns, indexSegment); _blocks = new Block[selectionColumns.size()]; _rowEvents = new ArrayList<>(); } @Override public boolean open() { _projectionOperator.open(); return true; } @Override public Block getNextBlock() { int numDocsScanned = 0; ProjectionBlock projectionBlock; while ((projectionBlock = (ProjectionBlock) _projectionOperator.nextBlock()) != null) { for (int i = 0; i < _dataSchema.size(); i++) { _blocks[i] = projectionBlock.getBlock(_dataSchema.getColumnName(i)); } SelectionFetcher selectionFetcher = new SelectionFetcher(_blocks, _dataSchema); DocIdSetBlock docIdSetBlock = projectionBlock.getDocIdSetBlock(); int numDocsToFetch = Math.min(docIdSetBlock.getSearchableLength(), _limitDocs - _rowEvents.size()); numDocsScanned += numDocsToFetch; int[] docIdSet = docIdSetBlock.getDocIdSet(); for (int i = 0; i < numDocsToFetch; i++) { _rowEvents.add(selectionFetcher.getRow(docIdSet[i])); } if (_rowEvents.size() == _limitDocs) { break; } } // Create execution statistics. long numEntriesScannedInFilter = _projectionOperator.getExecutionStatistics().getNumEntriesScannedInFilter(); long numEntriesScannedPostFilter = numDocsScanned * _projectionOperator.getNumProjectionColumns(); long numTotalRawDocs = _indexSegment.getSegmentMetadata().getTotalRawDocs(); _executionStatistics = new ExecutionStatistics(numDocsScanned, numEntriesScannedInFilter, numEntriesScannedPostFilter, numTotalRawDocs); return new IntermediateResultsBlock(_dataSchema, _rowEvents); } @Override public Block getNextBlock(BlockId blockId) { throw new UnsupportedOperationException(); } @Override public String getOperatorName() { return OPERATOR_NAME; } @Override public boolean close() { _projectionOperator.close(); return true; } @Override public ExecutionStatistics getExecutionStatistics() { return _executionStatistics; } }