/* * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.facebook.presto.operator; import com.facebook.presto.operator.SetBuilderOperator.SetSupplier; import com.facebook.presto.spi.Page; import com.facebook.presto.spi.PrestoException; import com.facebook.presto.spi.block.Block; import com.facebook.presto.spi.block.BlockBuilder; import com.facebook.presto.spi.type.Type; import com.facebook.presto.sql.planner.plan.PlanNodeId; import com.google.common.collect.ImmutableList; import com.google.common.util.concurrent.ListenableFuture; import java.util.List; import static com.facebook.presto.spi.StandardErrorCode.NOT_SUPPORTED; import static com.facebook.presto.spi.type.BooleanType.BOOLEAN; import static com.google.common.base.Preconditions.checkArgument; import static com.google.common.base.Preconditions.checkState; import static io.airlift.concurrent.MoreFutures.tryGetFutureValue; import static java.util.Objects.requireNonNull; public class HashSemiJoinOperator implements Operator { private final OperatorContext operatorContext; public static class HashSemiJoinOperatorFactory implements OperatorFactory { private final int operatorId; private final PlanNodeId planNodeId; private final SetSupplier setSupplier; private final List<Type> probeTypes; private final int probeJoinChannel; private final List<Type> types; private boolean closed; public HashSemiJoinOperatorFactory(int operatorId, PlanNodeId planNodeId, SetSupplier setSupplier, List<? extends Type> probeTypes, int probeJoinChannel) { this.operatorId = operatorId; this.planNodeId = requireNonNull(planNodeId, "planNodeId is null"); this.setSupplier = setSupplier; this.probeTypes = ImmutableList.copyOf(probeTypes); checkArgument(probeJoinChannel >= 0, "probeJoinChannel is negative"); this.probeJoinChannel = probeJoinChannel; this.types = ImmutableList.<Type>builder() .addAll(probeTypes) .add(BOOLEAN) .build(); } @Override public List<Type> getTypes() { return types; } @Override public Operator createOperator(DriverContext driverContext) { checkState(!closed, "Factory is already closed"); OperatorContext operatorContext = driverContext.addOperatorContext(operatorId, planNodeId, HashSemiJoinOperator.class.getSimpleName()); return new HashSemiJoinOperator(operatorContext, setSupplier, probeTypes, probeJoinChannel); } @Override public void close() { closed = true; } @Override public OperatorFactory duplicate() { return new HashSemiJoinOperatorFactory(operatorId, planNodeId, setSupplier, probeTypes, probeJoinChannel); } } private final int probeJoinChannel; private final List<Type> types; private final ListenableFuture<ChannelSet> channelSetFuture; private ChannelSet channelSet; private Page outputPage; private boolean finishing; public HashSemiJoinOperator(OperatorContext operatorContext, SetSupplier channelSetFuture, List<Type> probeTypes, int probeJoinChannel) { this.operatorContext = requireNonNull(operatorContext, "operatorContext is null"); // todo pass in desired projection requireNonNull(channelSetFuture, "hashProvider is null"); requireNonNull(probeTypes, "probeTypes is null"); checkArgument(probeJoinChannel >= 0, "probeJoinChannel is negative"); this.channelSetFuture = channelSetFuture.getChannelSet(); this.probeJoinChannel = probeJoinChannel; this.types = ImmutableList.<Type>builder() .addAll(probeTypes) .add(BOOLEAN) .build(); } @Override public OperatorContext getOperatorContext() { return operatorContext; } @Override public List<Type> getTypes() { return types; } @Override public void finish() { finishing = true; } @Override public boolean isFinished() { return finishing && outputPage == null; } @Override public ListenableFuture<?> isBlocked() { return channelSetFuture; } @Override public boolean needsInput() { if (finishing || outputPage != null) { return false; } if (channelSet == null) { channelSet = tryGetFutureValue(channelSetFuture).orElse(null); } return channelSet != null; } @Override public void addInput(Page page) { requireNonNull(page, "page is null"); checkState(!finishing, "Operator is finishing"); checkState(channelSet != null, "Set has not been built yet"); checkState(outputPage == null, "Operator still has pending output"); // create the block builder for the new boolean column // we know the exact size required for the block BlockBuilder blockBuilder = BOOLEAN.createFixedSizeBlockBuilder(page.getPositionCount()); Page probeJoinPage = new Page(page.getBlock(probeJoinChannel)); // update hashing strategy to use probe cursor for (int position = 0; position < page.getPositionCount(); position++) { if (probeJoinPage.getBlock(0).isNull(position)) { throw new PrestoException( NOT_SUPPORTED, "NULL values are not allowed on the probe side of SemiJoin operator. See the query plan for details."); } else { boolean contains = channelSet.contains(position, probeJoinPage); if (!contains && channelSet.containsNull()) { blockBuilder.appendNull(); } else { BOOLEAN.writeBoolean(blockBuilder, contains); } } } // add the new boolean column to the page Block[] sourceBlocks = page.getBlocks(); Block[] outputBlocks = new Block[sourceBlocks.length + 1]; // +1 for the single boolean output channel System.arraycopy(sourceBlocks, 0, outputBlocks, 0, sourceBlocks.length); outputBlocks[sourceBlocks.length] = blockBuilder.build(); outputPage = new Page(outputBlocks); } @Override public Page getOutput() { Page result = outputPage; outputPage = null; return result; } }