/*
* Licensed to CRATE Technology GmbH ("Crate") under one or more contributor
* license agreements. See the NOTICE file distributed with this work for
* additional information regarding copyright ownership. Crate licenses
* this file to you under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License. You may
* obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations
* under the License.
*
* However, if you have executed another commercial license agreement
* with Crate these terms will supersede the license and you may use the
* software solely pursuant to the terms of the relevant commercial agreement.
*/
package io.crate.operation.aggregation.impl;
import com.google.common.collect.ImmutableList;
import io.crate.breaker.RamAccountingContext;
import io.crate.breaker.SizeEstimator;
import io.crate.breaker.SizeEstimatorFactory;
import io.crate.metadata.FunctionIdent;
import io.crate.metadata.FunctionInfo;
import io.crate.data.Input;
import io.crate.operation.aggregation.AggregationFunction;
import io.crate.types.DataType;
import io.crate.types.DataTypes;
import io.crate.types.SetType;
import org.elasticsearch.common.breaker.CircuitBreakingException;
import java.util.HashSet;
import java.util.Set;
public class CollectSetAggregation extends AggregationFunction<Set<Object>, Set<Object>> {
public static final String NAME = "collect_set";
private final SizeEstimator<Object> innerTypeEstimator;
private FunctionInfo info;
public static void register(AggregationImplModule mod) {
for (final DataType dataType : DataTypes.PRIMITIVE_TYPES) {
mod.register(new CollectSetAggregation(new FunctionInfo(new FunctionIdent(NAME,
ImmutableList.of(dataType)),
new SetType(dataType), FunctionInfo.Type.AGGREGATE)));
}
}
CollectSetAggregation(FunctionInfo info) {
this.innerTypeEstimator = SizeEstimatorFactory.create(((SetType) info.returnType()).innerType());
this.info = info;
}
@Override
public FunctionInfo info() {
return info;
}
@Override
public Set<Object> iterate(RamAccountingContext ramAccountingContext, Set<Object> state, Input... args) throws CircuitBreakingException {
Object value = args[0].value();
if (value == null) {
return state;
}
if (state.add(value)) {
ramAccountingContext.addBytes(
RamAccountingContext.roundUp(innerTypeEstimator.estimateSize(value) + 36L) // values size + 32 bytes for entry, 4 bytes for increased capacity
);
}
return state;
}
@Override
public Set<Object> newState(RamAccountingContext ramAccountingContext) {
ramAccountingContext.addBytes(RamAccountingContext.roundUp(64L)); // overhead for HashSet: 32 * 0 + 16 * 4 bytes
return new HashSet<>();
}
@Override
public DataType partialType() {
return info.returnType();
}
@Override
public Set<Object> reduce(RamAccountingContext ramAccountingContext, Set<Object> state1, Set<Object> state2) {
for (Object newValue : state2) {
if (state1.add(newValue)) {
ramAccountingContext.addBytes(
RamAccountingContext.roundUp(innerTypeEstimator.estimateSize(newValue) + 36L) // value size + 32 bytes for entry + 4 bytes for increased capacity
);
}
}
return state1;
}
@Override
public Set<Object> terminatePartial(RamAccountingContext ramAccountingContext, Set<Object> state) {
return state;
}
}