/** * diqube: Distributed Query Base. * * Copyright (C) 2015 Bastian Gloeckle * * This file is part of diqube. * * diqube is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as * published by the Free Software Foundation, either version 3 of the * License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see <http://www.gnu.org/licenses/>. */ package org.diqube.function.aggregate; import java.math.BigDecimal; import org.diqube.data.column.ColumnType; import org.diqube.function.AggregationFunction; import org.diqube.function.Function; import org.diqube.function.FunctionException; import org.diqube.function.aggregate.result.IntermediaryResultValueIterator; import org.diqube.function.aggregate.result.IntermediaryResultValueSink; import org.diqube.function.aggregate.util.BigDecimalHelper; /** * Calculates the population variance. * * <p> * 1/N * sum(x_i^2) - avg(x_i)^2. * * @author Bastian Gloeckle */ @Function(name = VarDoubleFunction.NAME) public class VarDoubleFunction implements AggregationFunction<Double, Double> { public static final String NAME = "var"; private AvgDoubleFunction avgFn; private long count = 0l; private BigDecimal squaredSum = BigDecimalHelper.zeroCreate(); public VarDoubleFunction() { avgFn = new AvgDoubleFunction(); } @Override public String getNameLowerCase() { return NAME; } @Override public void provideConstantParameter(int idx, Object value) throws FunctionException { // noop } @Override public void addValues(ValueProvider<Double> valueProvider) { Double[] values = valueProvider.getValues(); for (Double value : values) { squaredSum = squaredSum.add(BigDecimal.valueOf(value).pow(2)); count++; } avgFn.addValues(new ValueProvider<Double>() { @Override public long size() { return values.length; } @Override public Double[] getValues() { return values; } @Override public boolean isFinalSetOfValues() { return valueProvider.isFinalSetOfValues(); } }); } @Override public void addIntermediary(IntermediaryResultValueIterator intermediary) { long otherCount = (Long) intermediary.next(); BigDecimal otherSquaredSum = (BigDecimal) intermediary.next(); avgFn.addIntermediary(intermediary); count += otherCount; squaredSum = squaredSum.add(otherSquaredSum); } @Override public void removeIntermediary(IntermediaryResultValueIterator intermediary) { long otherCount = (Long) intermediary.next(); BigDecimal otherSquaredSum = (BigDecimal) intermediary.next(); avgFn.removeIntermediary(intermediary); if (otherCount == count) { count = 0; squaredSum = BigDecimalHelper.zeroCreate(); return; } count -= otherCount; squaredSum = squaredSum.subtract(otherSquaredSum); } @Override public void populateIntermediary(IntermediaryResultValueSink res) throws FunctionException { res.pushValue(count); res.pushValue(squaredSum); avgFn.populateIntermediary(res); } @Override public Double calculate() throws FunctionException { double avg = avgFn.calculate(); BigDecimal res = squaredSum.divide(BigDecimal.valueOf(count), BigDecimalHelper.defaultMathContext()); res = res.subtract(BigDecimal.valueOf(avg).pow(2)); return res.doubleValue(); } @Override public ColumnType getOutputType() { return ColumnType.DOUBLE; } @Override public ColumnType getInputType() { return ColumnType.DOUBLE; } @Override public boolean needsActualValues() { return true; } }