/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.api.java.summarize.aggregation;
import org.apache.flink.api.java.summarize.StringColumnSummary;
import org.junit.Assert;
import org.junit.Test;
public class StringSummaryAggregatorTest {
@Test
public void testMixedGroup() {
StringColumnSummary summary = summarize("abc", "", null, " ", "defghi", "foo", null, null, "", " ");
Assert.assertEquals(10, summary.getTotalCount());
Assert.assertEquals(3, summary.getNullCount());
Assert.assertEquals(7, summary.getNonNullCount());
Assert.assertEquals(2, summary.getEmptyCount());
Assert.assertEquals(0, summary.getMinLength().intValue());
Assert.assertEquals(6, summary.getMaxLength().intValue());
Assert.assertEquals(2.142857, summary.getMeanLength().doubleValue(), 0.001);
}
@Test
public void testAllNullStrings() {
StringColumnSummary summary = summarize(null, null, null, null);
Assert.assertEquals(4, summary.getTotalCount());
Assert.assertEquals(4, summary.getNullCount());
Assert.assertEquals(0, summary.getNonNullCount());
Assert.assertEquals(0, summary.getEmptyCount());
Assert.assertNull(summary.getMinLength());
Assert.assertNull(summary.getMaxLength());
Assert.assertNull(summary.getMeanLength());
}
@Test
public void testAllWithValues() {
StringColumnSummary summary = summarize("cat", "hat", "dog", "frog");
Assert.assertEquals(4, summary.getTotalCount());
Assert.assertEquals(0, summary.getNullCount());
Assert.assertEquals(4, summary.getNonNullCount());
Assert.assertEquals(0, summary.getEmptyCount());
Assert.assertEquals(3, summary.getMinLength().intValue());
Assert.assertEquals(4, summary.getMaxLength().intValue());
Assert.assertEquals(3.25, summary.getMeanLength().doubleValue(), 0.0);
}
/**
* Helper method for summarizing a list of values.
*
* This method breaks the rule of "testing only one thing" by aggregating and combining
* a bunch of different ways.
*/
protected StringColumnSummary summarize(String... values) {
return new AggregateCombineHarness<String,StringColumnSummary,StringSummaryAggregator>(){
@Override
protected void compareResults(StringColumnSummary result1, StringColumnSummary result2) {
Assert.assertEquals(result1.getEmptyCount(), result2.getEmptyCount());
Assert.assertEquals(result1.getMaxLength(), result2.getMaxLength());
Assert.assertEquals(result1.getMinLength(), result2.getMinLength());
if (result1.getMeanLength() == null) {
Assert.assertEquals(result1.getMeanLength(), result2.getMeanLength());
}
else {
Assert.assertEquals(result1.getMeanLength().doubleValue(), result2.getMeanLength().doubleValue(), 1e-5d);
}
Assert.assertEquals(result1.getNullCount(), result2.getNullCount());
Assert.assertEquals(result1.getNonNullCount(), result2.getNonNullCount());
}
}.summarize(values);
}
}