/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.mahout.common.iterator;
import java.util.Collections;
import java.util.Iterator;
import java.util.Arrays;
import java.util.List;
import org.apache.mahout.common.MahoutTestCase;
import org.junit.Test;
public abstract class SamplerCase extends MahoutTestCase {
// these provide access to the underlying implementation
protected abstract Iterator<Integer> createSampler(int n, Iterator<Integer> source);
protected abstract boolean isSorted();
@Test
public void testEmptyCase() {
assertFalse(createSampler(100, new CountingIterator(0)).hasNext());
}
@Test
public void testSmallInput() {
Iterator<Integer> t = createSampler(10, new CountingIterator(1));
assertTrue(t.hasNext());
assertEquals(0, t.next().intValue());
assertFalse(t.hasNext());
t = createSampler(10, new CountingIterator(1));
assertTrue(t.hasNext());
assertEquals(0, t.next().intValue());
assertFalse(t.hasNext());
}
@Test
public void testAbsurdSize() {
Iterator<Integer> t = createSampler(0, new CountingIterator(2));
assertFalse(t.hasNext());
}
@Test
public void testExactSizeMatch() {
Iterator<Integer> t = createSampler(10, new CountingIterator(10));
for (int i = 0; i < 10; i++) {
assertTrue(t.hasNext());
assertEquals(i, t.next().intValue());
}
assertFalse(t.hasNext());
}
@Test
public void testSample() {
Iterator<Integer> source = new CountingIterator(100);
Iterator<Integer> t = createSampler(15, source);
// this is just a regression test, not a real test
List<Integer> expectedValues = Arrays.asList(83, 56, 69, 96, 4, 59, 70, 7, 93, 52, 39, 11, 16, 67, 26);
if (isSorted()) {
Collections.sort(expectedValues);
}
Iterator<Integer> expected = expectedValues.iterator();
int last = Integer.MIN_VALUE;
for (int i = 0; i < 15; i++) {
assertTrue(t.hasNext());
int actual = t.next();
if (isSorted()) {
assertTrue(actual >= last);
last = actual;
} else {
// any of the first few values should be in the original places
if (actual < 15) {
assertEquals(i, actual);
}
}
assertTrue(actual >= 0 && actual < 100);
// this is just a regression test, but still of some value
assertEquals(expected.next().intValue(), actual);
assertFalse(source.hasNext());
}
assertFalse(t.hasNext());
}
}