/*
* ARX: Powerful Data Anonymization
* Copyright 2012 - 2017 Fabian Prasser, Florian Kohlmayer and contributors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.deidentifier.arx.framework.check.distribution;
import java.util.Iterator;
import org.deidentifier.arx.DataType.DataTypeWithRatioScale;
/**
* An iterator over values of a distribution
*
* @author Florian Kohlmayer
* @author Fabian Prasser
*/
public abstract class DistributionIterator<T> implements Iterator<T>{
/**
* Double iterator for distributions.
* @author Florian Kohlmayer
* @author Fabian Prasser
*/
private static class DistributionIteratorDouble extends DistributionIterator<Double> {
/** The data type */
@SuppressWarnings("rawtypes")
private final DataTypeWithRatioScale type;
/**
* Constructor
* @param distribution
* @param dictionary
* @param type
*/
DistributionIteratorDouble(Distribution distribution, String[] dictionary, DataTypeWithRatioScale<?> type) {
super(distribution, dictionary);
this.type = type;
}
@SuppressWarnings("unchecked")
@Override
protected Double parse(String value) {
return type.toDouble(type.parse(value));
}
}
/**
* Double iterator for distributions.
* @author Florian Kohlmayer
* @author Fabian Prasser
*/
private static class DistributionIteratorString extends DistributionIterator<String> {
/**
* Constructor
* @param distribution
* @param dictionary
*/
DistributionIteratorString(Distribution distribution, String[] dictionary) {
super(distribution, dictionary);
}
@Override
protected String parse(String value) {
return value;
}
}
/**
* Returns a string iterator
* @param distribution
* @param dictionary
* @param type
* @return
*/
static Iterator<Double> createIteratorDouble(Distribution distribution, String[] dictionary, DataTypeWithRatioScale<?> type) {
return new DistributionIteratorDouble(distribution, dictionary, type);
}
/**
* Returns a string iterator
* @param distribution
* @param dictionary
* @return
*/
static Iterator<String> createIteratorString(Distribution distribution, String[] dictionary) {
return new DistributionIteratorString(distribution, dictionary);
}
/** The distribution. */
private final int[] buckets;
/** The dictionary. */
private final String[] dictionary;
/** The index of the next bucket. */
private int nextBucket = 0;
/** The frequency of the current value. */
private int currentFrequency;
/** The value of the current bucket. */
private T currentValue;
/** Is the current bucket valid. */
private boolean currentValid = false;
/**
* Instantiates the iterator.
*
* @param distribution the values
* @param dictionary the dictionary
*/
DistributionIterator(Distribution distribution, String[] dictionary) {
this.buckets = distribution.getBuckets();
this.dictionary = dictionary;
this.currentValid = false;
}
@Override
public boolean hasNext() {
if (!currentValid) {
pull();
}
return currentValid;
}
@Override
public T next() {
if (!currentValid) {
pull();
}
currentFrequency--;
if (currentFrequency == 0) {
currentValid = false;
}
return currentValue;
}
@Override
public void remove() {
throw new UnsupportedOperationException();
}
/**
* Pulls the next element from the distribution
*/
private void pull() {
// Check
if (nextBucket >= buckets.length) {
currentValue = null;
currentFrequency = 0;
currentValid = false;
return;
}
// Pull
int value = -1; // Bucket empty
while (nextBucket < buckets.length && value == -1) {
value = buckets[nextBucket];
nextBucket += 2;
}
// End of stream
if (value == -1) {
currentValue = null;
currentFrequency = 0;
currentValid = false;
return;
}
// Store
currentValue = parse(dictionary[value]);
currentFrequency = buckets[nextBucket - 1];
currentValid = true;
}
/**
* Parses the given value
* @param value
* @return
*/
protected abstract T parse(String value);
}