/*
* Copyright (c) 2012 Data Harmonisation Panel
*
* All rights reserved. This program and the accompanying materials are made
* available under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation, either version 3 of the License,
* or (at your option) any later version.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this distribution. If not, see <http://www.gnu.org/licenses/>.
*
* Contributors:
* HUMBOLDT EU Integrated Project #030962
* Data Harmonisation Panel <http://www.dhpanel.eu>
*/
package eu.esdihumboldt.cst.functions.core.merge;
import java.util.Collection;
import java.util.Map;
import com.google.common.collect.HashMultimap;
import com.google.common.collect.ListMultimap;
import com.google.common.collect.Multimap;
import eu.esdihumboldt.hale.common.align.model.ParameterValue;
import eu.esdihumboldt.hale.common.align.transformation.engine.TransformationEngine;
import eu.esdihumboldt.hale.common.align.transformation.function.InstanceHandler;
import eu.esdihumboldt.hale.common.align.transformation.function.TransformationException;
import eu.esdihumboldt.hale.common.align.transformation.function.impl.FamilyInstanceImpl;
import eu.esdihumboldt.hale.common.align.transformation.report.TransformationLog;
import eu.esdihumboldt.hale.common.core.HalePlatform;
import eu.esdihumboldt.hale.common.instance.model.FamilyInstance;
import eu.esdihumboldt.hale.common.instance.model.Instance;
import eu.esdihumboldt.hale.common.instance.model.InstanceCollection;
import eu.esdihumboldt.hale.common.instance.model.InstanceFactory;
import eu.esdihumboldt.hale.common.instance.model.InstanceReference;
import eu.esdihumboldt.hale.common.instance.model.ResourceIterator;
import eu.esdihumboldt.hale.common.instance.model.impl.GenericResourceIteratorAdapter;
import eu.esdihumboldt.hale.common.schema.model.TypeDefinition;
/**
* Abstract merge handler implementation based on a merge index of instance
* references.
*
* @param <T> the merge configuration type
* @param <K> the merge key type
* @author Simon Templer
*/
public abstract class AbstractMergeHandler<T, K> implements InstanceHandler<TransformationEngine> {
/**
* Key instance that stands for merging of all instances.
*/
public static final DeepIterableKey KEY_ALL = new DeepIterableKey(Long.valueOf(1));
/**
* Resource iterator over the merged instances
*/
public class MergedIterator extends GenericResourceIteratorAdapter<K, FamilyInstance> {
private final Multimap<K, InstanceReference> index;
private final InstanceCollection originalInstances;
private final T mergeConfig;
/**
* Create a collection of merged instances.
*
* @param index the merge index
* @param instances the original instance collection
* @param mergeConfig the merge configuration
*/
public MergedIterator(Multimap<K, InstanceReference> index, InstanceCollection instances,
T mergeConfig) {
super(index.keySet().iterator());
this.index = index;
this.originalInstances = instances;
this.mergeConfig = mergeConfig;
}
@Override
protected FamilyInstance convert(K next) {
// next is the merge key
// get the instances to merge
InstanceCollection instances;
if (next == KEY_ALL) {
// special case: merge all
instances = originalInstances;
}
else {
Collection<InstanceReference> references = index.get(next);
instances = originalInstances.getInstances(references);
}
// determine type based on sample instance type
TypeDefinition type = null;
try (ResourceIterator<Instance> it = instances.iterator()) {
if (it.hasNext()) {
type = it.next().getDefinition();
}
}
return new FamilyInstanceImpl(merge(instances, type, next, mergeConfig));
}
@Override
public void remove() {
// prohibit remove
throw new UnsupportedOperationException();
}
}
/**
* @see InstanceHandler#partitionInstances(InstanceCollection, String,
* TransformationEngine, ListMultimap, Map, TransformationLog)
*/
@Override
public ResourceIterator<FamilyInstance> partitionInstances(InstanceCollection instances,
String transformationIdentifier, TransformationEngine engine,
ListMultimap<String, ParameterValue> transformationParameters,
Map<String, String> executionParameters, TransformationLog log)
throws TransformationException {
T mergeConfig = createMergeConfiguration(transformationIdentifier, transformationParameters,
executionParameters, log);
// create merge index over all instances (references)
Multimap<K, InstanceReference> index = HashMultimap.create();
ResourceIterator<Instance> it = instances.iterator();
try {
while (it.hasNext()) {
Instance instance = it.next();
K key = getMergeKey(instance, mergeConfig);
index.put(key, instances.getReference(instance));
}
} finally {
it.close();
}
return new MergedIterator(index, instances, mergeConfig);
}
/**
* Get the instance factory
*
* @return the instance factory
*/
protected InstanceFactory getInstanceFactory() {
return HalePlatform.getService(InstanceFactory.class);
}
/**
* Create the merge configuration from the transformation configuration. The
* merge configuration may be then used in
* {@link #getMergeKey(Instance, Object)} and
* {@link #merge(InstanceCollection, TypeDefinition, Object, Object)}
*
* @param transformationIdentifier the transformation identifier
* @param transformationParameters the transformation parameters
* @param executionParameters the execution parameters
* @param log the transformation log
* @return the merge configuration
* @throws TransformationException if the merge configuration cannot be
* created
*/
protected abstract T createMergeConfiguration(String transformationIdentifier,
ListMultimap<String, ParameterValue> transformationParameters,
Map<String, String> executionParameters, TransformationLog log)
throws TransformationException;
/**
* Get the merge key for a given instance. Instances with an equal merge key
* will be merged.
*
* @param instance the instance
* @param mergeConfig the merge configuration
* @return the instance merge key
* @see #merge(InstanceCollection, TypeDefinition, Object, Object)
*/
protected abstract K getMergeKey(Instance instance, T mergeConfig);
/**
* Merge multiple instance into one.
*
* @param instances the instances to merge
* @param type the type definition of the instances to merge
* @param mergeKey the merge key associated to the instances
* @param mergeConfig the merge configuration
* @return the merged instance
*/
protected abstract Instance merge(InstanceCollection instances, TypeDefinition type, K mergeKey,
T mergeConfig);
}