/* * RapidMiner * * Copyright (C) 2001-2011 by Rapid-I and the contributors * * Complete list of developers available at our web site: * * http://rapid-i.com * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see http://www.gnu.org/licenses/. */ package com.rapidminer.operator.clustering.clusterer; import java.util.Collection; import java.util.LinkedList; import com.rapidminer.example.Attributes; import com.rapidminer.example.ExampleSet; import com.rapidminer.gui.ExampleVisualizer; import com.rapidminer.operator.Operator; import com.rapidminer.operator.OperatorDescription; import com.rapidminer.operator.OperatorException; import com.rapidminer.operator.clustering.ClusterModel; import com.rapidminer.operator.ports.InputPort; import com.rapidminer.operator.ports.OutputPort; import com.rapidminer.operator.ports.metadata.AttributeMetaData; import com.rapidminer.operator.ports.metadata.ExampleSetMetaData; import com.rapidminer.operator.ports.metadata.ExampleSetPassThroughRule; import com.rapidminer.operator.ports.metadata.GenerateNewMDRule; import com.rapidminer.operator.ports.metadata.MetaData; import com.rapidminer.operator.ports.metadata.SetRelation; import com.rapidminer.operator.ports.metadata.SimplePrecondition; import com.rapidminer.tools.ObjectVisualizerService; import com.rapidminer.tools.Ontology; import com.rapidminer.tools.metadata.MetaDataTools; /** * Abstract superclass of clusterers which defines the I/O behavior. * * @author Simon Fischer */ public abstract class AbstractClusterer extends Operator { private InputPort exampleSetInput = getInputPorts().createPort("example set"); private OutputPort modelOutput = getOutputPorts().createPort("cluster model"); private OutputPort exampleSetOutput = getOutputPorts().createPort("clustered set"); public AbstractClusterer(OperatorDescription description) { super(description); exampleSetInput.addPrecondition(new SimplePrecondition(exampleSetInput, new ExampleSetMetaData())); getTransformer().addRule(new GenerateNewMDRule(modelOutput, new MetaData(getClusterModelClass()))); getTransformer().addRule(new ExampleSetPassThroughRule(exampleSetInput, exampleSetOutput, SetRelation.EQUAL) { @Override public ExampleSetMetaData modifyExampleSet(ExampleSetMetaData metaData) { if (addsClusterAttribute()) { if (addsClusterAttribute()) metaData.addAttribute(new AttributeMetaData(Attributes.CLUSTER_NAME, Ontology.NOMINAL, Attributes.CLUSTER_NAME)); if (addsIdAttribute()) MetaDataTools.checkAndCreateIds(metaData); metaData.addAllAttributes(getAdditionalAttributes()); } return metaData; } }); } /** Generates a cluster model from an example set. Called by {@link #apply()}. */ public abstract ClusterModel generateClusterModel(ExampleSet exampleSet) throws OperatorException; /** Indicates whether {@link #doWork()} will add a cluster attribute to the example set. */ protected abstract boolean addsClusterAttribute(); /** Indicates whether {@link #doWork()} will add an id attribute to the example set. */ protected abstract boolean addsIdAttribute(); /** Subclasses might override this method in order to add additional attributes to the metaDataSet */ protected Collection<AttributeMetaData> getAdditionalAttributes() { return new LinkedList<AttributeMetaData>(); } @Override public void doWork() throws OperatorException { ExampleSet input = exampleSetInput.getData(ExampleSet.class); ClusterModel clusterModel = generateClusterModel(input); // registering visualizer ObjectVisualizerService.addObjectVisualizer(clusterModel, new ExampleVisualizer((ExampleSet) input.clone())); modelOutput.deliver(clusterModel); exampleSetOutput.deliver(input); // generateClusterModel() may have added cluster attribute } /** * Subclasses might overwrite this method in order to return the appropriate class of their model if postprocessing * is needed. */ public Class<? extends ClusterModel> getClusterModelClass() { return ClusterModel.class; } @Override public boolean shouldAutoConnect(OutputPort outputPort) { if (outputPort == exampleSetOutput) { // TODO: Remove in later versions return addsClusterAttribute(); } else { return super.shouldAutoConnect(outputPort); } } public InputPort getExampleSetInputPort() { return exampleSetInput; } }