/* * RapidMiner * * Copyright (C) 2001-2011 by Rapid-I and the contributors * * Complete list of developers available at our web site: * * http://rapid-i.com * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see http://www.gnu.org/licenses/. */ package com.rapidminer.operator.features.construction; import java.util.LinkedList; import java.util.List; import com.rapidminer.example.Attribute; import com.rapidminer.example.Example; import com.rapidminer.example.ExampleSet; import com.rapidminer.example.table.AttributeFactory; import com.rapidminer.operator.OperatorDescription; import com.rapidminer.operator.OperatorException; import com.rapidminer.operator.ports.metadata.AttributeMetaData; import com.rapidminer.operator.ports.metadata.ExampleSetMetaData; import com.rapidminer.operator.ports.metadata.MDInteger; import com.rapidminer.operator.ports.metadata.MetaData; import com.rapidminer.operator.ports.metadata.SetRelation; import com.rapidminer.parameter.ParameterType; import com.rapidminer.parameter.ParameterTypeAttributes; import com.rapidminer.parameter.UndefinedParameterError; import com.rapidminer.tools.Ontology; import com.rapidminer.tools.math.VectorMath; import com.rapidminer.tools.math.container.Range; /** * This operator creates all products of the specified attributes. The attribute names can be specified by regular * expressions. * * @author Ingo Mierswa */ public class ProductGenerationOperator extends AbstractFeatureConstruction { public static final String PARAMETER_FIRST_ATTRIBUTE_NAME = "first_attribute_name"; public static final String PARAMETER_SECOND_ATTRIBUTE_NAME = "second_attribute_name"; public ProductGenerationOperator(OperatorDescription description) { super(description); } @Override protected MetaData modifyMetaData(ExampleSetMetaData metaData) throws UndefinedParameterError { List<AttributeMetaData> newAttributes = new LinkedList<AttributeMetaData>(); String firstAttributeName = getParameterAsString(PARAMETER_FIRST_ATTRIBUTE_NAME); String secondAttributeName = getParameterAsString(PARAMETER_SECOND_ATTRIBUTE_NAME); for (AttributeMetaData attribute : metaData.getAllAttributes()) { if (attribute.isNumerical()) { if (attribute.getName().matches(firstAttributeName)) { for (AttributeMetaData attribute2 : metaData.getAllAttributes()) { if (attribute2.isNumerical()) { if (attribute2.getName().matches(secondAttributeName)) { AttributeMetaData newAMD = new AttributeMetaData("(" + attribute.getName() + ") * (" + attribute2.getName() + ")", Ontology.REAL); // range if (attribute.getValueSetRelation() == SetRelation.EQUAL && attribute2.getValueSetRelation() == SetRelation.EQUAL) { Range range1 = attribute.getValueRange(); Range range2 = attribute2.getValueRange(); double[] values = {range1.getLower() * range2.getLower(), range1.getLower() * range2.getUpper(),range1.getUpper() * range2.getLower(),range1.getUpper() * range2.getUpper()}; newAMD.setValueRange(new Range(VectorMath.minimalElement(values), VectorMath.maximalElement(values)), SetRelation.SUBSET); } else { newAMD.setValueRange(new Range(), SetRelation.UNKNOWN); } // unknown values if (attribute2.getNumberOfMissingValues().isKnown() && attribute.getNumberOfMissingValues().isKnown()) { newAMD.setNumberOfMissingValues(new MDInteger(attribute.getNumberOfMissingValues().getValue() + attribute2.getNumberOfMissingValues().getValue())); } newAttributes.add(newAMD); } } } } } } metaData.addAllAttributes(newAttributes); return metaData; } @Override public ExampleSet apply(ExampleSet exampleSet) throws OperatorException { List<Attribute> newAttributes = new LinkedList<Attribute>(); String firstAttributeName = getParameterAsString(PARAMETER_FIRST_ATTRIBUTE_NAME); String secondAttributeName = getParameterAsString(PARAMETER_SECOND_ATTRIBUTE_NAME); for (Attribute attribute : exampleSet.getAttributes()) { if (attribute.isNumerical()) { if (attribute.getName().matches(firstAttributeName)) { for (Attribute attribute2 : exampleSet.getAttributes()) { if (attribute2.isNumerical()) { if (attribute2.getName().matches(secondAttributeName)) { newAttributes.add(createAttribute(exampleSet, attribute, attribute2)); } } } } } } for (Attribute attribute : newAttributes) { exampleSet.getAttributes().addRegular(attribute); } return exampleSet; } private Attribute createAttribute(ExampleSet exampleSet, Attribute attribute1, Attribute attribute2) { Attribute result = AttributeFactory.createAttribute("(" + attribute1.getName() + ") * (" + attribute2.getName() + ")", Ontology.REAL); exampleSet.getExampleTable().addAttribute(result); for (Example example : exampleSet) { double value1 = example.getValue(attribute1); double value2 = example.getValue(attribute2); double resultValue = value1 * value2; example.setValue(result, resultValue); } return result; } @Override public List<ParameterType> getParameterTypes() { List<ParameterType> types = super.getParameterTypes(); types.add(new ParameterTypeAttributes(PARAMETER_FIRST_ATTRIBUTE_NAME, "The name(s) of the first attribute to be multiplied.", getExampleSetInputPort(), false, Ontology.NUMERICAL)); types.add(new ParameterTypeAttributes(PARAMETER_SECOND_ATTRIBUTE_NAME, "The name(s) of the second attribute to be multiplied.", getExampleSetInputPort(), false, Ontology.NUMERICAL)); return types; } }