/* * RapidMiner * * Copyright (C) 2001-2011 by Rapid-I and the contributors * * Complete list of developers available at our web site: * * http://rapid-i.com * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see http://www.gnu.org/licenses/. */ package com.rapidminer.operator.performance.cost; import java.util.List; import com.rapidminer.example.Attribute; import com.rapidminer.example.Attributes; import com.rapidminer.example.Example; import com.rapidminer.example.ExampleSet; import com.rapidminer.operator.Operator; import com.rapidminer.operator.OperatorDescription; import com.rapidminer.operator.OperatorException; import com.rapidminer.operator.UserError; import com.rapidminer.operator.ValueDouble; import com.rapidminer.operator.performance.MeasuredPerformance; import com.rapidminer.operator.performance.PerformanceCriterion; import com.rapidminer.operator.performance.PerformanceVector; import com.rapidminer.operator.ports.InputPort; import com.rapidminer.operator.ports.OutputPort; import com.rapidminer.operator.ports.metadata.ExampleSetPrecondition; import com.rapidminer.parameter.ParameterType; import com.rapidminer.parameter.ParameterTypeDouble; import com.rapidminer.parameter.ParameterTypeInt; import com.rapidminer.parameter.ParameterTypeList; import com.rapidminer.tools.Ontology; /** * This operator provides the ability to evaluate classification costs. * Therefore a cost matrix might be specified, denoting the costs for every * possible classification outcome: predicted label x real label. * Costs will be minimized during optimization. * * @author Sebastian Land */ public class RankingEvaluator extends Operator { private static final String PARAMETER_RANKING_COSTS = "ranking_costs"; private static final String PARAMETER_RANK_START = "rank_interval_start"; private static final String PARAMETER_RANK_COST = "costs"; private InputPort exampleSetInput = getInputPorts().createPort("example set"); private OutputPort exampleSetOutput = getOutputPorts().createPort("example set"); private OutputPort performanceOutput = getOutputPorts().createPort("performance"); private PerformanceVector performance = null; public RankingEvaluator(OperatorDescription description) { super(description); exampleSetInput.addPrecondition(new ExampleSetPrecondition(exampleSetInput, Ontology.ATTRIBUTE_VALUE, Attributes.LABEL_NAME)); getTransformer().addGenerationRule(performanceOutput, PerformanceVector.class); getTransformer().addPassThroughRule(exampleSetInput, exampleSetOutput); addValue(new ValueDouble("ranking_cost", "blubb") { @Override public double getDoubleValue() { if (performance == null) return Double.NaN; PerformanceCriterion c = performance.getCriterion("RankingCosts"); if (c != null) { return c.getAverage(); } else { return Double.NaN; } } }); } @Override public void doWork() throws OperatorException { ExampleSet exampleSet = exampleSetInput.getData(); Attribute label = exampleSet.getAttributes().getLabel(); if (label != null) { if (label.isNominal()) { List<String[]> rankings = getParameterList(PARAMETER_RANKING_COSTS); int i = 0; double[] costs = new double[rankings.size()]; int[] indices = new int[rankings.size()]; for (String[] pair: rankings) { indices[i] = Integer.valueOf(pair[0]); costs[i] = Double.valueOf(pair[1]); //TODO: Check if correctly sorted or sort automatically i++; } MeasuredPerformance criterion = new RankingCriterion(indices, costs, exampleSet); performance = new PerformanceVector(); performance.addCriterion(criterion); // now measuring costs criterion.startCounting(exampleSet, false); for (Example example: exampleSet) { criterion.countExample(example); } exampleSetOutput.deliver(exampleSet); performanceOutput.deliver(performance); } else { throw new UserError(this, 101, "CostEvaluator", label.getName()); } } else { throw new UserError(this, 105); } } @Override public List<ParameterType> getParameterTypes() { List<ParameterType> types = super.getParameterTypes(); types.add(new ParameterTypeList(PARAMETER_RANKING_COSTS, "This parameter defines the costs when the real call isn't the one with the highest confidence.", new ParameterTypeInt(PARAMETER_RANK_START, "This is the first rank of the interval between this and the nearest greater defined rank. Each of these ranks get assigned this value. Rank counting starts with 0.", 0, Integer.MAX_VALUE), new ParameterTypeDouble(PARAMETER_RANK_COST, "This is the cost of all ranks within this range.", Double.NEGATIVE_INFINITY, Double.POSITIVE_INFINITY), false)); return types; } }