/* * RapidMiner * * Copyright (C) 2001-2011 by Rapid-I and the contributors * * Complete list of developers available at our web site: * * http://rapid-i.com * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see http://www.gnu.org/licenses/. */ package com.rapidminer.operator.learner.tree; import java.util.Iterator; import java.util.List; import com.rapidminer.example.Attribute; import com.rapidminer.example.AttributeWeights; import com.rapidminer.example.Example; import com.rapidminer.example.ExampleSet; import com.rapidminer.operator.OperatorCapability; import com.rapidminer.operator.OperatorCreationException; import com.rapidminer.operator.OperatorDescription; import com.rapidminer.operator.OperatorException; import com.rapidminer.operator.features.weighting.ChiSquaredWeighting; import com.rapidminer.operator.learner.tree.criterions.Criterion; import com.rapidminer.parameter.ParameterType; import com.rapidminer.tools.OperatorService; /** * The CHAID decision tree learner works like the * {@link com.rapidminer.operator.learner.tree.DecisionTreeLearner} * with one exception: it used a chi squared based criterion * instead of the information gain or gain ratio criteria. * * @author Ingo Mierswa */ public class CHAIDLearner extends DecisionTreeLearner { public CHAIDLearner(OperatorDescription description) { super(description); } @Override protected Criterion createCriterion(double minimalGain) throws OperatorException { return new Criterion() { @Override public double getIncrementalBenefit() { throw new UnsupportedOperationException("Incremental calculation not supported."); } @Override public double getNominalBenefit(ExampleSet exampleSet, Attribute attribute) throws OperatorException { exampleSet = (ExampleSet) exampleSet.clone(); exampleSet.getAttributes().clearRegular(); exampleSet.getAttributes().addRegular(attribute); ChiSquaredWeighting weightOp = null; try { weightOp = OperatorService.createOperator(ChiSquaredWeighting.class); } catch (OperatorCreationException e) { throw new OperatorException("Cannot create chi squared calculation operator.", e); } AttributeWeights weights = weightOp.doWork(exampleSet); return weights.getWeight(attribute.getName()); } @Override public double getNumericalBenefit(ExampleSet exampleSet, Attribute attribute, double splitValue) { throw new UnsupportedOperationException("Numerical attributes not supported."); } @Override public void startIncrementalCalculation(ExampleSet exampleSet) { throw new UnsupportedOperationException("Incremental calculation not supported."); } @Override public boolean supportsIncrementalCalculation() { return false; } @Override public void swapExample(Example example) { throw new UnsupportedOperationException("Incremental calculation not supported."); } @Override public double getBenefit(double[][] weightCounts) { throw new UnsupportedOperationException("Method not supported."); } }; } /** This method calculates the benefit of the given attribute. This implementation * utilizes the defined {@link Criterion}. Subclasses might want to override this * method in order to calculate the benefit in other ways. */ protected Benefit calculateBenefit(ExampleSet trainingSet, Attribute attribute) throws OperatorException { ChiSquaredWeighting weightOp = null; try { weightOp = OperatorService.createOperator(ChiSquaredWeighting.class); } catch (OperatorCreationException e) { getLogger().warning("Cannot create chi squared calculation operator."); return null; } double weight = Double.NaN; if (weightOp != null) { AttributeWeights weights = weightOp.doWork(trainingSet); weight = weights.getWeight(attribute.getName()); } if (!Double.isNaN(weight)) { return new Benefit(weight, attribute); } else { return null; } } @Override public List<ParameterType> getParameterTypes() { List<ParameterType> types = super.getParameterTypes(); // remove criterion selection Iterator<ParameterType> i = types.iterator(); while (i.hasNext()) { if (i.next().getKey().equals(PARAMETER_CRITERION)) i.remove(); } return types; } @Override public boolean supportsCapability(OperatorCapability capability) { if (capability == OperatorCapability.NUMERICAL_ATTRIBUTES) return false; return super.supportsCapability(capability); } }