BestRuleInduction.java example

Explorer
ComplexRapidMiner-master
- operator
- src
/*
 *  RapidMiner
 *
 *  Copyright (C) 2001-2007 by Rapid-I and the contributors
 *
 *  Complete list of developers available at our web site:
 *
 *       http://rapid-i.com
 *
 *  This program is free software; you can redistribute it and/or
 *  modify it under the terms of the GNU General Public License as 
 *  published by the Free Software Foundation; either version 2 of the
 *  License, or (at your option) any later version. 
 *
 *  This program is distributed in the hope that it will be useful, but
 *  WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
 *  General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
 *  USA.
 */
package com.rapidminer.operator.learner;

import java.util.Arrays;
import java.util.Collection;
import java.util.Iterator;
import java.util.List;
import java.util.Vector;

import com.rapidminer.example.Attribute;
import com.rapidminer.example.Example;
import com.rapidminer.example.ExampleSet;
import com.rapidminer.operator.Model;
import com.rapidminer.operator.OperatorDescription;
import com.rapidminer.operator.OperatorException;
import com.rapidminer.operator.learner.rules.ConjunctiveRuleModel;
import com.rapidminer.parameter.ParameterType;
import com.rapidminer.parameter.ParameterTypeBoolean;
import com.rapidminer.parameter.ParameterTypeCategory;
import com.rapidminer.parameter.ParameterTypeInt;
import com.rapidminer.parameter.UndefinedParameterError;


/**
 * This operator returns the best rule regarding WRAcc using exhaustive search.
 * Features like the incorporation of other metrics and the search for more than
 * a single rule are prepared.
 * 
 * The search strategy is BFS, with save pruning whenever applicable. This
 * operator can easily be extended to support other search strategies.
 * 
 * @author Martin Scholz
 * @version $Id: BestRuleInduction.java,v 1.6 2006/04/11 22:43:29 martin_scholz
 *          Exp $
 */
public class BestRuleInduction extends AbstractLearner {

	public static class RuleWithScoreUpperBound implements Comparable {

		private final ConjunctiveRuleModel rule;

		private final double scoreUpperBound;

		public RuleWithScoreUpperBound(ConjunctiveRuleModel rule, double scoreUpperBound) {
			this.rule = rule;
			this.scoreUpperBound = scoreUpperBound;
		}

		public ConjunctiveRuleModel getRule() {
			return this.rule;
		}

		public double getScoreBound() {
			return this.scoreUpperBound;
		}

		public int compareTo(Object obj) {
			if (obj instanceof RuleWithScoreUpperBound) {
				double otherScore = ((RuleWithScoreUpperBound) obj).getScoreBound();
				if (this.getScoreBound() < otherScore)
					return -1;
				else if (this.getScoreBound() > otherScore)
					return 1;
				else
					return 0;
			} else
				return this.getClass().getName().compareTo(obj.getClass().getName());
		}
		
		public boolean equals(Object o) {
			if (!(o instanceof RuleWithScoreUpperBound)) {
				return false;
			} else {
				return this.rule.equals(((RuleWithScoreUpperBound)o).rule);
			}
		}
		
		public int hashCode() {
			return this.rule.hashCode();
		}
	}

	private static final String PARAMETER_MAX_DEPTH = "max_depth";

	private static final String PARAMETER_UTILITY_FUNCTION = "utility_function";

	private static final String PARAMETER_MAX_CACHE = "max_cache";

	private static final String PARAMETER_RELATIVE_TO_PREDICTIONS = "relative_to_predictions";

	private static final String WRACC = "weighted relative accuracy";

	private static final String BINOMIAL = "binomial test function";

	private static final String[] UTILITY_FUNCTION_LIST = new String[] { WRACC, BINOMIAL };

	private double globalP;

	private double globalN;

	protected ConjunctiveRuleModel bestRule;

	private double bestScore;

	// nodes under consideration
	private final Vector<RuleWithScoreUpperBound> openNodes = new Vector<RuleWithScoreUpperBound>();

	// keep track of rules that have been pruned, to avoid
	// evaluations for any kind of refinements
	private final Vector<ConjunctiveRuleModel> prunedNodes = new Vector<ConjunctiveRuleModel>();

	public BestRuleInduction(OperatorDescription description) {
		super(description);
	}

	public boolean supportsCapability(LearnerCapability lc) {
		if (lc == com.rapidminer.operator.learner.LearnerCapability.POLYNOMINAL_ATTRIBUTES)
			return true;
		if (lc == com.rapidminer.operator.learner.LearnerCapability.BINOMINAL_ATTRIBUTES)
			return true;

		if (lc == com.rapidminer.operator.learner.LearnerCapability.BINOMINAL_CLASS)
			return true;
		
		if (lc == com.rapidminer.operator.learner.LearnerCapability.WEIGHTED_EXAMPLES)
			return true;
		
		return false;
	}

	protected void initHighscore() {
		this.bestRule = null;
		this.bestScore = Double.NEGATIVE_INFINITY;
	}

	/**
	 * Adds a rule to the set of best rules if its score is high enough.
	 * Currently just a single rule is stored. Additionally it is checked
	 * whether the rule is bad enough to be pruned.
	 * 
	 * @return true iff the rule can be pruned
	 */
	protected boolean communicateToHighscore(ConjunctiveRuleModel rule, double[] counts) throws UndefinedParameterError {
		double optimisticScore = this.getOptimisticScore(counts);
		if (optimisticScore <= this.getPruningScore())
			return true; // indicates pruning
		else {
			double posScore = this.getScore(counts, true);
			double negScore = this.getScore(counts, false);
			if (posScore > this.bestScore) {
				this.bestRule = rule;
				this.bestScore = posScore;
			}
			if (negScore > this.bestScore) {
				ConjunctiveRuleModel negRule = new ConjunctiveRuleModel(rule, rule.getLabel().getMapping().getNegativeIndex());
				this.bestRule = negRule;
				this.bestScore = negScore;
			}

			return false; // no pruning
		}
	}

	/** @return the best rule found */
	protected ConjunctiveRuleModel getBestRule() {
		return this.bestRule;
	}

	/** @return the lowest score of the stored best rules for pruning */
	protected double getPruningScore() {
		return this.bestScore;
	}

	public Model learn(ExampleSet exampleSet) throws OperatorException {
		this.initHighscore();

		int positiveLabel = exampleSet.getAttributes().getLabel().getMapping().getPositiveIndex();
		// int negativeLabel = exampleSet.getLabel().getNegativeIndex();

		ConjunctiveRuleModel defaultRule = new ConjunctiveRuleModel(exampleSet, positiveLabel);
		// ConjunctiveRuleModel negRule = new
		// ConjunctiveRuleModel(exampleSet.getLabel(), negativeLabel);

		double[] globalCounts = this.getCounts(defaultRule, exampleSet);
		this.globalP = globalCounts[0];
		this.globalN = globalCounts[1];
		this.communicateToHighscore(defaultRule, globalCounts);

		double optimisticScore = this.getOptimisticScore(globalCounts);
		this.openNodes.clear();
		this.prunedNodes.clear();
		this.addRulesToOpenNodes(defaultRule.getAllRefinedRules(exampleSet), optimisticScore);

		int length = 1;

		while (!this.openNodes.isEmpty() && length <= this.getParameterAsInt(PARAMETER_MAX_DEPTH)) {
			int ignored = 0;

			log("Evaluating " + this.openNodes.size() + " rules of length " + length);
			if (this.openNodes.size() > this.getParameterAsInt(PARAMETER_MAX_CACHE)) {
				log("Ignoring all but the " + this.getParameterAsInt(PARAMETER_MAX_CACHE) + " rules with highest support.");
			}

			RuleWithScoreUpperBound[] ruleArray = new RuleWithScoreUpperBound[this.openNodes.size()];
			this.openNodes.toArray(ruleArray);
			Arrays.sort(ruleArray);
			int stopAtIndex = Math.max(0, ruleArray.length - this.getParameterAsInt(PARAMETER_MAX_CACHE));

			this.openNodes.clear();
			for (int i = ruleArray.length - 1; i >= stopAtIndex; i--) {
				RuleWithScoreUpperBound rulePlusScore = ruleArray[i];
				ConjunctiveRuleModel rule = rulePlusScore.getRule();

				if (this.isRefinementOfPrunedRule(rule)) {
					ignored++;
				} else if (rulePlusScore.getScoreBound() <= this.getPruningScore()) {
					ignored++;
					// This pruning could not be derived from prunedNodes and
					// may be useful
					// later on for refined rules with a less precise optimistic
					// estimate.
					this.prunedNodes.add(rulePlusScore.getRule());
				} else
					this.expandNode(rule, exampleSet);
				checkForStop();
			}

			log("Could ignore " + ignored + " rules as refinements of pruned rules or by optimistic estimates.");
            log("Number of pruned rules in cache: " + this.prunedNodes.size());
            log("Best rule is " + this.getBestRule().toString());
            log("Score is " + this.getPruningScore());

			length++;
		}

		this.openNodes.clear();
		this.prunedNodes.clear();
		return this.getBestRule();
	}

	/**
	 * Annotates the collection of ConjunctiveRuleModels with an optimistic
	 * score they may achieve in the best case and adds them to the collection
	 * of open nodes.
	 */
	private void addRulesToOpenNodes(Collection rules, double scoreUpperBound) {
		if (scoreUpperBound <= this.getPruningScore())
			return;

		Iterator it = rules.iterator();
		while (it.hasNext()) {
			this.openNodes.add(new RuleWithScoreUpperBound((ConjunctiveRuleModel) it.next(), scoreUpperBound));
		}
	}

	/**
	 * Evaluates a single rule by computing its score, and the best possible
	 * score after refining this rule. If this cannot improve over the currently
	 * best rules, then the refinements are pruned. Otherwise all refinements
	 * plus optimistic estimates are added to the collection of open nodes.
	 * 
	 * If the evaluated rule is good enough, then it is stored toghether with
	 * its score.
	 */
	private void expandNode(ConjunctiveRuleModel rule, ExampleSet exampleSet) throws OperatorException {
		// Compute counts:
		double[] counts = this.getCounts(rule, exampleSet);

		// Store in highscore if necessary and check whether it may be pruned.
		boolean pruning = this.communicateToHighscore(rule, counts);
		if (pruning == true) {
			this.prunedNodes.add(rule);
			// Nothing to add to the collection of open nodes ..
		} else if (rule.getRuleLength() < this.getParameterAsInt(PARAMETER_MAX_DEPTH)) {
			// Store all the refinements for later investigation:
			this.addRulesToOpenNodes(rule.getAllRefinedRules(exampleSet), this.getOptimisticScore(counts));
		}
	}

	/**
	 * @param rule
	 *            a ConjuctiveRuleModel for which it is checked whether a more
	 *            general rule has already been pruned.
	 * @return true, if this rule is a refinement of a pruned rule. The rules
	 *         are compared using the method
	 *         <code>ConjunctiveRuleModel.isRefinementOf(ConjunctiveRuleModel model)</code>
	 */
	public boolean isRefinementOfPrunedRule(ConjunctiveRuleModel rule) {
		Iterator it = this.prunedNodes.iterator();
		while (it.hasNext()) {
			ConjunctiveRuleModel prunedRule = (ConjunctiveRuleModel) it.next();
			// In this collection all rules predict positive, but the scores are
			// computed for the best label. For this reason the following
			// refinement test is valid.
			if (rule.isRefinementOf(prunedRule)) {
				return true;
			}
		}
		return false;
	}

	/**
	 * Computes the WRAcc or BINOMIAL TEST FUNCTION based on p, n, and the
	 * global values P and N stored in this object. First two entries of counts
	 * are p and n, optionally estimates for p and n can be supplied as further
	 * parameters.
	 */
	protected double getScore(double[] counts, boolean predictPositives) throws UndefinedParameterError {
		double p = counts[0];
		double n = counts[1];
		double cov = (p + n) / (globalP + globalN);
		double pnRel = (predictPositives ? p : n);

		String function = UTILITY_FUNCTION_LIST[this.getParameterAsInt(PARAMETER_UTILITY_FUNCTION)];
		UndefinedParameterError upe = new UndefinedParameterError("Missing parameter '" + PARAMETER_UTILITY_FUNCTION + "'!");

		double score;
		if (this.getParameterAsBoolean(PARAMETER_RELATIVE_TO_PREDICTIONS) == false || counts.length != 4) {
			double pnAbs = (predictPositives ? globalP : globalN);

			if (function.equals(WRACC)) {
				score = cov * (pnRel / (p + n) - pnAbs / (globalP + globalN));
			} else if (function.equals(BINOMIAL)) {
				score = Math.sqrt(cov) * (pnRel / (p + n) - pnAbs / (globalP + globalN));
			} else
				throw upe;
		} else {
			double estP = counts[2];
			double estN = counts[3];
			double pnEst = (predictPositives ? estP : estN);

			if (function.equals(WRACC)) {
				score = cov * (pnRel / (p + n) - pnEst / (estP + estN));
			} else if (function.equals(BINOMIAL)) {
				score = Math.sqrt(cov) * (pnRel / (p + n) - pnEst / (estP + estN));
			} else
				throw upe;
		}
		return score;
	}

	/**
	 * Computes the best possible score that might be achieved by refining the
	 * rule. During learning the conclusion is normalized to "positive", so the
	 * better of the estimates of the better conclusion is returned.
	 */
	protected double getOptimisticScore(double[] counts) throws UndefinedParameterError {
		double p = counts[0];
		double n = counts[1];

		if (this.getParameterAsBoolean(PARAMETER_RELATIVE_TO_PREDICTIONS) == false || counts.length != 4) {
			// For reasonable utility functions adding just negatives decreases
			// the score.
			return Math.max(this.getScore(new double[] { p, 0 }, true), this.getScore(new double[] { 0, n }, false));
		} else {
			// Improvement for positive rules: discard all negatives, which are
			// at the same time considered to be positives with confidence of 1
			// by the given prediction. As a complex second step discarding
			// further
			// positives might help to improve the score, since this allows to
			// lower the estimated precision term.
			// To keep things simple a non-tight optimistic score is computed:
			// 1. Keep all positives, discard all negatives: p'=p, n'=0
			// 2. Lower the estimated confidence to 0, simply estP' = 0, estN' =
			// 0.
			// Analogously for the negatively predicting rule.
			double estP = counts[2];
			double estN = counts[3];

			return Math.max(this.getScore(new double[] { p, 0, 0, estN }, true), this.getScore(new double[] { 0, n, 0, estP }, false));
		}

	}

	/**
	 * @param rule
	 *            the rule to evaluate
	 * @param exampleSet
	 *            the exampleSet to get the counts for
	 * @return a double[2] object, first parameter is p, second is n. If rule
	 *         discovery relative to a predicted label is activated, then a
	 *         double[4] is returned, which contains the estimated positives and
	 *         negatives in the covered part as fields 3 and 4.
	 * @throws OperatorException
	 */
	protected double[] getCounts(ConjunctiveRuleModel rule, ExampleSet exampleSet) throws OperatorException {
		Attribute weightAttr = exampleSet.getAttributes().getWeight();
		Attribute predictedLabel = exampleSet.getAttributes().getPredictedLabel();
		boolean relToPred = (predictedLabel != null) && this.getParameterAsBoolean(PARAMETER_RELATIVE_TO_PREDICTIONS);

		int coveredPart = rule.getConclusion();
		int posIndex = exampleSet.getAttributes().getLabel().getMapping().getPositiveIndex();
		int negIndex = exampleSet.getAttributes().getLabel().getMapping().getNegativeIndex();
		String posS = null;
		String negS = null;
		if (relToPred) {
			posS = predictedLabel.getMapping().mapIndex(posIndex);
			negS = predictedLabel.getMapping().mapIndex(negIndex);
		}

		double p = 0;
		double n = 0;
		double estP = 0;
		double estN = 0;

		Iterator<Example> reader = exampleSet.iterator();
		while (reader.hasNext()) {
			Example example = reader.next();
			double weight = (weightAttr == null) ? 1 : example.getValue(weightAttr);
			if (rule.predict(example) == coveredPart) {
				if (example.getValue(example.getAttributes().getLabel()) == posIndex) {
					p += weight;
				} else
					n += weight;

				if (relToPred) {
					double sum = example.getConfidence(posS) + example.getConfidence(negS);
					estP += weight * example.getConfidence(posS) / sum;
					estN += weight * example.getConfidence(negS) / sum;
				}
			}
		}

		return (relToPred ? new double[] { p, n, estP, estN } : new double[] { p, n });
	}

	/**
	 * Adds the parameters "number of iterations" and "model
	 * file".
	 */
	public List<ParameterType> getParameterTypes() {
		List<ParameterType> types = super.getParameterTypes();
		types.add(new ParameterTypeInt(PARAMETER_MAX_DEPTH, "An upper bound for the number of literals.", 1, Integer.MAX_VALUE, 2)); 
		types.add(new ParameterTypeCategory(PARAMETER_UTILITY_FUNCTION, "The function to be optimized by the rule.", UTILITY_FUNCTION_LIST, 0)); 
		types.add(new ParameterTypeInt(PARAMETER_MAX_CACHE, "Bounds the number of rules considered per depth to avoid high memory consumption, but leads to incomplete search.", 1, Integer.MAX_VALUE, 10000)); 
		types.add(new ParameterTypeBoolean(PARAMETER_RELATIVE_TO_PREDICTIONS, "Searches for rules with a maximum difference to the predited label.", false)); 
		return types;
	}
}