LogisticRegressionOptimization.java example

Explorer
ComplexRapidMiner-master
- operator
- src
/*
 *  RapidMiner
 *
 *  Copyright (C) 2001-2008 by Rapid-I and the contributors
 *
 *  Complete list of developers available at our web site:
 *
 *       http://rapid-i.com
 *
 *  This program is free software: you can redistribute it and/or modify
 *  it under the terms of the GNU Affero General Public License as published by
 *  the Free Software Foundation, either version 3 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU Affero General Public License for more details.
 *
 *  You should have received a copy of the GNU Affero General Public License
 *  along with this program.  If not, see http://www.gnu.org/licenses/.
 */
package com.rapidminer.operator.learner.functions;

import com.rapidminer.example.Attribute;
import com.rapidminer.example.Example;
import com.rapidminer.example.ExampleSet;
import com.rapidminer.operator.OperatorException;
import com.rapidminer.operator.performance.EstimatedPerformance;
import com.rapidminer.operator.performance.PerformanceVector;
import com.rapidminer.tools.LoggingHandler;
import com.rapidminer.tools.RandomGenerator;
import com.rapidminer.tools.math.optimization.ec.es.ESOptimization;
import com.rapidminer.tools.math.optimization.ec.es.Individual;

import Jama.Matrix;


/**
 * Evolutionary Strategy approach for optimization of the logistic regression problem. 
 * 
 * @author Ingo Mierswa, Tobias Malbrecht
 * @version $Id: LogisticRegressionOptimization.java,v 1.8 2008/05/09 19:22:55 ingomierswa Exp $
 */
public class LogisticRegressionOptimization extends ESOptimization {    
    
    private ExampleSet exampleSet;
    
    private Attribute label;
    
    private Attribute weight;
    
    private boolean addIntercept;
    
    LoggingHandler logging;
    
    /** Creates a new evolutionary optimization. */
    public LogisticRegressionOptimization(
            ExampleSet exampleSet, // training data
            boolean addIntercept, // add intercept
            int initType, // start population creation type para
            int maxIterations, int generationsWithoutImprovement, int popSize, // GA paras
            int selectionType, double tournamentFraction, boolean keepBest, // selection paras
            int mutationType, // type of mutation
            double crossoverProb,
            boolean showConvergencePlot,
            RandomGenerator random,
            LoggingHandler logging) {

        super(-1.0d, 1.0d, popSize, addIntercept ? exampleSet.getAttributes().size() + 1 : exampleSet.getAttributes().size(), 
              initType, maxIterations, generationsWithoutImprovement, selectionType, tournamentFraction, keepBest,
              mutationType, crossoverProb, showConvergencePlot, random, logging);

        this.logging = logging;
        
        this.exampleSet = exampleSet;
        this.label  = exampleSet.getAttributes().getLabel();
        this.weight = exampleSet.getAttributes().getWeight();

        this.addIntercept = addIntercept;
    }
    
    public PerformanceVector evaluateIndividual(Individual individual) {
        double[] beta = individual.getValues();
        
        double fitness = 0.0d;
        for (Example example : exampleSet) {
            double eta = 0.0d;
            int i = 0;
            for (Attribute attribute : example.getAttributes()) {
                double value = example.getValue(attribute);
                eta += beta[i] * value;
                i++;
            }
            if (addIntercept) {
            	eta += beta[beta.length - 1];
            }
            double pi = Math.exp(eta) / (1 + Math.exp(eta));
            
            double classValue = example.getValue(label);
            double currentFitness = classValue * Math.log(pi) + (1 - classValue) * Math.log(1 - pi);
            double weightValue = 1.0d;
            if (weight != null)
                weightValue = example.getValue(weight);
            fitness += weightValue * currentFitness;
        }
        
        PerformanceVector performanceVector = new PerformanceVector();
        performanceVector.addCriterion(new EstimatedPerformance("log_reg_fitness", fitness, exampleSet.size(), false));
        return performanceVector;
    }

    public LogisticRegressionModel train() throws OperatorException {
    	optimize();
        return new LogisticRegressionModel(this.exampleSet, getBestValuesEver(), estimateVariance(), addIntercept);
    }

    private double[] estimateVariance() {
    	double[] beta = getBestValuesEver();

    	Matrix hessian = new Matrix(beta.length, beta.length);
    	for (Example example : exampleSet) {
        	double[] values = new double[beta.length];
        	double eta = 0.0d;
        	int j = 0;
        	for (Attribute attribute : example.getAttributes()) {
        		double value = example.getValue(attribute); 
        		values[j] = value;
        		eta += beta[j] * value;
        		j++;
        	}
        	if (addIntercept) {
        		values[beta.length - 1] = 1.0d;
        		eta += beta[beta.length - 1];
        	}
        	double pi = Math.exp(eta) / (1 + Math.exp(eta));

            double weightValue = 1.0d;
            if (weight != null)
                weightValue = example.getValue(weight);
        	for (int x = 0; x < beta.length; x++) {
        		for (int y = 0; y < beta.length; y++) {
        			// sum is second derivative of log likelihood function
        			double h = hessian.get(x, y) - values[x] * values[y] * weightValue * pi * (1 - pi); 
        			hessian.set(x, y, h);
        		}
        	}
    	}

    	double[] variance = new double[beta.length];
    	Matrix varianceCovarianceMatrix = null;
    	try {
    	// asymptotic variance-covariance matrix is inverse of hessian matrix
    		varianceCovarianceMatrix = hessian.inverse();
    	} catch (Exception e) {
    		logging.logWarning("could not determine variance-covariance matrix, hessian is singular");
    		for (int j = 0; j < beta.length; j++) {
    			variance[j] = Double.NaN;
    		}
    		return variance;
    	}
    	for (int j = 0; j < beta.length; j++) {
    		// get diagonal elements
    		variance[j] = Math.abs(varianceCovarianceMatrix.get(j, j));
    	}
    	
    	return variance;
    }
    
    public void nextIteration() {
		double[] beta = getBestValuesEver();
		for (int i = 0; i < beta.length; i++) {
			double minBound = getMin(i);
			double maxBound = getMax(i);
			if (beta[i] == minBound) {
				minBound -= 1;
				setMin(i, minBound);
				logging.log("decrease lower bound for beta(" + i + ") to + " + minBound);
			}
			if (beta[i] == maxBound) {
				maxBound += 1;
				setMax(i, maxBound);
				logging.log("increase upper bound for beta(" + i + ") to + " + maxBound);
			}
		}
    }
    
    public PerformanceVector getPerformance() {
    	double[] beta = getBestValuesEver();
    	double numberOfSlopes = addIntercept ? beta.length - 1 : beta.length;
    	double logLikelihood = getBestFitnessEver();
    	double restrictedLogLikelihood = 0.0d;
    	double minusTwoLogLikelihood = 0.0d;
    	double modelChiSquared = 0.0d;
    	double goodnessOfFit = 0.0d;
    	double coxSnellRSquared = 0.0d;
    	double nagelkerkeRSquared = 0.0d;
    	double mcfaddenRSquared = 0.0d;
    	double AIC = 0.0d;
    	double BIC = 0.0d;

    	double weightSum = 0.0d;
    	double positiveSum = 0.0d;
    	for (Example example : exampleSet) {
            double eta = 0.0d;
            int i = 0;
            for (Attribute attribute : example.getAttributes()) {
                double value = example.getValue(attribute);
                eta += beta[i] * value;
                i++;
            }
            if (addIntercept) {
            	eta += beta[beta.length - 1];
            }
            double pi = Math.exp(eta) / (1 + Math.exp(eta));
            
            double classValue = example.getValue(label);
            double currentFit = (classValue - pi) * (classValue - pi) / (pi * (1 - pi));
            double weightValue = 1.0d;
            if (weight != null)
                weightValue = example.getValue(weight);
            weightSum += weightValue;
            positiveSum += weightValue * classValue;
            goodnessOfFit += weightValue * currentFit;
        }
    	double pi0 = positiveSum / weightSum;
    	if (addIntercept) {
    		restrictedLogLikelihood = weightSum * (pi0 * Math.log(pi0) + (1 - pi0) * Math.log(1 - pi0));
    	} else {
    		restrictedLogLikelihood = weightSum * Math.log(0.5);
    	}
    	minusTwoLogLikelihood = -2 * logLikelihood;
    	modelChiSquared = 2 * (logLikelihood - restrictedLogLikelihood);
    	coxSnellRSquared = 1 - Math.pow(Math.exp(restrictedLogLikelihood) / Math.exp(logLikelihood), 2 / weightSum);
    	nagelkerkeRSquared = coxSnellRSquared / (1 - Math.pow(Math.exp(restrictedLogLikelihood), 2 / weightSum));
    	mcfaddenRSquared =  1 - logLikelihood / restrictedLogLikelihood;
    	AIC = -2 * logLikelihood + 2 * (numberOfSlopes + 1);
    	BIC = -2 * logLikelihood + Math.log(weightSum) * (numberOfSlopes + 1);
    	
    	PerformanceVector estimatedPerformance = new PerformanceVector();
        estimatedPerformance.addCriterion(new EstimatedPerformance("log_likelihood", logLikelihood, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("restricted_log_likelihood", restrictedLogLikelihood, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("-2_log_likelihood", minusTwoLogLikelihood, exampleSet.size(), true));
        estimatedPerformance.addCriterion(new EstimatedPerformance("model_chi_squared", modelChiSquared, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("goodness_of_fit", goodnessOfFit, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("cox_snell_r_squared", coxSnellRSquared, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("nagelkerke_r_squared", nagelkerkeRSquared, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("mcfadden_r_squared", mcfaddenRSquared, exampleSet.size(), false));
        estimatedPerformance.addCriterion(new EstimatedPerformance("AIC", AIC, exampleSet.size(), true));
        estimatedPerformance.addCriterion(new EstimatedPerformance("BIC", BIC, exampleSet.size(), true));
        estimatedPerformance.setMainCriterionName("AIC");
        return estimatedPerformance;
    }
}