Model.java example

Explorer
ComplexRapidMiner-master
- operator
- src
/*
 *  RapidMiner
 *
 *  Copyright (C) 2001-2008 by Rapid-I and the contributors
 *
 *  Complete list of developers available at our web site:
 *
 *       http://rapid-i.com
 *
 *  This program is free software: you can redistribute it and/or modify
 *  it under the terms of the GNU Affero General Public License as published by
 *  the Free Software Foundation, either version 3 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU Affero General Public License for more details.
 *
 *  You should have received a copy of the GNU Affero General Public License
 *  along with this program.  If not, see http://www.gnu.org/licenses/.
 */
package com.rapidminer.operator.learner.functions.kernel.gaussianprocess;

import java.io.Serializable;

import com.rapidminer.operator.learner.functions.kernel.rvm.kernel.Kernel;

import Jama.Matrix;

/**
 * The learned model.
 * 
 * @author Piotr Kasprzak, Ingo Mierswa
 * @version $Id: Model.java,v 1.4 2008/05/09 19:23:17 ingomierswa Exp $
 * 
 */
public class Model implements Serializable {

	private static final long serialVersionUID = 1695426983570182267L;

	/* Kernel used */
	private Kernel kernel;

	/* The basis vectors used */
	private double[][] basisVectors;

	/* Parameterisation of the approximate GP */

	//private Matrix C; // GP-covariance parameterisation

	private Matrix alpha; // GP-mean parameterisation

	//private Matrix Q; // Inverse kernel gram matrix, could be useful later

	private boolean regression; // Regression or classification model

	/**
	 * Other variables (can be derived from the variables above)
	 */

	/*
	 * The vector k_t+1 = [K(x_1, x_t+1), K(x_2, x_t+1), ..., K(x_t, x_t+1)], holding the results of using the kernel on
	 * the the new input x_t+1 and the rest of the old inputs
	 */

	private Matrix k;

	/* Temorary result: C_t * k_t+1 */

	// IM: WARNING: the variable was never used !!!
	// private Matrix C_times_k;
	private int d; // Number of basis vectors (= dimension of all vectors / matrices)

	private int inputDim; // Dimension of the input vectors

	/** Constructors */

	public Model(Kernel kernel, double[][] basisVectors, Matrix alpha, Matrix C, Matrix Q, int d, boolean regression) {

		this.kernel = kernel;
		this.basisVectors = basisVectors;

		this.alpha = alpha;
		//this.C = C;
		//this.Q = Q;

		this.regression = regression;

		this.d = d;
		inputDim = basisVectors[0].length; // Dimension of the input vectors

		k = new Matrix(d, 1);

		/* Temorary result: C_t * k_t+1 */

		// IM: WARNING: the variable was never used !!!
		// C_times_k = new Matrix(d, 1);
	}

    public int getNumberOfBasisVectors() {
        return basisVectors.length;
    }
    
    public int getInputDim() {
        return inputDim;
    }
    
    public double[] getBasisVector(int i) {
        return this.basisVectors[i];
    }
    
    public double getBasisVectorValue(int i, int j) {
        return this.basisVectors[i][j];
    }
    
	/**
	 * Compute the (canonical) scalar product between x and y, using only the first d components of the vectors
	 */

	private double scalarProduct(double[][] x, double[][] y, int d) {
		/* Lengths of x and y must be both >= d */
		//if (x.length < d || y.length < d)
			//throw new Exception("At least one vector has a too small dimension!");

		double result = 0;

		for (int i = 0; i < d; i++) {
			result += x[i][0] * y[i][0];
		}

		return result;
	}

	/**
	 * Apply the model to a (new) input vector x_t+1 in order to get a prediction, which - as a GP-marignal at x_t+1 -
	 * is a one-dimensional gaussian distribution with mean m and covariance sigma^2 (2.22, the parameterisation lemma).
     * Returns only the function value, the mapping to a classification must be done by the invoking method.
	 */

	public double applyToVector(double[] x_new) {

		double m = 0; // The mean of the marginalisation, we want to compute
		// IM: Warning: the following variable was never used !!!
		// double sigma_2 = 0; // The according covariance

		double prediction = 0; // The prediction we return (will be =mean)

		// IM: WARNING: the variable k_star was never used !!!
		// double k_star = 0; // = Kernel(x_new, x_new)

		/**
		 * Compute k_t+1 = [K(x_1, x_t+1), K(x_2, x_t+1), ..., K(x_t, x_t+1)] and
		 * 
		 * k_star = K(x_t+1, x_t+1)
		 */

		for (int j = 0; j < d; j++) {
			k.getArray()[j][0] = kernel.eval(basisVectors[j], x_new);
		}

		// IM: WARNING: the variable k_star was never used !!!
		// k_star = kernel.eval(x_new, x_new);

		/**
		 * Compute m_t+1, the mean of the marginal of the GP at x_t+1, which is gaussian:
		 * 
		 * m_t+1 = {k_t+1}^T * alpha_t
		 * 
		 */

		m = scalarProduct(k.getArray(), alpha.getArray(), d);

		/**
		 * Compute sigma_t+1^2, the covariance^2 of the marginal of the GP at x_t+1, which is gaussian:
		 * 
		 * {sigma_t+1}^2 = K(x_t+1, x_t+1) + {k_t+1}^T * C_t * k_t+1
		 * 
		 * (see end of chapter 2.4 and chapter 5.1)
		 */

		// IM: WARNING: the variable was never used !!!
		// C_times_k = C.times(k);
		// IM: WARNING: the following variable was never used !!!
		// sigma_2 = k_star + scalarProduct(k.getArray(), C_times_k.getArray(), d);
		prediction = m;

        /* IM: should be done by invoking method
		if (!regression) {
			if (prediction > 0.0)
				prediction = 1.0;
			else
				prediction = 0.0;
		}
        */

		return prediction;
	}

	/**
	 * Apply the model to all input vectors
	 */
	public double[] apply(double[][] inputVectors) throws Exception {
		double[] prediction = new double[inputVectors.length];
		for (int i = 0; i < inputVectors.length; i++) {
			prediction[i] = applyToVector(inputVectors[i]);
            if (!regression) {
                if (prediction[i] > 0.0)
                    prediction[i] = 1.0;
                else
                    prediction[i] = 0.0;
            }
		}

		return prediction;
	}
}