RuleRegressionNode.java example

Explorer

samoa-master
- samoa-api
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        core
        ContentEvent.java
        DoubleVector.java
        EntranceProcessor.java
        Globals.java
        Processor.java
        SerializableInstance.java
        evaluation
        BasicClassificationPerformanceEvaluator.java
        BasicRegressionPerformanceEvaluator.java
        ClassificationPerformanceEvaluator.java
        ClusteringEvaluationContentEvent.java
        ClusteringEvaluatorProcessor.java
        ClusteringResultContentEvent.java
        EvaluatorProcessor.java
        PerformanceEvaluator.java
        RegressionPerformanceEvaluator.java
        WindowClassificationPerformanceEvaluator.java
        measures
        CMM.java
        CMM_GTAnalysis.java
        EntropyCollection.java
        F1.java
        General.java
        SSQ.java
        Separation.java
        SilhouetteCoefficient.java
        StatisticalCollection.java
        examples
        HelloWorldContentEvent.java
        HelloWorldDestinationProcessor.java
        HelloWorldSourceProcessor.java
        HelloWorldTask.java
        learners
        AdaptiveLearner.java
        ClassificationLearner.java
        InstanceContentEvent.java
        InstancesContentEvent.java
        Learner.java
        RegressionLearner.java
        ResultContentEvent.java
        classifiers
        LocalLearner.java
        LocalLearnerProcessor.java
        NaiveBayes.java
        SimpleClassifierAdapter.java
        SingleClassifier.java
        ensemble
        AdaptiveBagging.java
        Bagging.java
        BaggingDistributorProcessor.java
        Boosting.java
        BoostingDistributorProcessor.java
        BoostingPredictionCombinerProcessor.java
        PredictionCombinerProcessor.java
        rules
        AMRulesRegressor.java
        HorizontalAMRulesRegressor.java
        VerticalAMRulesRegressor.java
        centralized
        AMRulesRegressorProcessor.java
        common
        ActiveRule.java
        LearningRule.java
        NonLearningRule.java
        PassiveRule.java
        Perceptron.java
        Rule.java
        RuleActiveLearningNode.java
        RuleActiveRegressionNode.java
        RulePassiveLearningNode.java
        RulePassiveRegressionNode.java
        RuleRegressionNode.java
        RuleSplitNode.java
        TargetMean.java
        distributed
        AMRDefaultRuleProcessor.java
        AMRLearnerProcessor.java
        AMRRuleSetProcessor.java
        AMRulesAggregatorProcessor.java
        AMRulesStatisticsProcessor.java
        AssignmentContentEvent.java
        PredicateContentEvent.java
        RuleContentEvent.java
        trees
        ActiveLearningNode.java
        AttributeBatchContentEvent.java
        AttributeContentEvent.java
        ComputeContentEvent.java
        ControlContentEvent.java
        DeleteContentEvent.java
        FilterProcessor.java
        FoundNode.java
        InactiveLearningNode.java
        LearningNode.java
        LocalResultContentEvent.java
        LocalStatisticsProcessor.java
        ModelAggregatorProcessor.java
        Node.java
        SplitNode.java
        VerticalHoeffdingTree.java
        clusterers
        ClusteringContentEvent.java
        ClustreamClustererAdapter.java
        LocalClustererAdapter.java
        LocalClustererProcessor.java
        SingleLearner.java
        simple
        ClusteringDistributorProcessor.java
        DistributedClusterer.java
        moa
        AbstractMOAObject.java
        MOAObject.java
        classifiers
        AbstractClassifier.java
        Classifier.java
        Regressor.java
        core
        AttributeSplitSuggestion.java
        attributeclassobservers
        AttributeClassObserver.java
        BinaryTreeNumericAttributeClassObserver.java
        BinaryTreeNumericAttributeClassObserverRegression.java
        DiscreteAttributeClassObserver.java
        FIMTDDNumericAttributeClassObserver.java
        GaussianNumericAttributeClassObserver.java
        GreenwaldKhannaNumericAttributeClassObserver.java
        NominalAttributeClassObserver.java
        NullAttributeClassObserver.java
        NumericAttributeClassObserver.java
        VFMLNumericAttributeClassObserver.java
        conditionaltests
        InstanceConditionalBinaryTest.java
        InstanceConditionalTest.java
        NominalAttributeBinaryTest.java
        NominalAttributeMultiwayTest.java
        NumericAttributeBinaryTest.java
        driftdetection
        ADWIN.java
        ADWINChangeDetector.java
        AbstractChangeDetector.java
        ChangeDetector.java
        CusumDM.java
        DDM.java
        EDDM.java
        EWMAChartDM.java
        GeometricMovingAverageDM.java
        PageHinkleyDM.java
        splitcriteria
        GiniSplitCriterion.java
        InfoGainSplitCriterion.java
        InfoGainSplitCriterionMultilabel.java
        SDRSplitCriterion.java
        SplitCriterion.java
        VarianceReductionSplitCriterion.java
        functions
        MajorityClass.java
        rules
        core
        Predicate.java
        attributeclassobservers
        FIMTDDNumericAttributeClassLimitObserver.java
        conditionaltests
        NumericAttributeBinaryRulePredicate.java
        splitcriteria
        SDRSplitCriterionAMRules.java
        voting
        AbstractErrorWeightedVote.java
        ErrorWeightedVote.java
        InverseErrorWeightedVote.java
        UniformWeightedVote.java
        driftdetection
        PageHinkleyFading.java
        PageHinkleyTest.java
        cluster
        CFCluster.java
        Cluster.java
        Clustering.java
        Miniball.java
        SphereCluster.java
        clusterers
        AbstractClusterer.java
        ClusterGenerator.java
        Clusterer.java
        KMeans.java
        clustream
        Clustream.java
        ClustreamKernel.java
        WithKmeans.java
        core
        AutoClassDiscovery.java
        AutoExpandVector.java
        DataPoint.java
        DoubleVector.java
        Example.java
        FastVector.java
        GaussianEstimator.java
        GreenwaldKhannaQuantileSummary.java
        InputStreamProgressMonitor.java
        InstanceExample.java
        Measurement.java
        MiscUtils.java
        ObjectRepository.java
        SerializeUtils.java
        Statistics.java
        StringUtils.java
        Utils.java
        evaluation
        LearningCurve.java
        LearningEvaluation.java
        LearningPerformanceEvaluator.java
        MeasureCollection.java
        MembershipMatrix.java
        learners
        Learner.java
        options
        AbstractClassOption.java
        AbstractOptionHandler.java
        ClassOption.java
        OptionHandler.java
        OptionsHandler.java
        streams
        ArffFileStream.java
        ExampleStream.java
        InstanceStream.java
        clustering
        ClusterEvent.java
        ClusterEventListener.java
        ClusteringStream.java
        RandomRBFGeneratorEvents.java
        generators
        HyperplaneGenerator.java
        RandomTreeGenerator.java
        tasks
        NullMonitor.java
        ResultPreviewListener.java
        Task.java
        TaskMonitor.java
        streams
        ArffFileStream.java
        ClusteringEntranceProcessor.java
        FileStream.java
        PrequentialSourceProcessor.java
        StreamSource.java
        StreamSourceProcessor.java
        fs
        FileStreamSource.java
        HDFSFileStreamSource.java
        LocalFileStreamSource.java
        tasks
        ClusteringEvaluation.java
        PrequentialEvaluation.java
        Task.java
        topology
        AbstractEntranceProcessingItem.java
        AbstractProcessingItem.java
        AbstractStream.java
        AbstractTopology.java
        ComponentFactory.java
        EntranceProcessingItem.java
        IProcessingItem.java
        ISubmitter.java
        LocalEntranceProcessingItem.java
        ProcessingItem.java
        Stream.java
        Topology.java
        TopologyBuilder.java
        utils
        PartitioningScheme.java
        StreamDestination.java
        Utils.java
    - test
      - java
        com
        yahoo
        labs
        samoa
        core
        DoubleVectorTest.java
        streams
        fs
        HDFSFileStreamSourceTest.java
        LocalFileStreamSourceTest.java
- samoa-instances
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        instances
        ArffLoader.java
        Attribute.java
        DenseInstance.java
        DenseInstanceData.java
        Instance.java
        InstanceData.java
        InstanceInformation.java
        Instances.java
        InstancesHeader.java
        SingleClassInstanceData.java
        SingleLabelInstance.java
        SparseInstance.java
        SparseInstanceData.java
        Utils.java
- samoa-local
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        LocalDoTask.java
        topology
        impl
        SimpleComponentFactory.java
        SimpleEngine.java
        SimpleEntranceProcessingItem.java
        SimpleProcessingItem.java
        SimpleStream.java
        SimpleTopology.java
    - test
      - java
        com
        yahoo
        labs
        samoa
        AlgosTest.java
        topology
        impl
        SimpleComponentFactoryTest.java
        SimpleEngineTest.java
        SimpleEntranceProcessingItemTest.java
        SimpleProcessingItemTest.java
        SimpleStreamTest.java
        SimpleTopologyTest.java
- samoa-s4
  - samoa-s4-adapter
    - src
      - main
        java
        samoa
        topology
        adapter
        S4AdapterApp.java
        S4EntranceProcessingItem.java
        package-info.java
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        topology
        impl
        S4ComponentFactory.java
        S4DoTask.java
        S4EntranceProcessingItem.java
        S4Event.java
        S4ProcessingItem.java
        S4Stream.java
        S4Submitter.java
        S4Topology.java
        SamoaSerializer.java
        SamoaSerializerModule.java
- samoa-samza
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        SamzaDoTask.java
        topology
        impl
        SamoaSystemFactory.java
        SamzaComponentFactory.java
        SamzaEngine.java
        SamzaEntranceProcessingItem.java
        SamzaProcessingItem.java
        SamzaProcessingNode.java
        SamzaStream.java
        SamzaTopology.java
        utils
        SamzaConfigFactory.java
        SamzaKryoSerdeFactory.java
        SerializableSerializer.java
        SystemsUtils.java
- samoa-storm
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        LocalStormDoTask.java
        topology
        impl
        StormBoltStream.java
        StormComponentFactory.java
        StormDoTask.java
        StormEntranceProcessingItem.java
        StormJarSubmitter.java
        StormProcessingItem.java
        StormSamoaUtils.java
        StormSpoutStream.java
        StormStream.java
        StormTopology.java
        StormTopologyNode.java
        StormTopologySubmitter.java
    - test
      - java
        com
        yahoo
        labs
        samoa
        AlgosTest.java
        topology
        impl
        StormProcessingItemTest.java
- samoa-test
  - src
    - test
      - java
        com
        yahoo
        labs
        samoa
        TestParams.java
        TestUtils.java
- samoa-threads
  - src
    - main
      - java
        com
        yahoo
        labs
        samoa
        LocalThreadsDoTask.java
        topology
        impl
        ThreadsComponentFactory.java
        ThreadsEngine.java
        ThreadsEntranceProcessingItem.java
        ThreadsEventRunnable.java
        ThreadsProcessingItem.java
        ThreadsProcessingItemInstance.java
        ThreadsStream.java
        ThreadsTopology.java
    - test
      - java
        com
        yahoo
        labs
        samoa
        AlgosTest.java
        topology
        impl
        ThreadsComponentFactoryTest.java
        ThreadsEngineTest.java
        ThreadsEntranceProcessingItemTest.java
        ThreadsEventRunnableTest.java
        ThreadsProcessingItemInstanceTest.java
        ThreadsProcessingItemTest.java
        ThreadsStreamTest.java
        ThreadsTopologyTest.java
        utils
        StreamDestinationTest.java

package com.yahoo.labs.samoa.learners.classifiers.rules.common;

/*
 * #%L
 * SAMOA
 * %%
 * Copyright (C) 2013 - 2014 Yahoo! Inc.
 * %%
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 *      http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * #L%
 */

import java.io.Serializable;

import com.yahoo.labs.samoa.instances.Instance;
import com.yahoo.labs.samoa.moa.core.DoubleVector;

/**
 * The base class for LearningNode for regression rule.
 * 
 * @author Anh Thu Vu
 *
 */
public abstract class RuleRegressionNode implements Serializable {
	
	private static final long serialVersionUID = 9129659494380381126L;
	
	protected int predictionFunction;
	protected int ruleNumberID;
	// The statistics for this node:
	// Number of instances that have reached it
	// Sum of y values
	// Sum of squared y values
	protected DoubleVector nodeStatistics;
	
	protected Perceptron perceptron;
	protected TargetMean targetMean;
	protected double learningRatio;
	
	/*
	 * Simple setters & getters
	 */
	public Perceptron getPerceptron() {
		return perceptron;
	}

	public void setPerceptron(Perceptron perceptron) {
		this.perceptron = perceptron;
	}

	public TargetMean getTargetMean() {
		return targetMean;
	}

	public void setTargetMean(TargetMean targetMean) {
		this.targetMean = targetMean;
	}

	/*
	 * Create a new RuleRegressionNode
	 */
	public RuleRegressionNode(double[] initialClassObservations) {
		this.nodeStatistics = new DoubleVector(initialClassObservations);
	}

	public RuleRegressionNode() {
		this(new double[0]);
	}

	/*
	 * Update statistics with input instance
	 */
	public abstract void updateStatistics(Instance instance);

	/*
	 * Predictions 
	 */
	public double[] getPrediction(Instance instance) {
		int predictionMode = this.getLearnerToUse(this.predictionFunction);
		return getPrediction(instance, predictionMode);
	}
	
	public double[] getSimplePrediction() {
		if( this.targetMean!=null)
			return this.targetMean.getVotesForInstance();
		else
			return new double[]{0};
	}

	public double[] getPrediction(Instance instance, int predictionMode) {
		double[] ret;
		if (predictionMode == 1)
			ret=this.perceptron.getVotesForInstance(instance);
		else
			ret=this.targetMean.getVotesForInstance(instance);
		return ret;
	}
	
	public double getNormalizedPrediction(Instance instance) {
		double res;
		double [] aux;
		switch (this.predictionFunction) {
		//perceptron - 1
		case 1:
			res=this.perceptron.normalizedPrediction(instance);
			break;
			//target mean - 2
		case 2:
			aux=this.targetMean.getVotesForInstance();
			res=normalize(aux[0]);
			break;
			//adaptive	- 0
		case 0:  
			int predictionMode = this.getLearnerToUse(0);
			if(predictionMode == 1)
			{
				res=this.perceptron.normalizedPrediction(instance);
			}
			else{
				aux=this.targetMean.getVotesForInstance(instance);
				res = normalize(aux[0]); 
			}
			break;
		default: 
			throw new UnsupportedOperationException("Prediction mode not in range.");
		}
		return res;
	}

	/*
	 * Get learner mode
	 */
	public int getLearnerToUse(int predMode) {
		int predictionMode = predMode;
		if (predictionMode == 0) {
			double perceptronError= this.perceptron.getCurrentError();
			double meanTargetError =this.targetMean.getCurrentError();
			if (perceptronError < meanTargetError)
				predictionMode = 1; //PERCEPTRON
			else
				predictionMode = 2; //TARGET MEAN
		}
		return predictionMode;
	}

	/*
	 * Error and change detection
	 */
	public double computeError(Instance instance) {
		double normalizedPrediction = getNormalizedPrediction(instance); 
		double normalizedClassValue = normalize(instance.classValue());
		return Math.abs(normalizedClassValue - normalizedPrediction);
	}
	
	public double getCurrentError() {
		double error;
		if (this.perceptron!=null){
			if (targetMean==null)
				error=perceptron.getCurrentError();
			else{
				double errorP=perceptron.getCurrentError();
				double errorTM=targetMean.getCurrentError();
				error = (errorP<errorTM) ? errorP : errorTM;	
			}		
		}
		else
			error=Double.MAX_VALUE;
		return error;
	}
	
	/*
	 * no. of instances seen
	 */
	public long getInstancesSeen() {
		if (nodeStatistics != null) {
			return (long)this.nodeStatistics.getValue(0);
		} else {
			return 0;
		}
	}

	public DoubleVector getNodeStatistics(){
		return this.nodeStatistics;
	}
	
	/*
	 * Anomaly detection
	 */
	public boolean isAnomaly(Instance instance,
			double uniVariateAnomalyProbabilityThreshold,
			double multiVariateAnomalyProbabilityThreshold,
			int numberOfInstanceesForAnomaly) {
		//AMRUles is equipped with anomaly detection. If on, compute the anomaly value.
		long perceptronIntancesSeen=this.perceptron.getInstancesSeen();
		if ( perceptronIntancesSeen>= numberOfInstanceesForAnomaly) {
			double attribSum;
			double attribSquaredSum;
			double D = 0.0;
			double N = 0.0;
			double anomaly;

			for (int x = 0; x < instance.numAttributes() - 1; x++) {
				// Perceptron is initialized each rule.
				// this is a local anomaly.
				int instAttIndex = modelAttIndexToInstanceAttIndex(x, instance);
				attribSum = this.perceptron.perceptronattributeStatistics.getValue(x);
				attribSquaredSum = this.perceptron.squaredperceptronattributeStatistics.getValue(x);
				double mean = attribSum / perceptronIntancesSeen;
				double sd = computeSD(attribSquaredSum, attribSum, perceptronIntancesSeen);
				double probability = computeProbability(mean, sd, instance.value(instAttIndex));

				if (probability > 0.0) {
					D = D + Math.abs(Math.log(probability));
					if (probability < uniVariateAnomalyProbabilityThreshold) {//0.10
						N = N + Math.abs(Math.log(probability));
					}
				} 
			}

			anomaly = 0.0;
			if (D != 0.0) {
				anomaly = N / D;
			}
			if (anomaly >= multiVariateAnomalyProbabilityThreshold) {
				//debuganomaly(instance,
				//		uniVariateAnomalyProbabilityThreshold,
				//		multiVariateAnomalyProbabilityThreshold,
				//		anomaly);
				return true;
			}
		}
		return false;
	} 

	/*
	 * Helpers
	 */
	public static double computeProbability(double mean, double sd, double value) {
		double probability = 0.0;

		if (sd > 0.0) {
			double k = (Math.abs(value - mean) / sd); // One tailed variant of Chebyshev's inequality
			probability= 1.0 / (1+k*k);
		}

		return probability;
	}

	public static double computeHoeffdingBound(double range, double confidence, double n) {
		return Math.sqrt(((range * range) * Math.log(1.0 / confidence)) / (2.0 * n));
	}

	private double normalize(double value) {
		double meanY = this.nodeStatistics.getValue(1)/this.nodeStatistics.getValue(0);
		double sdY = computeSD(this.nodeStatistics.getValue(2), this.nodeStatistics.getValue(1), (long)this.nodeStatistics.getValue(0));
		double normalizedY = 0.0;
		if (sdY > 0.0000001) {
			normalizedY = (value - meanY) / (sdY);
		}
		return normalizedY;
	}


	public double computeSD(double squaredVal, double val, long size) {
		if (size > 1) {
			return Math.sqrt((squaredVal - ((val * val) / size)) / (size - 1.0));
		}
		return 0.0;
	}
	
	/**
     * Gets the index of the attribute in the instance,
     * given the index of the attribute in the learner.
     *
     * @param index the index of the attribute in the learner
     * @param inst the instance
     * @return the index in the instance
     */
    protected static int modelAttIndexToInstanceAttIndex(int index, Instance inst) {
            return  index<= inst.classIndex() ? index : index + 1;
    }
}