/*
* Encog(tm) Core v3.4 - Java Version
* http://www.heatonresearch.com/encog/
* https://github.com/encog/encog-java-core
* Copyright 2008-2016 Heaton Research, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* For more information on Heaton Research copyrights, licenses
* and trademarks visit:
* http://www.heatonresearch.com/copyright
*/
package org.encog.ml.hmm.alog;
import org.encog.ml.data.MLDataSet;
import org.encog.ml.hmm.HiddenMarkovModel;
/**
* This class produces a Kullback-Leibler estimation of the distance between two
* HMMs. This allows the similarity of two different HMM's to be evaluated.
*
* ^ Kullback, S.; Leibler, R.A. (1951). "On Information and Sufficiency".
* Annals of Mathematical Statistics 22 (1): 79-86. doi:10.1214/aoms/1177729694.
* MR39968.
*/
public class KullbackLeiblerDistanceCalculator {
private int len = 1000;
private int sequenceCount = 10;
public double distance(final HiddenMarkovModel hmm1,
final HiddenMarkovModel hmm2) {
double distance = 0.;
for (int i = 0; i < this.sequenceCount; i++) {
final MLDataSet oseq = new MarkovGenerator(hmm1)
.observationSequence(this.len);
distance += (new ForwardBackwardScaledCalculator(oseq, hmm1)
.lnProbability() - new ForwardBackwardScaledCalculator(
oseq, hmm2).lnProbability())
/ this.len;
}
return distance / this.sequenceCount;
}
public int getLen() {
return this.len;
}
public int getSequenceCount() {
return this.sequenceCount;
}
public void setLen(final int len) {
this.len = len;
}
public void setSequenceCount(final int sequenceCount) {
this.sequenceCount = sequenceCount;
}
}