/*
* Encog(tm) Core v2.5 - Java Version
* http://www.heatonresearch.com/encog/
* http://code.google.com/p/encog-java/
* Copyright 2008-2010 Heaton Research, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* For more information on Heaton Research copyrights, licenses
* and trademarks visit:
* http://www.heatonresearch.com/copyright
*/
package org.encog.mathutil.randomize;
import org.encog.EncogError;
import org.encog.neural.networks.BasicNetwork;
import org.encog.neural.networks.layers.Layer;
import org.encog.neural.networks.structure.FlatUpdateNeeded;
import org.encog.neural.networks.synapse.Synapse;
/**
* Implementation of <i>Nguyen-Widrow</i> weight initialization. This is the
* default weight initialization used by Encog, as it generally provides the
* most trainable neural network.
*
*
* @author St?phan Corriveau
*
*/
public class NguyenWidrowRandomizer extends RangeRandomizer implements
Randomizer {
/**
* Construct a Nguyen-Widrow randomizer.
*
* @param min
* The min of the range.
* @param max
* The max of the range.
*/
public NguyenWidrowRandomizer(final double min, final double max) {
super(min, max);
}
/**
* The <i>Nguyen-Widrow</i> initialization algorithm is the following :
* <br>
* 1. Initialize all weight of hidden layers with (ranged) random values<br>
* 2. For each hidden layer<br>
* 2.1 calculate beta value, 0.7 * Nth(#neurons of input layer) root of
* #neurons of current layer <br>
* 2.2 for each synapse<br>
* 2.1.1 for each weight <br>
* 2.1.2 Adjust weight by dividing by norm of weight for neuron and
* multiplying by beta value
* @param network The network to randomize.
*/
@Override
public final void randomize(final BasicNetwork network) {
super.randomize(network);
int neuronCount = 0;
for (final Layer layer : network.getStructure().getLayers()) {
neuronCount += layer.getNeuronCount();
}
final Layer inputLayer = network.getLayer(BasicNetwork.TAG_INPUT);
final Layer outputLayer = network.getLayer(BasicNetwork.TAG_OUTPUT);
if (inputLayer == null) {
throw new EncogError("Must have an input layer for Nguyen-Widrow.");
}
if (outputLayer == null) {
throw new EncogError("Must have an output layer for Nguyen-Widrow.");
}
final int hiddenNeurons = neuronCount - inputLayer.getNeuronCount()
- outputLayer.getNeuronCount();
// can't really do much, use regular randomization
if (hiddenNeurons < 1) {
return;
}
final double beta = 0.7 * Math.pow(hiddenNeurons, 1.0 / inputLayer
.getNeuronCount());
for (final Synapse synapse : network.getStructure().getSynapses()) {
randomize(beta, synapse);
}
network.getStructure().setFlatUpdate(FlatUpdateNeeded.Flatten);
network.getStructure().flattenWeights();
}
/**
* Randomize the specified synapse.
*
* @param beta
* The beta value.
* @param synapse
* The synapse to modify.
*/
private void randomize(final double beta, final Synapse synapse) {
if (synapse.getMatrix() == null) {
return;
}
for (int j = 0; j < synapse.getToNeuronCount(); j++) {
double norm = 0.0;
// Calculate the Euclidean Norm for the weights
for (int k = 0; k < synapse.getFromNeuronCount(); k++) {
final double value = synapse.getMatrix().get(k, j);
norm += value * value;
}
if (synapse.getToLayer().hasBias()) {
final double value = synapse.getToLayer().getBiasWeight(j);
norm += value * value;
norm = Math.sqrt(norm);
}
// Rescale the weights using beta and the norm
for (int k = 0; k < synapse.getFromNeuronCount(); k++) {
final double value = synapse.getMatrix().get(k, j);
synapse.getMatrix().set(k, j, beta * value / norm);
}
if (synapse.getToLayer().hasBias()) {
final double value = synapse.getToLayer().getBiasWeight(j);
synapse.getToLayer().setBiasWeight(j, beta * value / norm);
}
}
}
}