DeepLearningMnist.java example

Explorer
h2o-2-master
package samples.expert;

//import static samples.expert.DeepLearningVisualization.visualize;
import static water.util.MRUtils.sampleFrame;
import hex.deeplearning.DeepLearning;
import hex.deeplearning.DeepLearningModel;
import water.Job;
import water.TestUtil;
import water.UKV;
import water.fvec.Frame;
import water.util.Log;

import java.util.Random;

/**
 * Runs a neural network on the MNIST dataset.
 */
public class DeepLearningMnist extends Job {
  public static void main(String[] args) throws Exception {
    Class job = DeepLearningMnist.class;
    samples.launchers.CloudLocal.launch(job, 1);
//    samples.launchers.CloudProcess.launch(job, 4);
    //samples.launchers.CloudConnect.launch(job, "localhost:54321");
//    samples.launchers.CloudRemote.launchIPs(job, "192.168.1.171", "192.168.1.172", "192.168.1.173", "192.168.1.174", "192.168.1.175");
//    samples.launchers.CloudRemote.launchIPs(job, "192.168.1.162", "192.168.1.161", "192.168.1.163", "192.168.1.164");
//    samples.launchers.CloudRemote.launchIPs(job, "192.168.1.161", "192.168.1.162", "192.168.1.164");
//    samples.launchers.CloudRemote.launchIPs(job, "192.168.1.162", "192.168.1.164");
//    samples.launchers.CloudRemote.launchIPs(job, "192.168.1.164");
//    samples.launchers.CloudRemote.launchEC2(job, 4);
  }

  @Override protected void execImpl() {
    Log.info("Parsing data.");
    //long seed = 0xC0FFEE;
    long seed = new Random().nextLong();
    double fraction = 1.0;
//    Frame trainf = sampleFrame(TestUtil.parseFromH2OFolder("smalldata/mnist/train10x.csv"), (long)(600000*fraction), seed);
    Frame trainf = sampleFrame(TestUtil.parseFromH2OFolder("smalldata/mnist/train.csv.gz"), (long)(60000*fraction), seed);
    Frame testf = sampleFrame(TestUtil.parseFromH2OFolder("smalldata/mnist/test.csv.gz"), (long)(10000*fraction), seed+1);
    Log.info("Done.");

    DeepLearning p = new DeepLearning();
    // Hinton parameters -> should lead to ~1 % test error after a few dozen million samples
    p.seed = seed;
//    p.hidden = new int[]{1024,1024,2048};
    p.hidden = new int[]{128,128,256};
    p.activation = DeepLearning.Activation.RectifierWithDropout;
    p.loss = DeepLearning.Loss.CrossEntropy;
    p.input_dropout_ratio = 0.2;
    p.epochs = 10;
    p.l1 = 1e-5;
    p.l2 = 0;

    if (true) {
      // automatic learning rate
      p.adaptive_rate = true;
      p.rho = 0.99;
      p.epsilon = 1e-8;
//      p.max_w2 = 15;
      p.max_w2 = Float.POSITIVE_INFINITY;
    } else {
      // manual learning rate
      p.adaptive_rate = false;
      p.rate = 0.01;
      p.rate_annealing = 1e-6;
      p.momentum_start = 0.5;
      p.momentum_ramp = 1800000;
      p.momentum_stable = 0.99;
//      p.max_w2 = 15;
      p.max_w2 = Float.POSITIVE_INFINITY;
    }


    p.initial_weight_distribution = DeepLearning.InitialWeightDistribution.UniformAdaptive;
//    p.initial_weight_scale = 0.01
    p.classification = true;
    p.diagnostics = true;
    p.expert_mode = true;
    p.score_training_samples = 1000;
    p.score_validation_samples = 10000;
    p.validation = testf;
    p.source = trainf;
    p.response = trainf.lastVec();
    p.ignored_cols = null;
    p.classification_stop = -1;
    p.train_samples_per_iteration = -1;
    p.score_interval = 30;
    p.variable_importances = false;
    p.fast_mode = true; //to match old NeuralNet behavior
//    p.ignore_const_cols = true;
    p.ignore_const_cols = false; //to match old NeuralNet behavior and to have images look straight
    p.shuffle_training_data = false;
    p.force_load_balance = true;
    p.replicate_training_data = true;
    p.quiet_mode = false;
    p.invoke();

//    visualize((DeepLearningModel) UKV.get(p.dest()));
  }

}