/* * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */ /* * OutputClusterDistribution.java * Copyright (C) 2009 University of Waikato, Hamilton, New Zealand */ package wekaexamples.clusterers; import weka.clusterers.EM; import weka.core.Instances; import weka.core.Utils; import weka.core.converters.ConverterUtils.DataSource; /** * This example class builds an EM clusterer on a dataset and outputs for * a second dataset the predicted cluster, as well as the cluster membership. * * @author FracPete (fracpete at waikato dot ac dot nz) * @version $Revision$ */ public class OutputClusterDistribution { /** * Expects two parameters: training file and test file. * * @param args the commandline arguments * @throws Exception if something goes wrong */ public static void main(String[] args) throws Exception { // load data Instances train = DataSource.read(args[0]); Instances test = DataSource.read(args[1]); if (!train.equalHeaders(test)) throw new IllegalArgumentException( "Train and test set are not compatible: " + train.equalHeadersMsg(test)); // build clusterer EM clusterer = new EM(); clusterer.buildClusterer(train); // output predictions System.out.println("# - cluster - distribution"); for (int i = 0; i < test.numInstances(); i++) { int cluster = clusterer.clusterInstance(test.instance(i)); double[] dist = clusterer.distributionForInstance(test.instance(i)); System.out.print((i+1)); System.out.print(" - "); System.out.print(cluster); System.out.print(" - "); System.out.print(Utils.arrayToString(dist)); System.out.println(); } } }