/* * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */ /* * Copyright (C) 2009 Amri Napolitano */ package weka.filters.unsupervised.attribute; import weka.core.Attribute; import weka.core.AttributeStats; import weka.core.Instances; import weka.core.TestInstances; import weka.filters.AbstractFilterTest; import weka.filters.Filter; import weka.filters.unsupervised.attribute.StringToNominal; import weka.filters.unsupervised.attribute.NominalToBinary; import weka.filters.unsupervised.attribute.Remove; import junit.framework.Test; import junit.framework.TestSuite; /** * Tests EMImputation. Run from the command line with:<p> * java weka.filters.unsupervised.attribute.EMImputationTest * * @author Amri Napolitano * @version $Revision$ */ public class EMImputationTest extends AbstractFilterTest { public EMImputationTest(String name) { super(name); } /** Creates a default EMImputation */ public Filter getFilter() { return new EMImputation(); } protected void setUp() throws Exception { super.setUp(); Instances temp = new Instances(m_Instances); for (int j = 0; j < 2; j++) { for (int i = 0; i < temp.numInstances(); i++) { m_Instances.add(temp.instance(i)); } } // now just filter the instances to convert String attributes // and binarize nominal attributes StringToNominal stn = new StringToNominal(); stn.setAttributeRange("first-last"); stn.setInputFormat(m_Instances); m_Instances = Filter.useFilter(m_Instances, stn); NominalToBinary ntb = new NominalToBinary(); ntb.setInputFormat(m_Instances); m_Instances = Filter.useFilter(m_Instances, ntb); // remove the last column (date attribute) Remove r = new Remove(); r.setAttributeIndices("last"); r.setInputFormat(m_Instances); m_Instances = Filter.useFilter(m_Instances, r); } protected Instances getFilteredClassifierData() throws Exception { TestInstances test; Instances result; test = TestInstances.forCapabilities(getFilter().getCapabilities()); test.setClassIndex(TestInstances.CLASS_IS_LAST); test.setNumNumeric(3); result = test.generate(); return result; } public void testTypical() { Instances result = useFilter(); // Number of attributes shouldn't change assertEquals(m_Instances.numAttributes(), result.numAttributes()); // Number of instances may change (if an instance has all missing values) // assertEquals(m_Instances.numInstances(), result.numInstances()); for (int j = 0; j < result.numAttributes(); j++) { if (j == m_Instances.classIndex() && m_Instances.attribute(j).isNumeric() == false) { continue; } AttributeStats currentStats = m_Instances.attributeStats(j); if (currentStats.distinctCount < 2) { continue; } assertTrue("All missing values except for those in nonnumeric class " + "attributes should be replaced.", result.attributeStats(j).missingCount == 0); } } public static Test suite() { return new TestSuite(EMImputationTest.class); } public static void main(String[] args){ junit.textui.TestRunner.run(suite()); } }