/** * Global Sensor Networks (GSN) Source Code * Copyright (c) 2006-2016, Ecole Polytechnique Federale de Lausanne (EPFL) * * This file is part of GSN. * * GSN is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * GSN is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with GSN. If not, see <http://www.gnu.org/licenses/>. * * File: src/weka/filters/unsupervised/instance/RandomSample.java * * @author Julien Eberle * @author Sofiane Sarni * */ package weka.filters.unsupervised.instance; import java.util.Random; import weka.core.Instances; import weka.core.OptionHandler; import weka.filters.UnsupervisedFilter; /** * A filter that resample the instances randomly, given a certain ratio. * @author jeberle * */ public class RandomSample extends weka.filters.SimpleBatchFilter implements UnsupervisedFilter, OptionHandler{ private static final long serialVersionUID = -6080185146245135909L; private int m_ratio = 1; @Override public String globalInfo() { return "A filter that resample the instances randomly, given a certain ratio."; } @Override protected Instances determineOutputFormat(Instances inputFormat) throws Exception { return inputFormat; } @Override protected Instances process(Instances instances) throws Exception { Instances output = new Instances(instances); if(instances.numInstances() <= 2*m_ratio){return output;} Random r = new Random(); for(int i=output.numInstances()-1;i>=0;i--){ if(output.numInstances()>2 && r.nextInt(m_ratio) != 0){output.delete(i);} } return output; } public int getM_ratio() { return m_ratio; } public void setM_ratio(int m_ratio) { this.m_ratio = m_ratio; } }