/*********************************************************************** This file is part of KEEL-software, the Data Mining tool for regression, classification, clustering, pattern mining and so on. Copyright (C) 2004-2010 F. Herrera (herrera@decsai.ugr.es) L. S�nchez (luciano@uniovi.es) J. Alcal�-Fdez (jalcala@decsai.ugr.es) S. Garc�a (sglopez@ujaen.es) A. Fern�ndez (alberto.fernandez@ujaen.es) J. Luengo (julianlm@decsai.ugr.es) This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see http://www.gnu.org/licenses/ **********************************************************************/ package keel.Algorithms.UnsupervisedLearning.AssociationRules.IntervalRuleLearning.ARMMGA; /** * <p> * @author Written by Diana Mart�n (dmartin@ceis.cujae.edu.cu) * @version 1.1 * @since JDK1.6 * </p> */ import java.io.FileNotFoundException; import java.io.IOException; import java.io.PrintWriter; import java.util.ArrayList; import org.core.*; import keel.Dataset.*; public class ARMMGA { /** * <p> * It gathers all the parameters, launches the algorithm, and prints out the results * </p> */ myDataset trans; String assoc_rules_fname; String sup_rules_fname; String valuesOrderFilename; ARMMGAProcess ap; DataB dataBase; ArrayList<AssociationRule> assoc_rules; private String fileTime, fileHora, namedataset; //We may declare here the algorithm's parameters private int popsize; private int nTrials; private double alpha; private int nIntervals; private int kItemsets; private double ps; private double pc; private double pm; long startTime, totalTime; private boolean somethingWrong = false; //to check if everything is correct. /** * Default constructor */ public ARMMGA() { } /** * It reads the data from the input files and parse all the parameters * from the parameters array. * @param parameters parseParameters It contains the input files, output files and parameters */ public ARMMGA(parseParameters parameters) { this.startTime = System.currentTimeMillis(); this.trans = new myDataset(); try { this.namedataset = parameters.getTransactionsInputFile(); System.out.println("\nReading the transaction set: " + parameters.getTransactionsInputFile()); trans.readDataSet( parameters.getTransactionsInputFile() ); } catch (IOException e) { System.err.println("There was a problem while reading the input transaction set: " + e); somethingWrong = true; } //We may check if there are some numerical attributes, because our algorithm may not handle them: //somethingWrong = somethingWrong || train.hasNumericalAttributes(); this.somethingWrong = this.somethingWrong || this.trans.hasMissingAttributes(); this.assoc_rules_fname = parameters.getAssociationRulesFile(); this.sup_rules_fname = parameters.getOutputFile(0); this.valuesOrderFilename = parameters.getOutputFile(1); this.fileTime = (parameters.getOutputFile(0)).substring(0,(parameters.getOutputFile(0)).lastIndexOf('/')) + "/time.txt"; this.fileHora = (parameters.getOutputFile(0)).substring(0,(parameters.getOutputFile(0)).lastIndexOf('/')) + "/hora.txt"; long seed = Long.parseLong(parameters.getParameter(0)); this.kItemsets = Integer.parseInt( parameters.getParameter(1) ); this.popsize = Integer.parseInt( parameters.getParameter(2) ); this.nTrials = Integer.parseInt( parameters.getParameter(3) ); this.alpha = Double.parseDouble( parameters.getParameter(4) ); this.ps = Double.parseDouble( parameters.getParameter(5) ); this.pc = Double.parseDouble( parameters.getParameter(6) ); this.pm = Double.parseDouble( parameters.getParameter(7) ); this.nIntervals = Integer.parseInt( parameters.getParameter(8)); if (this.kItemsets > this.trans.getnVars()) this.kItemsets = this.trans.getnVars(); Randomize.setSeed(seed); } /** * It launches the algorithm */ public void execute() { if (somethingWrong) { //We do not execute the program System.err.println("An error was found"); System.err.println("Aborting the program"); //We should not use the statement: System.exit(-1); } else { this.dataBase = new DataB(this.nIntervals, this.trans); this.ap = new ARMMGAProcess(this.trans, this.dataBase, this.nTrials, this.popsize, this.kItemsets, this.ps, this.pc, this.pm, this.alpha); this.ap.run(); this.assoc_rules = this.ap.getRules(); try { PrintWriter rule_writer = new PrintWriter(assoc_rules_fname); PrintWriter sup_writer = new PrintWriter(sup_rules_fname); PrintWriter valueOrder_writer = new PrintWriter(this.valuesOrderFilename); rule_writer.println("<?xml version=\"1.0\" encoding=\"UTF-8\"?>"); rule_writer.println("<association_rules>"); sup_writer.println("<?xml version=\"1.0\" encoding=\"UTF-8\"?>"); sup_writer.println("<values>"); valueOrder_writer.print("<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n"); valueOrder_writer.println("<values>"); for (int i=0; i < assoc_rules.size(); i++) { AssociationRule a_r = assoc_rules.get(i); ArrayList<Gene> ant = a_r.getAntecedent(); ArrayList<Gene> cons = a_r.getConsequent(); rule_writer.println("<rule id=\"" + i + "\">"); sup_writer.println("<rule id=\"" + i + "\" rule_support=\"" + ARMMGAProcess.roundDouble(a_r.getAll_support(),2) + "\" antecedent_support=\"" + ARMMGAProcess.roundDouble(a_r.getSupport(),2) + "\" consequent_support=\"" + ARMMGAProcess.roundDouble(a_r.getSupport_consq(),2) + "\" confidence=\"" + ARMMGAProcess.roundDouble(a_r.getConfidence(),2) +"\" lift=\"" + ARMMGAProcess.roundDouble(a_r.getLift(),2) + "\" conviction=\"" + ARMMGAProcess.roundDouble(a_r.getConv(),2) + "\" certainFactor=\"" + ARMMGAProcess.roundDouble(a_r.getCF(),2) + "\" netConf=\"" + ARMMGAProcess.roundDouble(a_r.getNetConf(),2) + "\" yulesQ=\"" + ARMMGAProcess.roundDouble(a_r.getYulesQ(),2) + "\" nAttributes=\"" + (a_r.getAntecedent().size()+ a_r.getConsequent().size()) + "\"/>"); rule_writer.println("<antecedents>"); for (int j=0; j < ant.size(); j++) { Gene g_ant = ant.get(j); createRule(g_ant, rule_writer); } rule_writer.println("</antecedents>"); rule_writer.println("<consequents>"); for (int j=0; j < cons.size(); j++) { Gene g_cons = cons.get(j); createRule(g_cons, rule_writer); } rule_writer.println("</consequents>"); rule_writer.println("</rule>"); } rule_writer.println("</association_rules>"); sup_writer.println("</values>"); ap.saveReport(this.assoc_rules, sup_writer); rule_writer.close(); sup_writer.close(); valueOrder_writer.print(this.ap.printRules(this.assoc_rules)); valueOrder_writer.println("</values>"); valueOrder_writer.close(); totalTime = System.currentTimeMillis() - startTime; this.writeTime(); System.out.println("Algorithm Finished"); } catch (FileNotFoundException e) { e.printStackTrace(); } } } public void writeTime() { long seg, min, hor; String stringOut = new String(""); stringOut = "" + totalTime / 1000 + " " + this.namedataset + assoc_rules_fname + "\n"; Files.addToFile(this.fileTime, stringOut); totalTime /= 1000; seg = totalTime % 60; totalTime /= 60; min = totalTime % 60; hor = totalTime / 60; stringOut = ""; if (hor < 10) stringOut = stringOut + "0"+ hor + ":"; else stringOut = stringOut + hor + ":"; if (min < 10) stringOut = stringOut + "0"+ min + ":"; else stringOut = stringOut + min + ":"; if (seg < 10) stringOut = stringOut + "0"+ seg; else stringOut = stringOut + seg; stringOut = stringOut + " " + assoc_rules_fname + "\n"; Files.addToFile(this.fileHora, stringOut); } private void createRule(Gene g, PrintWriter w) { int i; int attr = g.getAttr(); Intervals inter; ArrayList<Integer> value = g.getValue(); w.print("<attribute name=\"" + Attributes.getAttribute(attr).getName() + "\" value=\""); if ( g.getType() == myDataset.NOMINAL ) { for (i=0; i < value.size()-1; i++) { w.print(Attributes.getAttribute(attr).getNominalValue(value.get(i).intValue())); } w.print(Attributes.getAttribute(attr).getNominalValue(value.get(value.size()-1).intValue())); } else { for (i=0; i < value.size()-1; i++) { inter = this.dataBase.getInterval(attr, value.get(i).intValue()); w.print("[" + inter.getLeft() + ", " + inter.getRight() + "]"); } inter = this.dataBase.getInterval(attr, value.get(value.size()-1).intValue()); w.print("[" + inter.getLeft() + ", " + inter.getRight() + "]"); } w.println("\" />"); } }