/***********************************************************************
This file is part of KEEL-software, the Data Mining tool for regression,
classification, clustering, pattern mining and so on.
Copyright (C) 2004-2010
F. Herrera (herrera@decsai.ugr.es)
L. S�nchez (luciano@uniovi.es)
J. Alcal�-Fdez (jalcala@decsai.ugr.es)
S. Garc�a (sglopez@ujaen.es)
A. Fern�ndez (alberto.fernandez@ujaen.es)
J. Luengo (julianlm@decsai.ugr.es)
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see http://www.gnu.org/licenses/
**********************************************************************/
package keel.Algorithms.Genetic_Rule_Learning.M5Rules;
/**
* Stores split information.
*/
public final class SplitInfo {
int number; // number of total instances
int first; // first instance index
int last; // last instance index
int position; // position of maximum impurity reduction
double maxImpurity; // maximum impurity reduction
double leftAve; // left average class value
double rightAve; // right average class value
int splitAttr; // spliting attribute
double splitValue; // splitting value
/**
* Constructs an object which contains the split information
* @param low the index of the first instance
* @param high the index of the last instance
* @param attr an attribute
*/
public SplitInfo(int low, int high, int attr) {
number = high - low + 1;
first = low;
last = high;
position = -1;
maxImpurity = -1.e20;
splitAttr = attr; // attr < 0 is an empty object
splitValue = 0.0;
}
/**
* Makes a copy of this SplitInfo object
* @return the copy of this SplitInfo
*/
public final SplitInfo copy() {
SplitInfo s = new SplitInfo(first, last, -1);
s.number = number;
s.first = first;
s.last = last;
s.position = position;
s.maxImpurity = maxImpurity;
s.leftAve = leftAve;
s.rightAve = rightAve;
s.splitAttr = splitAttr;
s.splitValue = splitValue;
return s;
}
/**
* Resets the object of split information
* @param low the index of the first instance
* @param high the index of the last instance
* @param attr the attribute
*/
public final void initialize(int low, int high, int attr) {
number = high - low + 1;
first = low;
last = high;
position = -1;
maxImpurity = -1.e20;
splitAttr = attr;
splitValue = 0.0;
}
/**
* Converts the spliting information to string
* @param inst the instances
* @return the spliting information to string
*/
public final String toString(MyDataset inst) {
StringBuffer text = new StringBuffer();
text.append("Print SplitInfo:\n");
text.append(" Instances:\t\t" + number + " (" + first + "-" +
position + "," + (position + 1) + "-" + last + ")\n");
text.append(" Maximum Impurity Reduction:\t" +
M5.doubleToStringG(maxImpurity, 1, 4) + "\n");
text.append(" Left average:\t" + leftAve + "\n");
text.append(" Right average:\t" + rightAve + "\n");
if (maxImpurity > 0.0) {
text.append(" Splitting function:\t" +
inst.getAttribute(splitAttr).name() + " = " + splitValue +
"\n");
} else {
text.append(" Splitting function:\tnull\n");
}
return text.toString();
}
/**
* Finds the best splitting point for an attribute in the instances
* @param attr the splitting attribute
* @param inst the instances
* @exception Exception if something goes wrong
*/
public final void attrSplit(int attr, MyDataset inst) throws Exception {
int i, len, count, part;
Impurity imp;
int low = 0;
int high = inst.numItemsets() - 1;
this.initialize(low, high, attr);
if (number < 4) {
return;
}
len = ((high - low + 1) < 5) ? 1 : (high - low + 1) / 5;
/* if(len>25)len=25; */
// len=1;
position = low;
part = low + len - 1;
imp = new Impurity(part, attr, inst, 5);
count = 0;
for (i = low + len; i <= high - len - 1; i++) {
imp.incremental(inst.itemset(i).getClassValue(), 1);
if (M5.eqDouble(inst.itemset(i + 1).getValue(attr),
inst.itemset(i).getValue(attr)) == false) {
count = i;
if (imp.impurity > maxImpurity) {
maxImpurity = imp.impurity;
splitValue = (inst.itemset(i).getValue(attr) +
inst.itemset(i + 1).getValue(attr)) * 0.5;
leftAve = imp.sl / imp.nl;
rightAve = imp.sr / imp.nr;
position = i;
}
}
}
}
}