package water.parser;
import java.io.File;
import java.io.IOException;
import java.util.Arrays;
import org.junit.*;
import water.Job;
import water.Key;
import water.TestUtil;
import water.fvec.Frame;
import water.fvec.NFSFileVec;
import water.fvec.Vec;
import water.util.FileUtils;
public class ParseFolderTestBig extends TestUtil {
@BeforeClass static public void setup() { stall_till_cloudsize(1); }
// "dataset directory is not usually available"
@Test @Ignore
public void testCovtype() {
Frame k1 = null, k2 = null;
try {
k2 = parse_test_folder("datasets/parse_folder_test");
k1 = parse_test_file ("datasets/UCI/UCI-large/covtype/covtype.data");
Assert.assertTrue("parsed values do not match!", TestUtil.isBitIdentical(k1,k2));
} finally {
if( k1 != null ) k1.delete();
if( k2 != null ) k2.delete();
}
}
// "bigdata directory is not usually available"
@Test @Ignore
public void testKDDCup() {
Frame k1 = null, k2 = null;
try {
k1 = parse_test_file("bigdata/laptop/usecases/cup98LRN_z.csv");
Vec v1 = k1.vec("RDATE_5");
System.out.println(v1.toString());
System.out.printf("%b %e %d %b %s\n", v1.isCategorical(), v1.min(), v1.naCnt(), v1.isCategorical(), Arrays.toString(v1.domain()));
k2 = parse_test_file("bigdata/laptop/usecases/cup98VAL_z.csv");
Vec v2 = k2.vec("SOLIH");
System.out.println(v2.toString());
System.out.printf("%b %e %d %b %s\n",v2.isCategorical(),v2.min(),v2.naCnt(),v2.isCategorical(),Arrays.toString(v2.domain()));
} finally {
if( k1 != null ) k1.delete();
if( k2 != null ) k2.delete();
}
}
@Test @Ignore
public void testBIGSVM() {
String fname = "bigdata/cust_K/1m.svm";
Frame k1 = null;
try {
File f = FileUtils.getFile(fname);
NFSFileVec nfs = NFSFileVec.make(f);
Job<Frame> job = ParseDataset.parse(Key.make("BIGSVM.hex"), new Key[]{nfs._key}, true, ParseSetup.guessSetup(new Key[]{nfs._key}, false, ParseSetup.GUESS_HEADER), false)._job;
while (job.progress() < 1.0) {
System.out.print(((int) (job.progress() * 1000.0)) / 10.0 + "% ");
try {
Thread.sleep(1000);
} catch (InterruptedException ignore) { /*comment to disable ideaJ warning*/}
}
System.out.println();
k1 = job.get();
System.out.println(k1.toString());
} catch (IOException ioe) {
Assert.fail("File not found: " + fname + " - " + ioe.getMessage());
} finally {
if( k1 != null ) k1.delete();
}
}
}