/*
* This file is part of ELKI:
* Environment for Developing KDD-Applications Supported by Index-Structures
*
* Copyright (C) 2017
* ELKI Development Team
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
package de.lmu.ifi.dbs.elki.datasource;
import java.io.BufferedInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.List;
import de.lmu.ifi.dbs.elki.datasource.filter.ObjectFilter;
import de.lmu.ifi.dbs.elki.datasource.parser.ArffParser;
import de.lmu.ifi.dbs.elki.datasource.parser.NumberVectorLabelParser;
import de.lmu.ifi.dbs.elki.datasource.parser.Parser;
import de.lmu.ifi.dbs.elki.utilities.Alias;
import de.lmu.ifi.dbs.elki.utilities.exceptions.AbortException;
import de.lmu.ifi.dbs.elki.utilities.io.FileUtil;
import de.lmu.ifi.dbs.elki.utilities.optionhandling.OptionID;
import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameterization.Parameterization;
import de.lmu.ifi.dbs.elki.utilities.optionhandling.parameters.FileParameter;
/**
* File based database connection based on the parser to be set.
*
* @author Arthur Zimek
* @since 0.2
*
* @apiviz.landmark
*/
@Alias("de.lmu.ifi.dbs.elki.database.connection.FileBasedDatabaseConnection")
public class FileBasedDatabaseConnection extends InputStreamDatabaseConnection {
/**
* Constructor.
*
* @param filters Filters, can be null
* @param parser the parser to provide a database
* @param infile File to load the data from
*/
public FileBasedDatabaseConnection(List<ObjectFilter> filters, Parser parser, File infile) {
super(null, filters, parser);
try {
this.in = new BufferedInputStream(FileUtil.tryGzipInput(new FileInputStream(infile)));
}
catch(IOException e) {
throw new AbortException("Could not load input file: " + infile, e);
}
}
/**
* Constructor.
*
* @param filters Filters, can be null
* @param parser the parser to provide a database
* @param infile File to load the data from
*/
public FileBasedDatabaseConnection(List<ObjectFilter> filters, Parser parser, String infile) {
super(null, filters, parser);
try {
this.in = new BufferedInputStream(FileUtil.tryGzipInput(new FileInputStream(infile)));
}
catch(IOException e) {
throw new AbortException("Could not load input file: " + infile, e);
}
}
/**
* Constructor.
*
* @param filters Filters, can be null
* @param parser the parser to provide a database
* @param in Input stream
*/
public FileBasedDatabaseConnection(List<ObjectFilter> filters, Parser parser, InputStream in) {
super(in, filters, parser);
}
/**
* Parameterization class.
*
* @author Erich Schubert
*
* @apiviz.exclude
*/
public static class Parameterizer extends InputStreamDatabaseConnection.Parameterizer {
/**
* Parameter that specifies the name of the input file to be parsed.
* <p>
* Key: {@code -dbc.in}
* </p>
*/
public static final OptionID INPUT_ID = new OptionID("dbc.in", "The name of the input file to be parsed.");
/**
* Input stream to process.
*/
protected File infile;
@Override
protected void makeOptions(Parameterization config) {
Class<? extends Parser> defaultParser = NumberVectorLabelParser.class;
// Add the input file first, for usability reasons.
final FileParameter inputParam = new FileParameter(INPUT_ID, FileParameter.FileType.INPUT_FILE);
if(config.grab(inputParam)) {
infile = inputParam.getValue();
String nam = infile.getName();
if(nam != null && (nam.endsWith(".arff") || nam.endsWith(".arff.gz"))) {
defaultParser = ArffParser.class;
}
}
configParser(config, Parser.class, defaultParser);
configFilters(config);
}
@Override
protected FileBasedDatabaseConnection makeInstance() {
return new FileBasedDatabaseConnection(filters, parser, infile);
}
}
}