/*
* This file is part of ALOE.
*
* ALOE is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
* ALOE is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
* You should have received a copy of the GNU General Public License
* along with ALOE. If not, see <http://www.gnu.org/licenses/>.
*
* Copyright (c) 2012 SCCL, University of Washington (http://depts.washington.edu/sccl)
*/
package etc.aloe.options;
import etc.aloe.FileNames;
import java.io.File;
import org.kohsuke.args4j.Argument;
import org.kohsuke.args4j.Option;
/**
* Defines options for all training runs, regardless of pipeline implementation.
*
* @author Michael Brooks <mjbrooks@uw.edu>
*/
public class TrainOptions extends ModeOptions {
@Argument(index = 0, usage = "input CSV file containing messages", required = true, metaVar = "INPUT_CSV")
public File inputCSVFile;
@Argument(index = 1, usage = "output directory (contents may be overwritten)", required = true, metaVar = "OUTPUT_DIR")
private void setOutputDir(File dir) {
this.outputDir = dir;
dir.mkdirs();
outputROCDir = new File(dir, FileNames.OUTPUT_ROC_DIR_NAME);
outputTestsDir = new File(dir, FileNames.OUTPUT_TESTS_DIR_NAME);
outputEvaluationReportFile = new File(dir, FileNames.OUTPUT_EVALUTION_REPORT_NAME);
outputFeatureSpecFile = new File(dir, FileNames.OUTPUT_FEATURE_SPEC_NAME);
outputModelFile = new File(dir, FileNames.OUTPUT_MODEL_NAME);
outputTopFeaturesFile = new File(dir, FileNames.OUTPUT_TOP_FEATURES_NAME);
outputFeatureWeightsFile = new File(dir, FileNames.OUTPUT_FEATURE_WEIGHTS_NAME);
outputFeatureValuesFile = new File(dir, FileNames.OUTPUT_FEATURE_VALUES_NAME);
outputCommandFile = new File(dir, FileNames.OUTPUT_COMMAND_FILE_NAME);
}
public File outputDir;
public File outputROCDir;
public File outputTestsDir;
public File outputEvaluationReportFile;
public File outputFeatureSpecFile;
public File outputModelFile;
public File outputTopFeaturesFile;
public File outputFeatureWeightsFile;
public File outputFeatureValuesFile;
public File outputCommandFile;
@Option(name="--roc", usage="Export data for ROC curves")
public boolean makeROC;
@Option(name="--test-sets", usage="Dump each labeled test set to files")
public boolean outputTests;
@Option(name="--feature-values", usage="output a csv file with feature values for each entity")
public boolean outputFeatureValues = false;
@Override
public void printUsage() {
System.err.println("java -jar aloe.jar PIPELINE_CLASS train INPUT_CSV OUTPUT_DIR [options...]");
}
}