// Copyright (C) 2011-2012 CRS4.
//
// This file is part of Seal.
//
// Seal is free software: you can redistribute it and/or modify it
// under the terms of the GNU General Public License as published by the Free
// Software Foundation, either version 3 of the License, or (at your option)
// any later version.
//
// Seal is distributed in the hope that it will be useful, but
// WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
// or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
// for more details.
//
// You should have received a copy of the GNU General Public License along
// with Seal. If not, see <http://www.gnu.org/licenses/>.
package it.crs4.seal.tsv_sort;
import it.crs4.seal.common.ClusterUtils;
import it.crs4.seal.common.SealToolParser;
import java.util.ArrayList;
import java.io.IOException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.commons.cli.*;
public class TsvSortOptionParser extends SealToolParser {
public static final String ConfigSection = "TsvSort";
private Option keyOption;
private Option delimiterOption;
@SuppressWarnings("static") // for OptionBuilder
public TsvSortOptionParser()
{
super(ConfigSection, "seal tsvsort");
// define custom options
keyOption = OptionBuilder
.withDescription("sort key list. Comma-separated numbers, ranges specified with '-' [default: whole line]")
.hasArg()
.withArgName("index[-last_index]")
.withLongOpt("key")
.create("k");
options.addOption(keyOption);
delimiterOption = OptionBuilder
.withDescription("character string that delimits fields [default: <TAB>]")
.hasArg()
.withArgName("DELIM")
.withLongOpt("field-separator")
.create("t");
options.addOption(delimiterOption);
this.setMinReduceTasks(1);
}
@Override
protected CommandLine parseOptions(Configuration conf, String[] args)
throws IOException, ParseException
{
CommandLine line = super.parseOptions(conf, args);
if (line.hasOption(keyOption.getOpt()))
conf.set(TsvInputFormat.COLUMN_KEYS_CONF, line.getOptionValue(keyOption.getOpt()));
if (line.hasOption(delimiterOption.getOpt()))
{
String delim = line.getOptionValue(delimiterOption.getOpt());
conf.set(TsvInputFormat.DELIM_CONF, delim);
}
// set number of reduce tasks to use
conf.set(ClusterUtils.NUM_RED_TASKS_PROPERTY, String.valueOf(getNReduceTasks()));
return line;
}
}