// Copyright (C) 2011-2012 CRS4. // // This file is part of Seal. // // Seal is free software: you can redistribute it and/or modify it // under the terms of the GNU General Public License as published by the Free // Software Foundation, either version 3 of the License, or (at your option) // any later version. // // Seal is distributed in the hope that it will be useful, but // WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY // or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License // for more details. // // You should have received a copy of the GNU General Public License along // with Seal. If not, see <http://www.gnu.org/licenses/>. package it.crs4.seal.recab; import it.crs4.seal.common.SealToolParser; import it.crs4.seal.common.ClusterUtils; import java.util.ArrayList; import java.io.IOException; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.Path; import org.apache.commons.cli.*; public class RecabTableOptionParser extends SealToolParser { public static final String ConfigSection = "RecabTable"; private Option vcfFileOpt; private Path vcfFilePath; private Option rodFileOpt; private Path rodFilePath; private Configuration conf; @SuppressWarnings("static") // for OptionBuilder public RecabTableOptionParser() { super(ConfigSection, "seal recab_table"); // define the options vcfFileOpt = OptionBuilder .withDescription("VCF file with known variation sites") .hasArg() .withArgName("FILE") .withLongOpt("vcf-file") .create("vcf"); options.addOption(vcfFileOpt); rodFileOpt = OptionBuilder .withDescription("ROD file with known variation sites") .hasArg() .withArgName("FILE") .withLongOpt("rod-file") .create("rod"); options.addOption(rodFileOpt); this.setMinReduceTasks(1); this.setAcceptedInputFormats(new String[] { "bam", "sam" }); conf = null; } @Override protected CommandLine parseOptions(Configuration conf, String[] args) throws IOException, ParseException { if (conf == null) throw new NullPointerException("null conf provided"); this.conf = conf; CommandLine line = super.parseOptions(conf, args); if (line.hasOption(vcfFileOpt.getOpt()) && line.hasOption(rodFileOpt.getOpt())) throw new ParseException("You can't specify both VCF (" + vcfFileOpt.getLongOpt() + ") and ROD (" + rodFileOpt.getLongOpt() + ") files. Please specify one or the other."); if (line.hasOption(vcfFileOpt.getOpt())) { vcfFilePath = new Path( line.getOptionValue(vcfFileOpt.getOpt()) ); if (!vcfFilePath.getFileSystem(conf).exists(vcfFilePath)) throw new ParseException("File " + vcfFilePath + " doesn't exist"); } else if (line.hasOption(rodFileOpt.getOpt())) { rodFilePath = new Path( line.getOptionValue(rodFileOpt.getOpt()) ); if (!rodFilePath.getFileSystem(conf).exists(rodFilePath)) throw new ParseException("File " + rodFilePath + " doesn't exist"); } else throw new ParseException("You must specify a file with known genetic variation sites (either VCF or ROD)."); // set number of reduce tasks to use conf.set(ClusterUtils.NUM_RED_TASKS_PROPERTY, String.valueOf(getNReduceTasks())); return line; } public Path getVcfFile() { return vcfFilePath; } public Path getRodFile() { return rodFilePath; } }