// Copyright (C) 2011-2012 CRS4.
//
// This file is part of Seal.
//
// Seal is free software: you can redistribute it and/or modify it
// under the terms of the GNU General Public License as published by the Free
// Software Foundation, either version 3 of the License, or (at your option)
// any later version.
//
// Seal is distributed in the hope that it will be useful, but
// WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
// or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
// for more details.
//
// You should have received a copy of the GNU General Public License along
// with Seal. If not, see <http://www.gnu.org/licenses/>.
package it.crs4.seal.common;
import java.util.ArrayList;
public class CutString
{
public static class FormatException extends Exception {
private static final long serialVersionUID = 1L;
public FormatException(String msg, String record)
{
super(msg + "Record: " + record.toString());
}
}
private final String delim;
private ArrayList<Integer> columns;
private String[] extractedFields;
/**
* @param delim: delimiter string that separates fields within the records to be scanned.
* @param cols: the sorted, zero-based indices of the columns to be extracted from the records.
*/
public CutString(String delimiter, int... cols)
{
if (delimiter.length() == 0)
throw new IllegalArgumentException("empty string is an invalid delimiter");
delim = delimiter;
columns = new ArrayList<Integer>(cols.length);
for (int c: cols)
columns.add(c);
if (columns.size() == 0)
throw new IllegalArgumentException("no columns specified");
// ensure the columns are in sorted order
for (int i = 1; i < columns.size(); ++i)
{
if ( columns.get(i-1) >= columns.get(i) )
throw new IllegalArgumentException("specified columns must be in sorted order and must not contain duplicates");
}
// initialize index
extractedFields = new String[columns.size()];
// initialize so that trying to access the fields before
// calling loadRecord results in obviously bad stuff
for (int i = 0; i < extractedFields.length; ++i)
extractedFields[i] = null;
}
public void loadRecord(String record) throws FormatException
{
int pos = 0; // the byte position within the record
int fieldno = 0; // the field index within the record
int colno = 0; // the index within the list of requested fields (columns)
while (pos < record.length() && colno < columns.size()) // iterate over each field
{
int endpos = record.indexOf(delim, pos); // the field's end position
if (endpos < 0)
endpos = record.length();
if (columns.get(colno) == fieldno) // if we're at a requested field
{
extractedFields[colno] = record.substring(pos, endpos);
colno += 1; // advance column
}
pos = endpos + 1; // the next starting position is the current end + 1
fieldno += 1;
}
if (colno < columns.size())
throw new FormatException("Missing field(s) in record. Field " + colno + " (zero-based) not found.", record);
}
public String getField(int i)
{
return extractedFields[i];
}
}