/**
* Copyright (c) 2009, Regents of the University of Colorado All rights
* reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* Redistributions of source code must retain the above copyright notice, this
* list of conditions and the following disclaimer. Redistributions in binary
* form must reproduce the above copyright notice, this list of conditions and
* the following disclaimer in the documentation and/or other materials provided
* with the distribution. Neither the name of the University of Colorado at
* Boulder nor the names of its contributors may be used to endorse or promote
* products derived from this software without specific prior written
* permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
package clear.reader;
import clear.dep.DepFeat;
import clear.dep.DepLib;
import clear.dep.DepNode;
import clear.dep.DepTree;
import java.io.IOException;
/**
* CoNLL dependency reader.
*
* @author Jinho D. Choi <b>Last update:</b> 6/26/2010
*/
public class CoNLLXReader extends AbstractReader<DepNode, DepTree> {
private boolean b_train;
/**
* Initializes the dependency reader for
* <code>filename</code>.
*
* @param filename name of the file containing dependency trees
* @param isTrain true if the reader is for training
*/
public CoNLLXReader(String filename, boolean isTrain) {
super(filename);
b_train = isTrain;
}
/**
* Returns the next dependency tree. If there is no more tree, returns null.
*/
@Override
public DepTree nextTree() {
DepTree tree = new DepTree();
boolean isNext = false;
try {
isNext = appendNextTree(tree);
} catch (IOException e) {
e.printStackTrace();
}
return isNext ? tree : null;
}
@Override
protected DepNode toNode(String line, int id) {
DepNode node = new DepNode();
String[] str = line.split(FIELD_DELIM);
node.id = Integer.parseInt(str[0]);
node.form = str[1];
node.lemma = str[2];
node.pos = str[4];
if (!str[5].equals(DepLib.FIELD_BLANK)) {
node.feats = new DepFeat(str[5]);
}
if (b_train) {
node.headId = Integer.parseInt(str[6]);
node.deprel = str[7];
}
return node;
}
}