/**
* Copyright (c) 2010, Regents of the University of Colorado All rights
* reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* Redistributions of source code must retain the above copyright notice, this
* list of conditions and the following disclaimer. Redistributions in binary
* form must reproduce the above copyright notice, this list of conditions and
* the following disclaimer in the documentation and/or other materials provided
* with the distribution. Neither the name of the University of Colorado at
* Boulder nor the names of its contributors may be used to endorse or promote
* products derived from this software without specific prior written
* permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
package clear.ftr.xml;
import java.io.InputStream;
import java.util.regex.Pattern;
import org.w3c.dom.Document;
/**
* Dependency feature template.
*
* @author Jinho D. Choi <b>Last update:</b> 4/12/2011
*/
public class DepFtrXml extends AbstractFtrXml {
static public final char LAMBDA = 'l';
static public final char BETA = 'b';
static public final String R_HD = "hd"; // head
static public final String R_LM = "lm"; // leftmost dependent
static public final String R_RM = "rm"; // rightmost dependent
static public final String R_LS = "ls"; // left sibling
static public final String R_RS = "rs"; // right sibling
static public final String R_VC = "vc"; // highest verb chain
static public final String F_FORM = "f";
static public final String F_LEMMA = "m";
static public final String F_POS = "p";
static public final String F_DEPREL = "d";
static public final Pattern P_REL = Pattern.compile(R_HD + "|" + R_LM + "|" + R_RM + "|" + R_LS + "|" + R_RS + "|" + R_VC);
static public final Pattern P_FIELD = Pattern.compile(F_FORM + "|" + F_LEMMA + "|" + F_POS + "|" + F_DEPREL);
static public final Pattern P_FEAT = Pattern.compile("^ft=(.+)$");
static public final Pattern P_TRANS = Pattern.compile("^tr(\\d+)$"); // transition
static public final Pattern P_KR = Pattern.compile("^kr(.)(\\d*)$");
public DepFtrXml(String featureXml) {
super(featureXml);
}
public DepFtrXml(InputStream fin) {
super(fin);
}
@Override
protected void initFeatures(Document doc) throws Exception {
}
@Override
protected boolean validSource(char token) {
return token == LAMBDA || token == BETA;
}
@Override
protected boolean validRelation(String relation) {
return P_REL.matcher(relation).matches();
}
@Override
protected boolean validField(String field) {
return P_FIELD.matcher(field).matches()
|| P_FEAT.matcher(field).matches()
|| P_TRANS.matcher(field).matches()
|| P_KR.matcher(field).matches();
}
}