/** * */ package vn.hus.nlp.tagger; /** * @author LE HONG Phuong, phuonglh@gmail.com * <p> * Jun 16, 2009, 12:01:30 PM * <p> * Some predefined constants for use in the tagger. */ public interface IConstants { /** * The default maxent model file of the Vietnamese tagger. */ public static String DEFAULT_MODEL_FILE = "resources/models/vtb.tagger"; // the experiment 1 (reported in the article) // public static String DEFAULT_MODEL_FILE = "experiments/fold1/left5words-vtb-1.tagger"; /** * The default properties file for training the tagger. */ // public static String DEFAULT_TRAINING_PROPERTIES = "data/conf/left3words-vtb-0.tagger.props"; // public static String DEFAULT_TRAINING_PROPERTIES = "data/conf/left3words-vtb-1.tagger.props"; // public static String DEFAULT_TRAINING_PROPERTIES = "data/conf/left5words-vtb-1.tagger.props"; // public static String DEFAULT_TRAINING_PROPERTIES = "data/conf/bidirectional5-vtb-1.tagger.props"; // public static String DEFAULT_TRAINING_PROPERTIES = "experiments/fold1/left5words-vtb-1.tagger.props"; // the experiment done with Stanford Maxent Tagger 2.0 public static String DEFAULT_TRAINING_PROPERTIES = "data/conf2/vnTagger.props"; /** * The delimiter between words and tags. */ public static final String DELIM = "/"; /** * The Vietnamese treebank file. */ public static String TREEBANK = "data/vtb-20091030.txt"; /** * The whole tagged corpus extracted from the Vietnamese treebank. */ public static String CORPUS = "data/vtb-20091030.tagged.txt"; /** * The training corpus. */ // public static String CORPUS_TRAINING = CORPUS; public static String CORPUS_TRAINING = "data/vtb-train.txt"; /** * The test corpus. */ public static String CORPUS_TEST = "data/vtb-test.txt"; }