HGMinRiskDAMert.java example

Explorer
relax-decode-master
- third-party
package joshua.discriminative.training.risk_annealer.hypergraph;

import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.logging.Logger;

import joshua.corpus.vocab.BuildinSymbol;
import joshua.corpus.vocab.SymbolTable;
import joshua.decoder.BLEU;
import joshua.decoder.JoshuaDecoder;
import joshua.decoder.ff.FeatureFunction;
import joshua.decoder.hypergraph.DiskHyperGraph;
import joshua.decoder.hypergraph.KBestExtractor;
import joshua.discriminative.FileUtilityOld;
import joshua.discriminative.feature_related.feature_function.FeatureTemplateBasedFF;
import joshua.discriminative.feature_related.feature_template.BaselineFT;
import joshua.discriminative.feature_related.feature_template.FeatureTemplate;
import joshua.discriminative.feature_related.feature_template.IndividualBaselineFT;
import joshua.discriminative.feature_related.feature_template.MicroRuleFT;
import joshua.discriminative.feature_related.feature_template.NgramFT;
import joshua.discriminative.feature_related.feature_template.TMFT;
import joshua.discriminative.feature_related.feature_template.TargetTMFT;
import joshua.discriminative.ranker.HGRanker;
import joshua.discriminative.training.NbestMerger;
import joshua.discriminative.training.risk_annealer.AbstractMinRiskMERT;
import joshua.discriminative.training.risk_annealer.DeterministicAnnealer;
import joshua.discriminative.training.risk_annealer.GradientComputer;
import joshua.discriminative.training.risk_annealer.nbest.NbestMinRiskDAMert;
import joshua.util.FileUtility;

public class HGMinRiskDAMert extends AbstractMinRiskMERT {
	
	JoshuaDecoder joshuaDecoder;
	String sourceTrainingFile;

	SymbolTable symbolTbl;
	
	List<FeatureTemplate> featTemplates;
	HashMap<String, Integer> featureStringToIntegerMap;
	
	MicroRuleFT microRuleFeatureTemplate = null;
	
	String hypFilePrefix;//training hypothesis file prefix
	String curConfigFile;
	String curFeatureFile;
	String curHypFilePrefix;
	
	boolean useIntegerString = false;//TODO
	
	boolean haveRefereces = true;
	
	int oldTotalNumHyp = 0;
	
	
	//== for loss-augmented pruning
	double curLossScale = 0;
	int oralceFeatureID = 0;
	
	static private Logger logger = 
		Logger.getLogger(HGMinRiskDAMert.class.getSimpleName());
	
	
	public HGMinRiskDAMert(String configFile, int numSentInDevSet, String[] devRefs, String hypFilePrefix, SymbolTable symbolTbl, String sourceTrainingFile) {
		
		super(configFile, numSentInDevSet, devRefs);	
		this.symbolTbl = symbolTbl;
		
		if(devRefs!=null){
			haveRefereces = true;
			for(String refFile : devRefs){
				logger.info("add symbols for file " + refFile);
				addAllWordsIntoSymbolTbl(refFile, symbolTbl);
			}
		}else{
			haveRefereces = false;			
		}
		
		this.initialize();
		
		this.hypFilePrefix = hypFilePrefix;		
		this.sourceTrainingFile = sourceTrainingFile;
		
		if(MRConfig.oneTimeHGRerank==false){
			joshuaDecoder = JoshuaDecoder.getUninitalizedDecoder();
			joshuaDecoder.initialize(configFile);
		}
		
		//oralce id-realted
		Integer id = inferOracleFeatureID(this.configFile);
		if(id != null && MRConfig.lossAugmentedPrune==false ){
			logger.severe("lossAugmentedPrune=false, but has a oracle model");
			System.exit(1);
		}
		if(MRConfig.lossAugmentedPrune == true){
			if(id==null){
				logger.severe("no oralce model while doing loss-augmented pruning, must be wrong");
				System.exit(1);
			}else{
				this.oralceFeatureID = id;
			}
			
			this.curLossScale = MRConfig.startLossScale;
			logger.info("startLossScale="+MRConfig.startLossScale+"; oralceFeatureID="+this.oralceFeatureID);
		}
		
		
		if(haveRefereces==false){//minimize conditional entropy
			MRConfig.temperatureAtNoAnnealing = 1;//TODO
		}else{
			if(MRConfig.useModelDivergenceRegula){
				System.out.println("supervised training, we should not do model divergence regular");
				System.exit(0);
			}
		}
			
	}

	
	
	public void mainLoop(){
		
		/**Here, we need multiple iterations as we do pruning when generate the hypergraph
		 * Note that DeterministicAnnealer itself many need to solve an optimization problem at each temperature,
		 * and each optimization is solved by LBFGS which itself involves many iterations (of computing gradients) 
		 * */
        for(int iter=1; iter<=MRConfig.maxNumIter; iter++){
        	
        	//==== re-normalize weights, and save config files
        	this.curConfigFile =  configFile+"." + iter;
        	this.curFeatureFile = MRConfig.featureFile +"." + iter;
        	if(MRConfig.normalizeByFirstFeature)
        		normalizeWeightsByFirstFeature(lastWeightVector, 0);        	     	
        	saveLastModel(configFile, curConfigFile, MRConfig.featureFile, curFeatureFile);
        	//writeConfigFile(lastWeightVector, configFile, configFile+"." + iter);
        	
        	//==== re-decode based on the new weights
        	if(MRConfig.oneTimeHGRerank){
	        	this.curHypFilePrefix = hypFilePrefix; 
        	}else{
        		this.curHypFilePrefix = hypFilePrefix +"." + iter;
	        	decodingTestSet(null, curHypFilePrefix);
        	}

        	
        	//==== merge hypergrphs and check convergency
        	if(MRConfig.hyp_merge_mode>0){
        		try {
		        	String oldMergedFile = hypFilePrefix +".merged." + (iter-1);
		        	String newMergedFile = hypFilePrefix +".merged." + (iter);
		        	int newTotalNumHyp =0;
		        	
		        	if(MRConfig.use_kbest_hg==false && MRConfig.hyp_merge_mode==2){
		        		System.out.println("use_kbest_hg==false && MRConfig.hyp_merge_mode; we will look at the nbest");
		            	if(iter ==1){
		            		FileUtility.copyFile(curHypFilePrefix, newMergedFile);
		            		newTotalNumHyp = FileUtilityOld.numberLinesInFile(newMergedFile);
		            	}else{
		            		newTotalNumHyp = NbestMerger.mergeNbest(oldMergedFile, curHypFilePrefix, newMergedFile);
		                }		            	
	        		}else{		        	
			        	if(iter ==1){		        		
							FileUtility.copyFile(curHypFilePrefix+".hg.items", newMergedFile+".hg.items");						
			        		FileUtility.copyFile(curHypFilePrefix+".hg.rules", newMergedFile+".hg.rules");
			        	}else{
			        		boolean saveModelCosts = true;
			        		
				            /**TODO: this assumes that the feature values for the same hypothesis does not change,
				             * though the weights for these features can change. In particular, this means
				             * we cannot tune the weight for the aggregate discriminative model while we are tunining the individual 
				             * discriminative feature. This is also true for the bestHyperEdge pointer.*/
				            newTotalNumHyp = DiskHyperGraph.mergeDiskHyperGraphs(MRConfig.ngramStateID, saveModelCosts, this.numTrainingSentence, 
				            		MRConfig.use_unique_nbest, MRConfig.use_tree_nbest,
				            		oldMergedFile, curHypFilePrefix, newMergedFile, (MRConfig.hyp_merge_mode==2));
				            
			            }
			        	
			        	this.curHypFilePrefix = newMergedFile;
		        	}
		        	
		        	//check convergence
		        	double newRatio = (newTotalNumHyp-oldTotalNumHyp)*1.0/oldTotalNumHyp;
		        	if(iter <=2 || newRatio > MRConfig.stop_hyp_ratio) {
		        		System.out.println("oldTotalNumHyp=" + oldTotalNumHyp + "; newTotalNumHyp=" + newTotalNumHyp + "; newRatio="+ newRatio +";  at iteration " + iter);
		        		oldTotalNumHyp = newTotalNumHyp; 
		            }else{
		            	System.out.println("No new hypotheses generated at iteration " + iter + " for stop_hyp_ratio=" + MRConfig.stop_hyp_ratio); 
		            	break;
		            }
		        	
        		} catch (IOException e) {
					e.printStackTrace();
				}
        	}
        	
        	Map<String, Integer>  ruleStringToIDTable = DiskHyperGraph.obtainRuleStringToIDTable(curHypFilePrefix+".hg.rules");
        	
        	//try to abbrevate the featuers if possible
        	addAbbreviatedNames(ruleStringToIDTable);
        	
        	
        	//micro rule features
        	if(MRConfig.useSparseFeature && MRConfig.useMicroTMFeat){	        	
	        	this.microRuleFeatureTemplate.setupTbl(ruleStringToIDTable, featureStringToIntegerMap.keySet());
        	}

        	//=====compute onebest BLEU
        	computeOneBestBLEU(curHypFilePrefix);
        	
        	//==== run DA annealer to obtain optimal weight vector using the hypergraphs as training data 	
        	HyperGraphFactory hgFactory = new HyperGraphFactory(curHypFilePrefix, referenceFiles, MRConfig.ngramStateID,  symbolTbl, this.haveRefereces);   
         	GradientComputer gradientComputer = new HGRiskGradientComputer(MRConfig.useSemiringV2,
    				numTrainingSentence, numPara, MRConfig.gainFactor, 1.0, 0.0, true,
        			MRConfig.fixFirstFeature, hgFactory,
        			MRConfig.maxNumHGInQueue, MRConfig.numThreads,
        			
        			MRConfig.ngramStateID,  MRConfig.baselineLMOrder, symbolTbl,
        			featureStringToIntegerMap, featTemplates,
        			MRConfig.linearCorpusGainThetas,
        			this.haveRefereces
    		);
 	        
        	annealer = new DeterministicAnnealer(numPara,  lastWeightVector, MRConfig.isMinimizer, gradientComputer, 
        			MRConfig.useL2Regula, MRConfig.varianceForL2, MRConfig.useModelDivergenceRegula, MRConfig.lambda, MRConfig.printFirstN);
        	if(MRConfig.annealingMode==0)//do not anneal
        		lastWeightVector = annealer.runWithoutAnnealing(MRConfig.isScalingFactorTunable, MRConfig.startScaleAtNoAnnealing, MRConfig.temperatureAtNoAnnealing);
        	else if(MRConfig.annealingMode==1)
        		lastWeightVector = annealer.runQuenching(1.0);
        	else if(MRConfig.annealingMode==2)
        		lastWeightVector = annealer.runDAAndQuenching();
        	else{
        		logger.severe("unsorported anneal mode, " + MRConfig.annealingMode);
        		System.exit(0);
        	}
        	
        	
        	//=====re-compute onebest BLEU
        	if(MRConfig.normalizeByFirstFeature)
            	normalizeWeightsByFirstFeature(lastWeightVector, 0);
        	
        	
        	computeOneBestBLEU(curHypFilePrefix);
        	
        	//@todo: check convergency
        	
        	//@todo: delete files
        	if(false){
	        	FileUtility.deleteFile(this.curHypFilePrefix+".hg.items");
	        	FileUtility.deleteFile(this.curHypFilePrefix+".hg.rules");
        	}
        	
        	if(MRConfig.lossAugmentedPrune){
    			this.curLossScale -= MRConfig.lossDecreaseConstant;
    			if(this.curLossScale<=0)
    				this.curLossScale = 0;
    		}
        }
        
        //final output
        if(MRConfig.normalizeByFirstFeature)
        	normalizeWeightsByFirstFeature(lastWeightVector, 0);        	     	
    	saveLastModel(configFile, configFile + ".final", MRConfig.featureFile, MRConfig.featureFile + ".final");
        //writeConfigFile(lastWeightVector, configFile, configFile+".final");
    	
        //System.out.println("#### Final weights are: ");
        //annealer.getLBFGSRunner().printStatistics(-1, -1, null, lastWeightVector);
	}
	
	

	public void decodingTestSet(double[] weights, String hypFilePrefix){
		/**three scenarios:
		 * (1) individual baseline features
		 * (2) baselineCombo + sparse feature
		 * (3) individual baseline features + sparse features
		*/
		
		if(MRConfig.useSparseFeature)
			joshuaDecoder.changeFeatureWeightVector( getIndividualBaselineWeights(), this.curFeatureFile );
		else
			joshuaDecoder.changeFeatureWeightVector( getIndividualBaselineWeights(), null);
		
    	//call Joshua decoder to produce an hypergraph using the new weight vector
    	joshuaDecoder.decodeTestSet(sourceTrainingFile, hypFilePrefix);
    	 		
	}


	private void computeOneBestBLEU(String curHypFilePrefix){
		if(this.haveRefereces==false)
			return;
		
		double bleuSum = 0;
		double googleGainSum = 0;
		double modelSum = 0;
		
		//==== feature-based feature
		int featID = 999;
		double weight = 1.0;
		HashSet<String> restrictedFeatureSet = null;
		HashMap<String, Double> modelTbl = obtainModelTable(this.featureStringToIntegerMap, this.lastWeightVector);
		//System.out.println("modelTable: " + modelTbl);
		FeatureFunction ff = new FeatureTemplateBasedFF(featID, weight, modelTbl, this.featTemplates, restrictedFeatureSet); 

		//==== reranker
		List<FeatureFunction> features =  new ArrayList<FeatureFunction>();
		features.add(ff);
		HGRanker reranker = new HGRanker(features);	
		
		
		//==== kbest 
		boolean addCombinedCost = false;	
		KBestExtractor kbestExtractor = new KBestExtractor(symbolTbl, MRConfig.use_unique_nbest, MRConfig.use_tree_nbest, false, addCombinedCost, false, true);
		
		//==== loop
		HyperGraphFactory hgFactory = new HyperGraphFactory(curHypFilePrefix, referenceFiles, MRConfig.ngramStateID,  symbolTbl, true);
		hgFactory.startLoop();
		for(int sentID=0; sentID< this.numTrainingSentence; sentID ++){			
			HGAndReferences res = hgFactory.nextHG();
			reranker.rankHG(res.hg);//reset best pointer and transition prob
		
			String hypSent = kbestExtractor.getKthHyp(res.hg.goalNode, 1, -1, null, null);
			double bleu = BLEU.computeSentenceBleu(res.referenceSentences, hypSent);
			bleuSum  += bleu;
			
			double googleGain = BLEU.computeLinearCorpusGain(MRConfig.linearCorpusGainThetas, res.referenceSentences, hypSent);
			googleGainSum += googleGain;
			
			modelSum +=  res.hg.bestLogP();
			//System.out.println("logP=" + res.hg.bestLogP() + "; Bleu=" + bleu +"; googleGain="+googleGain);
							
		}
		hgFactory.endLoop();
		
		System.out.println("AvgLogP=" + modelSum/this.numTrainingSentence + "; AvgBleu=" + bleuSum/this.numTrainingSentence
				+ "; AvgGoogleGain=" + googleGainSum/this.numTrainingSentence + "; SumGoogleGain=" + googleGainSum);
	}
	
	
	public void saveLastModel(String configTemplate, String configOutput, String sparseFeaturesTemplate, String sparseFeaturesOutput){
		if(MRConfig.useSparseFeature){
			JoshuaDecoder.writeConfigFile( getIndividualBaselineWeights(), configTemplate, configOutput, sparseFeaturesOutput);
			saveSparseFeatureFile(sparseFeaturesTemplate, sparseFeaturesOutput);			
		}else{
			JoshuaDecoder.writeConfigFile( getIndividualBaselineWeights(), configTemplate, configOutput, null);
		}
	}
	
	private void initialize(){
		//===== read configurations
		MRConfig.readConfigFile(this.configFile);
		
		//===== initialize googleCorpusBLEU
		if(MRConfig.useGoogleLinearCorpusGain==true){
			//do nothing		
		}else{
			logger.severe("On hypergraph, we must use the linear corpus gain.");
			System.exit(1);
		}
		
		//===== initialize the featureTemplates
		setupFeatureTemplates();
		
		//====== initialize featureStringToIntegerMap and weights
		initFeatureMapAndWeights(MRConfig.featureFile);	
	}
	
	
	//TODO: should merge with setupFeatureTemplates in HGMinRiskDAMert
	private void setupFeatureTemplates(){
		
		this.featTemplates = new ArrayList<FeatureTemplate>();
		
		if(MRConfig.useBaseline){
			FeatureTemplate ft = new BaselineFT(MRConfig.baselineFeatureName, true);
			featTemplates.add(ft);
		}
		
		if(MRConfig.useIndividualBaselines){
			for(int id : MRConfig.baselineFeatIDsToTune){				
				String featName = MRConfig.individualBSFeatNamePrefix +id;				
				FeatureTemplate ft = new IndividualBaselineFT(featName, id, true);
				featTemplates.add(ft);	
			}
		}
		
		if(MRConfig.useSparseFeature){
			
			if(MRConfig.useMicroTMFeat){	
				//FeatureTemplate ft = new TMFT(symbolTbl, useIntegerString, MRConfig.useRuleIDName);
				this.microRuleFeatureTemplate = new MicroRuleFT(MRConfig.useRuleIDName, MRConfig.startTargetNgramOrder, MRConfig.endTargetNgramOrder, MRConfig.wordMapFile);
				featTemplates.add(microRuleFeatureTemplate);
			}
			
			if(MRConfig.useTMFeat){
				FeatureTemplate ft = new TMFT(symbolTbl, useIntegerString, MRConfig.useRuleIDName);				
				featTemplates.add(ft);
			}
			
			if(MRConfig.useTMTargetFeat){			
				FeatureTemplate ft = new TargetTMFT(symbolTbl, useIntegerString);
				featTemplates.add(ft);		
			}	
				
			if(MRConfig.useLMFeat){
				FeatureTemplate ft = new NgramFT(symbolTbl, useIntegerString, MRConfig.ngramStateID, 
												MRConfig.baselineLMOrder, MRConfig.startNgramOrder, MRConfig.endNgramOrder);
				featTemplates.add(ft);
			}
		}	
		
		System.out.println("feature template are " + featTemplates.toString());

	}

	//read feature map into featureStringToIntegerMap
	//TODO we assume the featureId is the line ID (starting from zero)
	private void initFeatureMapAndWeights(String featureFile){
		
		featureStringToIntegerMap = new HashMap<String, Integer>();
		List<Double> temInitWeights = new ArrayList<Double>();
		int featID = 0;
		

		//==== baseline feature
		if(MRConfig.useBaseline){
			featureStringToIntegerMap.put(MRConfig.baselineFeatureName, featID++);
			temInitWeights.add(MRConfig.baselineFeatureWeight);
		}
		
		//==== individual bs feature
		if(MRConfig.useIndividualBaselines){
			List<Double> weights = readBaselineFeatureWeights(this.configFile);
			for(int id : MRConfig.baselineFeatIDsToTune){				
				String featName = MRConfig.individualBSFeatNamePrefix + id;	
				featureStringToIntegerMap.put(featName,  featID++);
				double  weight = weights.get(id);
				temInitWeights.add(weight);
			}
		}

		//==== features in file
		if(MRConfig.useSparseFeature){
			BufferedReader reader = FileUtilityOld.getReadFileStream(featureFile ,"UTF-8");	
			String line;
			while((line=FileUtilityOld.readLineLzf(reader))!=null){
				String[] fds = line.split("\\s+\\|{3}\\s+");// feature_key ||| feature vale; the feature_key itself may contain "|||"
				StringBuffer featKey = new StringBuffer();
				for(int i=0; i<fds.length-1; i++){
					featKey.append(fds[i]);
					if(i<fds.length-2) 
						featKey.append(" ||| ");
				}
				double initWeight = new Double(fds[fds.length-1]);//initial weight
				temInitWeights.add(initWeight);
				featureStringToIntegerMap.put(featKey.toString(), featID++);
			}
			FileUtilityOld.closeReadFile(reader);
		}
		
		//==== initialize lastWeightVector
		numPara = temInitWeights.size();
		lastWeightVector = new double[numPara];
		for(int i=0; i<numPara; i++)
			lastWeightVector[i] = temInitWeights.get(i);
	}
	

	
	private double[] getIndividualBaselineWeights(){
		
		double baselineWeight = 1.0;
		if(MRConfig.useBaseline)
			baselineWeight = getBaselineWeight();
		
		List<Double> weights  = readBaselineFeatureWeights(this.configFile);
		
		//change the weights we are tunning
		if(MRConfig.useIndividualBaselines){		
			for(int id : MRConfig.baselineFeatIDsToTune){				
				String featName = MRConfig.individualBSFeatNamePrefix +id;
				int featID = featureStringToIntegerMap.get(featName);
				weights.set(id, baselineWeight*lastWeightVector[featID]);				
			}
		}
		
		if(MRConfig.lossAugmentedPrune){
			String featName = MRConfig.individualBSFeatNamePrefix +this.oralceFeatureID;
			if(featureStringToIntegerMap.containsKey(featName)){
				logger.severe("we are tuning the oracle model, must be wrong in specifying baselineFeatIDsToTune");
				System.exit(1);
			}
			
			weights.set(this.oralceFeatureID, this.curLossScale);
			System.out.println("curLossScale=" + this.curLossScale + "; oralceFeatureID="+this.oralceFeatureID);
		}
		
		double[] res = new double[weights.size()];
		for(int i=0; i<res.length; i++)
			res[i] = weights.get(i);
		return res;
	}
	

	private double getBaselineWeight(){
		String featName = MRConfig.baselineFeatureName;
		int featID = featureStringToIntegerMap.get(featName);
		double weight = lastWeightVector[featID];
		System.out.println("baseline weight is " + weight);
		return weight;
	}
	
	private void saveSparseFeatureFile(String fileTemplate, String outputFile){
	
		BufferedReader template = FileUtilityOld.getReadFileStream(fileTemplate,"UTF-8");	
		BufferedWriter writer = FileUtilityOld.getWriteFileStream(outputFile);
		String line;
		
		while((line=FileUtilityOld.readLineLzf(template))!=null){
			//== construct feature name
			String[] fds = line.split("\\s+\\|{3}\\s+");// feature_key ||| feature vale; the feature_key itself may contain "|||"
			StringBuffer featKey = new StringBuffer();
			for(int i=0; i<fds.length-1; i++){
				featKey.append(fds[i]);
				if(i<fds.length-2) 
					featKey.append(" ||| ");
			}
			
			//== write the learnt weight
			//double oldWeight = new Double(fds[fds.length-1]);//initial weight
			int featID = featureStringToIntegerMap.get(featKey.toString());
			double newWeight =  lastWeightVector[featID];//last model
			//System.out.println(featKey +"; old=" + oldWeight + "; new=" + newWeight);
			FileUtilityOld.writeLzf(writer, featKey.toString() + " ||| " + newWeight +"\n");
			
			featID++;
		}
		FileUtilityOld.closeReadFile(template);
		FileUtilityOld.closeWriteFile(writer);
	}
	
	
	private HashMap<String,Double> obtainModelTable(HashMap<String, Integer> featureStringToIntegerMap, double[] weightVector){
		HashMap<String,Double> modelTbl = new HashMap<String,Double>();
		for(Map.Entry<String,Integer> entry : featureStringToIntegerMap.entrySet()){
			int featID = entry.getValue();
			double weight =  lastWeightVector[featID];//last model
			modelTbl.put(entry.getKey(), weight);
		}
		return modelTbl;
	}
	
	
	private void addAbbreviatedNames(Map<String, Integer> rulesIDTable){
//		try to abbrevate the featuers if possible
    	if(MRConfig.useRuleIDName){
    		//add the abbreviated feature name into featureStringToIntegerMap
    		
    		//System.out.println("size1=" + featureStringToIntegerMap.size());
    		
    		for(Entry<String, Integer> entry : rulesIDTable.entrySet()){
    			Integer featureID = featureStringToIntegerMap.get(entry.getKey());
    			if(featureID!=null){
    				String abbrFeatName = "r" + entry.getValue();//TODO??????
    				featureStringToIntegerMap.put(abbrFeatName, featureID);
    				//System.out.println("full="+entry.getKey() + "; abbrFeatName="+abbrFeatName + "; id="+featureID);
    			}
    		}
    		//System.out.println("size2=" + featureStringToIntegerMap);
    		//System.exit(0);
    	}
    	
	}
	
	
	static public void addAllWordsIntoSymbolTbl(String file, SymbolTable symbolTbl){
		BufferedReader reader = FileUtilityOld.getReadFileStream(file,"UTF-8");	
		String line;
		while((line=FileUtilityOld.readLineLzf(reader))!=null){
			symbolTbl.addTerminals(line);
		}
		FileUtilityOld.closeReadFile(reader);
	}
	
	
	
	
	
	public static void main(String[] args) {
		/*String f_joshua_config="C:/data_disk/java_work_space/discriminative_at_clsp/edu/jhu/joshua/discriminative_training/lbfgs/example.config.javalm";
		String f_dev_src="C:/data_disk/java_work_space/sf_trunk/example/example.test.in";
		String f_nbest_prefix="C:/data_disk/java_work_space/discriminative_at_clsp/edu/jhu/joshua/discriminative_training/lbfgs/example.nbest.javalm.out";
		String f_dev_ref="C:/data_disk/java_work_space/sf_trunk/example/example.test.ref.0";
		*/
		if(args.length<3){
			System.out.println("Wrong number of parameters!");
			System.exit(1);
		}
		
	
		
		//long start_time = System.currentTimeMillis();
		String joshuaConfigFile=args[0].trim();
		String sourceTrainingFile=args[1].trim();
		String hypFilePrefix=args[2].trim();
		
		String[] devRefs = null;
		if(args.length>3){
			devRefs = new String[args.length-3];
			for(int i=3; i< args.length; i++){
				devRefs[i-3]= args[i].trim();
				System.out.println("Use ref file " + devRefs[i-3]);
			}
		}
		
		SymbolTable symbolTbl = new BuildinSymbol(null);
		
		int numSentInDevSet = FileUtilityOld.numberLinesInFile(sourceTrainingFile);
		
		
		HGMinRiskDAMert trainer =  new HGMinRiskDAMert(joshuaConfigFile,numSentInDevSet, devRefs, hypFilePrefix, symbolTbl, sourceTrainingFile);

		trainer.mainLoop();
	}
	
}