src/joshua/discriminative/training/risk_annealer/hypergraph/MRConfig.java - joshua - Git at Google

 package joshua.discriminative.training.risk_annealer.hypergraph;

 import java.io.BufferedReader;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.logging.Level;
 import java.util.logging.Logger;

 import joshua.discriminative.FileUtilityOld;
 import joshua.util.Regex;


 public class MRConfig {

 	//=== general
 	public static boolean oneTimeHGRerank = false;
 	public static int maxNumIter = 5;
 	public static boolean useSemiringV2 = true;
 	public static int maxNumHGInQueue = 100;
 	public static int numThreads = 4;
 	public static boolean saveHGInMemory;

 	//==disk hg related
 	public static int baselineLMOrder;
 	public static int ngramStateID;


 	//== first feature options
 	public static boolean fixFirstFeature = true;
 	public static boolean normalizeByFirstFeature = false;


 	//=== option for not using annealing at all
 	public static int annealingMode = 0;//0:no annealing; 1: quenching; 2: DA+Quenching
 	public static double temperatureAtNoAnnealing = 0;
 	public static double startScaleAtNoAnnealing = 1;
 	public static double gainFactor = 1.0;//argmax gainfactor*gain + T*Enropy
 	public static boolean isMinimizer = false;
 	public static boolean useL2Regula = false;
 	public static double varianceForL2 = 1;

 	public static boolean useModelDivergenceRegula = false;
 	public static double lambda = -1;

 	/*when we do not anneal, is the scaling factor a parameter in the tuning?*/
 	public static boolean isScalingFactorTunable = false;


 	//=== use goolge linear corpus gain?
 	public static boolean useGoogleLinearCorpusGain = false;
 	public static double[] linearCorpusGainThetas = null;


 	//======= feature realtes
 	//public static boolean doFeatureFiltering;

 	//== dense features
 	public static boolean useBaseline;
 	public static String baselineFeatureName;
 	public static double baselineFeatureWeight = 1.0;

 	public static boolean useIndividualBaselines;
 	public static String individualBSFeatNamePrefix="bs";
 	public static List<Integer> baselineFeatIDsToTune;


 	//== sparse features
 	public static String featureFile;

 	public static boolean useSparseFeature = false;
 	public static boolean useTMFeat = false;
 	public static boolean useRuleIDName= true;

 	public static boolean useMicroTMFeat = true;
 	public static String wordMapFile = null; /*tbl for mapping rule words*/
 	public static int startTargetNgramOrder = 2;//TODO
 	public static int endTargetNgramOrder = 2;//TODO


 	public static boolean useTMTargetFeat = false;

 	public static boolean useLMFeat;
 	public static int startNgramOrder = 1;
 	public static int endNgramOrder = 2;

 	public static int printFirstN=2;

 	//==loss augmented inferene
 	public static boolean lossAugmentedPrune = false;
 	public static double startLossScale = 10;
 	public static double lossDecreaseConstant = 1;

 	//nbest based training
 	public static boolean use_unique_nbest    = false;
 	public static boolean use_tree_nbest      = false;

 	public static int topN = 500;
 	public static boolean use_kbest_hg = false;
 	public static double stop_hyp_ratio = 1e-2; //how many new hypotheses should be generated before converge

 	public static int hyp_merge_mode  = 2; //0: no merge; 1: merge without de-duplicate; 2: merge with de-duplicate

 	private static final Logger logger =
 		Logger.getLogger(MRConfig.class.getName());

 	public static void readConfigFile(String configFile){
 		BufferedReader reader = FileUtilityOld.getReadFileStream(configFile);
 		String line;
 		while ((line = FileUtilityOld.readLineLzf(reader)) != null) {
 			line = line.trim();
 			if (line.matches("^\\s*\\#.*$") || line.matches("^\\s*$")) {
 				continue;
 			}
 			if (line.indexOf("=") != -1) { // parameters
 				String[] fds = Regex.equalsWithSpaces.split(line);
 				if (fds.length != 2) {
 					logger.severe("Wrong config line: " + line);
 					System.exit(1);
 				}

 				if ("useGoogleLinearCorpusGain".equals(fds[0])) {
 					useGoogleLinearCorpusGain = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useGoogleLinearCorpusGain: %s", useGoogleLinearCorpusGain));
 				} else if ("googleBLEUWeights".equals(fds[0])) {
 					String[] googleWeights = fds[1].trim().split(";");
 					if(googleWeights.length!=5){
 						logger.severe("wrong line=" + line);
 						System.exit(1);
 					}
 					linearCorpusGainThetas = new double[5];
 					for(int i=0; i<5; i++)
 						linearCorpusGainThetas[i] = new Double(googleWeights[i]);

 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("googleBLEUWeights: %s", linearCorpusGainThetas));

 				} else if ("lossAugmentedPrune".equals(fds[0])) {
 					lossAugmentedPrune = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("lossAugmentedPrune: %s", lossAugmentedPrune));
 				} else if ("startLossScale".equals(fds[0])) {
 					startLossScale = new Double(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("startLossScale: %s", startLossScale));
 				} else if ("lossDecreaseConstant".equals(fds[0])) {
 					lossDecreaseConstant = new Double(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("lossDecreaseConstant: %s", lossDecreaseConstant));
 				} else if ("oneTimeHGRerank".equals(fds[0])) {
 					oneTimeHGRerank = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("oneTimeHGRerank: %s", oneTimeHGRerank));
 				} else if ("annealingMode".equals(fds[0])) {
 					annealingMode = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("annealingMode: %s", annealingMode));
 				} else if ("useL2Regula".equals(fds[0])) {
 					useL2Regula = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useL2Regula: %s", useL2Regula));
 				} else if ("varianceForL2".equals(fds[0])) {
 					varianceForL2 = new Double(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("varianceForL2: %s", varianceForL2));
 				} else if ("useModelDivergenceRegula".equals(fds[0])) {
 					useModelDivergenceRegula = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useModelDivergenceRegula: %s", useModelDivergenceRegula));
 				} else if ("lambda".equals(fds[0])) {
 					lambda = new Double(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("lambda: %s", lambda));
 				} else if ("isScalingFactorTunable".equals(fds[0])) {
 					isScalingFactorTunable = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("isScalingFactorTunable: %s", isScalingFactorTunable));
 				} else if ("maxNumIter".equals(fds[0])) {
 					maxNumIter = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("maxNumIter: %s", maxNumIter));
 				} else if ("baselineLMOrder".equals(fds[0]) || "order".equals(fds[0])) {
 					baselineLMOrder = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("baselineLMOrder: %s", baselineLMOrder));
 				} else if ("ngramStateID".equals(fds[0])) {
 					ngramStateID = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("ngramStateID: %s", ngramStateID));
 				}  /*else if ("doFeatureFiltering".equals(fds[0])) {
 					doFeatureFiltering = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("doFeatureFiltering: %s", doFeatureFiltering));
 				}*/ else if ("useBaseline".equals(fds[0])) {
 					useBaseline = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useBaseline: %s", useBaseline));
 				} else if ("baselineFeatureName".equals(fds[0])) {
 					baselineFeatureName = fds[1].trim();
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("baselineFeatureName: %s", baselineFeatureName));
 				} else if ("baselineFeatureWeight".equals(fds[0])) {
 					baselineFeatureWeight = new Double( fds[1].trim() );
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("baselineFeatureWeight: %s", baselineFeatureWeight));
 				} else if ("useIndividualBaselines".equals(fds[0])) {
 					useIndividualBaselines = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useIndividualBaselines: %s", useIndividualBaselines));
 				}else if ("baselineFeatIDsToTune".equals(fds[0])) {
 					String[] ids = fds[1].trim().split(";");
 					baselineFeatIDsToTune = new ArrayList<Integer>();
 					for(String id : ids){
 						baselineFeatIDsToTune.add(new Integer(id.trim()));
 					}
 					System.out.println(String.format("baselineFeatIDsToTune: %s", baselineFeatIDsToTune));
 				} else if ("useSparseFeature".equals(fds[0])) {
 					useSparseFeature = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useSparseFeature: %s", useSparseFeature));
 				} else if ("wordMapFile".equals(fds[0])) {
 					wordMapFile = fds[1].trim();
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("wordMapFile: %s", wordMapFile));
 				} else if ("useTMFeat".equals(fds[0])) {
 					useTMFeat = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useTMFeat: %s", useTMFeat));
 				} else if ("useMicroTMFeat".equals(fds[0])) {
 					useMicroTMFeat = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useMicroTMFeat: %s", useMicroTMFeat));
 				} else if ("useRuleIDName".equals(fds[0])) {
 					useRuleIDName = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useRuleIDName: %s", useRuleIDName));
 				} else if ("useTMTargetFeat".equals(fds[0])) {
 					useTMTargetFeat = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useTMTargetFeat: %s", useTMTargetFeat));
 				} else if ("useLMFeat".equals(fds[0])) {
 					useLMFeat = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useLMFeat: %s", useLMFeat));
 				} else if ("startNgramOrder".equals(fds[0])) {
 					startNgramOrder = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("startNgramOrder: %s", startNgramOrder));
 				} else if ("endNgramOrder".equals(fds[0])) {
 					endNgramOrder = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("endNgramOrder: %s", endNgramOrder));
 				} else if ("saveHGInMemory".equals(fds[0])) {
 					saveHGInMemory = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("saveHGInMemory: %s", saveHGInMemory));
 				} else if ("fixFirstFeature".equals(fds[0])) {
 					fixFirstFeature = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("fixFirstFeature: %s", fixFirstFeature));
 				} else if ("useSemiringV2".equals(fds[0])) {
 					useSemiringV2 = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("useSemiringV2: %s", useSemiringV2));
 				} else if ("maxNumHGInQueue".equals(fds[0])) {
 					maxNumHGInQueue = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("maxNumHGInQueue: %s", maxNumHGInQueue));
 				} else if ("numThreads".equals(fds[0])) {
 					numThreads = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("numThreads: %s", numThreads));
 				} else if ("normalizeByFirstFeature".equals(fds[0])) {
 					normalizeByFirstFeature = new Boolean(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("normalizeByFirstFeature: %s", normalizeByFirstFeature));
 				} else if ("printFirstN".equals(fds[0])) {
 					printFirstN = new Integer(fds[1].trim());
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("printFirstN: %s", printFirstN));
 				} else if ("use_unique_nbest".equals(fds[0])) {
 					use_unique_nbest = Boolean.valueOf(fds[1]);
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("use_unique_nbest: %s", use_unique_nbest));
 				} else if ("use_tree_nbest".equals(fds[0])) {
 					use_tree_nbest = Boolean.valueOf(fds[1]);
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("use_tree_nbest: %s", use_tree_nbest));
 				} else if ("top_n".equals(fds[0])) {
 					topN = Integer.parseInt(fds[1]);
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("topN: %s", topN));
 				} else if ("use_kbest_hg".equals(fds[0])) {
 					use_kbest_hg = Boolean.valueOf(fds[1]);
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("use_kbest_hg: %s", use_kbest_hg));
 				} else if ("hyp_merge_mode".equals(fds[0])) {
 					hyp_merge_mode = new Integer(fds[1]);
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("hyp_merge_mode: %s", hyp_merge_mode));
 				} else if ("stop_hyp_ratio".equals(fds[0])) {
 					stop_hyp_ratio = new Double( fds[1].trim() );
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("stop_hyp_ratio: %s", stop_hyp_ratio));
 				}


 			}else{//models

 				String[] fds = Regex.spaces.split(line);
 				if ("discriminative".equals(fds[0]) && fds.length == 3) { //discriminative weight modelFile

 					featureFile = fds[1].trim();
 					if (logger.isLoggable(Level.FINEST))
 						logger.finest(String.format("featureFile: %s", featureFile));

 				}
 			}
 		}
 		FileUtilityOld.closeReadFile(reader);

 		/**three scenarios:
 		 * (1) individual baseline features
 		 * (2) baselineCombo + sparse feature
 		 * (3) individual baseline features + sparse features
 		*/

 		if(useIndividualBaselines==true && useBaseline == false  && useSparseFeature == false){
 			logger.info("========== regular MERT scenario: tune only baseline features");
 		}else if(useIndividualBaselines==false && useBaseline == true  && useSparseFeature == true){
 			logger.info("========== scenario: baselineCombo + sparseFeature");
 		}else if(useIndividualBaselines==true && useBaseline == false  && useSparseFeature == true){
 			logger.info("========== scenario: IndividualBaselines + sparseFeature");
 		}else{
 			logger.info("==== wrong training scenario ====");
 			System.exit(1);
 		}

 		if( useGoogleLinearCorpusGain && linearCorpusGainThetas==null ){
 			logger.info("linearCorpusGainThetas is null, did you set googleBLEUWeights properly?");
 			System.exit(1);
 		}else if(linearCorpusGainThetas.length!=5){
 			logger.info("linearCorpusGainThetas does not have five values, did you set googleBLEUWeights properly?");
 			System.exit(1);
 		}

 		if(oneTimeHGRerank && maxNumIter!=1){
 			logger.info("oneTimeHGRerank=true, but maxNumIter!=1");
 			System.exit(1);
 		}

 		if(use_kbest_hg==false && hyp_merge_mode==2){
 			logger.warning("use_kbest_hg==false && hyp_merge_mode==2, cannot do dedup-merge for real hypergraph-based training, back to nbest merge, but trained on hg");
 			//System.exit(1);
 		}
 	}

 }
	package joshua.discriminative.training.risk_annealer.hypergraph;

	import java.io.BufferedReader;
	import java.util.ArrayList;
	import java.util.List;
	import java.util.logging.Level;
	import java.util.logging.Logger;

	import joshua.discriminative.FileUtilityOld;
	import joshua.util.Regex;



	public class MRConfig {

	//=== general
	public static boolean oneTimeHGRerank = false;
	public static int maxNumIter = 5;
	public static boolean useSemiringV2 = true;
	public static int maxNumHGInQueue = 100;
	public static int numThreads = 4;
	public static boolean saveHGInMemory;

	//==disk hg related
	public static int baselineLMOrder;
	public static int ngramStateID;


	//== first feature options
	public static boolean fixFirstFeature = true;
	public static boolean normalizeByFirstFeature = false;


	//=== option for not using annealing at all
	public static int annealingMode = 0;//0:no annealing; 1: quenching; 2: DA+Quenching
	public static double temperatureAtNoAnnealing = 0;
	public static double startScaleAtNoAnnealing = 1;
	public static double gainFactor = 1.0;//argmax gainfactorgain + TEnropy
	public static boolean isMinimizer = false;
	public static boolean useL2Regula = false;
	public static double varianceForL2 = 1;

	public static boolean useModelDivergenceRegula = false;
	public static double lambda = -1;

	/when we do not anneal, is the scaling factor a parameter in the tuning?/
	public static boolean isScalingFactorTunable = false;


	//=== use goolge linear corpus gain?
	public static boolean useGoogleLinearCorpusGain = false;
	public static double[] linearCorpusGainThetas = null;


	//======= feature realtes
	//public static boolean doFeatureFiltering;

	//== dense features
	public static boolean useBaseline;
	public static String baselineFeatureName;
	public static double baselineFeatureWeight = 1.0;

	public static boolean useIndividualBaselines;
	public static String individualBSFeatNamePrefix="bs";
	public static List<Integer> baselineFeatIDsToTune;


	//== sparse features
	public static String featureFile;

	public static boolean useSparseFeature = false;
	public static boolean useTMFeat = false;
	public static boolean useRuleIDName= true;

	public static boolean useMicroTMFeat = true;
	public static String wordMapFile = null; /tbl for mapping rule words/
	public static int startTargetNgramOrder = 2;//TODO
	public static int endTargetNgramOrder = 2;//TODO


	public static boolean useTMTargetFeat = false;

	public static boolean useLMFeat;
	public static int startNgramOrder = 1;
	public static int endNgramOrder = 2;

	public static int printFirstN=2;

	//==loss augmented inferene
	public static boolean lossAugmentedPrune = false;
	public static double startLossScale = 10;
	public static double lossDecreaseConstant = 1;

	//nbest based training
	public static boolean use_unique_nbest = false;
	public static boolean use_tree_nbest = false;

	public static int topN = 500;
	public static boolean use_kbest_hg = false;
	public static double stop_hyp_ratio = 1e-2; //how many new hypotheses should be generated before converge

	public static int hyp_merge_mode = 2; //0: no merge; 1: merge without de-duplicate; 2: merge with de-duplicate

	private static final Logger logger =
	Logger.getLogger(MRConfig.class.getName());

	public static void readConfigFile(String configFile){
	BufferedReader reader = FileUtilityOld.getReadFileStream(configFile);
	String line;
	while ((line = FileUtilityOld.readLineLzf(reader)) != null) {
	line = line.trim();
	if (line.matches("^\\s\\#.$") \|\| line.matches("^\\s*$")) {
	continue;
	}
	if (line.indexOf("=") != -1) { // parameters
	String[] fds = Regex.equalsWithSpaces.split(line);
	if (fds.length != 2) {
	logger.severe("Wrong config line: " + line);
	System.exit(1);
	}

	if ("useGoogleLinearCorpusGain".equals(fds[0])) {
	useGoogleLinearCorpusGain = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useGoogleLinearCorpusGain: %s", useGoogleLinearCorpusGain));
	} else if ("googleBLEUWeights".equals(fds[0])) {
	String[] googleWeights = fds[1].trim().split(";");
	if(googleWeights.length!=5){
	logger.severe("wrong line=" + line);
	System.exit(1);
	}
	linearCorpusGainThetas = new double[5];
	for(int i=0; i<5; i++)
	linearCorpusGainThetas[i] = new Double(googleWeights[i]);

	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("googleBLEUWeights: %s", linearCorpusGainThetas));

	} else if ("lossAugmentedPrune".equals(fds[0])) {
	lossAugmentedPrune = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("lossAugmentedPrune: %s", lossAugmentedPrune));
	} else if ("startLossScale".equals(fds[0])) {
	startLossScale = new Double(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("startLossScale: %s", startLossScale));
	} else if ("lossDecreaseConstant".equals(fds[0])) {
	lossDecreaseConstant = new Double(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("lossDecreaseConstant: %s", lossDecreaseConstant));
	} else if ("oneTimeHGRerank".equals(fds[0])) {
	oneTimeHGRerank = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("oneTimeHGRerank: %s", oneTimeHGRerank));
	} else if ("annealingMode".equals(fds[0])) {
	annealingMode = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("annealingMode: %s", annealingMode));
	} else if ("useL2Regula".equals(fds[0])) {
	useL2Regula = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useL2Regula: %s", useL2Regula));
	} else if ("varianceForL2".equals(fds[0])) {
	varianceForL2 = new Double(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("varianceForL2: %s", varianceForL2));
	} else if ("useModelDivergenceRegula".equals(fds[0])) {
	useModelDivergenceRegula = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useModelDivergenceRegula: %s", useModelDivergenceRegula));
	} else if ("lambda".equals(fds[0])) {
	lambda = new Double(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("lambda: %s", lambda));
	} else if ("isScalingFactorTunable".equals(fds[0])) {
	isScalingFactorTunable = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("isScalingFactorTunable: %s", isScalingFactorTunable));
	} else if ("maxNumIter".equals(fds[0])) {
	maxNumIter = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("maxNumIter: %s", maxNumIter));
	} else if ("baselineLMOrder".equals(fds[0]) \|\| "order".equals(fds[0])) {
	baselineLMOrder = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("baselineLMOrder: %s", baselineLMOrder));
	} else if ("ngramStateID".equals(fds[0])) {
	ngramStateID = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("ngramStateID: %s", ngramStateID));
	} /*else if ("doFeatureFiltering".equals(fds[0])) {
	doFeatureFiltering = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("doFeatureFiltering: %s", doFeatureFiltering));
	}*/ else if ("useBaseline".equals(fds[0])) {
	useBaseline = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useBaseline: %s", useBaseline));
	} else if ("baselineFeatureName".equals(fds[0])) {
	baselineFeatureName = fds[1].trim();
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("baselineFeatureName: %s", baselineFeatureName));
	} else if ("baselineFeatureWeight".equals(fds[0])) {
	baselineFeatureWeight = new Double( fds[1].trim() );
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("baselineFeatureWeight: %s", baselineFeatureWeight));
	} else if ("useIndividualBaselines".equals(fds[0])) {
	useIndividualBaselines = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useIndividualBaselines: %s", useIndividualBaselines));
	}else if ("baselineFeatIDsToTune".equals(fds[0])) {
	String[] ids = fds[1].trim().split(";");
	baselineFeatIDsToTune = new ArrayList<Integer>();
	for(String id : ids){
	baselineFeatIDsToTune.add(new Integer(id.trim()));
	}
	System.out.println(String.format("baselineFeatIDsToTune: %s", baselineFeatIDsToTune));
	} else if ("useSparseFeature".equals(fds[0])) {
	useSparseFeature = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useSparseFeature: %s", useSparseFeature));
	} else if ("wordMapFile".equals(fds[0])) {
	wordMapFile = fds[1].trim();
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("wordMapFile: %s", wordMapFile));
	} else if ("useTMFeat".equals(fds[0])) {
	useTMFeat = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useTMFeat: %s", useTMFeat));
	} else if ("useMicroTMFeat".equals(fds[0])) {
	useMicroTMFeat = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useMicroTMFeat: %s", useMicroTMFeat));
	} else if ("useRuleIDName".equals(fds[0])) {
	useRuleIDName = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useRuleIDName: %s", useRuleIDName));
	} else if ("useTMTargetFeat".equals(fds[0])) {
	useTMTargetFeat = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useTMTargetFeat: %s", useTMTargetFeat));
	} else if ("useLMFeat".equals(fds[0])) {
	useLMFeat = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useLMFeat: %s", useLMFeat));
	} else if ("startNgramOrder".equals(fds[0])) {
	startNgramOrder = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("startNgramOrder: %s", startNgramOrder));
	} else if ("endNgramOrder".equals(fds[0])) {
	endNgramOrder = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("endNgramOrder: %s", endNgramOrder));
	} else if ("saveHGInMemory".equals(fds[0])) {
	saveHGInMemory = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("saveHGInMemory: %s", saveHGInMemory));
	} else if ("fixFirstFeature".equals(fds[0])) {
	fixFirstFeature = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("fixFirstFeature: %s", fixFirstFeature));
	} else if ("useSemiringV2".equals(fds[0])) {
	useSemiringV2 = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("useSemiringV2: %s", useSemiringV2));
	} else if ("maxNumHGInQueue".equals(fds[0])) {
	maxNumHGInQueue = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("maxNumHGInQueue: %s", maxNumHGInQueue));
	} else if ("numThreads".equals(fds[0])) {
	numThreads = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("numThreads: %s", numThreads));
	} else if ("normalizeByFirstFeature".equals(fds[0])) {
	normalizeByFirstFeature = new Boolean(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("normalizeByFirstFeature: %s", normalizeByFirstFeature));
	} else if ("printFirstN".equals(fds[0])) {
	printFirstN = new Integer(fds[1].trim());
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("printFirstN: %s", printFirstN));
	} else if ("use_unique_nbest".equals(fds[0])) {
	use_unique_nbest = Boolean.valueOf(fds[1]);
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("use_unique_nbest: %s", use_unique_nbest));
	} else if ("use_tree_nbest".equals(fds[0])) {
	use_tree_nbest = Boolean.valueOf(fds[1]);
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("use_tree_nbest: %s", use_tree_nbest));
	} else if ("top_n".equals(fds[0])) {
	topN = Integer.parseInt(fds[1]);
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("topN: %s", topN));
	} else if ("use_kbest_hg".equals(fds[0])) {
	use_kbest_hg = Boolean.valueOf(fds[1]);
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("use_kbest_hg: %s", use_kbest_hg));
	} else if ("hyp_merge_mode".equals(fds[0])) {
	hyp_merge_mode = new Integer(fds[1]);
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("hyp_merge_mode: %s", hyp_merge_mode));
	} else if ("stop_hyp_ratio".equals(fds[0])) {
	stop_hyp_ratio = new Double( fds[1].trim() );
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("stop_hyp_ratio: %s", stop_hyp_ratio));
	}


	}else{//models

	String[] fds = Regex.spaces.split(line);
	if ("discriminative".equals(fds[0]) && fds.length == 3) { //discriminative weight modelFile

	featureFile = fds[1].trim();
	if (logger.isLoggable(Level.FINEST))
	logger.finest(String.format("featureFile: %s", featureFile));

	}
	}
	}
	FileUtilityOld.closeReadFile(reader);

	/**three scenarios:
	* (1) individual baseline features
	* (2) baselineCombo + sparse feature
	* (3) individual baseline features + sparse features
	*/

	if(useIndividualBaselines==true && useBaseline == false && useSparseFeature == false){
	logger.info("========== regular MERT scenario: tune only baseline features");
	}else if(useIndividualBaselines==false && useBaseline == true && useSparseFeature == true){
	logger.info("========== scenario: baselineCombo + sparseFeature");
	}else if(useIndividualBaselines==true && useBaseline == false && useSparseFeature == true){
	logger.info("========== scenario: IndividualBaselines + sparseFeature");
	}else{
	logger.info("==== wrong training scenario ====");
	System.exit(1);
	}

	if( useGoogleLinearCorpusGain && linearCorpusGainThetas==null ){
	logger.info("linearCorpusGainThetas is null, did you set googleBLEUWeights properly?");
	System.exit(1);
	}else if(linearCorpusGainThetas.length!=5){
	logger.info("linearCorpusGainThetas does not have five values, did you set googleBLEUWeights properly?");
	System.exit(1);
	}

	if(oneTimeHGRerank && maxNumIter!=1){
	logger.info("oneTimeHGRerank=true, but maxNumIter!=1");
	System.exit(1);
	}

	if(use_kbest_hg==false && hyp_merge_mode==2){
	logger.warning("use_kbest_hg==false && hyp_merge_mode==2, cannot do dedup-merge for real hypergraph-based training, back to nbest merge, but trained on hg");
	//System.exit(1);
	}
	}

	}