src/joshua/decoder/ff/tm/Rule.java - joshua - Git at Google

 package joshua.decoder.ff.tm;

 import java.util.Arrays;
 import java.util.Comparator;
 import java.util.List;
 import java.util.StringTokenizer;
 import java.util.regex.Pattern;

 import joshua.corpus.Vocabulary;
 import joshua.decoder.Decoder;
 import joshua.decoder.ff.FeatureFunction;
 import joshua.decoder.ff.FeatureVector;
 import joshua.decoder.segment_file.Sentence;

 /**
  * This class define the interface for Rule.
  *
  * All feature scores are interpreted as negative log probabilities, and are therefore negated.
  * Note that not all features need to be negative log probs, but you should be aware that they
  * will be negated, so if you want a positive count, it should come in as negative.
  *
  * @author Zhifei Li, <zhifei.work@gmail.com>
  */


 /**
  * Normally, the feature score in the rule should be *cost* (i.e., -LogP), so that the feature
  * weight should be positive
  *
  * @author Zhifei Li, <zhifei.work@gmail.com>
  * @author Matt Post <post@cs.jhu.edu>
  */
 public class Rule implements Comparator<Rule>, Comparable<Rule> {

   private int lhs; // tag of this rule
   private int[] pFrench; // pointer to the RuleCollection, as all the rules under it share the same
                          // Source side
   protected int arity;

   // And a string containing the sparse ones
   protected FeatureVector features = null;
   protected String sparseFeatureString;

   /*
    * a feature function will be fired for this rule only if the owner of the rule matches the owner
    * of the feature function
    */
   private int owner = -1;

   /**
    * This is the cost computed only from the features present with the grammar rule. This cost is
    * needed to sort the rules in the grammar for cube pruning, but isn't the full cost of applying
    * the rule (which will include contextual features that can't be computed until the rule is
    * applied).
    */
   private float estimatedCost = Float.NEGATIVE_INFINITY;

   private float precomputableCost = Float.NEGATIVE_INFINITY;

   private int[] english;

   // The alignment string, e.g., 0-0 0-1 1-1 2-1
   private String alignmentString;
   protected byte[] alignment = null;

   /**
    * Constructs a new rule using the provided parameters. The owner and rule id for this rule are
    * undefined. Note that some of the sparse features may be unlabeled, but they cannot be mapped to
    * their default names ("tm_OWNER_INDEX") until later, when we know the owner of the rule. This is
    * not known until the rule is actually added to a grammar in Grammar::addRule().
    *
    * @param lhs Left-hand side of the rule.
    * @param sourceRhs Source language right-hand side of the rule.
    * @param targetRhs Target language right-hand side of the rule.
    * @param sparseFeatures Feature value scores for the rule.
    * @param arity Number of nonterminals in the source language right-hand side.
    * @param owner
    */
   public Rule(int lhs, int[] sourceRhs, int[] targetRhs, String sparseFeatures, int arity,
       int owner) {
     this.lhs = lhs;
     this.pFrench = sourceRhs;
     this.sparseFeatureString = sparseFeatures;
     this.arity = arity;
     this.owner = owner;
     this.english = targetRhs;
   }

   // Sparse feature version
   public Rule(int lhs, int[] sourceRhs, int[] targetRhs, String sparseFeatures, int arity) {
     this.lhs = lhs;
     this.pFrench = sourceRhs;
     this.sparseFeatureString = sparseFeatures;
     this.arity = arity;
     this.owner = -1;
     this.english = targetRhs;
   }

   public Rule(int lhs, int[] sourceRhs, int[] targetRhs, String sparseFeatures, int arity, String alignment) {
     this(lhs, sourceRhs, targetRhs, sparseFeatures, arity);
     this.alignmentString = alignment;
   }

   public Rule() {
     this.lhs = -1;
   }

   // ===============================================================
   // Attributes
   // ===============================================================

   public void setEnglish(int[] eng) {
     this.english = eng;
   }

   public int[] getEnglish() {
     return this.english;
   }

   /**
    * Two Rules are equal of they have the same LHS, the same source RHS and the same target
    * RHS.
    *
    * @param o the object to check for equality
    * @return true if o is the same Rule as this rule, false otherwise
    */
   public boolean equals(Object o) {
     if (!(o instanceof Rule)) {
       return false;
     }
     Rule other = (Rule) o;
     if (getLHS() != other.getLHS()) {
       return false;
     }
     if (!Arrays.equals(getFrench(), other.getFrench())) {
       return false;
     }
     if (!Arrays.equals(english, other.getEnglish())) {
       return false;
     }
     return true;
   }

   public int hashCode() {
     // I just made this up. If two rules are equal they'll have the
     // same hashcode. Maybe someone else can do a better job though?
     int frHash = Arrays.hashCode(getFrench());
     int enHash = Arrays.hashCode(english);
     return frHash ^ enHash ^ getLHS();
   }

   // ===============================================================
   // Attributes
   // ===============================================================

   public void setArity(int arity) {
     this.arity = arity;
   }

   public int getArity() {
     return this.arity;
   }

   public void setOwner(int owner) {
     this.owner = owner;
   }

   public int getOwner() {
     return this.owner;
   }

   public void setLHS(int lhs) {
     this.lhs = lhs;
   }

   public int getLHS() {
     return this.lhs;
   }

   public void setFrench(int[] french) {
     this.pFrench = french;
   }

   public int[] getFrench() {
     return this.pFrench;
   }

   /**
    * This function does the work of turning the string version of the sparse features (passed in
    * when the rule was created) into an actual set of features. This is a bit complicated because we
    * support intermingled labeled and unlabeled features, where the unlabeled features are mapped to
    * a default name template of the form "tm_OWNER_INDEX".
    *
    * This function returns the dense (phrasal) features discovered when the rule was loaded. Dense
    * features are the list of unlabeled features that preceded labeled ones. They can also be
    * specified as labeled features of the form "tm_OWNER_INDEX", but the former format is preferred.
    */
   public FeatureVector getFeatureVector() {
     /*
      * Now read the feature scores, which can be any number of dense features and sparse features.
      * Any unlabeled feature becomes a dense feature. By convention, dense features should precede
      * sparse (labeled) ones, but it's not required.
      */

     if (features == null)
       features = (owner != -1)
         ? new FeatureVector(getFeatureString(), "tm_" + Vocabulary.word(owner) + "_")
         : new FeatureVector();

     return features;
   }

   /**
    * This function returns the estimated cost of a rule, which should have been computed when the
    * grammar was first sorted via a call to Rule::estimateRuleCost(). This function is a getter
    * only; it will not compute the value if it has not already been set. It is necessary in addition
    * to estimateRuleCost(models) because sometimes the value needs to be retrieved from contexts
    * that do not have access to the feature functions.
    *
    * This function is called by the rule comparator when sorting the grammar. As such it may be
    * called many times and any implementation of it should be a cached implementation.
    *
    * @return the estimated cost of the rule (a lower bound on the true cost)
    */
   public float getEstimatedCost() {
     return estimatedCost;
   }

   /**
    * Precomputable costs is the inner product of the weights found on each grammar rule and the
    * weight vector. This is slightly different from the estimated rule cost, which can include other
    * features (such as a language model estimate). This getter and setter should also be cached, and
    * is basically provided to allow the PhraseModel feature to cache its (expensive) computation for
    * each rule.
    *
    * @return the precomputable cost of each rule
    */
   public float getPrecomputableCost() {
     return precomputableCost;
   }

   public float getDenseFeature(int k) {
     return getFeatureVector().getDense(k);
   }

   public void setPrecomputableCost(float[] phrase_weights, FeatureVector weights) {
     float cost = 0.0f;

 //    System.err.println(String.format("// Setting precomputable cost for for %s/%s", getEnglishWords(), getFrenchWords()));
     FeatureVector features = getFeatureVector();
     for (int i = 0; i < features.getDenseFeatures().size() && i < phrase_weights.length; i++) {
 //      System.err.println(String.format("    %d -> %.5f", i, features.get(i)));
       cost += phrase_weights[i] * features.getDense(i);
     }

     for (String key: features.getSparseFeatures().keySet()) {
 //      System.err.println(String.format("    %s -> %.5f", key, features.get(key)));
       cost += weights.getSparse(key) * features.getSparse(key);
     }

 //    System.err.println(String.format("-> %f", cost));

     this.precomputableCost = cost;
   }

   /**
    * This function estimates the cost of a rule, which is used for sorting the rules for cube
    * pruning. The estimated cost is basically the set of precomputable features (features listed
    * along with the rule in the grammar file) along with any other estimates that other features
    * would like to contribute (e.g., a language model estimate). This cost will be a lower bound on
    * the rule's actual cost.
    *
    * The value of this function is used only for sorting the rules. When the rule is later applied
    * in context to particular hypernodes, the rule's actual cost is computed.
    *
    * @param models the list of models available to the decoder
    * @return estimated cost of the rule
    */
   public float estimateRuleCost(List<FeatureFunction> models) {
     if (null == models)
       return 0.0f;

     if (this.estimatedCost <= Float.NEGATIVE_INFINITY) {
       this.estimatedCost = 0.0f; // weights.innerProduct(computeFeatures());

       if (Decoder.VERBOSE >= 4)
         System.err.println(String.format("estimateCost(%s ;; %s)", getFrenchWords(), getEnglishWords()));
       for (FeatureFunction ff : models) {
         float val = ff.estimateCost(this, null);
         if (Decoder.VERBOSE >= 4)
           System.err.println(String.format("  FEATURE %s -> %.3f", ff.getName(), val));
         this.estimatedCost += val;
       }
     }

     return estimatedCost;
   }

   // ===============================================================
   // Methods
   // ===============================================================

   public String toString() {
     StringBuffer sb = new StringBuffer();
     sb.append(Vocabulary.word(this.getLHS()));
     sb.append(" ||| ");
     sb.append(getFrenchWords());
     sb.append(" ||| ");
     sb.append(getEnglishWords());
     sb.append(" |||");
     sb.append(" " + getFeatureVector());
     sb.append(String.format(" ||| est=%.3f", getEstimatedCost()));
     sb.append(String.format(" pre=%.3f", getPrecomputableCost()));
     return sb.toString();
   }

   /**
    * Returns a version of the rule suitable for reading in from a text file.
    *
    * @return
    */
   public String textFormat() {
     StringBuffer sb = new StringBuffer();
     sb.append(Vocabulary.word(this.getLHS()));
     sb.append(" |||");

     int nt = 1;
     for (int i = 0; i < getFrench().length; i++) {
       if (getFrench()[i] < 0)
         sb.append(" " + Vocabulary.word(getFrench()[i]).replaceFirst("\\]", String.format(",%d]", nt++)));
       else
         sb.append(" " + Vocabulary.word(getFrench()[i]));
     }
     sb.append(" |||");
     nt = 1;
     for (int i = 0; i < getEnglish().length; i++) {
       if (getEnglish()[i] < 0)
         sb.append(" " + Vocabulary.word(getEnglish()[i]).replaceFirst("\\]", String.format(",%d]", nt++)));
       else
         sb.append(" " + Vocabulary.word(getEnglish()[i]));
     }
     sb.append(" |||");
     sb.append(" " + getFeatureString());
     if (getAlignmentString() != null)
       sb.append(" ||| " + getAlignmentString());
     return sb.toString();
   }

   public String getFeatureString() {
     return sparseFeatureString;
   }

   /**
    * Returns an alignment as a sequence of integers. The integers at positions i and i+1 are paired,
    * with position i indexing the source and i+1 the target.
    */
   public byte[] getAlignment() {
     if (alignment == null && getAlignmentString() != null) {
       String[] tokens = getAlignmentString().split("[-\\s]+");
       alignment = new byte[tokens.length];
       for (int i = 0; i < tokens.length; i++)
         alignment[i] = (byte) Short.parseShort(tokens[i]);
     }
     return alignment;
   }

   public String getAlignmentString() {
     return alignmentString;
   }

   /**
    * The nonterminals on the English side are pointers to the source side nonterminals (-1 and -2),
    * rather than being directly encoded. These number indicate the correspondence between the
    * nonterminals on each side, introducing a level of indirection however when we want to resolve
    * them. So to get the ID, we need to look up the corresponding source side ID.
    *
    * @return The string of English words
    */
   public String getEnglishWords() {
     int[] foreignNTs = getForeignNonTerminals();

     StringBuilder sb = new StringBuilder();
     for (Integer index : getEnglish()) {
       if (index >= 0)
         sb.append(Vocabulary.word(index) + " ");
       else
         sb.append(Vocabulary.word(foreignNTs[-index - 1]).replace("]",
             String.format(",%d] ", Math.abs(index))));
     }

     return sb.toString().trim();
   }

   public boolean isTerminal() {
     for (int i = 0; i < getEnglish().length; i++)
       if (getEnglish()[i] < 0)
         return false;

     return true;
   }

   /**
    * Return the French (source) nonterminals as list of Strings
    *
    * @return
    */
   public int[] getForeignNonTerminals() {
     int[] nts = new int[getArity()];
     int index = 0;
     for (int id : getFrench())
       if (id < 0)
         nts[index++] = -id;
     return nts;
   }

   /**
    * Return the English (target) nonterminals as list of Strings
    *
    * @return
    */
   public int[] getEnglishNonTerminals() {
     int[] nts = new int[getArity()];
     int[] foreignNTs = getForeignNonTerminals();
     int index = 0;

     for (int i : getEnglish()) {
       if (i < 0)
         nts[index++] = foreignNTs[Math.abs(getEnglish()[i]) - 1];
     }

     return nts;
   }

   private int[] getNormalizedEnglishNonterminalIndices() {
     int[] result = new int[getArity()];

     int ntIndex = 0;
     for (Integer index : getEnglish()) {
       if (index < 0)
         result[ntIndex++] = -index - 1;
     }

     return result;
   }

   public boolean isInverting() {
     int[] normalizedEnglishNonTerminalIndices = getNormalizedEnglishNonterminalIndices();
     if (normalizedEnglishNonTerminalIndices.length == 2) {
       if (normalizedEnglishNonTerminalIndices[0] == 1) {
         return true;
       }
     }
     return false;
   }

   public String getFrenchWords() {
     return Vocabulary.getWords(getFrench());
   }

   public static final String NT_REGEX = "\\[[^\\]]+?\\]";

   private Pattern getPattern() {
     String source = getFrenchWords();
     String pattern = Pattern.quote(source);
     pattern = pattern.replaceAll(NT_REGEX, "\\\\E.+\\\\Q");
     pattern = pattern.replaceAll("\\\\Q\\\\E", "");
     pattern = "(?:^|\\s)" + pattern + "(?:$|\\s)";
     return Pattern.compile(pattern);
   }

   /**
    * Matches the string representation of the rule's source side against a sentence
    *
    * @param sentence
    * @return
    */
   public boolean matches(Sentence sentence) {
     boolean match = getPattern().matcher(sentence.fullSource()).find();
     // System.err.println(String.format("match(%s,%s) = %s", Pattern.quote(getFrenchWords()),
     // sentence.annotatedSource(), match));
     return match;
   }

   /**
    * This comparator is used for sorting the rules during cube pruning. An estimate of the cost
    * of each rule is computed and used to sort.
    */
   public static Comparator<Rule> EstimatedCostComparator = new Comparator<Rule>() {
     public int compare(Rule rule1, Rule rule2) {
       float cost1 = rule1.getEstimatedCost();
       float cost2 = rule2.getEstimatedCost();
       return Float.compare(cost2,  cost1);
     }
   };

   public int compare(Rule rule1, Rule rule2) {
     return EstimatedCostComparator.compare(rule1, rule2);
   }

   public int compareTo(Rule other) {
     return EstimatedCostComparator.compare(this, other);
   }

   public String getRuleString() {
     return String.format("%s -> %s ||| %s", Vocabulary.word(getLHS()), getFrenchWords(), getEnglishWords());
   }
 }
	package joshua.decoder.ff.tm;

	import java.util.Arrays;
	import java.util.Comparator;
	import java.util.List;
	import java.util.StringTokenizer;
	import java.util.regex.Pattern;

	import joshua.corpus.Vocabulary;
	import joshua.decoder.Decoder;
	import joshua.decoder.ff.FeatureFunction;
	import joshua.decoder.ff.FeatureVector;
	import joshua.decoder.segment_file.Sentence;

	/**
	* This class define the interface for Rule.
	*
	* All feature scores are interpreted as negative log probabilities, and are therefore negated.
	* Note that not all features need to be negative log probs, but you should be aware that they
	* will be negated, so if you want a positive count, it should come in as negative.
	*
	* @author Zhifei Li, <zhifei.work@gmail.com>
	*/


	/**
	* Normally, the feature score in the rule should be cost (i.e., -LogP), so that the feature
	* weight should be positive
	*
	* @author Zhifei Li, <zhifei.work@gmail.com>
	* @author Matt Post <post@cs.jhu.edu>
	*/
	public class Rule implements Comparator<Rule>, Comparable<Rule> {

	private int lhs; // tag of this rule
	private int[] pFrench; // pointer to the RuleCollection, as all the rules under it share the same
	// Source side
	protected int arity;

	// And a string containing the sparse ones
	protected FeatureVector features = null;
	protected String sparseFeatureString;

	/*
	* a feature function will be fired for this rule only if the owner of the rule matches the owner
	* of the feature function
	*/
	private int owner = -1;

	/**
	* This is the cost computed only from the features present with the grammar rule. This cost is
	* needed to sort the rules in the grammar for cube pruning, but isn't the full cost of applying
	* the rule (which will include contextual features that can't be computed until the rule is
	* applied).
	*/
	private float estimatedCost = Float.NEGATIVE_INFINITY;

	private float precomputableCost = Float.NEGATIVE_INFINITY;

	private int[] english;

	// The alignment string, e.g., 0-0 0-1 1-1 2-1
	private String alignmentString;
	protected byte[] alignment = null;

	/**
	* Constructs a new rule using the provided parameters. The owner and rule id for this rule are
	* undefined. Note that some of the sparse features may be unlabeled, but they cannot be mapped to
	* their default names ("tm_OWNER_INDEX") until later, when we know the owner of the rule. This is
	* not known until the rule is actually added to a grammar in Grammar::addRule().
	*
	* @param lhs Left-hand side of the rule.
	* @param sourceRhs Source language right-hand side of the rule.
	* @param targetRhs Target language right-hand side of the rule.
	* @param sparseFeatures Feature value scores for the rule.
	* @param arity Number of nonterminals in the source language right-hand side.
	* @param owner
	*/
	public Rule(int lhs, int[] sourceRhs, int[] targetRhs, String sparseFeatures, int arity,
	int owner) {
	this.lhs = lhs;
	this.pFrench = sourceRhs;
	this.sparseFeatureString = sparseFeatures;
	this.arity = arity;
	this.owner = owner;
	this.english = targetRhs;
	}

	// Sparse feature version
	public Rule(int lhs, int[] sourceRhs, int[] targetRhs, String sparseFeatures, int arity) {
	this.lhs = lhs;
	this.pFrench = sourceRhs;
	this.sparseFeatureString = sparseFeatures;
	this.arity = arity;
	this.owner = -1;
	this.english = targetRhs;
	}

	public Rule(int lhs, int[] sourceRhs, int[] targetRhs, String sparseFeatures, int arity, String alignment) {
	this(lhs, sourceRhs, targetRhs, sparseFeatures, arity);
	this.alignmentString = alignment;
	}

	public Rule() {
	this.lhs = -1;
	}

	// ===============================================================
	// Attributes
	// ===============================================================

	public void setEnglish(int[] eng) {
	this.english = eng;
	}

	public int[] getEnglish() {
	return this.english;
	}

	/**
	* Two Rules are equal of they have the same LHS, the same source RHS and the same target
	* RHS.
	*
	* @param o the object to check for equality
	* @return true if o is the same Rule as this rule, false otherwise
	*/
	public boolean equals(Object o) {
	if (!(o instanceof Rule)) {
	return false;
	}
	Rule other = (Rule) o;
	if (getLHS() != other.getLHS()) {
	return false;
	}
	if (!Arrays.equals(getFrench(), other.getFrench())) {
	return false;
	}
	if (!Arrays.equals(english, other.getEnglish())) {
	return false;
	}
	return true;
	}

	public int hashCode() {
	// I just made this up. If two rules are equal they'll have the
	// same hashcode. Maybe someone else can do a better job though?
	int frHash = Arrays.hashCode(getFrench());
	int enHash = Arrays.hashCode(english);
	return frHash ^ enHash ^ getLHS();
	}

	// ===============================================================
	// Attributes
	// ===============================================================

	public void setArity(int arity) {
	this.arity = arity;
	}

	public int getArity() {
	return this.arity;
	}

	public void setOwner(int owner) {
	this.owner = owner;
	}

	public int getOwner() {
	return this.owner;
	}

	public void setLHS(int lhs) {
	this.lhs = lhs;
	}

	public int getLHS() {
	return this.lhs;
	}

	public void setFrench(int[] french) {
	this.pFrench = french;
	}

	public int[] getFrench() {
	return this.pFrench;
	}

	/**
	* This function does the work of turning the string version of the sparse features (passed in
	* when the rule was created) into an actual set of features. This is a bit complicated because we
	* support intermingled labeled and unlabeled features, where the unlabeled features are mapped to
	* a default name template of the form "tm_OWNER_INDEX".
	*
	* This function returns the dense (phrasal) features discovered when the rule was loaded. Dense
	* features are the list of unlabeled features that preceded labeled ones. They can also be
	* specified as labeled features of the form "tm_OWNER_INDEX", but the former format is preferred.
	*/
	public FeatureVector getFeatureVector() {
	/*
	* Now read the feature scores, which can be any number of dense features and sparse features.
	* Any unlabeled feature becomes a dense feature. By convention, dense features should precede
	* sparse (labeled) ones, but it's not required.
	*/

	if (features == null)
	features = (owner != -1)
	? new FeatureVector(getFeatureString(), "tm_" + Vocabulary.word(owner) + "_")
	: new FeatureVector();

	return features;
	}

	/**
	* This function returns the estimated cost of a rule, which should have been computed when the
	* grammar was first sorted via a call to Rule::estimateRuleCost(). This function is a getter
	* only; it will not compute the value if it has not already been set. It is necessary in addition
	* to estimateRuleCost(models) because sometimes the value needs to be retrieved from contexts
	* that do not have access to the feature functions.
	*
	* This function is called by the rule comparator when sorting the grammar. As such it may be
	* called many times and any implementation of it should be a cached implementation.
	*
	* @return the estimated cost of the rule (a lower bound on the true cost)
	*/
	public float getEstimatedCost() {
	return estimatedCost;
	}

	/**
	* Precomputable costs is the inner product of the weights found on each grammar rule and the
	* weight vector. This is slightly different from the estimated rule cost, which can include other
	* features (such as a language model estimate). This getter and setter should also be cached, and
	* is basically provided to allow the PhraseModel feature to cache its (expensive) computation for
	* each rule.
	*
	* @return the precomputable cost of each rule
	*/
	public float getPrecomputableCost() {
	return precomputableCost;
	}

	public float getDenseFeature(int k) {
	return getFeatureVector().getDense(k);
	}

	public void setPrecomputableCost(float[] phrase_weights, FeatureVector weights) {
	float cost = 0.0f;

	// System.err.println(String.format("// Setting precomputable cost for for %s/%s", getEnglishWords(), getFrenchWords()));
	FeatureVector features = getFeatureVector();
	for (int i = 0; i < features.getDenseFeatures().size() && i < phrase_weights.length; i++) {
	// System.err.println(String.format(" %d -> %.5f", i, features.get(i)));
	cost += phrase_weights[i] * features.getDense(i);
	}

	for (String key: features.getSparseFeatures().keySet()) {
	// System.err.println(String.format(" %s -> %.5f", key, features.get(key)));
	cost += weights.getSparse(key) * features.getSparse(key);
	}

	// System.err.println(String.format("-> %f", cost));

	this.precomputableCost = cost;
	}

	/**
	* This function estimates the cost of a rule, which is used for sorting the rules for cube
	* pruning. The estimated cost is basically the set of precomputable features (features listed
	* along with the rule in the grammar file) along with any other estimates that other features
	* would like to contribute (e.g., a language model estimate). This cost will be a lower bound on
	* the rule's actual cost.
	*
	* The value of this function is used only for sorting the rules. When the rule is later applied
	* in context to particular hypernodes, the rule's actual cost is computed.
	*
	* @param models the list of models available to the decoder
	* @return estimated cost of the rule
	*/
	public float estimateRuleCost(List<FeatureFunction> models) {
	if (null == models)
	return 0.0f;

	if (this.estimatedCost <= Float.NEGATIVE_INFINITY) {
	this.estimatedCost = 0.0f; // weights.innerProduct(computeFeatures());

	if (Decoder.VERBOSE >= 4)
	System.err.println(String.format("estimateCost(%s ;; %s)", getFrenchWords(), getEnglishWords()));
	for (FeatureFunction ff : models) {
	float val = ff.estimateCost(this, null);
	if (Decoder.VERBOSE >= 4)
	System.err.println(String.format(" FEATURE %s -> %.3f", ff.getName(), val));
	this.estimatedCost += val;
	}
	}

	return estimatedCost;
	}

	// ===============================================================
	// Methods
	// ===============================================================

	public String toString() {
	StringBuffer sb = new StringBuffer();
	sb.append(Vocabulary.word(this.getLHS()));
	sb.append(" \|\|\| ");
	sb.append(getFrenchWords());
	sb.append(" \|\|\| ");
	sb.append(getEnglishWords());
	sb.append(" \|\|\|");
	sb.append(" " + getFeatureVector());
	sb.append(String.format(" \|\|\| est=%.3f", getEstimatedCost()));
	sb.append(String.format(" pre=%.3f", getPrecomputableCost()));
	return sb.toString();
	}

	/**
	* Returns a version of the rule suitable for reading in from a text file.
	*
	* @return
	*/
	public String textFormat() {
	StringBuffer sb = new StringBuffer();
	sb.append(Vocabulary.word(this.getLHS()));
	sb.append(" \|\|\|");

	int nt = 1;
	for (int i = 0; i < getFrench().length; i++) {
	if (getFrench()[i] < 0)
	sb.append(" " + Vocabulary.word(getFrench()[i]).replaceFirst("\\]", String.format(",%d]", nt++)));
	else
	sb.append(" " + Vocabulary.word(getFrench()[i]));
	}
	sb.append(" \|\|\|");
	nt = 1;
	for (int i = 0; i < getEnglish().length; i++) {
	if (getEnglish()[i] < 0)
	sb.append(" " + Vocabulary.word(getEnglish()[i]).replaceFirst("\\]", String.format(",%d]", nt++)));
	else
	sb.append(" " + Vocabulary.word(getEnglish()[i]));
	}
	sb.append(" \|\|\|");
	sb.append(" " + getFeatureString());
	if (getAlignmentString() != null)
	sb.append(" \|\|\| " + getAlignmentString());
	return sb.toString();
	}

	public String getFeatureString() {
	return sparseFeatureString;
	}

	/**
	* Returns an alignment as a sequence of integers. The integers at positions i and i+1 are paired,
	* with position i indexing the source and i+1 the target.
	*/
	public byte[] getAlignment() {
	if (alignment == null && getAlignmentString() != null) {
	String[] tokens = getAlignmentString().split("[-\\s]+");
	alignment = new byte[tokens.length];
	for (int i = 0; i < tokens.length; i++)
	alignment[i] = (byte) Short.parseShort(tokens[i]);
	}
	return alignment;
	}

	public String getAlignmentString() {
	return alignmentString;
	}

	/**
	* The nonterminals on the English side are pointers to the source side nonterminals (-1 and -2),
	* rather than being directly encoded. These number indicate the correspondence between the
	* nonterminals on each side, introducing a level of indirection however when we want to resolve
	* them. So to get the ID, we need to look up the corresponding source side ID.
	*
	* @return The string of English words
	*/
	public String getEnglishWords() {
	int[] foreignNTs = getForeignNonTerminals();

	StringBuilder sb = new StringBuilder();
	for (Integer index : getEnglish()) {
	if (index >= 0)
	sb.append(Vocabulary.word(index) + " ");
	else
	sb.append(Vocabulary.word(foreignNTs[-index - 1]).replace("]",
	String.format(",%d] ", Math.abs(index))));
	}

	return sb.toString().trim();
	}

	public boolean isTerminal() {
	for (int i = 0; i < getEnglish().length; i++)
	if (getEnglish()[i] < 0)
	return false;

	return true;
	}

	/**
	* Return the French (source) nonterminals as list of Strings
	*
	* @return
	*/
	public int[] getForeignNonTerminals() {
	int[] nts = new int[getArity()];
	int index = 0;
	for (int id : getFrench())
	if (id < 0)
	nts[index++] = -id;
	return nts;
	}

	/**
	* Return the English (target) nonterminals as list of Strings
	*
	* @return
	*/
	public int[] getEnglishNonTerminals() {
	int[] nts = new int[getArity()];
	int[] foreignNTs = getForeignNonTerminals();
	int index = 0;

	for (int i : getEnglish()) {
	if (i < 0)
	nts[index++] = foreignNTs[Math.abs(getEnglish()[i]) - 1];
	}

	return nts;
	}

	private int[] getNormalizedEnglishNonterminalIndices() {
	int[] result = new int[getArity()];

	int ntIndex = 0;
	for (Integer index : getEnglish()) {
	if (index < 0)
	result[ntIndex++] = -index - 1;
	}

	return result;
	}

	public boolean isInverting() {
	int[] normalizedEnglishNonTerminalIndices = getNormalizedEnglishNonterminalIndices();
	if (normalizedEnglishNonTerminalIndices.length == 2) {
	if (normalizedEnglishNonTerminalIndices[0] == 1) {
	return true;
	}
	}
	return false;
	}

	public String getFrenchWords() {
	return Vocabulary.getWords(getFrench());
	}

	public static final String NT_REGEX = "\\[[^\\]]+?\\]";

	private Pattern getPattern() {
	String source = getFrenchWords();
	String pattern = Pattern.quote(source);
	pattern = pattern.replaceAll(NT_REGEX, "\\\\E.+\\\\Q");
	pattern = pattern.replaceAll("\\\\Q\\\\E", "");
	pattern = "(?:^\|\\s)" + pattern + "(?:$\|\\s)";
	return Pattern.compile(pattern);
	}

	/**
	* Matches the string representation of the rule's source side against a sentence
	*
	* @param sentence
	* @return
	*/
	public boolean matches(Sentence sentence) {
	boolean match = getPattern().matcher(sentence.fullSource()).find();
	// System.err.println(String.format("match(%s,%s) = %s", Pattern.quote(getFrenchWords()),
	// sentence.annotatedSource(), match));
	return match;
	}

	/**
	* This comparator is used for sorting the rules during cube pruning. An estimate of the cost
	* of each rule is computed and used to sort.
	*/
	public static Comparator<Rule> EstimatedCostComparator = new Comparator<Rule>() {
	public int compare(Rule rule1, Rule rule2) {
	float cost1 = rule1.getEstimatedCost();
	float cost2 = rule2.getEstimatedCost();
	return Float.compare(cost2, cost1);
	}
	};

	public int compare(Rule rule1, Rule rule2) {
	return EstimatedCostComparator.compare(rule1, rule2);
	}

	public int compareTo(Rule other) {
	return EstimatedCostComparator.compare(this, other);
	}

	public String getRuleString() {
	return String.format("%s -> %s \|\|\| %s", Vocabulary.word(getLHS()), getFrenchWords(), getEnglishWords());
	}
	}