lucene/join/src/java/org/apache/lucene/search/join/TermsWithScoreCollector.java - lucene-solr - Git at Google

 package org.apache.lucene.search.join;

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 import java.io.IOException;

 import org.apache.lucene.index.AtomicReaderContext;
 import org.apache.lucene.index.BinaryDocValues;
 import org.apache.lucene.index.DocValues;
 import org.apache.lucene.index.SortedSetDocValues;
 import org.apache.lucene.search.LeafCollector;
 import org.apache.lucene.search.Collector;
 import org.apache.lucene.search.Scorer;
 import org.apache.lucene.search.SimpleCollector;
 import org.apache.lucene.util.ArrayUtil;
 import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.BytesRefHash;

 abstract class TermsWithScoreCollector extends SimpleCollector {

   private final static int INITIAL_ARRAY_SIZE = 256;

   final String field;
   final BytesRefHash collectedTerms = new BytesRefHash();
   final ScoreMode scoreMode;

   Scorer scorer;
   float[] scoreSums = new float[INITIAL_ARRAY_SIZE];

   TermsWithScoreCollector(String field, ScoreMode scoreMode) {
     this.field = field;
     this.scoreMode = scoreMode;
   }

   public BytesRefHash getCollectedTerms() {
     return collectedTerms;
   }

   public float[] getScoresPerTerm() {
     return scoreSums;
   }

   @Override
   public void setScorer(Scorer scorer) throws IOException {
     this.scorer = scorer;
   }

   @Override
   public boolean acceptsDocsOutOfOrder() {
     return true;
   }

   /**
    * Chooses the right {@link TermsWithScoreCollector} implementation.
    *
    * @param field                     The field to collect terms for
    * @param multipleValuesPerDocument Whether the field to collect terms for has multiple values per document.
    * @return a {@link TermsWithScoreCollector} instance
    */
   static TermsWithScoreCollector create(String field, boolean multipleValuesPerDocument, ScoreMode scoreMode) {
     if (multipleValuesPerDocument) {
       switch (scoreMode) {
         case Avg:
           return new MV.Avg(field);
         default:
           return new MV(field, scoreMode);
       }
     } else {
       switch (scoreMode) {
         case Avg:
           return new SV.Avg(field);
         default:
           return new SV(field, scoreMode);
       }
     }
   }

   // impl that works with single value per document
   static class SV extends TermsWithScoreCollector {

     final BytesRef spare = new BytesRef();
     BinaryDocValues fromDocTerms;

     SV(String field, ScoreMode scoreMode) {
       super(field, scoreMode);
     }

     @Override
     public void collect(int doc) throws IOException {
       fromDocTerms.get(doc, spare);
       int ord = collectedTerms.add(spare);
       if (ord < 0) {
         ord = -ord - 1;
       } else {
         if (ord >= scoreSums.length) {
           scoreSums = ArrayUtil.grow(scoreSums);
         }
       }

       float current = scorer.score();
       float existing = scoreSums[ord];
       if (Float.compare(existing, 0.0f) == 0) {
         scoreSums[ord] = current;
       } else {
         switch (scoreMode) {
           case Total:
             scoreSums[ord] = scoreSums[ord] + current;
             break;
           case Max:
             if (current > existing) {
               scoreSums[ord] = current;
             }
         }
       }
     }

     @Override
     protected void doSetNextReader(AtomicReaderContext context) throws IOException {
       fromDocTerms = DocValues.getBinary(context.reader(), field);
     }

     static class Avg extends SV {

       int[] scoreCounts = new int[INITIAL_ARRAY_SIZE];

       Avg(String field) {
         super(field, ScoreMode.Avg);
       }

       @Override
       public void collect(int doc) throws IOException {
         fromDocTerms.get(doc, spare);
         int ord = collectedTerms.add(spare);
         if (ord < 0) {
           ord = -ord - 1;
         } else {
           if (ord >= scoreSums.length) {
             scoreSums = ArrayUtil.grow(scoreSums);
             scoreCounts = ArrayUtil.grow(scoreCounts);
           }
         }

         float current = scorer.score();
         float existing = scoreSums[ord];
         if (Float.compare(existing, 0.0f) == 0) {
           scoreSums[ord] = current;
           scoreCounts[ord] = 1;
         } else {
           scoreSums[ord] = scoreSums[ord] + current;
           scoreCounts[ord]++;
         }
       }

       @Override
       public float[] getScoresPerTerm() {
         if (scoreCounts != null) {
           for (int i = 0; i < scoreCounts.length; i++) {
             scoreSums[i] = scoreSums[i] / scoreCounts[i];
           }
           scoreCounts = null;
         }
         return scoreSums;
       }
     }
   }

   // impl that works with multiple values per document
   static class MV extends TermsWithScoreCollector {

     SortedSetDocValues fromDocTermOrds;
     final BytesRef scratch = new BytesRef();

     MV(String field, ScoreMode scoreMode) {
       super(field, scoreMode);
     }

     @Override
     public void collect(int doc) throws IOException {
       fromDocTermOrds.setDocument(doc);
       long ord;
       while ((ord = fromDocTermOrds.nextOrd()) != SortedSetDocValues.NO_MORE_ORDS) {
         fromDocTermOrds.lookupOrd(ord, scratch);

         int termID = collectedTerms.add(scratch);
         if (termID < 0) {
           termID = -termID - 1;
         } else {
           if (termID >= scoreSums.length) {
             scoreSums = ArrayUtil.grow(scoreSums);
           }
         }

         switch (scoreMode) {
           case Total:
             scoreSums[termID] += scorer.score();
             break;
           case Max:
             scoreSums[termID] = Math.max(scoreSums[termID], scorer.score());
         }
       }
     }

     @Override
     protected void doSetNextReader(AtomicReaderContext context) throws IOException {
       fromDocTermOrds = DocValues.getSortedSet(context.reader(), field);
     }

     static class Avg extends MV {

       int[] scoreCounts = new int[INITIAL_ARRAY_SIZE];

       Avg(String field) {
         super(field, ScoreMode.Avg);
       }

       @Override
       public void collect(int doc) throws IOException {
         fromDocTermOrds.setDocument(doc);
         long ord;
         while ((ord = fromDocTermOrds.nextOrd()) != SortedSetDocValues.NO_MORE_ORDS) {
           fromDocTermOrds.lookupOrd(ord, scratch);

           int termID = collectedTerms.add(scratch);
           if (termID < 0) {
             termID = -termID - 1;
           } else {
             if (termID >= scoreSums.length) {
               scoreSums = ArrayUtil.grow(scoreSums);
               scoreCounts = ArrayUtil.grow(scoreCounts);
             }
           }

           scoreSums[termID] += scorer.score();
           scoreCounts[termID]++;
         }
       }

       @Override
       public float[] getScoresPerTerm() {
         if (scoreCounts != null) {
           for (int i = 0; i < scoreCounts.length; i++) {
             scoreSums[i] = scoreSums[i] / scoreCounts[i];
           }
           scoreCounts = null;
         }
         return scoreSums;
       }
     }
   }

 }
	package org.apache.lucene.search.join;

	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	import java.io.IOException;

	import org.apache.lucene.index.AtomicReaderContext;
	import org.apache.lucene.index.BinaryDocValues;
	import org.apache.lucene.index.DocValues;
	import org.apache.lucene.index.SortedSetDocValues;
	import org.apache.lucene.search.LeafCollector;
	import org.apache.lucene.search.Collector;
	import org.apache.lucene.search.Scorer;
	import org.apache.lucene.search.SimpleCollector;
	import org.apache.lucene.util.ArrayUtil;
	import org.apache.lucene.util.BytesRef;
	import org.apache.lucene.util.BytesRefHash;

	abstract class TermsWithScoreCollector extends SimpleCollector {

	private final static int INITIAL_ARRAY_SIZE = 256;

	final String field;
	final BytesRefHash collectedTerms = new BytesRefHash();
	final ScoreMode scoreMode;

	Scorer scorer;
	float[] scoreSums = new float[INITIAL_ARRAY_SIZE];

	TermsWithScoreCollector(String field, ScoreMode scoreMode) {
	this.field = field;
	this.scoreMode = scoreMode;
	}

	public BytesRefHash getCollectedTerms() {
	return collectedTerms;
	}

	public float[] getScoresPerTerm() {
	return scoreSums;
	}

	@Override
	public void setScorer(Scorer scorer) throws IOException {
	this.scorer = scorer;
	}

	@Override
	public boolean acceptsDocsOutOfOrder() {
	return true;
	}

	/**
	* Chooses the right {@link TermsWithScoreCollector} implementation.
	*
	* @param field The field to collect terms for
	* @param multipleValuesPerDocument Whether the field to collect terms for has multiple values per document.
	* @return a {@link TermsWithScoreCollector} instance
	*/
	static TermsWithScoreCollector create(String field, boolean multipleValuesPerDocument, ScoreMode scoreMode) {
	if (multipleValuesPerDocument) {
	switch (scoreMode) {
	case Avg:
	return new MV.Avg(field);
	default:
	return new MV(field, scoreMode);
	}
	} else {
	switch (scoreMode) {
	case Avg:
	return new SV.Avg(field);
	default:
	return new SV(field, scoreMode);
	}
	}
	}

	// impl that works with single value per document
	static class SV extends TermsWithScoreCollector {

	final BytesRef spare = new BytesRef();
	BinaryDocValues fromDocTerms;

	SV(String field, ScoreMode scoreMode) {
	super(field, scoreMode);
	}

	@Override
	public void collect(int doc) throws IOException {
	fromDocTerms.get(doc, spare);
	int ord = collectedTerms.add(spare);
	if (ord < 0) {
	ord = -ord - 1;
	} else {
	if (ord >= scoreSums.length) {
	scoreSums = ArrayUtil.grow(scoreSums);
	}
	}

	float current = scorer.score();
	float existing = scoreSums[ord];
	if (Float.compare(existing, 0.0f) == 0) {
	scoreSums[ord] = current;
	} else {
	switch (scoreMode) {
	case Total:
	scoreSums[ord] = scoreSums[ord] + current;
	break;
	case Max:
	if (current > existing) {
	scoreSums[ord] = current;
	}
	}
	}
	}

	@Override
	protected void doSetNextReader(AtomicReaderContext context) throws IOException {
	fromDocTerms = DocValues.getBinary(context.reader(), field);
	}

	static class Avg extends SV {

	int[] scoreCounts = new int[INITIAL_ARRAY_SIZE];

	Avg(String field) {
	super(field, ScoreMode.Avg);
	}

	@Override
	public void collect(int doc) throws IOException {
	fromDocTerms.get(doc, spare);
	int ord = collectedTerms.add(spare);
	if (ord < 0) {
	ord = -ord - 1;
	} else {
	if (ord >= scoreSums.length) {
	scoreSums = ArrayUtil.grow(scoreSums);
	scoreCounts = ArrayUtil.grow(scoreCounts);
	}
	}

	float current = scorer.score();
	float existing = scoreSums[ord];
	if (Float.compare(existing, 0.0f) == 0) {
	scoreSums[ord] = current;
	scoreCounts[ord] = 1;
	} else {
	scoreSums[ord] = scoreSums[ord] + current;
	scoreCounts[ord]++;
	}
	}

	@Override
	public float[] getScoresPerTerm() {
	if (scoreCounts != null) {
	for (int i = 0; i < scoreCounts.length; i++) {
	scoreSums[i] = scoreSums[i] / scoreCounts[i];
	}
	scoreCounts = null;
	}
	return scoreSums;
	}
	}
	}

	// impl that works with multiple values per document
	static class MV extends TermsWithScoreCollector {

	SortedSetDocValues fromDocTermOrds;
	final BytesRef scratch = new BytesRef();

	MV(String field, ScoreMode scoreMode) {
	super(field, scoreMode);
	}

	@Override
	public void collect(int doc) throws IOException {
	fromDocTermOrds.setDocument(doc);
	long ord;
	while ((ord = fromDocTermOrds.nextOrd()) != SortedSetDocValues.NO_MORE_ORDS) {
	fromDocTermOrds.lookupOrd(ord, scratch);

	int termID = collectedTerms.add(scratch);
	if (termID < 0) {
	termID = -termID - 1;
	} else {
	if (termID >= scoreSums.length) {
	scoreSums = ArrayUtil.grow(scoreSums);
	}
	}

	switch (scoreMode) {
	case Total:
	scoreSums[termID] += scorer.score();
	break;
	case Max:
	scoreSums[termID] = Math.max(scoreSums[termID], scorer.score());
	}
	}
	}

	@Override
	protected void doSetNextReader(AtomicReaderContext context) throws IOException {
	fromDocTermOrds = DocValues.getSortedSet(context.reader(), field);
	}

	static class Avg extends MV {

	int[] scoreCounts = new int[INITIAL_ARRAY_SIZE];

	Avg(String field) {
	super(field, ScoreMode.Avg);
	}

	@Override
	public void collect(int doc) throws IOException {
	fromDocTermOrds.setDocument(doc);
	long ord;
	while ((ord = fromDocTermOrds.nextOrd()) != SortedSetDocValues.NO_MORE_ORDS) {
	fromDocTermOrds.lookupOrd(ord, scratch);

	int termID = collectedTerms.add(scratch);
	if (termID < 0) {
	termID = -termID - 1;
	} else {
	if (termID >= scoreSums.length) {
	scoreSums = ArrayUtil.grow(scoreSums);
	scoreCounts = ArrayUtil.grow(scoreCounts);
	}
	}

	scoreSums[termID] += scorer.score();
	scoreCounts[termID]++;
	}
	}

	@Override
	public float[] getScoresPerTerm() {
	if (scoreCounts != null) {
	for (int i = 0; i < scoreCounts.length; i++) {
	scoreSums[i] = scoreSums[i] / scoreCounts[i];
	}
	scoreCounts = null;
	}
	return scoreSums;
	}
	}
	}

	}