lucene/codecs/src/java/org/apache/lucene/codecs/memory/MemoryPostingsFormat.java - lucene-solr - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.lucene.codecs.memory;

 import java.io.IOException;
 import java.util.Collection;
 import java.util.Collections;
 import java.util.Iterator;
 import java.util.Map;
 import java.util.SortedMap;
 import java.util.TreeMap;

 import org.apache.lucene.codecs.CodecUtil;
 import org.apache.lucene.codecs.FieldsConsumer;
 import org.apache.lucene.codecs.FieldsProducer;
 import org.apache.lucene.codecs.PostingsFormat;
 import org.apache.lucene.codecs.TermStats;
 import org.apache.lucene.index.CorruptIndexException;
 import org.apache.lucene.index.PostingsEnum;
 import org.apache.lucene.index.FieldInfo;
 import org.apache.lucene.index.FieldInfos;
 import org.apache.lucene.index.Fields;
 import org.apache.lucene.index.IndexFileNames;
 import org.apache.lucene.index.IndexOptions;
 import org.apache.lucene.index.SegmentReadState;
 import org.apache.lucene.index.SegmentWriteState;
 import org.apache.lucene.index.Terms;
 import org.apache.lucene.index.TermsEnum;
 import org.apache.lucene.store.ByteArrayDataInput;
 import org.apache.lucene.store.ChecksumIndexInput;
 import org.apache.lucene.store.IOContext;
 import org.apache.lucene.store.IndexInput;
 import org.apache.lucene.store.IndexOutput;
 import org.apache.lucene.store.RAMOutputStream;
 import org.apache.lucene.util.Accountable;
 import org.apache.lucene.util.Accountables;
 import org.apache.lucene.util.ArrayUtil;
 import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.FixedBitSet;
 import org.apache.lucene.util.IOUtils;
 import org.apache.lucene.util.IntsRefBuilder;
 import org.apache.lucene.util.fst.Builder;
 import org.apache.lucene.util.fst.ByteSequenceOutputs;
 import org.apache.lucene.util.fst.BytesRefFSTEnum;
 import org.apache.lucene.util.fst.FST;
 import org.apache.lucene.util.fst.Util;
 import org.apache.lucene.util.packed.PackedInts;

 // TODO: would be nice to somehow allow this to act like
 // InstantiatedIndex, by never writing to disk; ie you write
 // to this Codec in RAM only and then when you open a reader
 // it pulls the FST directly from what you wrote w/o going
 // to disk.

 /** Stores terms and postings (docs, positions, payloads) in
  *  RAM, using an FST.
  *
  * <p>Note that this codec implements advance as a linear
  * scan!  This means if you store large fields in here,
  * queries that rely on advance will (AND BooleanQuery,
  * PhraseQuery) will be relatively slow!
  *
  * @lucene.experimental */

 // TODO: Maybe name this 'Cached' or something to reflect
 // the reality that it is actually written to disk, but
 // loads itself in ram?
 public final class MemoryPostingsFormat extends PostingsFormat {

   public MemoryPostingsFormat() {
     this(false, PackedInts.DEFAULT);
   }

   /**
    * Create MemoryPostingsFormat, specifying advanced FST options.
    * @param doPackFST true if a packed FST should be built.
    *        NOTE: packed FSTs are limited to ~2.1 GB of postings.
    * @param acceptableOverheadRatio allowable overhead for packed ints
    *        during FST construction.
    */
   public MemoryPostingsFormat(boolean doPackFST, float acceptableOverheadRatio) {
     super("Memory");
   }

   @Override
   public String toString() {
     return "PostingsFormat(name=" + getName() + ")";
   }

   private final static class TermsWriter {
     private final IndexOutput out;
     private final FieldInfo field;
     private final Builder<BytesRef> builder;
     private final ByteSequenceOutputs outputs = ByteSequenceOutputs.getSingleton();
     private int termCount;

     public TermsWriter(IndexOutput out, FieldInfo field) {
       this.out = out;
       this.field = field;
       builder = new Builder<>(FST.INPUT_TYPE.BYTE1, 0, 0, true, true, Integer.MAX_VALUE, outputs, true, 15, false);
     }

     private class PostingsWriter {
       private int lastDocID;
       private int lastPos;
       private int lastPayloadLen;

       // NOTE: not private so we don't pay access check at runtime:
       int docCount;
       RAMOutputStream buffer = new RAMOutputStream();

       int lastOffsetLength;
       int lastOffset;

       public void startDoc(int docID, int termDocFreq) throws IOException {
         //System.out.println("    startDoc docID=" + docID + " freq=" + termDocFreq);
         final int delta = docID - lastDocID;
         assert docID == 0 || delta > 0;
         lastDocID = docID;
         docCount++;

         if (field.getIndexOptions() == IndexOptions.DOCS) {
           buffer.writeVInt(delta);
         } else if (termDocFreq == 1) {
           buffer.writeVInt((delta<<1) | 1);
         } else {
           buffer.writeVInt(delta<<1);
           assert termDocFreq > 0;
           buffer.writeVInt(termDocFreq);
         }

         lastPos = 0;
         lastOffset = 0;
       }

       public void addPosition(int pos, BytesRef payload, int startOffset, int endOffset) throws IOException {
         assert payload == null || field.hasPayloads();

         //System.out.println("      addPos pos=" + pos + " payload=" + payload);

         final int delta = pos - lastPos;
         assert delta >= 0;
         lastPos = pos;

         int payloadLen = 0;

         if (field.hasPayloads()) {
           payloadLen = payload == null ? 0 : payload.length;
           if (payloadLen != lastPayloadLen) {
             lastPayloadLen = payloadLen;
             buffer.writeVInt((delta<<1)|1);
             buffer.writeVInt(payloadLen);
           } else {
             buffer.writeVInt(delta<<1);
           }
         } else {
           buffer.writeVInt(delta);
         }

         if (field.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS) >= 0) {
           // don't use startOffset - lastEndOffset, because this creates lots of negative vints for synonyms,
           // and the numbers aren't that much smaller anyways.
           int offsetDelta = startOffset - lastOffset;
           int offsetLength = endOffset - startOffset;
           if (offsetLength != lastOffsetLength) {
             buffer.writeVInt(offsetDelta << 1 | 1);
             buffer.writeVInt(offsetLength);
           } else {
             buffer.writeVInt(offsetDelta << 1);
           }
           lastOffset = startOffset;
           lastOffsetLength = offsetLength;
         }

         if (payloadLen > 0) {
           buffer.writeBytes(payload.bytes, payload.offset, payloadLen);
         }
       }

       public PostingsWriter reset() {
         assert buffer.getFilePointer() == 0;
         lastDocID = 0;
         docCount = 0;
         lastPayloadLen = 0;
         // force first offset to write its length
         lastOffsetLength = -1;
         return this;
       }
     }

     final PostingsWriter postingsWriter = new PostingsWriter();

     private final RAMOutputStream buffer2 = new RAMOutputStream();
     private final BytesRef spare = new BytesRef();
     private byte[] finalBuffer = new byte[128];

     private final IntsRefBuilder scratchIntsRef = new IntsRefBuilder();

     private void finishTerm(BytesRef text, TermStats stats) throws IOException {

       if (stats.docFreq == 0) {
         return;
       }
       assert postingsWriter.docCount == stats.docFreq;

       assert buffer2.getFilePointer() == 0;

       buffer2.writeVInt(stats.docFreq);
       if (field.getIndexOptions() != IndexOptions.DOCS) {
         buffer2.writeVLong(stats.totalTermFreq-stats.docFreq);
       }
       int pos = (int) buffer2.getFilePointer();
       buffer2.writeTo(finalBuffer, 0);
       buffer2.reset();

       final int totalBytes = pos + (int) postingsWriter.buffer.getFilePointer();
       if (totalBytes > finalBuffer.length) {
         finalBuffer = ArrayUtil.grow(finalBuffer, totalBytes);
       }
       postingsWriter.buffer.writeTo(finalBuffer, pos);
       postingsWriter.buffer.reset();

       spare.bytes = finalBuffer;
       spare.length = totalBytes;

       //System.out.println("    finishTerm term=" + text.utf8ToString() + " " + totalBytes + " bytes totalTF=" + stats.totalTermFreq);
       //for(int i=0;i<totalBytes;i++) {
       //  System.out.println("      " + Integer.toHexString(finalBuffer[i]&0xFF));
       //}

       builder.add(Util.toIntsRef(text, scratchIntsRef), BytesRef.deepCopyOf(spare));
       termCount++;
     }

     public void finish(long sumTotalTermFreq, long sumDocFreq, int docCount) throws IOException {
       if (termCount > 0) {
         out.writeVInt(termCount);
         out.writeVInt(field.number);
         if (field.getIndexOptions() != IndexOptions.DOCS) {
           out.writeVLong(sumTotalTermFreq);
         }
         out.writeVLong(sumDocFreq);
         out.writeVInt(docCount);
         FST<BytesRef> fst = builder.finish();
         fst.save(out);
         //System.out.println("finish field=" + field.name + " fp=" + out.getFilePointer());
       }
     }
   }

   private static String EXTENSION = "ram";
   private static final String CODEC_NAME = "MemoryPostings";
   private static final int VERSION_START = 1;
   private static final int VERSION_CURRENT = VERSION_START;

   private static class MemoryFieldsConsumer extends FieldsConsumer {
     private final SegmentWriteState state;
     private final IndexOutput out;

     private MemoryFieldsConsumer(SegmentWriteState state) throws IOException {
       final String fileName = IndexFileNames.segmentFileName(state.segmentInfo.name, state.segmentSuffix, EXTENSION);
       out = state.directory.createOutput(fileName, state.context);
       boolean success = false;
       try {
         CodecUtil.writeIndexHeader(out, CODEC_NAME, VERSION_CURRENT, state.segmentInfo.getId(), state.segmentSuffix);
         success = true;
       } finally {
         if (!success) {
           IOUtils.closeWhileHandlingException(out);
         }
       }
       this.state = state;
     }

     @Override
     public void write(Fields fields) throws IOException {
       for(String field : fields) {

         Terms terms = fields.terms(field);
         if (terms == null) {
           continue;
         }

         TermsEnum termsEnum = terms.iterator();

         FieldInfo fieldInfo = state.fieldInfos.fieldInfo(field);
         TermsWriter termsWriter = new TermsWriter(out, fieldInfo);

         FixedBitSet docsSeen = new FixedBitSet(state.segmentInfo.maxDoc());
         long sumTotalTermFreq = 0;
         long sumDocFreq = 0;
         PostingsEnum postingsEnum = null;
         PostingsEnum posEnum = null;
         int enumFlags;

         IndexOptions indexOptions = fieldInfo.getIndexOptions();
         boolean writeFreqs = indexOptions.compareTo(IndexOptions.DOCS_AND_FREQS) >= 0;
         boolean writePositions = indexOptions.compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS) >= 0;
         boolean writeOffsets = indexOptions.compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS) >= 0;
         boolean writePayloads = fieldInfo.hasPayloads();

         if (writeFreqs == false) {
           enumFlags = 0;
         } else if (writePositions == false) {
           enumFlags = PostingsEnum.FREQS;
         } else if (writeOffsets == false) {
           if (writePayloads) {
             enumFlags = PostingsEnum.PAYLOADS;
           }
           else {
             enumFlags = PostingsEnum.POSITIONS;
           }
         } else {
           if (writePayloads) {
             enumFlags = PostingsEnum.PAYLOADS | PostingsEnum.OFFSETS;
           } else {
             enumFlags = PostingsEnum.OFFSETS;
           }
         }

         while (true) {
           BytesRef term = termsEnum.next();
           if (term == null) {
             break;
           }
           termsWriter.postingsWriter.reset();

           if (writePositions) {
             posEnum = termsEnum.postings(posEnum, enumFlags);
             postingsEnum = posEnum;
           } else {
             postingsEnum = termsEnum.postings(postingsEnum, enumFlags);
             posEnum = null;
           }

           int docFreq = 0;
           long totalTermFreq = 0;
           while (true) {
             int docID = postingsEnum.nextDoc();
             if (docID == PostingsEnum.NO_MORE_DOCS) {
               break;
             }
             docsSeen.set(docID);
             docFreq++;

             int freq;
             if (writeFreqs) {
               freq = postingsEnum.freq();
               totalTermFreq += freq;
             } else {
               freq = -1;
             }

             termsWriter.postingsWriter.startDoc(docID, freq);
             if (writePositions) {
               for (int i=0;i<freq;i++) {
                 int pos = posEnum.nextPosition();
                 BytesRef payload = writePayloads ? posEnum.getPayload() : null;
                 int startOffset;
                 int endOffset;
                 if (writeOffsets) {
                   startOffset = posEnum.startOffset();
                   endOffset = posEnum.endOffset();
                 } else {
                   startOffset = -1;
                   endOffset = -1;
                 }
                 termsWriter.postingsWriter.addPosition(pos, payload, startOffset, endOffset);
               }
             }
           }
           termsWriter.finishTerm(term, new TermStats(docFreq, totalTermFreq));
           sumDocFreq += docFreq;
           sumTotalTermFreq += totalTermFreq;
         }

         termsWriter.finish(sumTotalTermFreq, sumDocFreq, docsSeen.cardinality());
       }
     }

     private boolean closed;

     @Override
     public void close() throws IOException {
       if (closed) {
         return;
       }
       closed = true;

       // EOF marker:
       try (IndexOutput out = this.out) {
         out.writeVInt(0);
         CodecUtil.writeFooter(out);
       }
     }
   }

   @Override
   public FieldsConsumer fieldsConsumer(SegmentWriteState state) throws IOException {
     return new MemoryFieldsConsumer(state);
   }

   private final static class FSTDocsEnum extends PostingsEnum {
     private final IndexOptions indexOptions;
     private final boolean storePayloads;
     private byte[] buffer = new byte[16];
     private final ByteArrayDataInput in = new ByteArrayDataInput(buffer);

     private int docUpto;
     private int docID = -1;
     private int accum;
     private int freq;
     private int payloadLen;
     private int numDocs;

     public FSTDocsEnum(IndexOptions indexOptions, boolean storePayloads) {
       this.indexOptions = indexOptions;
       this.storePayloads = storePayloads;
     }

     public boolean canReuse(IndexOptions indexOptions, boolean storePayloads) {
       return indexOptions == this.indexOptions && storePayloads == this.storePayloads;
     }

     public FSTDocsEnum reset(BytesRef bufferIn, int numDocs) {
       assert numDocs > 0;
       if (buffer.length < bufferIn.length) {
         buffer = ArrayUtil.grow(buffer, bufferIn.length);
       }
       in.reset(buffer, 0, bufferIn.length);
       System.arraycopy(bufferIn.bytes, bufferIn.offset, buffer, 0, bufferIn.length);
       docID = -1;
       accum = 0;
       docUpto = 0;
       freq = 1;
       payloadLen = 0;
       this.numDocs = numDocs;
       return this;
     }

     @Override
     public int nextDoc() {
       //System.out.println("  nextDoc cycle docUpto=" + docUpto + " numDocs=" + numDocs + " fp=" + in.getPosition() + " this=" + this);
       if (docUpto == numDocs) {
         // System.out.println("    END");
         return docID = NO_MORE_DOCS;
       }
       docUpto++;
       if (indexOptions == IndexOptions.DOCS) {
         accum += in.readVInt();
       } else {
         final int code = in.readVInt();
         accum += code >>> 1;
         //System.out.println("  docID=" + accum + " code=" + code);
         if ((code & 1) != 0) {
           freq = 1;
         } else {
           freq = in.readVInt();
           assert freq > 0;
         }

         if (indexOptions == IndexOptions.DOCS_AND_FREQS_AND_POSITIONS) {
           // Skip positions/payloads
           for(int posUpto=0;posUpto<freq;posUpto++) {
             if (!storePayloads) {
               in.readVInt();
             } else {
               final int posCode = in.readVInt();
               if ((posCode & 1) != 0) {
                 payloadLen = in.readVInt();
               }
               in.skipBytes(payloadLen);
             }
           }
         } else if (indexOptions == IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS) {
           // Skip positions/offsets/payloads
           for(int posUpto=0;posUpto<freq;posUpto++) {
             int posCode = in.readVInt();
             if (storePayloads && ((posCode & 1) != 0)) {
               payloadLen = in.readVInt();
             }
             if ((in.readVInt() & 1) != 0) {
               // new offset length
               in.readVInt();
             }
             if (storePayloads) {
               in.skipBytes(payloadLen);
             }
           }
         }
       }

       //System.out.println("    return docID=" + accum + " freq=" + freq);
       return (docID = accum);
     }

     @Override
     public int docID() {
       return docID;
     }

     @Override
     public int advance(int target) throws IOException {
       // TODO: we could make more efficient version, but, it
       // should be rare that this will matter in practice
       // since usually apps will not store "big" fields in
       // this codec!
       return slowAdvance(target);
     }

     @Override
     public int freq() {
       return freq;
     }

     @Override
     public long cost() {
       return numDocs;
     }

     @Override
     public int nextPosition() throws IOException {
       return -1;
     }

     @Override
     public int startOffset() throws IOException {
       return -1;
     }

     @Override
     public int endOffset() throws IOException {
       return -1;
     }

     @Override
     public BytesRef getPayload() throws IOException {
       return null;
     }
   }

   private final static class FSTPostingsEnum extends PostingsEnum {
     private final boolean storePayloads;
     private byte[] buffer = new byte[16];
     private final ByteArrayDataInput in = new ByteArrayDataInput(buffer);

     private int docUpto;
     private int docID = -1;
     private int accum;
     private int freq;
     private int numDocs;
     private int posPending;
     private int payloadLength;
     final boolean storeOffsets;
     int offsetLength;
     int startOffset;

     private int pos;
     private final BytesRef payload = new BytesRef();

     public FSTPostingsEnum(boolean storePayloads, boolean storeOffsets) {
       this.storePayloads = storePayloads;
       this.storeOffsets = storeOffsets;
     }

     public boolean canReuse(boolean storePayloads, boolean storeOffsets) {
       return storePayloads == this.storePayloads && storeOffsets == this.storeOffsets;
     }

     public FSTPostingsEnum reset(BytesRef bufferIn, int numDocs) {
       assert numDocs > 0;

       // System.out.println("D&P reset bytes this=" + this);
       // for(int i=bufferIn.offset;i<bufferIn.length;i++) {
       //   System.out.println("  " + Integer.toHexString(bufferIn.bytes[i]&0xFF));
       // }

       if (buffer.length < bufferIn.length) {
         buffer = ArrayUtil.grow(buffer, bufferIn.length);
       }
       in.reset(buffer, 0, bufferIn.length - bufferIn.offset);
       System.arraycopy(bufferIn.bytes, bufferIn.offset, buffer, 0, bufferIn.length);
       docID = -1;
       accum = 0;
       docUpto = 0;
       payload.bytes = buffer;
       payloadLength = 0;
       this.numDocs = numDocs;
       posPending = 0;
       startOffset = storeOffsets ? 0 : -1; // always return -1 if no offsets are stored
       offsetLength = 0;
       return this;
     }

     @Override
     public int nextDoc() {
       while (posPending > 0) {
         nextPosition();
       }
       while(true) {
         //System.out.println("  nextDoc cycle docUpto=" + docUpto + " numDocs=" + numDocs + " fp=" + in.getPosition() + " this=" + this);
         if (docUpto == numDocs) {
           //System.out.println("    END");
           return docID = NO_MORE_DOCS;
         }
         docUpto++;

         final int code = in.readVInt();
         accum += code >>> 1;
         if ((code & 1) != 0) {
           freq = 1;
         } else {
           freq = in.readVInt();
           assert freq > 0;
         }

         pos = 0;
         startOffset = storeOffsets ? 0 : -1;
         posPending = freq;
         //System.out.println("    return docID=" + accum + " freq=" + freq);
         return (docID = accum);
       }
     }

     @Override
     public int nextPosition() {
       //System.out.println("    nextPos storePayloads=" + storePayloads + " this=" + this);
       assert posPending > 0;
       posPending--;
       if (!storePayloads) {
         pos += in.readVInt();
       } else {
         final int code = in.readVInt();
         pos += code >>> 1;
         if ((code & 1) != 0) {
           payloadLength = in.readVInt();
           //System.out.println("      new payloadLen=" + payloadLength);
           //} else {
           //System.out.println("      same payloadLen=" + payloadLength);
         }
       }

       if (storeOffsets) {
         int offsetCode = in.readVInt();
         if ((offsetCode & 1) != 0) {
           // new offset length
           offsetLength = in.readVInt();
         }
         startOffset += offsetCode >>> 1;
       }

       if (storePayloads) {
         payload.offset = in.getPosition();
         in.skipBytes(payloadLength);
         payload.length = payloadLength;
       }

       //System.out.println("      pos=" + pos + " payload=" + payload + " fp=" + in.getPosition());
       return pos;
     }

     @Override
     public int startOffset() {
       return startOffset;
     }

     @Override
     public int endOffset() {
       return startOffset + offsetLength;
     }

     @Override
     public BytesRef getPayload() {
       return payload.length > 0 ? payload : null;
     }

     @Override
     public int docID() {
       return docID;
     }

     @Override
     public int advance(int target) throws IOException {
       // TODO: we could make more efficient version, but, it
       // should be rare that this will matter in practice
       // since usually apps will not store "big" fields in
       // this codec!
       return slowAdvance(target);
     }

     @Override
     public int freq() {
       return freq;
     }

     @Override
     public long cost() {
       return numDocs;
     }
   }

   private final static class FSTTermsEnum extends TermsEnum {
     private final FieldInfo field;
     private final BytesRefFSTEnum<BytesRef> fstEnum;
     private final ByteArrayDataInput buffer = new ByteArrayDataInput();
     private boolean didDecode;

     private int docFreq;
     private long totalTermFreq;
     private BytesRefFSTEnum.InputOutput<BytesRef> current;
     private BytesRef postingsSpare = new BytesRef();

     public FSTTermsEnum(FieldInfo field, FST<BytesRef> fst) {
       this.field = field;
       fstEnum = new BytesRefFSTEnum<>(fst);
     }

     private void decodeMetaData() {
       if (!didDecode) {
         buffer.reset(current.output.bytes, current.output.offset, current.output.length);
         docFreq = buffer.readVInt();
         if (field.getIndexOptions() != IndexOptions.DOCS) {
           totalTermFreq = docFreq + buffer.readVLong();
         } else {
           totalTermFreq = -1;
         }
         postingsSpare.bytes = current.output.bytes;
         postingsSpare.offset = buffer.getPosition();
         postingsSpare.length = current.output.length - (buffer.getPosition() - current.output.offset);
         //System.out.println("  df=" + docFreq + " totTF=" + totalTermFreq + " offset=" + buffer.getPosition() + " len=" + current.output.length);
         didDecode = true;
       }
     }

     @Override
     public boolean seekExact(BytesRef text) throws IOException {
       //System.out.println("te.seekExact text=" + field.name + ":" + text.utf8ToString() + " this=" + this);
       current = fstEnum.seekExact(text);
       didDecode = false;
       return current != null;
     }

     @Override
     public SeekStatus seekCeil(BytesRef text) throws IOException {
       //System.out.println("te.seek text=" + field.name + ":" + text.utf8ToString() + " this=" + this);
       current = fstEnum.seekCeil(text);
       if (current == null) {
         return SeekStatus.END;
       } else {

         // System.out.println("  got term=" + current.input.utf8ToString());
         // for(int i=0;i<current.output.length;i++) {
         //   System.out.println("    " + Integer.toHexString(current.output.bytes[i]&0xFF));
         // }

         didDecode = false;

         if (text.equals(current.input)) {
           //System.out.println("  found!");
           return SeekStatus.FOUND;
         } else {
           //System.out.println("  not found: " + current.input.utf8ToString());
           return SeekStatus.NOT_FOUND;
         }
       }
     }

     @Override
     public PostingsEnum postings(PostingsEnum reuse, int flags) {

       // TODO: the logic of which enum impl to choose should be refactored to be simpler...
       boolean hasPositions = field.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS) >= 0;
       if (hasPositions && PostingsEnum.featureRequested(flags, PostingsEnum.POSITIONS)) {
         boolean hasOffsets = field.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS) >= 0;
         decodeMetaData();
         FSTPostingsEnum docsAndPositionsEnum;
         if (reuse == null || !(reuse instanceof FSTPostingsEnum)) {
           docsAndPositionsEnum = new FSTPostingsEnum(field.hasPayloads(), hasOffsets);
         } else {
           docsAndPositionsEnum = (FSTPostingsEnum) reuse;
           if (!docsAndPositionsEnum.canReuse(field.hasPayloads(), hasOffsets)) {
             docsAndPositionsEnum = new FSTPostingsEnum(field.hasPayloads(), hasOffsets);
           }
         }
         //System.out.println("D&P reset this=" + this);
         return docsAndPositionsEnum.reset(postingsSpare, docFreq);
       }

       decodeMetaData();
       FSTDocsEnum docsEnum;

       if (reuse == null || !(reuse instanceof FSTDocsEnum)) {
         docsEnum = new FSTDocsEnum(field.getIndexOptions(), field.hasPayloads());
       } else {
         docsEnum = (FSTDocsEnum) reuse;
         if (!docsEnum.canReuse(field.getIndexOptions(), field.hasPayloads())) {
           docsEnum = new FSTDocsEnum(field.getIndexOptions(), field.hasPayloads());
         }
       }
       return docsEnum.reset(this.postingsSpare, docFreq);
     }

     @Override
     public BytesRef term() {
       return current.input;
     }

     @Override
     public BytesRef next() throws IOException {
       //System.out.println("te.next");
       current = fstEnum.next();
       if (current == null) {
         //System.out.println("  END");
         return null;
       }
       didDecode = false;
       //System.out.println("  term=" + field.name + ":" + current.input.utf8ToString());
       return current.input;
     }

     @Override
     public int docFreq() {
       decodeMetaData();
       return docFreq;
     }

     @Override
     public long totalTermFreq() {
       decodeMetaData();
       return totalTermFreq;
     }

     @Override
     public void seekExact(long ord) {
       // NOTE: we could add this...
       throw new UnsupportedOperationException();
     }

     @Override
     public long ord() {
       // NOTE: we could add this...
       throw new UnsupportedOperationException();
     }
   }

   private final static class TermsReader extends Terms implements Accountable {

     private final long sumTotalTermFreq;
     private final long sumDocFreq;
     private final int docCount;
     private final int termCount;
     private FST<BytesRef> fst;
     private final ByteSequenceOutputs outputs = ByteSequenceOutputs.getSingleton();
     private final FieldInfo field;

     public TermsReader(FieldInfos fieldInfos, IndexInput in, int termCount) throws IOException {
       this.termCount = termCount;
       final int fieldNumber = in.readVInt();
       field = fieldInfos.fieldInfo(fieldNumber);
       if (field == null) {
         throw new CorruptIndexException("invalid field number: " + fieldNumber, in);
       } else if (field.getIndexOptions() != IndexOptions.DOCS) {
         sumTotalTermFreq = in.readVLong();
       } else {
         sumTotalTermFreq = -1;
       }
       sumDocFreq = in.readVLong();
       docCount = in.readVInt();

       fst = new FST<>(in, outputs);
     }

     @Override
     public long getSumTotalTermFreq() {
       return sumTotalTermFreq;
     }

     @Override
     public long getSumDocFreq() {
       return sumDocFreq;
     }

     @Override
     public int getDocCount() {
       return docCount;
     }

     @Override
     public long size() {
       return termCount;
     }

     @Override
     public TermsEnum iterator() {
       return new FSTTermsEnum(field, fst);
     }

     @Override
     public boolean hasFreqs() {
       return field.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS) >= 0;
     }

     @Override
     public boolean hasOffsets() {
       return field.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS) >= 0;
     }

     @Override
     public boolean hasPositions() {
       return field.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS) >= 0;
     }

     @Override
     public boolean hasPayloads() {
       return field.hasPayloads();
     }

     @Override
     public long ramBytesUsed() {
       return ((fst!=null) ? fst.ramBytesUsed() : 0);
     }

     @Override
     public Collection<Accountable> getChildResources() {
       if (fst == null) {
         return Collections.emptyList();
       } else {
         return Collections.singletonList(Accountables.namedAccountable("terms", fst));
       }
     }

     @Override
     public String toString() {
       return "MemoryTerms(terms=" + termCount + ",postings=" + sumDocFreq + ",positions=" + sumTotalTermFreq + ",docs=" + docCount + ")";
     }
   }

   @Override
   public FieldsProducer fieldsProducer(SegmentReadState state) throws IOException {
     final String fileName = IndexFileNames.segmentFileName(state.segmentInfo.name, state.segmentSuffix, EXTENSION);

     final SortedMap<String,TermsReader> fields = new TreeMap<>();

     try (ChecksumIndexInput in = state.directory.openChecksumInput(fileName, IOContext.READONCE)) {
       Throwable priorE = null;
       try {
         CodecUtil.checkIndexHeader(in, CODEC_NAME, VERSION_START, VERSION_CURRENT, state.segmentInfo.getId(), state.segmentSuffix);
         while(true) {
           final int termCount = in.readVInt();
           if (termCount == 0) {
             break;
           }
           final TermsReader termsReader = new TermsReader(state.fieldInfos, in, termCount);
           // System.out.println("load field=" + termsReader.field.name);
           fields.put(termsReader.field.name, termsReader);
         }
       } catch (Throwable exception) {
         priorE = exception;
       } finally {
         CodecUtil.checkFooter(in, priorE);
       }
     }

     return new FieldsProducer() {
       @Override
       public Iterator<String> iterator() {
         return Collections.unmodifiableSet(fields.keySet()).iterator();
       }

       @Override
       public Terms terms(String field) {
         return fields.get(field);
       }

       @Override
       public int size() {
         return fields.size();
       }

       @Override
       public void close() {
         // Drop ref to FST:
         for(TermsReader termsReader : fields.values()) {
           termsReader.fst = null;
         }
       }

       @Override
       public long ramBytesUsed() {
         long sizeInBytes = 0;
         for(Map.Entry<String,TermsReader> entry: fields.entrySet()) {
           sizeInBytes += (entry.getKey().length() * Character.BYTES);
           sizeInBytes += entry.getValue().ramBytesUsed();
         }
         return sizeInBytes;
       }

       @Override
       public Collection<Accountable> getChildResources() {
         return Accountables.namedAccountables("field", fields);
       }

       @Override
       public String toString() {
         return "MemoryPostings(fields=" + fields.size() + ")";
       }

       @Override
       public void checkIntegrity() throws IOException {}
     };
   }
 }