lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene70/Lucene70SegmentInfoFormat.java - lucene-solr - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.lucene.backward_codecs.lucene70;

 import java.io.IOException;
 import java.util.Map;
 import java.util.Set;
 import org.apache.lucene.codecs.CodecUtil;
 import org.apache.lucene.codecs.SegmentInfoFormat;
 import org.apache.lucene.index.CorruptIndexException;
 import org.apache.lucene.index.IndexFileNames;
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.SegmentInfo;
 import org.apache.lucene.index.SegmentInfos;
 import org.apache.lucene.search.Sort;
 import org.apache.lucene.search.SortField;
 import org.apache.lucene.search.SortedNumericSelector;
 import org.apache.lucene.search.SortedNumericSortField;
 import org.apache.lucene.search.SortedSetSelector;
 import org.apache.lucene.search.SortedSetSortField;
 import org.apache.lucene.store.ChecksumIndexInput;
 import org.apache.lucene.store.DataInput;
 import org.apache.lucene.store.DataOutput;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.IOContext;
 import org.apache.lucene.util.Version;

 /**
  * Lucene 7.0 Segment info format.
  *
  * <p>Files:
  *
  * <ul>
  *   <li><code>.si</code>: Header, SegVersion, SegSize, IsCompoundFile, Diagnostics, Files,
  *       Attributes, IndexSort, Footer
  * </ul>
  *
  * Data types:
  *
  * <ul>
  *   <li>Header --&gt; {@link CodecUtil#writeIndexHeader IndexHeader}
  *   <li>SegSize --&gt; {@link DataOutput#writeInt Int32}
  *   <li>SegVersion --&gt; {@link DataOutput#writeString String}
  *   <li>SegMinVersion --&gt; {@link DataOutput#writeString String}
  *   <li>Files --&gt; {@link DataOutput#writeSetOfStrings Set&lt;String&gt;}
  *   <li>Diagnostics,Attributes --&gt; {@link DataOutput#writeMapOfStrings Map&lt;String,String&gt;}
  *   <li>IsCompoundFile --&gt; {@link DataOutput#writeByte Int8}
  *   <li>IndexSort --&gt; {@link DataOutput#writeVInt Int32} count, followed by {@code count}
  *       SortField
  *   <li>SortField --&gt; {@link DataOutput#writeString String} field name, followed by {@link
  *       DataOutput#writeVInt Int32} sort type ID, followed by {@link DataOutput#writeByte Int8}
  *       indicating reversed sort, followed by a type-specific encoding of the optional missing
  *       value
  *   <li>Footer --&gt; {@link CodecUtil#writeFooter CodecFooter}
  * </ul>
  *
  * Field Descriptions:
  *
  * <ul>
  *   <li>SegVersion is the code version that created the segment.
  *   <li>SegMinVersion is the minimum code version that contributed documents to the segment.
  *   <li>SegSize is the number of documents contained in the segment index.
  *   <li>IsCompoundFile records whether the segment is written as a compound file or not. If this is
  *       -1, the segment is not a compound file. If it is 1, the segment is a compound file.
  *   <li>The Diagnostics Map is privately written by {@link IndexWriter}, as a debugging aid, for
  *       each segment it creates. It includes metadata like the current Lucene version, OS, Java
  *       version, why the segment was created (merge, flush, addIndexes), etc.
  *   <li>Files is a list of files referred to by this segment.
  * </ul>
  *
  * @see SegmentInfos
  * @lucene.experimental
  */
 public class Lucene70SegmentInfoFormat extends SegmentInfoFormat {

   /** File extension used to store {@link SegmentInfo}. */
   public static final String SI_EXTENSION = "si";

   static final String CODEC_NAME = "Lucene70SegmentInfo";
   static final int VERSION_START = 0;
   static final int VERSION_CURRENT = VERSION_START;

   /** Sole constructor. */
   public Lucene70SegmentInfoFormat() {}

   @Override
   public SegmentInfo read(Directory dir, String segment, byte[] segmentID, IOContext context)
       throws IOException {
     final String fileName =
         IndexFileNames.segmentFileName(segment, "", Lucene70SegmentInfoFormat.SI_EXTENSION);
     try (ChecksumIndexInput input = dir.openChecksumInput(fileName, context)) {
       Throwable priorE = null;
       SegmentInfo si = null;
       try {
         int format =
             CodecUtil.checkIndexHeader(
                 input,
                 Lucene70SegmentInfoFormat.CODEC_NAME,
                 Lucene70SegmentInfoFormat.VERSION_START,
                 Lucene70SegmentInfoFormat.VERSION_CURRENT,
                 segmentID,
                 "");

         si = parseSegmentInfo(dir, input, segment, segmentID);

       } catch (Throwable exception) {
         priorE = exception;
       } finally {
         CodecUtil.checkFooter(input, priorE);
       }
       return si;
     }
   }

   private SegmentInfo parseSegmentInfo(
       Directory dir, DataInput input, String segment, byte[] segmentID) throws IOException {
     final Version version = Version.fromBits(input.readInt(), input.readInt(), input.readInt());
     byte hasMinVersion = input.readByte();
     final Version minVersion;
     switch (hasMinVersion) {
       case 0:
         minVersion = null;
         break;
       case 1:
         minVersion = Version.fromBits(input.readInt(), input.readInt(), input.readInt());
         break;
       default:
         throw new CorruptIndexException("Illegal boolean value " + hasMinVersion, input);
     }

     final int docCount = input.readInt();
     if (docCount < 0) {
       throw new CorruptIndexException("invalid docCount: " + docCount, input);
     }
     final boolean isCompoundFile = input.readByte() == SegmentInfo.YES;

     final Map<String, String> diagnostics = input.readMapOfStrings();
     final Set<String> files = input.readSetOfStrings();
     final Map<String, String> attributes = input.readMapOfStrings();

     int numSortFields = input.readVInt();
     Sort indexSort;
     if (numSortFields > 0) {
       SortField[] sortFields = new SortField[numSortFields];
       for (int i = 0; i < numSortFields; i++) {
         String fieldName = input.readString();
         int sortTypeID = input.readVInt();
         SortField.Type sortType;
         SortedSetSelector.Type sortedSetSelector = null;
         SortedNumericSelector.Type sortedNumericSelector = null;
         switch (sortTypeID) {
           case 0:
             sortType = SortField.Type.STRING;
             break;
           case 1:
             sortType = SortField.Type.LONG;
             break;
           case 2:
             sortType = SortField.Type.INT;
             break;
           case 3:
             sortType = SortField.Type.DOUBLE;
             break;
           case 4:
             sortType = SortField.Type.FLOAT;
             break;
           case 5:
             sortType = SortField.Type.STRING;
             byte selector = input.readByte();
             if (selector == 0) {
               sortedSetSelector = SortedSetSelector.Type.MIN;
             } else if (selector == 1) {
               sortedSetSelector = SortedSetSelector.Type.MAX;
             } else if (selector == 2) {
               sortedSetSelector = SortedSetSelector.Type.MIDDLE_MIN;
             } else if (selector == 3) {
               sortedSetSelector = SortedSetSelector.Type.MIDDLE_MAX;
             } else {
               throw new CorruptIndexException(
                   "invalid index SortedSetSelector ID: " + selector, input);
             }
             break;
           case 6:
             byte type = input.readByte();
             if (type == 0) {
               sortType = SortField.Type.LONG;
             } else if (type == 1) {
               sortType = SortField.Type.INT;
             } else if (type == 2) {
               sortType = SortField.Type.DOUBLE;
             } else if (type == 3) {
               sortType = SortField.Type.FLOAT;
             } else {
               throw new CorruptIndexException(
                   "invalid index SortedNumericSortField type ID: " + type, input);
             }
             byte numericSelector = input.readByte();
             if (numericSelector == 0) {
               sortedNumericSelector = SortedNumericSelector.Type.MIN;
             } else if (numericSelector == 1) {
               sortedNumericSelector = SortedNumericSelector.Type.MAX;
             } else {
               throw new CorruptIndexException(
                   "invalid index SortedNumericSelector ID: " + numericSelector, input);
             }
             break;
           default:
             throw new CorruptIndexException(
                 "invalid index sort field type ID: " + sortTypeID, input);
         }
         byte b = input.readByte();
         boolean reverse;
         if (b == 0) {
           reverse = true;
         } else if (b == 1) {
           reverse = false;
         } else {
           throw new CorruptIndexException("invalid index sort reverse: " + b, input);
         }

         if (sortedSetSelector != null) {
           sortFields[i] = new SortedSetSortField(fieldName, reverse, sortedSetSelector);
         } else if (sortedNumericSelector != null) {
           sortFields[i] =
               new SortedNumericSortField(fieldName, sortType, reverse, sortedNumericSelector);
         } else {
           sortFields[i] = new SortField(fieldName, sortType, reverse);
         }

         Object missingValue;
         b = input.readByte();
         if (b == 0) {
           missingValue = null;
         } else {
           switch (sortType) {
             case STRING:
               if (b == 1) {
                 missingValue = SortField.STRING_LAST;
               } else if (b == 2) {
                 missingValue = SortField.STRING_FIRST;
               } else {
                 throw new CorruptIndexException("invalid missing value flag: " + b, input);
               }
               break;
             case LONG:
               if (b != 1) {
                 throw new CorruptIndexException("invalid missing value flag: " + b, input);
               }
               missingValue = input.readLong();
               break;
             case INT:
               if (b != 1) {
                 throw new CorruptIndexException("invalid missing value flag: " + b, input);
               }
               missingValue = input.readInt();
               break;
             case DOUBLE:
               if (b != 1) {
                 throw new CorruptIndexException("invalid missing value flag: " + b, input);
               }
               missingValue = Double.longBitsToDouble(input.readLong());
               break;
             case FLOAT:
               if (b != 1) {
                 throw new CorruptIndexException("invalid missing value flag: " + b, input);
               }
               missingValue = Float.intBitsToFloat(input.readInt());
               break;
             default:
               throw new AssertionError("unhandled sortType=" + sortType);
           }
         }
         if (missingValue != null) {
           sortFields[i].setMissingValue(missingValue);
         }
       }
       indexSort = new Sort(sortFields);
     } else if (numSortFields < 0) {
       throw new CorruptIndexException("invalid index sort field count: " + numSortFields, input);
     } else {
       indexSort = null;
     }

     SegmentInfo si =
         new SegmentInfo(
             dir,
             version,
             minVersion,
             segment,
             docCount,
             isCompoundFile,
             null,
             diagnostics,
             segmentID,
             attributes,
             indexSort);
     si.setFiles(files);
     return si;
   }

   @Override
   public void write(Directory dir, SegmentInfo si, IOContext ioContext) throws IOException {
     throw new UnsupportedOperationException("Old formats can't be used for writing");
   }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package org.apache.lucene.backward_codecs.lucene70;

	import java.io.IOException;
	import java.util.Map;
	import java.util.Set;
	import org.apache.lucene.codecs.CodecUtil;
	import org.apache.lucene.codecs.SegmentInfoFormat;
	import org.apache.lucene.index.CorruptIndexException;
	import org.apache.lucene.index.IndexFileNames;
	import org.apache.lucene.index.IndexWriter;
	import org.apache.lucene.index.SegmentInfo;
	import org.apache.lucene.index.SegmentInfos;
	import org.apache.lucene.search.Sort;
	import org.apache.lucene.search.SortField;
	import org.apache.lucene.search.SortedNumericSelector;
	import org.apache.lucene.search.SortedNumericSortField;
	import org.apache.lucene.search.SortedSetSelector;
	import org.apache.lucene.search.SortedSetSortField;
	import org.apache.lucene.store.ChecksumIndexInput;
	import org.apache.lucene.store.DataInput;
	import org.apache.lucene.store.DataOutput;
	import org.apache.lucene.store.Directory;
	import org.apache.lucene.store.IOContext;
	import org.apache.lucene.util.Version;

	/**
	* Lucene 7.0 Segment info format.
	*
	* <p>Files:
	*
	* <ul>
	* <li><code>.si</code>: Header, SegVersion, SegSize, IsCompoundFile, Diagnostics, Files,
	* Attributes, IndexSort, Footer
	* </ul>
	*
	* Data types:
	*
	* <ul>
	* <li>Header --> {@link CodecUtil#writeIndexHeader IndexHeader}
	* <li>SegSize --> {@link DataOutput#writeInt Int32}
	* <li>SegVersion --> {@link DataOutput#writeString String}
	* <li>SegMinVersion --> {@link DataOutput#writeString String}
	* <li>Files --> {@link DataOutput#writeSetOfStrings Set<String>}
	* <li>Diagnostics,Attributes --> {@link DataOutput#writeMapOfStrings Map<String,String>}
	* <li>IsCompoundFile --> {@link DataOutput#writeByte Int8}
	* <li>IndexSort --> {@link DataOutput#writeVInt Int32} count, followed by {@code count}
	* SortField
	* <li>SortField --> {@link DataOutput#writeString String} field name, followed by {@link
	* DataOutput#writeVInt Int32} sort type ID, followed by {@link DataOutput#writeByte Int8}
	* indicating reversed sort, followed by a type-specific encoding of the optional missing
	* value
	* <li>Footer --> {@link CodecUtil#writeFooter CodecFooter}
	* </ul>
	*
	* Field Descriptions:
	*
	* <ul>
	* <li>SegVersion is the code version that created the segment.
	* <li>SegMinVersion is the minimum code version that contributed documents to the segment.
	* <li>SegSize is the number of documents contained in the segment index.
	* <li>IsCompoundFile records whether the segment is written as a compound file or not. If this is
	* -1, the segment is not a compound file. If it is 1, the segment is a compound file.
	* <li>The Diagnostics Map is privately written by {@link IndexWriter}, as a debugging aid, for
	* each segment it creates. It includes metadata like the current Lucene version, OS, Java
	* version, why the segment was created (merge, flush, addIndexes), etc.
	* <li>Files is a list of files referred to by this segment.
	* </ul>
	*
	* @see SegmentInfos
	* @lucene.experimental
	*/
	public class Lucene70SegmentInfoFormat extends SegmentInfoFormat {

	/** File extension used to store {@link SegmentInfo}. */
	public static final String SI_EXTENSION = "si";

	static final String CODEC_NAME = "Lucene70SegmentInfo";
	static final int VERSION_START = 0;
	static final int VERSION_CURRENT = VERSION_START;

	/** Sole constructor. */
	public Lucene70SegmentInfoFormat() {}

	@Override
	public SegmentInfo read(Directory dir, String segment, byte[] segmentID, IOContext context)
	throws IOException {
	final String fileName =
	IndexFileNames.segmentFileName(segment, "", Lucene70SegmentInfoFormat.SI_EXTENSION);
	try (ChecksumIndexInput input = dir.openChecksumInput(fileName, context)) {
	Throwable priorE = null;
	SegmentInfo si = null;
	try {
	int format =
	CodecUtil.checkIndexHeader(
	input,
	Lucene70SegmentInfoFormat.CODEC_NAME,
	Lucene70SegmentInfoFormat.VERSION_START,
	Lucene70SegmentInfoFormat.VERSION_CURRENT,
	segmentID,
	"");

	si = parseSegmentInfo(dir, input, segment, segmentID);

	} catch (Throwable exception) {
	priorE = exception;
	} finally {
	CodecUtil.checkFooter(input, priorE);
	}
	return si;
	}
	}

	private SegmentInfo parseSegmentInfo(
	Directory dir, DataInput input, String segment, byte[] segmentID) throws IOException {
	final Version version = Version.fromBits(input.readInt(), input.readInt(), input.readInt());
	byte hasMinVersion = input.readByte();
	final Version minVersion;
	switch (hasMinVersion) {
	case 0:
	minVersion = null;
	break;
	case 1:
	minVersion = Version.fromBits(input.readInt(), input.readInt(), input.readInt());
	break;
	default:
	throw new CorruptIndexException("Illegal boolean value " + hasMinVersion, input);
	}

	final int docCount = input.readInt();
	if (docCount < 0) {
	throw new CorruptIndexException("invalid docCount: " + docCount, input);
	}
	final boolean isCompoundFile = input.readByte() == SegmentInfo.YES;

	final Map<String, String> diagnostics = input.readMapOfStrings();
	final Set<String> files = input.readSetOfStrings();
	final Map<String, String> attributes = input.readMapOfStrings();

	int numSortFields = input.readVInt();
	Sort indexSort;
	if (numSortFields > 0) {
	SortField[] sortFields = new SortField[numSortFields];
	for (int i = 0; i < numSortFields; i++) {
	String fieldName = input.readString();
	int sortTypeID = input.readVInt();
	SortField.Type sortType;
	SortedSetSelector.Type sortedSetSelector = null;
	SortedNumericSelector.Type sortedNumericSelector = null;
	switch (sortTypeID) {
	case 0:
	sortType = SortField.Type.STRING;
	break;
	case 1:
	sortType = SortField.Type.LONG;
	break;
	case 2:
	sortType = SortField.Type.INT;
	break;
	case 3:
	sortType = SortField.Type.DOUBLE;
	break;
	case 4:
	sortType = SortField.Type.FLOAT;
	break;
	case 5:
	sortType = SortField.Type.STRING;
	byte selector = input.readByte();
	if (selector == 0) {
	sortedSetSelector = SortedSetSelector.Type.MIN;
	} else if (selector == 1) {
	sortedSetSelector = SortedSetSelector.Type.MAX;
	} else if (selector == 2) {
	sortedSetSelector = SortedSetSelector.Type.MIDDLE_MIN;
	} else if (selector == 3) {
	sortedSetSelector = SortedSetSelector.Type.MIDDLE_MAX;
	} else {
	throw new CorruptIndexException(
	"invalid index SortedSetSelector ID: " + selector, input);
	}
	break;
	case 6:
	byte type = input.readByte();
	if (type == 0) {
	sortType = SortField.Type.LONG;
	} else if (type == 1) {
	sortType = SortField.Type.INT;
	} else if (type == 2) {
	sortType = SortField.Type.DOUBLE;
	} else if (type == 3) {
	sortType = SortField.Type.FLOAT;
	} else {
	throw new CorruptIndexException(
	"invalid index SortedNumericSortField type ID: " + type, input);
	}
	byte numericSelector = input.readByte();
	if (numericSelector == 0) {
	sortedNumericSelector = SortedNumericSelector.Type.MIN;
	} else if (numericSelector == 1) {
	sortedNumericSelector = SortedNumericSelector.Type.MAX;
	} else {
	throw new CorruptIndexException(
	"invalid index SortedNumericSelector ID: " + numericSelector, input);
	}
	break;
	default:
	throw new CorruptIndexException(
	"invalid index sort field type ID: " + sortTypeID, input);
	}
	byte b = input.readByte();
	boolean reverse;
	if (b == 0) {
	reverse = true;
	} else if (b == 1) {
	reverse = false;
	} else {
	throw new CorruptIndexException("invalid index sort reverse: " + b, input);
	}

	if (sortedSetSelector != null) {
	sortFields[i] = new SortedSetSortField(fieldName, reverse, sortedSetSelector);
	} else if (sortedNumericSelector != null) {
	sortFields[i] =
	new SortedNumericSortField(fieldName, sortType, reverse, sortedNumericSelector);
	} else {
	sortFields[i] = new SortField(fieldName, sortType, reverse);
	}

	Object missingValue;
	b = input.readByte();
	if (b == 0) {
	missingValue = null;
	} else {
	switch (sortType) {
	case STRING:
	if (b == 1) {
	missingValue = SortField.STRING_LAST;
	} else if (b == 2) {
	missingValue = SortField.STRING_FIRST;
	} else {
	throw new CorruptIndexException("invalid missing value flag: " + b, input);
	}
	break;
	case LONG:
	if (b != 1) {
	throw new CorruptIndexException("invalid missing value flag: " + b, input);
	}
	missingValue = input.readLong();
	break;
	case INT:
	if (b != 1) {
	throw new CorruptIndexException("invalid missing value flag: " + b, input);
	}
	missingValue = input.readInt();
	break;
	case DOUBLE:
	if (b != 1) {
	throw new CorruptIndexException("invalid missing value flag: " + b, input);
	}
	missingValue = Double.longBitsToDouble(input.readLong());
	break;
	case FLOAT:
	if (b != 1) {
	throw new CorruptIndexException("invalid missing value flag: " + b, input);
	}
	missingValue = Float.intBitsToFloat(input.readInt());
	break;
	default:
	throw new AssertionError("unhandled sortType=" + sortType);
	}
	}
	if (missingValue != null) {
	sortFields[i].setMissingValue(missingValue);
	}
	}
	indexSort = new Sort(sortFields);
	} else if (numSortFields < 0) {
	throw new CorruptIndexException("invalid index sort field count: " + numSortFields, input);
	} else {
	indexSort = null;
	}

	SegmentInfo si =
	new SegmentInfo(
	dir,
	version,
	minVersion,
	segment,
	docCount,
	isCompoundFile,
	null,
	diagnostics,
	segmentID,
	attributes,
	indexSort);
	si.setFiles(files);
	return si;
	}

	@Override
	public void write(Directory dir, SegmentInfo si, IOContext ioContext) throws IOException {
	throw new UnsupportedOperationException("Old formats can't be used for writing");
	}
	}