lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene60/Lucene60PointsFormat.java - lucene-solr - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.lucene.backward_codecs.lucene60;

 import java.io.IOException;
 import org.apache.lucene.codecs.CodecUtil;
 import org.apache.lucene.codecs.PointsFormat;
 import org.apache.lucene.codecs.PointsReader;
 import org.apache.lucene.codecs.PointsWriter;
 import org.apache.lucene.index.SegmentReadState;
 import org.apache.lucene.index.SegmentWriteState;

 /**
  * Lucene 6.0 point format, which encodes dimensional values in a block KD-tree structure for fast
  * 1D range and N dimensional shape intersection filtering. See <a
  * href="https://www.cs.duke.edu/~pankaj/publications/papers/bkd-sstd.pdf">this paper</a> for
  * details.
  *
  * <p>This data structure is written as a series of blocks on disk, with an in-memory perfectly
  * balanced binary tree of split values referencing those blocks at the leaves.
  *
  * <p>The <code>.dim</code> file has both blocks and the index split values, for each field. The
  * file starts with {@link CodecUtil#writeIndexHeader}.
  *
  * <p>The blocks are written like this:
  *
  * <ul>
  *   <li>count (vInt)
  *   <li>delta-docID (vInt) <sup>count</sup> (delta coded docIDs, in sorted order)
  *   <li>packedValue<sup>count</sup> (the <code>byte[]</code> value of each dimension packed into a
  *       single <code>byte[]</code>)
  * </ul>
  *
  * <p>After all blocks for a field are written, then the index is written:
  *
  * <ul>
  *   <li>numDims (vInt)
  *   <li>maxPointsInLeafNode (vInt)
  *   <li>bytesPerDim (vInt)
  *   <li>count (vInt)
  *   <li>packed index (byte[])
  * </ul>
  *
  * <p>The packed index uses hierarchical delta and prefix coding to compactly encode the file
  * pointer for all leaf blocks, once the tree is traversed, as well as the split dimension and split
  * value for each inner node of the tree.
  *
  * <p>After all fields blocks + index data are written, {@link CodecUtil#writeFooter} writes the
  * checksum.
  *
  * <p>The <code>.dii</code> file records the file pointer in the <code>.dim</code> file where each
  * field's index data was written. It starts with {@link CodecUtil#writeIndexHeader}, then has:
  *
  * <ul>
  *   <li>fieldCount (vInt)
  *   <li>(fieldNumber (vInt), fieldFilePointer (vLong))<sup>fieldCount</sup>
  * </ul>
  *
  * <p>After all fields blocks + index data are written, {@link CodecUtil#writeFooter} writes the
  * checksum.
  *
  * @lucene.experimental
  */
 public class Lucene60PointsFormat extends PointsFormat {

   static final String DATA_CODEC_NAME = "Lucene60PointsFormatData";
   static final String META_CODEC_NAME = "Lucene60PointsFormatMeta";

   /** Filename extension for the leaf blocks */
   public static final String DATA_EXTENSION = "dim";

   /** Filename extension for the index per field */
   public static final String INDEX_EXTENSION = "dii";

   static final int DATA_VERSION_START = 0;
   static final int DATA_VERSION_CURRENT = DATA_VERSION_START;

   static final int INDEX_VERSION_START = 0;
   static final int INDEX_VERSION_CURRENT = INDEX_VERSION_START;

   /** Sole constructor */
   public Lucene60PointsFormat() {}

   @Override
   public PointsWriter fieldsWriter(SegmentWriteState state) throws IOException {
     throw new UnsupportedOperationException("Old codecs may only be used for reading");
   }

   @Override
   public PointsReader fieldsReader(SegmentReadState state) throws IOException {
     return new Lucene60PointsReader(state);
   }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package org.apache.lucene.backward_codecs.lucene60;

	import java.io.IOException;
	import org.apache.lucene.codecs.CodecUtil;
	import org.apache.lucene.codecs.PointsFormat;
	import org.apache.lucene.codecs.PointsReader;
	import org.apache.lucene.codecs.PointsWriter;
	import org.apache.lucene.index.SegmentReadState;
	import org.apache.lucene.index.SegmentWriteState;

	/**
	* Lucene 6.0 point format, which encodes dimensional values in a block KD-tree structure for fast
	* 1D range and N dimensional shape intersection filtering. See <a
	* href="https://www.cs.duke.edu/~pankaj/publications/papers/bkd-sstd.pdf">this paper</a> for
	* details.
	*
	* <p>This data structure is written as a series of blocks on disk, with an in-memory perfectly
	* balanced binary tree of split values referencing those blocks at the leaves.
	*
	* <p>The <code>.dim</code> file has both blocks and the index split values, for each field. The
	* file starts with {@link CodecUtil#writeIndexHeader}.
	*
	* <p>The blocks are written like this:
	*
	* <ul>
	* <li>count (vInt)
	* <li>delta-docID (vInt) <sup>count</sup> (delta coded docIDs, in sorted order)
	* <li>packedValue<sup>count</sup> (the <code>byte[]</code> value of each dimension packed into a
	* single <code>byte[]</code>)
	* </ul>
	*
	* <p>After all blocks for a field are written, then the index is written:
	*
	* <ul>
	* <li>numDims (vInt)
	* <li>maxPointsInLeafNode (vInt)
	* <li>bytesPerDim (vInt)
	* <li>count (vInt)
	* <li>packed index (byte[])
	* </ul>
	*
	* <p>The packed index uses hierarchical delta and prefix coding to compactly encode the file
	* pointer for all leaf blocks, once the tree is traversed, as well as the split dimension and split
	* value for each inner node of the tree.
	*
	* <p>After all fields blocks + index data are written, {@link CodecUtil#writeFooter} writes the
	* checksum.
	*
	* <p>The <code>.dii</code> file records the file pointer in the <code>.dim</code> file where each
	* field's index data was written. It starts with {@link CodecUtil#writeIndexHeader}, then has:
	*
	* <ul>
	* <li>fieldCount (vInt)
	* <li>(fieldNumber (vInt), fieldFilePointer (vLong))<sup>fieldCount</sup>
	* </ul>
	*
	* <p>After all fields blocks + index data are written, {@link CodecUtil#writeFooter} writes the
	* checksum.
	*
	* @lucene.experimental
	*/
	public class Lucene60PointsFormat extends PointsFormat {

	static final String DATA_CODEC_NAME = "Lucene60PointsFormatData";
	static final String META_CODEC_NAME = "Lucene60PointsFormatMeta";

	/** Filename extension for the leaf blocks */
	public static final String DATA_EXTENSION = "dim";

	/** Filename extension for the index per field */
	public static final String INDEX_EXTENSION = "dii";

	static final int DATA_VERSION_START = 0;
	static final int DATA_VERSION_CURRENT = DATA_VERSION_START;

	static final int INDEX_VERSION_START = 0;
	static final int INDEX_VERSION_CURRENT = INDEX_VERSION_START;

	/** Sole constructor */
	public Lucene60PointsFormat() {}

	@Override
	public PointsWriter fieldsWriter(SegmentWriteState state) throws IOException {
	throw new UnsupportedOperationException("Old codecs may only be used for reading");
	}

	@Override
	public PointsReader fieldsReader(SegmentReadState state) throws IOException {
	return new Lucene60PointsReader(state);
	}
	}