lucene/test-framework/src/java/org/apache/lucene/tests/index/BaseIndexFileFormatTestCase.java - lucene - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.lucene.tests.index;

 import java.io.ByteArrayOutputStream;
 import java.io.IOException;
 import java.io.PrintStream;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.IdentityHashMap;
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
 import java.util.TreeSet;
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.function.IntConsumer;
 import org.apache.lucene.analysis.Analyzer;
 import org.apache.lucene.codecs.Codec;
 import org.apache.lucene.codecs.DocValuesConsumer;
 import org.apache.lucene.codecs.DocValuesProducer;
 import org.apache.lucene.codecs.FieldsConsumer;
 import org.apache.lucene.codecs.FieldsProducer;
 import org.apache.lucene.codecs.NormsConsumer;
 import org.apache.lucene.codecs.NormsProducer;
 import org.apache.lucene.codecs.StoredFieldsReader;
 import org.apache.lucene.codecs.StoredFieldsWriter;
 import org.apache.lucene.codecs.TermVectorsReader;
 import org.apache.lucene.codecs.TermVectorsWriter;
 import org.apache.lucene.codecs.simpletext.SimpleTextCodec;
 import org.apache.lucene.document.Document;
 import org.apache.lucene.document.Field;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.NumericDocValuesField;
 import org.apache.lucene.document.TextField;
 import org.apache.lucene.index.DirectoryReader;
 import org.apache.lucene.index.EmptyDocValuesProducer;
 import org.apache.lucene.index.FieldInfo;
 import org.apache.lucene.index.FieldInfos;
 import org.apache.lucene.index.Fields;
 import org.apache.lucene.index.IndexFileNames;
 import org.apache.lucene.index.IndexReader;
 import org.apache.lucene.index.IndexReaderContext;
 import org.apache.lucene.index.IndexWriter;
 import org.apache.lucene.index.IndexWriterConfig;
 import org.apache.lucene.index.LeafReader;
 import org.apache.lucene.index.MergePolicy;
 import org.apache.lucene.index.NumericDocValues;
 import org.apache.lucene.index.SegmentCommitInfo;
 import org.apache.lucene.index.SegmentInfo;
 import org.apache.lucene.index.SegmentInfos;
 import org.apache.lucene.index.SegmentReadState;
 import org.apache.lucene.index.SegmentWriteState;
 import org.apache.lucene.index.SerialMergeScheduler;
 import org.apache.lucene.index.Term;
 import org.apache.lucene.index.Terms;
 import org.apache.lucene.internal.tests.IndexWriterAccess;
 import org.apache.lucene.internal.tests.TestSecrets;
 import org.apache.lucene.store.AlreadyClosedException;
 import org.apache.lucene.store.ChecksumIndexInput;
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.store.FilterDirectory;
 import org.apache.lucene.store.FlushInfo;
 import org.apache.lucene.store.IOContext;
 import org.apache.lucene.store.IndexInput;
 import org.apache.lucene.store.IndexOutput;
 import org.apache.lucene.tests.analysis.MockAnalyzer;
 import org.apache.lucene.tests.store.MockDirectoryWrapper;
 import org.apache.lucene.tests.util.LuceneTestCase;
 import org.apache.lucene.tests.util.RamUsageTester;
 import org.apache.lucene.tests.util.Rethrow;
 import org.apache.lucene.tests.util.TestUtil;
 import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.CloseableThreadLocal;
 import org.apache.lucene.util.FixedBitSet;
 import org.apache.lucene.util.IOUtils;
 import org.apache.lucene.util.RamUsageEstimator;
 import org.apache.lucene.util.StringHelper;
 import org.apache.lucene.util.Version;

 /** Common tests to all index formats. */
 abstract class BaseIndexFileFormatTestCase extends LuceneTestCase {

   private static final IndexWriterAccess INDEX_WRITER_ACCESS = TestSecrets.getIndexWriterAccess();

   // metadata or Directory-level objects
   private static final Set<Class<?>> EXCLUDED_CLASSES =
       Collections.newSetFromMap(new IdentityHashMap<Class<?>, Boolean>());

   static {
     // Directory objects, don't take into account eg. the NIO buffers
     EXCLUDED_CLASSES.add(Directory.class);
     EXCLUDED_CLASSES.add(IndexInput.class);

     // used for thread management, not by the index
     EXCLUDED_CLASSES.add(CloseableThreadLocal.class);
     EXCLUDED_CLASSES.add(ThreadLocal.class);

     // don't follow references to the top-level reader
     EXCLUDED_CLASSES.add(IndexReader.class);
     EXCLUDED_CLASSES.add(IndexReaderContext.class);

     // usually small but can bump memory usage for
     // memory-efficient things like stored fields
     EXCLUDED_CLASSES.add(FieldInfos.class);
     EXCLUDED_CLASSES.add(SegmentInfo.class);
     EXCLUDED_CLASSES.add(SegmentCommitInfo.class);
     EXCLUDED_CLASSES.add(FieldInfo.class);

     // constant overhead is typically due to strings
     // TODO: can we remove this and still pass the test consistently
     EXCLUDED_CLASSES.add(String.class);
   }

   static class Accumulator extends RamUsageTester.Accumulator {

     private final Object root;

     Accumulator(Object root) {
       this.root = root;
     }

     @Override
     public long accumulateObject(
         Object o,
         long shallowSize,
         Map<java.lang.reflect.Field, Object> fieldValues,
         Collection<Object> queue) {
       for (Class<?> clazz = o.getClass(); clazz != null; clazz = clazz.getSuperclass()) {
         if (EXCLUDED_CLASSES.contains(clazz) && o != root) {
           return 0;
         }
       }
       // we have no way to estimate the size of these things in codecs although
       // something like a Collections.newSetFromMap(new HashMap<>()) uses quite
       // some memory... So for now the test ignores the overhead of such
       // collections but can we do better?
       long v;
       if (o instanceof Collection) {
         Collection<?> coll = (Collection<?>) o;
         queue.addAll((Collection<?>) o);
         v = (long) coll.size() * RamUsageEstimator.NUM_BYTES_OBJECT_REF;
       } else if (o instanceof Map) {
         final Map<?, ?> map = (Map<?, ?>) o;
         queue.addAll(map.keySet());
         queue.addAll(map.values());
         v = 2L * map.size() * RamUsageEstimator.NUM_BYTES_OBJECT_REF;
       } else {
         List<Object> references = new ArrayList<>();
         v = super.accumulateObject(o, shallowSize, fieldValues, references);
         for (Object r : references) {
           // AssertingCodec adds Thread references to make sure objects are consumed in the right
           // thread
           if (r instanceof Thread == false) {
             queue.add(r);
           }
         }
       }
       return v;
     }

     @Override
     public long accumulateArray(
         Object array, long shallowSize, List<Object> values, Collection<Object> queue) {
       long v = super.accumulateArray(array, shallowSize, values, queue);
       // System.out.println(array.getClass() + "=" + v);
       return v;
     }
   }

   /** Returns the codec to run tests against */
   protected abstract Codec getCodec();

   /** Returns the major version that this codec is compatible with. */
   protected int getCreatedVersionMajor() {
     return Version.LATEST.major;
   }

   /** Set the created version of the given {@link Directory} and return it. */
   protected final <D extends Directory> D applyCreatedVersionMajor(D d) throws IOException {
     if (SegmentInfos.getLastCommitGeneration(d) != -1) {
       throw new IllegalArgumentException(
           "Cannot set the created version on a Directory that already has segments");
     }
     if (getCreatedVersionMajor() != Version.LATEST.major || random().nextBoolean()) {
       new SegmentInfos(getCreatedVersionMajor()).commit(d);
     }
     return d;
   }

   private Codec savedCodec;

   @Override
   public void setUp() throws Exception {
     super.setUp();
     // set the default codec, so adding test cases to this isn't fragile
     savedCodec = Codec.getDefault();
     Codec.setDefault(getCodec());
   }

   @Override
   public void tearDown() throws Exception {
     Codec.setDefault(savedCodec); // restore
     super.tearDown();
   }

   /** Add random fields to the provided document. */
   protected abstract void addRandomFields(Document doc);

   private Map<String, Long> bytesUsedByExtension(Directory d) throws IOException {
     Map<String, Long> bytesUsedByExtension = new HashMap<>();
     for (String file : d.listAll()) {
       if (IndexFileNames.CODEC_FILE_PATTERN.matcher(file).matches()) {
         final String ext = IndexFileNames.getExtension(file);
         final long previousLength =
             bytesUsedByExtension.containsKey(ext) ? bytesUsedByExtension.get(ext) : 0;
         bytesUsedByExtension.put(ext, previousLength + d.fileLength(file));
       }
     }
     bytesUsedByExtension.keySet().removeAll(excludedExtensionsFromByteCounts());

     return bytesUsedByExtension;
   }

   /**
    * Return the list of extensions that should be excluded from byte counts when comparing indices
    * that store the same content.
    */
   protected Collection<String> excludedExtensionsFromByteCounts() {
     return new HashSet<String>(
         Arrays.asList(
             new String[] {
               // segment infos store various pieces of information that don't solely depend
               // on the content of the index in the diagnostics (such as a timestamp) so we
               // exclude this file from the bytes counts
               "si",
               // lock files are 0 bytes (one directory in the test could be RAMDir, the other FSDir)
               "lock"
             }));
   }

   /**
    * The purpose of this test is to make sure that bulk merge doesn't accumulate useless data over
    * runs.
    */
   public void testMergeStability() throws Exception {
     assumeTrue("merge is not stable", mergeIsStable());
     Directory dir = applyCreatedVersionMajor(newDirectory());

     // do not use newMergePolicy that might return a MockMergePolicy that ignores the no-CFS ratio
     // do not use RIW which will change things up!
     MergePolicy mp = newTieredMergePolicy();
     mp.setNoCFSRatio(0);
     IndexWriterConfig cfg =
         new IndexWriterConfig(new MockAnalyzer(random()))
             .setUseCompoundFile(false)
             .setMergePolicy(mp);
     IndexWriter w = new IndexWriter(dir, cfg);
     final int numDocs = atLeast(500);
     for (int i = 0; i < numDocs; ++i) {
       Document d = new Document();
       addRandomFields(d);
       w.addDocument(d);
     }
     w.forceMerge(1);
     w.commit();
     w.close();
     DirectoryReader reader = DirectoryReader.open(dir);

     Directory dir2 = applyCreatedVersionMajor(newDirectory());
     mp = newTieredMergePolicy();
     mp.setNoCFSRatio(0);
     cfg =
         new IndexWriterConfig(new MockAnalyzer(random()))
             .setUseCompoundFile(false)
             .setMergePolicy(mp);
     w = new IndexWriter(dir2, cfg);
     TestUtil.addIndexesSlowly(w, reader);

     w.commit();
     w.close();

     assertEquals(bytesUsedByExtension(dir), bytesUsedByExtension(dir2));

     reader.close();
     dir.close();
     dir2.close();
   }

   protected boolean mergeIsStable() {
     return true;
   }

   /** Calls close multiple times on closeable codec apis */
   public void testMultiClose() throws IOException {
     // first make a one doc index
     Directory oneDocIndex = applyCreatedVersionMajor(newDirectory());
     IndexWriter iw =
         new IndexWriter(oneDocIndex, new IndexWriterConfig(new MockAnalyzer(random())));
     Document oneDoc = new Document();
     FieldType customType = new FieldType(TextField.TYPE_STORED);
     customType.setStoreTermVectors(true);
     Field customField = new Field("field", "contents", customType);
     oneDoc.add(customField);
     oneDoc.add(new NumericDocValuesField("field", 5));
     iw.addDocument(oneDoc);
     LeafReader oneDocReader = getOnlyLeafReader(DirectoryReader.open(iw));
     iw.close();

     // now feed to codec apis manually
     // we use FSDir, things like ramdir are not guaranteed to cause fails if you write to them after
     // close(), etc
     Directory dir = newFSDirectory(createTempDir("justSoYouGetSomeChannelErrors"));
     Codec codec = getCodec();

     SegmentInfo segmentInfo =
         new SegmentInfo(
             dir,
             Version.LATEST,
             Version.LATEST,
             "_0",
             1,
             false,
             codec,
             Collections.emptyMap(),
             StringHelper.randomId(),
             Collections.emptyMap(),
             null);
     FieldInfo proto = oneDocReader.getFieldInfos().fieldInfo("field");
     FieldInfo field =
         new FieldInfo(
             proto.name,
             proto.number,
             proto.hasVectors(),
             proto.omitsNorms(),
             proto.hasPayloads(),
             proto.getIndexOptions(),
             proto.getDocValuesType(),
             proto.getDocValuesGen(),
             new HashMap<>(),
             proto.getPointDimensionCount(),
             proto.getPointIndexDimensionCount(),
             proto.getPointNumBytes(),
             proto.getVectorDimension(),
             proto.getVectorEncoding(),
             proto.getVectorSimilarityFunction(),
             proto.isSoftDeletesField());

     FieldInfos fieldInfos = new FieldInfos(new FieldInfo[] {field});

     SegmentWriteState writeState =
         new SegmentWriteState(
             null, dir, segmentInfo, fieldInfos, null, new IOContext(new FlushInfo(1, 20)));

     SegmentReadState readState = new SegmentReadState(dir, segmentInfo, fieldInfos, IOContext.READ);

     // PostingsFormat
     NormsProducer fakeNorms =
         new NormsProducer() {

           @Override
           public void close() throws IOException {}

           @Override
           public NumericDocValues getNorms(FieldInfo field) throws IOException {
             if (field.hasNorms() == false) {
               return null;
             }
             return oneDocReader.getNormValues(field.name);
           }

           @Override
           public void checkIntegrity() throws IOException {}
         };
     try (FieldsConsumer consumer = codec.postingsFormat().fieldsConsumer(writeState)) {
       final Fields fields =
           new Fields() {
             TreeSet<String> indexedFields =
                 new TreeSet<>(FieldInfos.getIndexedFields(oneDocReader));

             @Override
             public Iterator<String> iterator() {
               return indexedFields.iterator();
             }

             @Override
             public Terms terms(String field) throws IOException {
               return oneDocReader.terms(field);
             }

             @Override
             public int size() {
               return indexedFields.size();
             }
           };
       consumer.write(fields, fakeNorms);
       IOUtils.close(consumer);
       IOUtils.close(consumer);
     }
     try (FieldsProducer producer = codec.postingsFormat().fieldsProducer(readState)) {
       IOUtils.close(producer);
       IOUtils.close(producer);
     }

     // DocValuesFormat
     try (DocValuesConsumer consumer = codec.docValuesFormat().fieldsConsumer(writeState)) {
       consumer.addNumericField(
           field,
           new EmptyDocValuesProducer() {
             @Override
             public NumericDocValues getNumeric(FieldInfo field) {
               return new NumericDocValues() {
                 int docID = -1;

                 @Override
                 public int docID() {
                   return docID;
                 }

                 @Override
                 public int nextDoc() {
                   docID++;
                   if (docID == 1) {
                     docID = NO_MORE_DOCS;
                   }
                   return docID;
                 }

                 @Override
                 public int advance(int target) {
                   if (docID <= 0 && target == 0) {
                     docID = 0;
                   } else {
                     docID = NO_MORE_DOCS;
                   }
                   return docID;
                 }

                 @Override
                 public boolean advanceExact(int target) throws IOException {
                   docID = target;
                   return target == 0;
                 }

                 @Override
                 public long cost() {
                   return 1;
                 }

                 @Override
                 public long longValue() {
                   return 5;
                 }
               };
             }
           });
       IOUtils.close(consumer);
       IOUtils.close(consumer);
     }
     try (DocValuesProducer producer = codec.docValuesFormat().fieldsProducer(readState)) {
       IOUtils.close(producer);
       IOUtils.close(producer);
     }

     // NormsFormat
     try (NormsConsumer consumer = codec.normsFormat().normsConsumer(writeState)) {
       consumer.addNormsField(
           field,
           new NormsProducer() {
             @Override
             public NumericDocValues getNorms(FieldInfo field) {
               return new NumericDocValues() {
                 int docID = -1;

                 @Override
                 public int docID() {
                   return docID;
                 }

                 @Override
                 public int nextDoc() {
                   docID++;
                   if (docID == 1) {
                     docID = NO_MORE_DOCS;
                   }
                   return docID;
                 }

                 @Override
                 public int advance(int target) {
                   if (docID <= 0 && target == 0) {
                     docID = 0;
                   } else {
                     docID = NO_MORE_DOCS;
                   }
                   return docID;
                 }

                 @Override
                 public boolean advanceExact(int target) throws IOException {
                   docID = target;
                   return target == 0;
                 }

                 @Override
                 public long cost() {
                   return 1;
                 }

                 @Override
                 public long longValue() {
                   return 5;
                 }
               };
             }

             @Override
             public void checkIntegrity() {}

             @Override
             public void close() {}
           });
       IOUtils.close(consumer);
       IOUtils.close(consumer);
     }
     try (NormsProducer producer = codec.normsFormat().normsProducer(readState)) {
       IOUtils.close(producer);
       IOUtils.close(producer);
     }

     // TermVectorsFormat
     try (TermVectorsWriter consumer =
         codec.termVectorsFormat().vectorsWriter(dir, segmentInfo, writeState.context)) {
       consumer.startDocument(1);
       consumer.startField(field, 1, false, false, false);
       consumer.startTerm(new BytesRef("testing"), 2);
       consumer.finishTerm();
       consumer.finishField();
       consumer.finishDocument();
       consumer.finish(1);
       IOUtils.close(consumer);
       IOUtils.close(consumer);
     }
     try (TermVectorsReader producer =
         codec.termVectorsFormat().vectorsReader(dir, segmentInfo, fieldInfos, readState.context)) {
       IOUtils.close(producer);
       IOUtils.close(producer);
     }

     // StoredFieldsFormat
     try (StoredFieldsWriter consumer =
         codec.storedFieldsFormat().fieldsWriter(dir, segmentInfo, writeState.context)) {
       consumer.startDocument();
       consumer.writeField(field, customField);
       consumer.finishDocument();
       consumer.finish(1);
       IOUtils.close(consumer);
       IOUtils.close(consumer);
     }
     try (StoredFieldsReader producer =
         codec.storedFieldsFormat().fieldsReader(dir, segmentInfo, fieldInfos, readState.context)) {
       IOUtils.close(producer);
       IOUtils.close(producer);
     }

     IOUtils.close(oneDocReader, oneDocIndex, dir);
   }

   /** Tests exception handling on write and openInput/createOutput */
   // TODO: this is really not ideal. each BaseXXXTestCase should have unit tests doing this.
   // but we use this shotgun approach to prevent bugs in the meantime: it just ensures the
   // codec does not corrupt the index or leak file handles.
   public void testRandomExceptions() throws Exception {
     // disable slow things: we don't rely upon sleeps here.
     MockDirectoryWrapper dir = applyCreatedVersionMajor(newMockDirectory());
     dir.setThrottling(MockDirectoryWrapper.Throttling.NEVER);
     dir.setUseSlowOpenClosers(false);
     dir.setRandomIOExceptionRate(0.001); // more rare

     // log all exceptions we hit, in case we fail (for debugging)
     ByteArrayOutputStream exceptionLog = new ByteArrayOutputStream();
     PrintStream exceptionStream = new PrintStream(exceptionLog, true, "UTF-8");
     // PrintStream exceptionStream = System.out;

     Analyzer analyzer = new MockAnalyzer(random());

     IndexWriterConfig conf = newIndexWriterConfig(analyzer);
     // just for now, try to keep this test reproducible
     conf.setMergeScheduler(new SerialMergeScheduler());
     conf.setCodec(getCodec());

     int numDocs = atLeast(500);

     IndexWriter iw = new IndexWriter(dir, conf);
     try {
       boolean allowAlreadyClosed = false;
       for (int i = 0; i < numDocs; i++) {
         dir.setRandomIOExceptionRateOnOpen(0.02); // turn on exceptions for openInput/createOutput

         Document doc = new Document();
         doc.add(newStringField("id", Integer.toString(i), Field.Store.NO));
         addRandomFields(doc);

         // single doc
         try {
           iw.addDocument(doc);
           // we made it, sometimes delete our doc
           iw.deleteDocuments(new Term("id", Integer.toString(i)));
         } catch (
             @SuppressWarnings("unused")
             AlreadyClosedException ace) {
           // OK: writer was closed by abort; we just reopen now:
           dir.setRandomIOExceptionRateOnOpen(
               0.0); // disable exceptions on openInput until next iteration
           assertTrue(INDEX_WRITER_ACCESS.isDeleterClosed(iw));
           assertTrue(allowAlreadyClosed);
           allowAlreadyClosed = false;
           conf = newIndexWriterConfig(analyzer);
           // just for now, try to keep this test reproducible
           conf.setMergeScheduler(new SerialMergeScheduler());
           conf.setCodec(getCodec());
           iw = new IndexWriter(dir, conf);
         } catch (IOException e) {
           handleFakeIOException(e, exceptionStream);
           allowAlreadyClosed = true;
         }

         if (random().nextInt(10) == 0) {
           // trigger flush:
           try {
             if (random().nextBoolean()) {
               DirectoryReader ir = null;
               try {
                 ir = DirectoryReader.open(iw, random().nextBoolean(), false);
                 dir.setRandomIOExceptionRateOnOpen(
                     0.0); // disable exceptions on openInput until next iteration
                 TestUtil.checkReader(ir);
               } finally {
                 IOUtils.closeWhileHandlingException(ir);
               }
             } else {
               dir.setRandomIOExceptionRateOnOpen(
                   0.0); // disable exceptions on openInput until next iteration:
               // or we make slowExists angry and trip a scarier assert!
               iw.commit();
             }
             if (DirectoryReader.indexExists(dir)) {
               TestUtil.checkIndex(dir);
             }
           } catch (
               @SuppressWarnings("unused")
               AlreadyClosedException ace) {
             // OK: writer was closed by abort; we just reopen now:
             dir.setRandomIOExceptionRateOnOpen(
                 0.0); // disable exceptions on openInput until next iteration
             assertTrue(INDEX_WRITER_ACCESS.isDeleterClosed(iw));
             assertTrue(allowAlreadyClosed);
             allowAlreadyClosed = false;
             conf = newIndexWriterConfig(analyzer);
             // just for now, try to keep this test reproducible
             conf.setMergeScheduler(new SerialMergeScheduler());
             conf.setCodec(getCodec());
             iw = new IndexWriter(dir, conf);
           } catch (IOException e) {
             handleFakeIOException(e, exceptionStream);
             allowAlreadyClosed = true;
           }
         }
       }

       try {
         dir.setRandomIOExceptionRateOnOpen(
             0.0); // disable exceptions on openInput until next iteration:
         // or we make slowExists angry and trip a scarier assert!
         iw.close();
       } catch (IOException e) {
         handleFakeIOException(e, exceptionStream);
         try {
           iw.rollback();
         } catch (
             @SuppressWarnings("unused")
             Throwable t) {
         }
       }
       dir.close();
     } catch (Throwable t) {
       System.out.println("Unexpected exception: dumping fake-exception-log:...");
       exceptionStream.flush();
       System.out.println(exceptionLog.toString("UTF-8"));
       System.out.flush();
       Rethrow.rethrow(t);
     }

     if (VERBOSE) {
       System.out.println("TEST PASSED: dumping fake-exception-log:...");
       System.out.println(exceptionLog.toString("UTF-8"));
     }
   }

   private void handleFakeIOException(IOException e, PrintStream exceptionStream) {
     Throwable ex = e;
     while (ex != null) {
       if (ex.getMessage() != null && ex.getMessage().startsWith("a random IOException")) {
         exceptionStream.println("\nTEST: got expected fake exc:" + ex.getMessage());
         ex.printStackTrace(exceptionStream);
         return;
       }
       ex = ex.getCause();
     }

     Rethrow.rethrow(e);
   }

   /**
    * Returns {@code false} if only the regular fields reader should be tested, and {@code true} if
    * only the merge instance should be tested.
    */
   protected boolean shouldTestMergeInstance() {
     return false;
   }

   protected final DirectoryReader maybeWrapWithMergingReader(DirectoryReader r) throws IOException {
     if (shouldTestMergeInstance()) {
       r = new MergingDirectoryReaderWrapper(r);
     }
     return r;
   }

   /** A directory that tracks created files that haven't been deleted. */
   protected static class FileTrackingDirectoryWrapper extends FilterDirectory {

     private final Set<String> files =
         Collections.newSetFromMap(new ConcurrentHashMap<String, Boolean>());

     /** Sole constructor. */
     FileTrackingDirectoryWrapper(Directory in) {
       super(in);
     }

     /** Get the set of created files. */
     public Set<String> getFiles() {
       return Set.copyOf(files);
     }

     @Override
     public IndexOutput createOutput(String name, IOContext context) throws IOException {
       files.add(name);
       return super.createOutput(name, context);
     }

     @Override
     public void rename(String source, String dest) throws IOException {
       files.remove(source);
       files.add(dest);
       super.rename(source, dest);
     }

     @Override
     public void deleteFile(String name) throws IOException {
       files.remove(name);
       super.deleteFile(name);
     }
   }

   private static class ReadBytesIndexInputWrapper extends IndexInput {

     private final IndexInput in;
     private final IntConsumer readByte;

     ReadBytesIndexInputWrapper(IndexInput in, IntConsumer readByte) {
       super(in.toString());
       this.in = in;
       this.readByte = readByte;
     }

     @Override
     public IndexInput clone() {
       return new ReadBytesIndexInputWrapper(in.clone(), readByte);
     }

     @Override
     public void close() throws IOException {
       in.close();
     }

     @Override
     public long getFilePointer() {
       return in.getFilePointer();
     }

     @Override
     public void seek(long pos) throws IOException {
       in.seek(pos);
     }

     @Override
     public long length() {
       return in.length();
     }

     @Override
     public IndexInput slice(String sliceDescription, long offset, long length) throws IOException {
       IndexInput slice = in.slice(sliceDescription, offset, length);
       return new ReadBytesIndexInputWrapper(
           slice, o -> readByte.accept(Math.toIntExact(offset + o)));
     }

     @Override
     public byte readByte() throws IOException {
       readByte.accept(Math.toIntExact(getFilePointer()));
       return in.readByte();
     }

     @Override
     public void readBytes(byte[] b, int offset, int len) throws IOException {
       final int fp = Math.toIntExact(getFilePointer());
       for (int i = 0; i < len; ++i) {
         readByte.accept(Math.addExact(fp, i));
       }
       in.readBytes(b, offset, len);
     }
   }

   /** A directory that tracks read bytes. */
   protected static class ReadBytesDirectoryWrapper extends FilterDirectory {

     /** Sole constructor. */
     public ReadBytesDirectoryWrapper(Directory in) {
       super(in);
     }

     private final Map<String, FixedBitSet> readBytes = new ConcurrentHashMap<>();

     /** Get information about which bytes have been read. */
     public Map<String, FixedBitSet> getReadBytes() {
       return Map.copyOf(readBytes);
     }

     @Override
     public IndexInput openInput(String name, IOContext context) throws IOException {
       IndexInput in = super.openInput(name, context);
       final FixedBitSet set =
           readBytes.computeIfAbsent(name, n -> new FixedBitSet(Math.toIntExact(in.length())));
       if (set.length() != in.length()) {
         throw new IllegalStateException();
       }
       return new ReadBytesIndexInputWrapper(in, set::set);
     }

     @Override
     public ChecksumIndexInput openChecksumInput(String name, IOContext context) throws IOException {
       ChecksumIndexInput in = super.openChecksumInput(name, context);
       final FixedBitSet set =
           readBytes.computeIfAbsent(name, n -> new FixedBitSet(Math.toIntExact(in.length())));
       if (set.length() != in.length()) {
         throw new IllegalStateException();
       }
       return new ChecksumIndexInput(in.toString()) {

         @Override
         public void readBytes(byte[] b, int offset, int len) throws IOException {
           final int fp = Math.toIntExact(getFilePointer());
           set.set(fp, Math.addExact(fp, len));
           in.readBytes(b, offset, len);
         }

         @Override
         public byte readByte() throws IOException {
           set.set(Math.toIntExact(getFilePointer()));
           return in.readByte();
         }

         @Override
         public IndexInput slice(String sliceDescription, long offset, long length)
             throws IOException {
           throw new UnsupportedOperationException();
         }

         @Override
         public long length() {
           return in.length();
         }

         @Override
         public long getFilePointer() {
           return in.getFilePointer();
         }

         @Override
         public void close() throws IOException {
           in.close();
         }

         @Override
         public long getChecksum() throws IOException {
           return in.getChecksum();
         }
       };
     }

     @Override
     public IndexOutput createOutput(String name, IOContext context) throws IOException {
       throw new UnsupportedOperationException();
     }

     @Override
     public IndexOutput createTempOutput(String prefix, String suffix, IOContext context)
         throws IOException {
       throw new UnsupportedOperationException();
     }
   }

   /**
    * This test is a best effort at verifying that checkIntegrity doesn't miss any files. It tests
    * that the combination of opening a reader and calling checkIntegrity on it reads all bytes of
    * all files.
    */
   public void testCheckIntegrityReadsAllBytes() throws Exception {
     assumeFalse(
         "SimpleText doesn't store checksums of its files", getCodec() instanceof SimpleTextCodec);
     FileTrackingDirectoryWrapper dir = new FileTrackingDirectoryWrapper(newDirectory());
     applyCreatedVersionMajor(dir);

     IndexWriterConfig cfg = new IndexWriterConfig(new MockAnalyzer(random()));
     IndexWriter w = new IndexWriter(dir, cfg);
     final int numDocs = atLeast(100);
     for (int i = 0; i < numDocs; ++i) {
       Document d = new Document();
       addRandomFields(d);
       w.addDocument(d);
     }
     w.forceMerge(1);
     w.commit();
     w.close();

     ReadBytesDirectoryWrapper readBytesWrapperDir = new ReadBytesDirectoryWrapper(dir);
     IndexReader reader = DirectoryReader.open(readBytesWrapperDir);
     LeafReader leafReader = getOnlyLeafReader(reader);
     leafReader.checkIntegrity();

     Map<String, FixedBitSet> readBytesMap = readBytesWrapperDir.getReadBytes();

     Set<String> unreadFiles = new HashSet<>(dir.getFiles());
     System.out.println(Arrays.toString(dir.listAll()));
     unreadFiles.removeAll(readBytesMap.keySet());
     unreadFiles.remove(IndexWriter.WRITE_LOCK_NAME);
     assertTrue("Some files have not been open: " + unreadFiles, unreadFiles.isEmpty());

     List<String> messages = new ArrayList<>();
     for (Map.Entry<String, FixedBitSet> entry : readBytesMap.entrySet()) {
       String name = entry.getKey();
       FixedBitSet unreadBytes = entry.getValue().clone();
       unreadBytes.flip(0, unreadBytes.length());
       int unread = unreadBytes.nextSetBit(0);
       if (unread != Integer.MAX_VALUE) {
         messages.add(
             "Offset "
                 + unread
                 + " of file "
                 + name
                 + "("
                 + unreadBytes.length()
                 + "bytes) was not read.");
       }
     }
     assertTrue(String.join("\n", messages), messages.isEmpty());
     reader.close();
     dir.close();
   }
 }