exec/java-exec/src/main/java/org/apache/drill/exec/physical/impl/xsort/ExternalSortBatch.java - drill - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  * http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.drill.exec.physical.impl.xsort;

 import java.io.IOException;
 import java.util.Collection;
 import java.util.Iterator;
 import java.util.LinkedList;
 import java.util.List;
 import java.util.Set;
 import java.util.concurrent.TimeUnit;

 import org.apache.drill.shaded.guava.com.google.common.collect.Sets;
 import org.apache.calcite.rel.RelFieldCollation.Direction;
 import org.apache.drill.common.AutoCloseables;
 import org.apache.drill.common.config.DrillConfig;
 import org.apache.drill.common.exceptions.UserException;
 import org.apache.drill.common.expression.ErrorCollector;
 import org.apache.drill.common.expression.ErrorCollectorImpl;
 import org.apache.drill.common.expression.LogicalExpression;
 import org.apache.drill.common.expression.SchemaPath;
 import org.apache.drill.common.logical.data.Order.Ordering;
 import org.apache.drill.exec.ExecConstants;
 import org.apache.drill.exec.compile.sig.GeneratorMapping;
 import org.apache.drill.exec.compile.sig.MappingSet;
 import org.apache.drill.exec.exception.ClassTransformationException;
 import org.apache.drill.exec.exception.OutOfMemoryException;
 import org.apache.drill.exec.exception.SchemaChangeException;
 import org.apache.drill.exec.expr.ClassGenerator;
 import org.apache.drill.exec.expr.ClassGenerator.HoldingContainer;
 import org.apache.drill.exec.expr.CodeGenerator;
 import org.apache.drill.exec.expr.ExpressionTreeMaterializer;
 import org.apache.drill.exec.expr.TypeHelper;
 import org.apache.drill.exec.expr.fn.FunctionGenerationHelper;
 import org.apache.drill.exec.memory.BufferAllocator;
 import org.apache.drill.exec.ops.FragmentContext;
 import org.apache.drill.exec.ops.MetricDef;
 import org.apache.drill.exec.physical.config.ExternalSort;
 import org.apache.drill.exec.physical.impl.sort.RecordBatchData;
 import org.apache.drill.exec.physical.impl.sort.SortRecordBatchBuilder;
 import org.apache.drill.exec.proto.ExecProtos.FragmentHandle;
 import org.apache.drill.exec.proto.helper.QueryIdHelper;
 import org.apache.drill.exec.record.AbstractRecordBatch;
 import org.apache.drill.exec.record.BatchSchema;
 import org.apache.drill.exec.record.BatchSchema.SelectionVectorMode;
 import org.apache.drill.exec.record.MaterializedField;
 import org.apache.drill.exec.record.RecordBatch;
 import org.apache.drill.exec.record.SchemaUtil;
 import org.apache.drill.exec.record.VectorAccessible;
 import org.apache.drill.exec.record.VectorContainer;
 import org.apache.drill.exec.record.VectorWrapper;
 import org.apache.drill.exec.record.WritableBatch;
 import org.apache.drill.exec.record.selection.SelectionVector2;
 import org.apache.drill.exec.record.selection.SelectionVector4;
 import org.apache.drill.exec.testing.ControlsInjector;
 import org.apache.drill.exec.testing.ControlsInjectorFactory;
 import org.apache.drill.exec.vector.CopyUtil;
 import org.apache.drill.exec.vector.ValueVector;
 import org.apache.drill.exec.vector.complex.AbstractContainerVector;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;

 import org.apache.drill.shaded.guava.com.google.common.base.Joiner;
 import org.apache.drill.shaded.guava.com.google.common.base.Stopwatch;
 import org.apache.drill.shaded.guava.com.google.common.collect.Iterators;
 import org.apache.drill.shaded.guava.com.google.common.collect.Lists;
 import com.sun.codemodel.JConditional;
 import com.sun.codemodel.JExpr;

 public class ExternalSortBatch extends AbstractRecordBatch<ExternalSort> {
   private static final org.slf4j.Logger logger = org.slf4j.LoggerFactory.getLogger(ExternalSortBatch.class);
   private static final ControlsInjector injector = ControlsInjectorFactory.getInjector(ExternalSortBatch.class);

   private static final GeneratorMapping COPIER_MAPPING = new GeneratorMapping("doSetup", "doCopy", null, null);
   private final MappingSet MAIN_MAPPING = new MappingSet( (String) null, null, ClassGenerator.DEFAULT_SCALAR_MAP, ClassGenerator.DEFAULT_SCALAR_MAP);
   private final MappingSet LEFT_MAPPING = new MappingSet("leftIndex", null, ClassGenerator.DEFAULT_SCALAR_MAP, ClassGenerator.DEFAULT_SCALAR_MAP);
   private final MappingSet RIGHT_MAPPING = new MappingSet("rightIndex", null, ClassGenerator.DEFAULT_SCALAR_MAP, ClassGenerator.DEFAULT_SCALAR_MAP);
   private final MappingSet COPIER_MAPPING_SET = new MappingSet(COPIER_MAPPING, COPIER_MAPPING);

   private final int SPILL_BATCH_GROUP_SIZE;
   private final int SPILL_THRESHOLD;
   private final Iterator<String> dirs;
   private final RecordBatch incoming;
   private final BufferAllocator oAllocator;
   private final BufferAllocator copierAllocator;

   private BatchSchema schema;
   private SingleBatchSorter sorter;
   private SortRecordBatchBuilder builder;
   private MSorter mSorter;
   /**
    * A single PriorityQueueCopier instance is used for 2 purposes:
    * 1. Merge sorted batches before spilling
    * 2. Merge sorted batches when all incoming data fits in memory
    */
   private PriorityQueueCopier copier;
   private LinkedList<BatchGroup> batchGroups = Lists.newLinkedList();
   private LinkedList<BatchGroup> spilledBatchGroups = Lists.newLinkedList();
   private SelectionVector4 sv4;
   private FileSystem fs;
   private int spillCount = 0;
   private int batchesSinceLastSpill = 0;
   private boolean first = true;
   private int targetRecordCount;
   private final String fileName;
   private final Set<Path> currSpillDirs = Sets.newTreeSet();
   private int firstSpillBatchCount = 0;
   private int peakNumBatches = -1;

   /**
    * The copier uses the COPIER_BATCH_MEM_LIMIT to estimate the target
    * number of records to return in each batch.
    */
   private static final int COPIER_BATCH_MEM_LIMIT = 256 * 1024;

   public static final String INTERRUPTION_AFTER_SORT = "after-sort";
   public static final String INTERRUPTION_AFTER_SETUP = "after-setup";
   public static final String INTERRUPTION_WHILE_SPILLING = "spilling";

   // Be careful here! This enum is used in TWO places! First, it is used
   // in this code to build up metrics. Easy enough. But, it is also used
   // in OperatorMetricRegistry to define the metrics for the
   // operator ID defined in CoreOperatorType. As a result, the values
   // defined here are shared between this legacy version AND the new
   // managed version. (Though the new, managed version has its own
   // copy of this enum.) The two enums MUST be identical.

   public enum Metric implements MetricDef {
     SPILL_COUNT,            // number of times operator spilled to disk
     RETIRED1,               // Was: peak value for totalSizeInMemory
                             // But operator already provides this value
     PEAK_BATCHES_IN_MEMORY, // maximum number of batches kept in memory
     MERGE_COUNT,            // Used only by the managed version.
     MIN_BUFFER,             // Used only by the managed version.
     INPUT_BATCHES;          // Used only by the managed version.

     @Override
     public int metricId() {
       return ordinal();
     }
   }

   public ExternalSortBatch(ExternalSort popConfig, FragmentContext context, RecordBatch incoming) throws OutOfMemoryException {
     super(popConfig, context, true);
     this.incoming = incoming;
     DrillConfig config = context.getConfig();
     Configuration conf = new Configuration();
     conf.set(FileSystem.FS_DEFAULT_NAME_KEY, config.getString(ExecConstants.EXTERNAL_SORT_SPILL_FILESYSTEM));
     try {
       this.fs = FileSystem.get(conf);
     } catch (IOException e) {
       throw new RuntimeException(e);
     }
     SPILL_BATCH_GROUP_SIZE = config.getInt(ExecConstants.EXTERNAL_SORT_SPILL_GROUP_SIZE);
     SPILL_THRESHOLD = config.getInt(ExecConstants.EXTERNAL_SORT_SPILL_THRESHOLD);
     dirs = Iterators.cycle(config.getStringList(ExecConstants.EXTERNAL_SORT_SPILL_DIRS));
     oAllocator = oContext.getAllocator();
     copierAllocator = oAllocator.newChildAllocator(oAllocator.getName() + ":copier",
         PriorityQueueCopier.INITIAL_ALLOCATION, PriorityQueueCopier.MAX_ALLOCATION);
     FragmentHandle handle = context.getHandle();
     fileName = String.format("%s_majorfragment%s_minorfragment%s_operator%s", QueryIdHelper.getQueryId(handle.getQueryId()),
         handle.getMajorFragmentId(), handle.getMinorFragmentId(), popConfig.getOperatorId());
   }

   @Override
   public int getRecordCount() {
     if (sv4 != null) {
       return sv4.getCount();
     }
     return container.getRecordCount();
   }

   @Override
   public SelectionVector4 getSelectionVector4() {
     return sv4;
   }

   private void closeBatchGroups(Collection<BatchGroup> groups) {
     for (BatchGroup group: groups) {
       try {
         group.close();
       } catch (Exception e) {
         // collect all failure and make sure to cleanup all remaining batches
         // Originally we would have thrown a RuntimeException that would propagate to FragmentExecutor.closeOutResources()
         // where it would have been passed to context.fail()
         // passing the exception directly to context.fail(e) will let the cleanup process continue instead of stopping
         // right away, this will also make sure we collect any additional exception we may get while cleaning up
         context.getExecutorState().fail(e);
       }
     }
   }

   @Override
   public void close() {
     try {
       if (batchGroups != null) {
         closeBatchGroups(batchGroups);
         batchGroups = null;
       }
       if (spilledBatchGroups != null) {
         closeBatchGroups(spilledBatchGroups);
         spilledBatchGroups = null;
       }
     } finally {
       if (builder != null) {
         builder.clear();
         builder.close();
       }
       if (sv4 != null) {
         sv4.clear();
       }

       try {
         if (copier != null) {
           copier.close();
         }
       } catch (IOException e) {
         throw new RuntimeException(e);
       } finally {
         copierAllocator.close();
         super.close();

         if (mSorter != null) {
           mSorter.clear();
         }
         for(Iterator<Path> iter = this.currSpillDirs.iterator(); iter.hasNext(); iter.remove()) {
             Path path = iter.next();
             try {
                 if (fs != null && path != null && fs.exists(path)) {
                     if (fs.delete(path, true)) {
                         fs.cancelDeleteOnExit(path);
                     }
                 }
             } catch (IOException e) {
                 // since this is meant to be used in a batches's cleanup, we don't propagate the exception
                 logger.warn("Unable to delete spill directory " + path,  e);
             }
         }
       }

     }


   }

   @Override
   public void buildSchema() throws SchemaChangeException {
     IterOutcome outcome = next(incoming);
     switch (outcome) {
       case OK:
       case OK_NEW_SCHEMA:
         for (VectorWrapper<?> w : incoming) {
           ValueVector v = container.addOrGet(w.getField());
           if (v instanceof AbstractContainerVector) {
             w.getValueVector().makeTransferPair(v); // Can we remove this hack?
             v.clear();
           }
           v.allocateNew(); // Can we remove this? - SVR fails with NPE (TODO)
         }
         container.buildSchema(SelectionVectorMode.NONE);
         container.setRecordCount(0);
         break;
       case STOP:
         state = BatchState.STOP;
         break;
       case NONE:
         state = BatchState.DONE;
         break;
       default:
         break;
     }
   }

   @Override
   public IterOutcome innerNext() {
     if (schema != null) {
       if (spillCount == 0) {
         return (getSelectionVector4().next()) ? IterOutcome.OK : IterOutcome.NONE;
       } else {
         Stopwatch w = Stopwatch.createStarted();
         int count = copier.next(targetRecordCount);
         if (count > 0) {
           long t = w.elapsed(TimeUnit.MICROSECONDS);
           logger.debug("Took {} us to merge {} records", t, count);
           container.setRecordCount(count);
           return IterOutcome.OK;
         } else {
           logger.debug("copier returned 0 records");
           return IterOutcome.NONE;
         }
       }
     }

     int totalCount = 0;
     int totalBatches = 0; // total number of batches received so far

     try{
       container.clear();
       outer: while (true) {
         IterOutcome upstream;
         if (first) {
           upstream = IterOutcome.OK_NEW_SCHEMA;
         } else {
           upstream = next(incoming);
         }
         if (upstream == IterOutcome.OK && sorter == null) {
           upstream = IterOutcome.OK_NEW_SCHEMA;
         }
         switch (upstream) {
         case NONE:
           if (first) {
             return upstream;
           }
           break outer;
         case NOT_YET:
           throw new UnsupportedOperationException();
         case STOP:
           return upstream;
         case OK_NEW_SCHEMA:
         case OK:
           VectorContainer convertedBatch;
           // only change in the case that the schema truly changes.  Artificial schema changes are ignored.
           if (upstream == IterOutcome.OK_NEW_SCHEMA && !incoming.getSchema().equals(schema)) {
             if (schema != null) {
               if (unionTypeEnabled) {
                 this.schema = SchemaUtil.mergeSchemas(schema, incoming.getSchema());
               } else {
                 throw new SchemaChangeException("Schema changes not supported in External Sort. Please enable Union type");
               }
             } else {
               schema = incoming.getSchema();
             }
             convertedBatch = SchemaUtil.coerceContainer(incoming, schema, oContext);
             for (BatchGroup b : batchGroups) {
               b.setSchema(schema);
             }
             for (BatchGroup b : spilledBatchGroups) {
               b.setSchema(schema);
             }
             this.sorter = createNewSorter(context, convertedBatch);
           } else {
             convertedBatch = SchemaUtil.coerceContainer(incoming, schema, oContext);
           }
           if (first) {
             first = false;
           }
           if (convertedBatch.getRecordCount() == 0) {
             for (VectorWrapper<?> w : convertedBatch) {
               w.clear();
             }
             break;
           }
           SelectionVector2 sv2;
           if (incoming.getSchema().getSelectionVectorMode() == BatchSchema.SelectionVectorMode.TWO_BYTE) {
             sv2 = incoming.getSelectionVector2().clone();
           } else {
             try {
               sv2 = newSV2();
             } catch(InterruptedException e) {
               return IterOutcome.STOP;
             } catch (OutOfMemoryException e) {
               throw new OutOfMemoryException(e);
             }
           }

           int count = sv2.getCount();
           totalCount += count;
           totalBatches++;
           sorter.setup(context, sv2, convertedBatch);
           sorter.sort(sv2);
           RecordBatchData rbd = new RecordBatchData(convertedBatch, oAllocator);
           boolean success = false;
           try {
             rbd.setSv2(sv2);
             batchGroups.add(new BatchGroup(rbd.getContainer(), rbd.getSv2(), oContext));
             if (peakNumBatches < batchGroups.size()) {
               peakNumBatches = batchGroups.size();
               stats.setLongStat(Metric.PEAK_BATCHES_IN_MEMORY, peakNumBatches);
             }

             batchesSinceLastSpill++;
             if (// If we haven't spilled so far, do we have enough memory for MSorter if this turns out to be the last incoming batch?
                 (spillCount == 0 && !hasMemoryForInMemorySort(totalCount)) ||
                 // If we haven't spilled so far, make sure we don't exceed the maximum number of batches SV4 can address
                 (spillCount == 0 && totalBatches > Character.MAX_VALUE) ||
                 // TODO(DRILL-4438) - consider setting this threshold more intelligently,
                 // lowering caused a failing low memory condition (test in BasicPhysicalOpUnitTest)
                 // to complete successfully (although it caused perf decrease as there was more spilling)

                 // current memory used is more than 95% of memory usage limit of this operator
                 (oAllocator.getAllocatedMemory() > .95 * oAllocator.getLimit()) ||
                 // Number of incoming batches (BatchGroups) exceed the limit and number of incoming batches accumulated
                 // since the last spill exceed the defined limit
                 (batchGroups.size() > SPILL_THRESHOLD && batchesSinceLastSpill >= SPILL_BATCH_GROUP_SIZE)) {

               if (firstSpillBatchCount == 0) {
                 firstSpillBatchCount = batchGroups.size();
               }

               if (spilledBatchGroups.size() > firstSpillBatchCount / 2) {
                 logger.info("Merging spills");
                 final BatchGroup merged = mergeAndSpill(spilledBatchGroups);
                 if (merged != null) {
                   spilledBatchGroups.addFirst(merged);
                 }
               }
               final BatchGroup merged = mergeAndSpill(batchGroups);
               if (merged != null) { // make sure we don't add null to spilledBatchGroups
                 spilledBatchGroups.add(merged);
                 batchesSinceLastSpill = 0;
               }
             }
             success = true;
           } finally {
             if (!success) {
               rbd.clear();
             }
           }
           break;
         default:
           throw new UnsupportedOperationException();
         }
       }

       if (totalCount == 0) {
         return IterOutcome.NONE;
       }
       if (spillCount == 0) {

         if (builder != null) {
           builder.clear();
           builder.close();
         }
         builder = new SortRecordBatchBuilder(oAllocator);

         for (BatchGroup group : batchGroups) {
           RecordBatchData rbd = new RecordBatchData(group.getContainer(), oAllocator);
           rbd.setSv2(group.getSv2());
           builder.add(rbd);
         }

         builder.build(container);
         sv4 = builder.getSv4();
         mSorter = createNewMSorter();
         mSorter.setup(context, oAllocator, getSelectionVector4(), this.container);

         // For testing memory-leak purpose, inject exception after mSorter finishes setup
         injector.injectUnchecked(context.getExecutionControls(), INTERRUPTION_AFTER_SETUP);
         mSorter.sort(this.container);

         // sort may have prematurely exited due to should continue returning false.
         if (!context.getExecutorState().shouldContinue()) {
           return IterOutcome.STOP;
         }

         // For testing memory-leak purpose, inject exception after mSorter finishes sorting
         injector.injectUnchecked(context.getExecutionControls(), INTERRUPTION_AFTER_SORT);
         sv4 = mSorter.getSV4();

         container.buildSchema(SelectionVectorMode.FOUR_BYTE);
       } else { // some batches were spilled
         final BatchGroup merged = mergeAndSpill(batchGroups);
         if (merged != null) {
           spilledBatchGroups.add(merged);
         }
         batchGroups.addAll(spilledBatchGroups);
         spilledBatchGroups = null; // no need to cleanup spilledBatchGroups, all it's batches are in batchGroups now

         logger.warn("Starting to merge. {} batch groups. Current allocated memory: {}", batchGroups.size(), oAllocator.getAllocatedMemory());
         VectorContainer hyperBatch = constructHyperBatch(batchGroups);
         createCopier(hyperBatch, batchGroups, container, false);

         int estimatedRecordSize = 0;
         for (VectorWrapper<?> w : batchGroups.get(0)) {
           try {
             estimatedRecordSize += TypeHelper.getSize(w.getField().getType());
           } catch (UnsupportedOperationException e) {
             estimatedRecordSize += 50;
           }
         }
         targetRecordCount = Math.min(MAX_BATCH_ROW_COUNT, Math.max(1, COPIER_BATCH_MEM_LIMIT / estimatedRecordSize));
         int count = copier.next(targetRecordCount);
         container.buildSchema(SelectionVectorMode.NONE);
         container.setRecordCount(count);
       }

       return IterOutcome.OK_NEW_SCHEMA;

     } catch (SchemaChangeException ex) {
       kill(false);
       context.getExecutorState().fail(UserException.unsupportedError(ex)
         .message("Sort doesn't currently support sorts with changing schemas").build(logger));
       return IterOutcome.STOP;
     } catch(ClassTransformationException | IOException ex) {
       kill(false);
       context.getExecutorState().fail(ex);
       return IterOutcome.STOP;
     } catch (UnsupportedOperationException e) {
       throw new RuntimeException(e);
     }
   }

   private boolean hasMemoryForInMemorySort(int currentRecordCount) {
     long currentlyAvailable =  popConfig.getMaxAllocation() - oAllocator.getAllocatedMemory();

     long neededForInMemorySort = SortRecordBatchBuilder.memoryNeeded(currentRecordCount) +
         MSortTemplate.memoryNeeded(currentRecordCount);

     return currentlyAvailable > neededForInMemorySort;
   }

   public BatchGroup mergeAndSpill(LinkedList<BatchGroup> batchGroups) throws SchemaChangeException {
     logger.debug("Copier allocator current allocation {}", copierAllocator.getAllocatedMemory());
     logger.debug("mergeAndSpill: starting total size in memory = {}", oAllocator.getAllocatedMemory());
     VectorContainer outputContainer = new VectorContainer();
     List<BatchGroup> batchGroupList = Lists.newArrayList();
     int batchCount = batchGroups.size();
     for (int i = 0; i < batchCount / 2; i++) {
       if (batchGroups.size() == 0) {
         break;
       }
       BatchGroup batch = batchGroups.pollLast();
       assert batch != null : "Encountered a null batch during merge and spill operation";
       batchGroupList.add(batch);
     }

     if (batchGroupList.size() == 0) {
       return null;
     }
     int estimatedRecordSize = 0;
     for (VectorWrapper<?> w : batchGroupList.get(0)) {
       try {
         estimatedRecordSize += TypeHelper.getSize(w.getField().getType());
       } catch (UnsupportedOperationException e) {
         estimatedRecordSize += 50;
       }
     }
     int targetRecordCount = Math.max(1, COPIER_BATCH_MEM_LIMIT / estimatedRecordSize);
     VectorContainer hyperBatch = constructHyperBatch(batchGroupList);
     createCopier(hyperBatch, batchGroupList, outputContainer, true);

     int count = copier.next(targetRecordCount);
     assert count > 0;

     logger.debug("mergeAndSpill: estimated record size = {}, target record count = {}", estimatedRecordSize, targetRecordCount);

     // 1 output container is kept in memory, so we want to hold on to it and transferClone
     // allows keeping ownership
     VectorContainer c1 = VectorContainer.getTransferClone(outputContainer, oContext);
     c1.buildSchema(BatchSchema.SelectionVectorMode.NONE);
     c1.setRecordCount(count);

     String spillDir = dirs.next();
     Path currSpillPath = new Path(Joiner.on("/").join(spillDir, fileName));
     currSpillDirs.add(currSpillPath);
     String outputFile = Joiner.on("/").join(currSpillPath, spillCount++);
     try {
         fs.deleteOnExit(currSpillPath);
     } catch (IOException e) {
         // since this is meant to be used in a batches's spilling, we don't propagate the exception
         logger.warn("Unable to mark spill directory " + currSpillPath + " for deleting on exit", e);
     }
     stats.setLongStat(Metric.SPILL_COUNT, spillCount);
     BatchGroup newGroup = new BatchGroup(c1, fs, outputFile, oContext);
     try (AutoCloseable a = AutoCloseables.all(batchGroupList)) {
       logger.info("Merging and spilling to {}", outputFile);
       while ((count = copier.next(targetRecordCount)) > 0) {
         outputContainer.buildSchema(BatchSchema.SelectionVectorMode.NONE);
         outputContainer.setRecordCount(count);
         // note that addBatch also clears the outputContainer
         newGroup.addBatch(outputContainer);
       }
       injector.injectChecked(context.getExecutionControls(), INTERRUPTION_WHILE_SPILLING, IOException.class);
       newGroup.closeOutputStream();
     } catch (Throwable e) {
       // we only need to cleanup newGroup if spill failed
       try {
         AutoCloseables.close(e, newGroup);
       } catch (Throwable t) { /* close() may hit the same IO issue; just ignore */ }
       throw UserException.resourceError(e)
         .message("External Sort encountered an error while spilling to disk")
               .addContext(e.getMessage() /* more detail */)
         .build(logger);
     } finally {
       hyperBatch.clear();
     }
     logger.debug("mergeAndSpill: final total size in memory = {}", oAllocator.getAllocatedMemory());
     logger.info("Completed spilling to {}", outputFile);
     return newGroup;
   }

   private SelectionVector2 newSV2() throws OutOfMemoryException, InterruptedException {
     @SuppressWarnings("resource")
     SelectionVector2 sv2 = new SelectionVector2(oAllocator);
     if (!sv2.allocateNewSafe(incoming.getRecordCount())) {
       try {
         final BatchGroup merged = mergeAndSpill(batchGroups);
         if (merged != null) {
           spilledBatchGroups.add(merged);
         } else {
           throw UserException.memoryError("Unable to allocate sv2 for %d records, and not enough batchGroups to spill.",
               incoming.getRecordCount())
             .addContext("batchGroups.size", batchGroups.size())
             .addContext("spilledBatchGroups.size", spilledBatchGroups.size())
             .addContext("allocated memory", oAllocator.getAllocatedMemory())
             .addContext("allocator limit", oAllocator.getLimit())
             .build(logger);
         }
       } catch (SchemaChangeException e) {
         throw new RuntimeException(e);
       }
       int waitTime = 1;
       while (true) {
         try {
           Thread.sleep(waitTime * 1000);
         } catch(final InterruptedException e) {
           if (!context.getExecutorState().shouldContinue()) {
             throw e;
           }
         }
         waitTime *= 2;
         if (sv2.allocateNewSafe(incoming.getRecordCount())) {
           break;
         }
         if (waitTime >= 32) {
           throw new OutOfMemoryException("Unable to allocate sv2 buffer after repeated attempts");
         }
       }
     }
     for (int i = 0; i < incoming.getRecordCount(); i++) {
       sv2.setIndex(i, (char) i);
     }
     sv2.setRecordCount(incoming.getRecordCount());
     return sv2;
   }

   private VectorContainer constructHyperBatch(List<BatchGroup> batchGroupList) {
     VectorContainer cont = new VectorContainer();
     for (MaterializedField field : schema) {
       ValueVector[] vectors = new ValueVector[batchGroupList.size()];
       int i = 0;
       for (BatchGroup group : batchGroupList) {
         vectors[i++] = group.getValueAccessorById(
             field.getValueClass(),
             group.getValueVectorId(SchemaPath.getSimplePath(field.getName())).getFieldIds())
             .getValueVector();
       }
       cont.add(vectors);
     }
     cont.buildSchema(BatchSchema.SelectionVectorMode.FOUR_BYTE);
     return cont;
   }

   private MSorter createNewMSorter() throws ClassTransformationException, IOException, SchemaChangeException {
     return createNewMSorter(context, this.popConfig.getOrderings(), this, MAIN_MAPPING, LEFT_MAPPING, RIGHT_MAPPING);
   }

   private MSorter createNewMSorter(FragmentContext context, List<Ordering> orderings, VectorAccessible batch, MappingSet mainMapping, MappingSet leftMapping, MappingSet
     rightMapping)
           throws ClassTransformationException, IOException, SchemaChangeException {
     CodeGenerator<MSorter> cg = CodeGenerator.get(MSorter.TEMPLATE_DEFINITION, context.getOptions());
     ClassGenerator<MSorter> g = cg.getRoot();
     g.setMappingSet(mainMapping);

     for (Ordering od : orderings) {
       // first, we rewrite the evaluation stack for each side of the comparison.
       ErrorCollector collector = new ErrorCollectorImpl();
       final LogicalExpression expr = ExpressionTreeMaterializer.materialize(od.getExpr(), batch, collector, context.getFunctionRegistry());
       if (collector.hasErrors()) {
         throw new SchemaChangeException("Failure while materializing expression. " + collector.toErrorString());
       }
       g.setMappingSet(leftMapping);
       HoldingContainer left = g.addExpr(expr, ClassGenerator.BlkCreateMode.FALSE);
       g.setMappingSet(rightMapping);
       HoldingContainer right = g.addExpr(expr, ClassGenerator.BlkCreateMode.FALSE);
       g.setMappingSet(mainMapping);

       // next we wrap the two comparison sides and add the expression block for the comparison.
       LogicalExpression fh =
           FunctionGenerationHelper.getOrderingComparator(od.nullsSortHigh(), left, right,
                                                          context.getFunctionRegistry());
       HoldingContainer out = g.addExpr(fh, ClassGenerator.BlkCreateMode.FALSE);
       JConditional jc = g.getEvalBlock()._if(out.getValue().ne(JExpr.lit(0)));

       if (od.getDirection() == Direction.ASCENDING) {
         jc._then()._return(out.getValue());
       }else{
         jc._then()._return(out.getValue().minus());
       }
       g.rotateBlock();
     }

     g.rotateBlock();
     g.getEvalBlock()._return(JExpr.lit(0));

     cg.plainJavaCapable(true); // This class can generate plain-old Java.
     // Uncomment out this line to debug the generated code.
 //    cg.saveCodeForDebugging(true);
     return context.getImplementationClass(cg);
   }

   public SingleBatchSorter createNewSorter(FragmentContext context, VectorAccessible batch)
           throws ClassTransformationException, IOException, SchemaChangeException {
     CodeGenerator<SingleBatchSorter> cg = CodeGenerator.get(SingleBatchSorter.TEMPLATE_DEFINITION, context.getOptions());
     cg.plainJavaCapable(true); // This class can generate plain-old Java.

     // Uncomment out this line to debug the generated code.
 //    cg.saveCodeForDebugging(true);
     generateComparisons(cg.getRoot(), batch);
     return context.getImplementationClass(cg);
   }

   private void generateComparisons(ClassGenerator<?> g, VectorAccessible batch) throws SchemaChangeException {
     g.setMappingSet(MAIN_MAPPING);

     for (Ordering od : popConfig.getOrderings()) {
       // first, we rewrite the evaluation stack for each side of the comparison.
       ErrorCollector collector = new ErrorCollectorImpl();
       final LogicalExpression expr = ExpressionTreeMaterializer.materialize(od.getExpr(), batch, collector,context.getFunctionRegistry());
       if (collector.hasErrors()) {
         throw new SchemaChangeException("Failure while materializing expression. " + collector.toErrorString());
       }
       g.setMappingSet(LEFT_MAPPING);
       HoldingContainer left = g.addExpr(expr, ClassGenerator.BlkCreateMode.FALSE);
       g.setMappingSet(RIGHT_MAPPING);
       HoldingContainer right = g.addExpr(expr, ClassGenerator.BlkCreateMode.FALSE);
       g.setMappingSet(MAIN_MAPPING);

       // next we wrap the two comparison sides and add the expression block for the comparison.
       LogicalExpression fh =
           FunctionGenerationHelper.getOrderingComparator(od.nullsSortHigh(), left, right,
                                                          context.getFunctionRegistry());
       HoldingContainer out = g.addExpr(fh, ClassGenerator.BlkCreateMode.FALSE);
       JConditional jc = g.getEvalBlock()._if(out.getValue().ne(JExpr.lit(0)));

       if (od.getDirection() == Direction.ASCENDING) {
         jc._then()._return(out.getValue());
       }else{
         jc._then()._return(out.getValue().minus());
       }
       g.rotateBlock();
     }

     g.rotateBlock();
     g.getEvalBlock()._return(JExpr.lit(0));
   }

   private void createCopier(VectorAccessible batch, List<BatchGroup> batchGroupList, VectorContainer outputContainer, boolean spilling) throws SchemaChangeException {
     try {
       if (copier == null) {
         CodeGenerator<PriorityQueueCopier> cg = CodeGenerator.get(PriorityQueueCopier.TEMPLATE_DEFINITION, context.getOptions());
         cg.plainJavaCapable(true);
         // Uncomment out this line to debug the generated code.
 //        cg.saveCodeForDebugging(true);
         ClassGenerator<PriorityQueueCopier> g = cg.getRoot();

         generateComparisons(g, batch);

         g.setMappingSet(COPIER_MAPPING_SET);
         CopyUtil.generateCopies(g, batch, true);
         g.setMappingSet(MAIN_MAPPING);
         copier = context.getImplementationClass(cg);
       } else {
         copier.close();
       }

       BufferAllocator allocator = spilling ? copierAllocator : oAllocator;
       for (VectorWrapper<?> i : batch) {
         ValueVector v = TypeHelper.getNewVector(i.getField(), allocator);
         outputContainer.add(v);
       }
       copier.setup(context, allocator, batch, batchGroupList, outputContainer);
     } catch (ClassTransformationException | IOException e) {
       throw new RuntimeException(e);
     }
   }


   @Override
   public WritableBatch getWritableBatch() {
     throw new UnsupportedOperationException("A sort batch is not writable.");
   }

   @Override
   protected void killIncoming(boolean sendUpstream) {
     incoming.kill(sendUpstream);
   }

   @Override
   public void dump() {
     logger.error("ExternalSortBatch[schema={}, sorter={}, mSorter={}, container={}]", schema, sorter, mSorter, container);
   }
 }