blob: 2ecbcb97ca2159f19c7bf72913fd8bfd10604106 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.physical.impl.xsort;
import org.apache.drill.common.config.DrillConfig;
import org.apache.drill.exec.ExecConstants;
import org.apache.drill.exec.server.options.OptionManager;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
public class SortConfig {
private static final Logger logger = LoggerFactory.getLogger(SortConfig.class);
/**
* Smallest allowed output batch size. The smallest output batch
* created even under constrained memory conditions.
*/
public static final int MIN_MERGED_BATCH_SIZE = 256 * 1024;
/**
* In the bizarre case where the user gave us an unrealistically low
* spill file size, set a floor at some bare minimum size. (Note that,
* at this size, big queries will create a huge number of files, which
* is why the configuration default is one the order of hundreds of MB.)
*/
public static final long MIN_SPILL_FILE_SIZE = 1 * 1024 * 1024;
public static final int DEFAULT_SPILL_BATCH_SIZE = 8 * 1024 * 1024;
public static final int MIN_SPILL_BATCH_SIZE = 256 * 1024;
public static final int MIN_MERGE_BATCH_SIZE = 256 * 1024;
public static final int DEFAULT_MERGE_LIMIT = 128;
public static final int MIN_MERGE_LIMIT = 2;
private final long maxMemory;
/**
* Maximum number of spilled runs that can be merged in a single pass.
*/
private final int mergeLimit;
/**
* Target size of the first-generation spill files.
*/
private final long spillFileSize;
private final int spillBatchSize;
private final int mergeBatchSize;
private final int bufferedBatchLimit;
/**
* Limit the size of the in-memory merge return batches.
* Primarily for testing.
*/
private final int mSortBatchSize;
public SortConfig(DrillConfig config, OptionManager options) {
// Optional configured memory limit, typically used only for testing.
maxMemory = config.getBytes(ExecConstants.EXTERNAL_SORT_MAX_MEMORY);
// Optional limit on the number of spilled runs to merge in a single
// pass. Limits the number of open file handles. Must allow at least
// two batches to merge to make progress.
int limit = config.getInt(ExecConstants.EXTERNAL_SORT_MERGE_LIMIT);
if (limit > 0) {
mergeLimit = Math.max(limit, MIN_MERGE_LIMIT);
} else {
mergeLimit = Integer.MAX_VALUE;
}
// Limits the size of first-generation spill files.
// Ensure the size is reasonable.
spillFileSize = Math.max(config.getBytes(ExecConstants.EXTERNAL_SORT_SPILL_FILE_SIZE), MIN_SPILL_FILE_SIZE);
spillBatchSize = (int) Math.max(config.getBytes(ExecConstants.EXTERNAL_SORT_SPILL_BATCH_SIZE), MIN_SPILL_BATCH_SIZE);
// Set the target output batch size. Use the maximum size, but only if
// this represents less than 10% of available memory. Otherwise, use 10%
// of memory, but no smaller than the minimum size. In any event, an
// output batch can contain no fewer than a single record.
// get the output batch size from context.
// Size of the batch sent downstream from the sort operator during
// the merge phase. Default value is 16M.
// Don't change defaults unless you know what you are doing,
// larger sizes can result in memory fragmentation, smaller sizes
// in excessive operator iterator overhead.
mergeBatchSize = (int) Math.max(options.getOption(ExecConstants.OUTPUT_BATCH_SIZE_VALIDATOR), MIN_MERGE_BATCH_SIZE);
// Limit on in-memory batches, primarily for testing.
int value = config.getInt(ExecConstants.EXTERNAL_SORT_BATCH_LIMIT);
if (value == 0) {
bufferedBatchLimit = Integer.MAX_VALUE;
} else {
bufferedBatchLimit = Math.max(value, 2);
}
// Limit on memory merge batch size; primarily for testing
if (config.hasPath(ExecConstants.EXTERNAL_SORT_MSORT_MAX_BATCHSIZE)) {
mSortBatchSize = Math.max(1,
Math.min(Character.MAX_VALUE,
config.getInt(ExecConstants.EXTERNAL_SORT_MSORT_MAX_BATCHSIZE)));
} else {
mSortBatchSize = Character.MAX_VALUE;
}
logConfig();
}
private void logConfig() {
logger.debug("Config: " +
"spill file size = {}, spill batch size = {}, " +
"merge batch size = {}, mSort batch size = {}",
spillFileSize, spillBatchSize,
mergeBatchSize, mSortBatchSize);
}
@Override
public String toString() {
return "SortConfig[spillFileSize=" + spillFileSize
+ ", spillBatchSize=" + spillBatchSize
+ ", mergeBatchSize=" + mergeBatchSize
+ ", mSortBatchSize=" + mSortBatchSize
+ "]";
}
public long maxMemory() { return maxMemory; }
public int mergeLimit() { return mergeLimit; }
public long spillFileSize() { return spillFileSize; }
public int spillBatchSize() { return spillBatchSize; }
public int mergeBatchSize() { return mergeBatchSize; }
public int getBufferedBatchLimit() { return bufferedBatchLimit; }
public int getMSortBatchSize() { return mSortBatchSize; }
}